{"current_steps": 1, "total_steps": 17941, "loss": 1.7989, "learning_rate": 3.3333333333333335e-07, "epoch": 5.573825316314587e-05, "percentage": 0.01, "elapsed_time": "0:00:10", "remaining_time": "2 days, 4:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 17941, "loss": 1.996, "learning_rate": 6.666666666666667e-07, "epoch": 0.00011147650632629174, "percentage": 0.01, "elapsed_time": "0:00:19", "remaining_time": "1 day, 23:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 17941, "loss": 1.8613, "learning_rate": 1.0000000000000002e-06, "epoch": 0.0001672147594894376, "percentage": 0.02, "elapsed_time": "0:00:27", "remaining_time": "1 day, 21:32:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 17941, "loss": 1.8904, "learning_rate": 1.3333333333333334e-06, "epoch": 0.00022295301265258348, "percentage": 0.02, "elapsed_time": "0:00:35", "remaining_time": "1 day, 20:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 17941, "loss": 2.0151, "learning_rate": 1.6666666666666667e-06, "epoch": 0.0002786912658157293, "percentage": 0.03, "elapsed_time": "0:00:44", "remaining_time": "1 day, 20:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 17941, "loss": 1.9774, "learning_rate": 2.0000000000000003e-06, "epoch": 0.0003344295189788752, "percentage": 0.03, "elapsed_time": "0:00:52", "remaining_time": "1 day, 19:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 17941, "loss": 1.8994, "learning_rate": 2.3333333333333336e-06, "epoch": 0.0003901677721420211, "percentage": 0.04, "elapsed_time": "0:01:01", "remaining_time": "1 day, 19:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 17941, "loss": 1.894, "learning_rate": 2.666666666666667e-06, "epoch": 0.00044590602530516696, "percentage": 0.04, "elapsed_time": "0:01:09", "remaining_time": "1 day, 19:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 17941, "loss": 2.0865, "learning_rate": 3e-06, "epoch": 0.0005016442784683128, "percentage": 0.05, "elapsed_time": "0:01:18", "remaining_time": "1 day, 19:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 17941, "loss": 1.9688, "learning_rate": 3.3333333333333333e-06, "epoch": 0.0005573825316314586, "percentage": 0.06, "elapsed_time": "0:01:26", "remaining_time": "1 day, 19:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 17941, "loss": 1.8239, "learning_rate": 3.666666666666667e-06, "epoch": 0.0006131207847946045, "percentage": 0.06, "elapsed_time": "0:01:35", "remaining_time": "1 day, 19:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 17941, "loss": 2.0367, "learning_rate": 4.000000000000001e-06, "epoch": 0.0006688590379577504, "percentage": 0.07, "elapsed_time": "0:01:43", "remaining_time": "1 day, 18:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 17941, "loss": 1.9817, "learning_rate": 4.333333333333334e-06, "epoch": 0.0007245972911208963, "percentage": 0.07, "elapsed_time": "0:01:51", "remaining_time": "1 day, 18:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 17941, "loss": 2.01, "learning_rate": 4.666666666666667e-06, "epoch": 0.0007803355442840422, "percentage": 0.08, "elapsed_time": "0:02:00", "remaining_time": "1 day, 18:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 17941, "loss": 1.8419, "learning_rate": 5e-06, "epoch": 0.000836073797447188, "percentage": 0.08, "elapsed_time": "0:02:08", "remaining_time": "1 day, 18:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 17941, "loss": 1.8663, "learning_rate": 5.333333333333334e-06, "epoch": 0.0008918120506103339, "percentage": 0.09, "elapsed_time": "0:02:17", "remaining_time": "1 day, 18:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 17941, "loss": 2.2089, "learning_rate": 5.666666666666667e-06, "epoch": 0.0009475503037734797, "percentage": 0.09, "elapsed_time": "0:02:25", "remaining_time": "1 day, 18:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 17941, "loss": 2.0842, "learning_rate": 6e-06, "epoch": 0.0010032885569366257, "percentage": 0.1, "elapsed_time": "0:02:34", "remaining_time": "1 day, 18:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 17941, "loss": 1.755, "learning_rate": 6.333333333333334e-06, "epoch": 0.0010590268100997716, "percentage": 0.11, "elapsed_time": "0:02:42", "remaining_time": "1 day, 18:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 17941, "loss": 2.2494, "learning_rate": 6.666666666666667e-06, "epoch": 0.0011147650632629172, "percentage": 0.11, "elapsed_time": "0:02:51", "remaining_time": "1 day, 18:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 17941, "loss": 2.0236, "learning_rate": 7.000000000000001e-06, "epoch": 0.0011705033164260631, "percentage": 0.12, "elapsed_time": "0:02:59", "remaining_time": "1 day, 18:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 17941, "loss": 1.8295, "learning_rate": 7.333333333333334e-06, "epoch": 0.001226241569589209, "percentage": 0.12, "elapsed_time": "0:03:08", "remaining_time": "1 day, 18:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 17941, "loss": 2.1311, "learning_rate": 7.666666666666667e-06, "epoch": 0.001281979822752355, "percentage": 0.13, "elapsed_time": "0:03:16", "remaining_time": "1 day, 18:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 17941, "loss": 1.888, "learning_rate": 8.000000000000001e-06, "epoch": 0.0013377180759155008, "percentage": 0.13, "elapsed_time": "0:03:25", "remaining_time": "1 day, 18:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 17941, "loss": 1.6625, "learning_rate": 8.333333333333334e-06, "epoch": 0.0013934563290786467, "percentage": 0.14, "elapsed_time": "0:03:33", "remaining_time": "1 day, 18:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 17941, "loss": 2.0062, "learning_rate": 8.666666666666668e-06, "epoch": 0.0014491945822417925, "percentage": 0.14, "elapsed_time": "0:03:41", "remaining_time": "1 day, 18:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 17941, "loss": 1.7991, "learning_rate": 9e-06, "epoch": 0.0015049328354049384, "percentage": 0.15, "elapsed_time": "0:03:50", "remaining_time": "1 day, 18:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 17941, "loss": 2.0728, "learning_rate": 9.333333333333334e-06, "epoch": 0.0015606710885680843, "percentage": 0.16, "elapsed_time": "0:03:58", "remaining_time": "1 day, 18:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 17941, "loss": 1.808, "learning_rate": 9.666666666666667e-06, "epoch": 0.0016164093417312302, "percentage": 0.16, "elapsed_time": "0:04:07", "remaining_time": "1 day, 18:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 17941, "loss": 1.9738, "learning_rate": 1e-05, "epoch": 0.001672147594894376, "percentage": 0.17, "elapsed_time": "0:04:15", "remaining_time": "1 day, 18:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 17941, "loss": 2.0967, "learning_rate": 1.0333333333333333e-05, "epoch": 0.001727885848057522, "percentage": 0.17, "elapsed_time": "0:04:24", "remaining_time": "1 day, 18:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 17941, "loss": 1.6821, "learning_rate": 1.0666666666666667e-05, "epoch": 0.0017836241012206678, "percentage": 0.18, "elapsed_time": "0:04:32", "remaining_time": "1 day, 18:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 17941, "loss": 1.8442, "learning_rate": 1.1000000000000001e-05, "epoch": 0.0018393623543838135, "percentage": 0.18, "elapsed_time": "0:04:41", "remaining_time": "1 day, 18:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 17941, "loss": 2.0705, "learning_rate": 1.1333333333333334e-05, "epoch": 0.0018951006075469594, "percentage": 0.19, "elapsed_time": "0:04:49", "remaining_time": "1 day, 18:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 17941, "loss": 1.7944, "learning_rate": 1.1666666666666668e-05, "epoch": 0.0019508388607101053, "percentage": 0.2, "elapsed_time": "0:04:58", "remaining_time": "1 day, 18:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 17941, "loss": 2.0, "learning_rate": 1.2e-05, "epoch": 0.0020065771138732514, "percentage": 0.2, "elapsed_time": "0:05:06", "remaining_time": "1 day, 18:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 17941, "loss": 2.1365, "learning_rate": 1.2333333333333334e-05, "epoch": 0.0020623153670363973, "percentage": 0.21, "elapsed_time": "0:05:14", "remaining_time": "1 day, 18:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 17941, "loss": 1.8569, "learning_rate": 1.2666666666666668e-05, "epoch": 0.002118053620199543, "percentage": 0.21, "elapsed_time": "0:05:23", "remaining_time": "1 day, 18:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 17941, "loss": 1.9313, "learning_rate": 1.3000000000000001e-05, "epoch": 0.0021737918733626886, "percentage": 0.22, "elapsed_time": "0:05:32", "remaining_time": "1 day, 18:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 17941, "loss": 1.8843, "learning_rate": 1.3333333333333333e-05, "epoch": 0.0022295301265258345, "percentage": 0.22, "elapsed_time": "0:05:40", "remaining_time": "1 day, 18:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 17941, "loss": 1.929, "learning_rate": 1.3666666666666666e-05, "epoch": 0.0022852683796889804, "percentage": 0.23, "elapsed_time": "0:05:49", "remaining_time": "1 day, 18:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 17941, "loss": 2.0276, "learning_rate": 1.4000000000000001e-05, "epoch": 0.0023410066328521262, "percentage": 0.23, "elapsed_time": "0:05:57", "remaining_time": "1 day, 18:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 17941, "loss": 1.949, "learning_rate": 1.4333333333333334e-05, "epoch": 0.002396744886015272, "percentage": 0.24, "elapsed_time": "0:06:06", "remaining_time": "1 day, 18:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 17941, "loss": 2.2978, "learning_rate": 1.4666666666666668e-05, "epoch": 0.002452483139178418, "percentage": 0.25, "elapsed_time": "0:06:14", "remaining_time": "1 day, 18:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 17941, "loss": 1.9125, "learning_rate": 1.5e-05, "epoch": 0.002508221392341564, "percentage": 0.25, "elapsed_time": "0:06:23", "remaining_time": "1 day, 18:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 17941, "loss": 1.8533, "learning_rate": 1.5333333333333334e-05, "epoch": 0.00256395964550471, "percentage": 0.26, "elapsed_time": "0:06:32", "remaining_time": "1 day, 18:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 17941, "loss": 1.9015, "learning_rate": 1.5666666666666667e-05, "epoch": 0.0026196978986678557, "percentage": 0.26, "elapsed_time": "0:06:40", "remaining_time": "1 day, 18:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 17941, "loss": 1.682, "learning_rate": 1.6000000000000003e-05, "epoch": 0.0026754361518310016, "percentage": 0.27, "elapsed_time": "0:06:49", "remaining_time": "1 day, 18:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 17941, "loss": 2.0425, "learning_rate": 1.6333333333333335e-05, "epoch": 0.0027311744049941474, "percentage": 0.27, "elapsed_time": "0:06:57", "remaining_time": "1 day, 18:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 17941, "loss": 1.8745, "learning_rate": 1.6666666666666667e-05, "epoch": 0.0027869126581572933, "percentage": 0.28, "elapsed_time": "0:07:06", "remaining_time": "1 day, 18:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 17941, "loss": 1.8872, "learning_rate": 1.7000000000000003e-05, "epoch": 0.002842650911320439, "percentage": 0.28, "elapsed_time": "0:07:14", "remaining_time": "1 day, 18:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 17941, "loss": 2.0187, "learning_rate": 1.7333333333333336e-05, "epoch": 0.002898389164483585, "percentage": 0.29, "elapsed_time": "0:07:22", "remaining_time": "1 day, 18:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 17941, "loss": 2.0231, "learning_rate": 1.7666666666666668e-05, "epoch": 0.002954127417646731, "percentage": 0.3, "elapsed_time": "0:07:31", "remaining_time": "1 day, 18:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 17941, "loss": 1.8641, "learning_rate": 1.8e-05, "epoch": 0.003009865670809877, "percentage": 0.3, "elapsed_time": "0:07:39", "remaining_time": "1 day, 18:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 17941, "loss": 2.215, "learning_rate": 1.8333333333333333e-05, "epoch": 0.0030656039239730227, "percentage": 0.31, "elapsed_time": "0:07:48", "remaining_time": "1 day, 18:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 17941, "loss": 1.9232, "learning_rate": 1.866666666666667e-05, "epoch": 0.0031213421771361686, "percentage": 0.31, "elapsed_time": "0:07:57", "remaining_time": "1 day, 18:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 17941, "loss": 1.8452, "learning_rate": 1.9e-05, "epoch": 0.0031770804302993145, "percentage": 0.32, "elapsed_time": "0:08:06", "remaining_time": "1 day, 18:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 17941, "loss": 1.5623, "learning_rate": 1.9333333333333333e-05, "epoch": 0.0032328186834624604, "percentage": 0.32, "elapsed_time": "0:08:14", "remaining_time": "1 day, 18:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 17941, "loss": 1.7901, "learning_rate": 1.9666666666666666e-05, "epoch": 0.0032885569366256063, "percentage": 0.33, "elapsed_time": "0:08:23", "remaining_time": "1 day, 18:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 17941, "loss": 1.8802, "learning_rate": 2e-05, "epoch": 0.003344295189788752, "percentage": 0.33, "elapsed_time": "0:08:31", "remaining_time": "1 day, 18:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 17941, "loss": 1.8334, "learning_rate": 2.0333333333333334e-05, "epoch": 0.003400033442951898, "percentage": 0.34, "elapsed_time": "0:08:39", "remaining_time": "1 day, 18:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 17941, "loss": 2.1029, "learning_rate": 2.0666666666666666e-05, "epoch": 0.003455771696115044, "percentage": 0.35, "elapsed_time": "0:08:48", "remaining_time": "1 day, 18:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 17941, "loss": 2.0333, "learning_rate": 2.1e-05, "epoch": 0.00351150994927819, "percentage": 0.35, "elapsed_time": "0:08:56", "remaining_time": "1 day, 18:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 17941, "loss": 1.6012, "learning_rate": 2.1333333333333335e-05, "epoch": 0.0035672482024413357, "percentage": 0.36, "elapsed_time": "0:09:05", "remaining_time": "1 day, 18:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 17941, "loss": 2.0818, "learning_rate": 2.1666666666666667e-05, "epoch": 0.003622986455604481, "percentage": 0.36, "elapsed_time": "0:09:14", "remaining_time": "1 day, 18:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 17941, "loss": 1.9022, "learning_rate": 2.2000000000000003e-05, "epoch": 0.003678724708767627, "percentage": 0.37, "elapsed_time": "0:09:22", "remaining_time": "1 day, 18:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 17941, "loss": 1.7435, "learning_rate": 2.2333333333333335e-05, "epoch": 0.003734462961930773, "percentage": 0.37, "elapsed_time": "0:09:31", "remaining_time": "1 day, 18:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 17941, "loss": 1.7816, "learning_rate": 2.2666666666666668e-05, "epoch": 0.003790201215093919, "percentage": 0.38, "elapsed_time": "0:09:39", "remaining_time": "1 day, 18:19:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 17941, "loss": 1.672, "learning_rate": 2.3000000000000003e-05, "epoch": 0.0038459394682570647, "percentage": 0.38, "elapsed_time": "0:09:48", "remaining_time": "1 day, 18:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 17941, "loss": 1.771, "learning_rate": 2.3333333333333336e-05, "epoch": 0.0039016777214202106, "percentage": 0.39, "elapsed_time": "0:09:56", "remaining_time": "1 day, 18:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 17941, "loss": 1.9594, "learning_rate": 2.3666666666666668e-05, "epoch": 0.0039574159745833564, "percentage": 0.4, "elapsed_time": "0:10:05", "remaining_time": "1 day, 18:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 17941, "loss": 1.8492, "learning_rate": 2.4e-05, "epoch": 0.004013154227746503, "percentage": 0.4, "elapsed_time": "0:10:13", "remaining_time": "1 day, 18:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 17941, "loss": 1.798, "learning_rate": 2.4333333333333336e-05, "epoch": 0.004068892480909648, "percentage": 0.41, "elapsed_time": "0:10:22", "remaining_time": "1 day, 18:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 17941, "loss": 1.6625, "learning_rate": 2.466666666666667e-05, "epoch": 0.0041246307340727945, "percentage": 0.41, "elapsed_time": "0:10:30", "remaining_time": "1 day, 18:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 17941, "loss": 2.1015, "learning_rate": 2.5e-05, "epoch": 0.00418036898723594, "percentage": 0.42, "elapsed_time": "0:10:38", "remaining_time": "1 day, 18:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 17941, "loss": 1.9176, "learning_rate": 2.5333333333333337e-05, "epoch": 0.004236107240399086, "percentage": 0.42, "elapsed_time": "0:10:47", "remaining_time": "1 day, 18:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 17941, "loss": 1.8244, "learning_rate": 2.5666666666666666e-05, "epoch": 0.004291845493562232, "percentage": 0.43, "elapsed_time": "0:10:55", "remaining_time": "1 day, 18:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 17941, "loss": 1.851, "learning_rate": 2.6000000000000002e-05, "epoch": 0.004347583746725377, "percentage": 0.43, "elapsed_time": "0:11:04", "remaining_time": "1 day, 18:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 17941, "loss": 1.8332, "learning_rate": 2.633333333333333e-05, "epoch": 0.0044033219998885235, "percentage": 0.44, "elapsed_time": "0:11:12", "remaining_time": "1 day, 18:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 17941, "loss": 1.8357, "learning_rate": 2.6666666666666667e-05, "epoch": 0.004459060253051669, "percentage": 0.45, "elapsed_time": "0:11:21", "remaining_time": "1 day, 18:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 17941, "loss": 1.8162, "learning_rate": 2.7000000000000002e-05, "epoch": 0.004514798506214815, "percentage": 0.45, "elapsed_time": "0:11:29", "remaining_time": "1 day, 18:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 17941, "loss": 1.9187, "learning_rate": 2.733333333333333e-05, "epoch": 0.004570536759377961, "percentage": 0.46, "elapsed_time": "0:11:38", "remaining_time": "1 day, 18:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 17941, "loss": 1.9235, "learning_rate": 2.7666666666666667e-05, "epoch": 0.004626275012541107, "percentage": 0.46, "elapsed_time": "0:11:46", "remaining_time": "1 day, 18:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 17941, "loss": 1.9148, "learning_rate": 2.8000000000000003e-05, "epoch": 0.0046820132657042525, "percentage": 0.47, "elapsed_time": "0:11:55", "remaining_time": "1 day, 18:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 17941, "loss": 1.9738, "learning_rate": 2.8333333333333335e-05, "epoch": 0.004737751518867399, "percentage": 0.47, "elapsed_time": "0:12:03", "remaining_time": "1 day, 18:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 17941, "loss": 1.6872, "learning_rate": 2.8666666666666668e-05, "epoch": 0.004793489772030544, "percentage": 0.48, "elapsed_time": "0:12:11", "remaining_time": "1 day, 18:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 17941, "loss": 1.9944, "learning_rate": 2.9e-05, "epoch": 0.004849228025193691, "percentage": 0.48, "elapsed_time": "0:12:20", "remaining_time": "1 day, 18:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 17941, "loss": 1.7542, "learning_rate": 2.9333333333333336e-05, "epoch": 0.004904966278356836, "percentage": 0.49, "elapsed_time": "0:12:28", "remaining_time": "1 day, 18:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 17941, "loss": 1.9534, "learning_rate": 2.9666666666666672e-05, "epoch": 0.004960704531519982, "percentage": 0.5, "elapsed_time": "0:12:37", "remaining_time": "1 day, 18:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 17941, "loss": 1.7684, "learning_rate": 3e-05, "epoch": 0.005016442784683128, "percentage": 0.5, "elapsed_time": "0:12:45", "remaining_time": "1 day, 18:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 17941, "loss": 1.9028, "learning_rate": 3.0333333333333337e-05, "epoch": 0.005072181037846274, "percentage": 0.51, "elapsed_time": "0:12:54", "remaining_time": "1 day, 18:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 17941, "loss": 1.8876, "learning_rate": 3.066666666666667e-05, "epoch": 0.00512791929100942, "percentage": 0.51, "elapsed_time": "0:13:02", "remaining_time": "1 day, 18:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 17941, "loss": 1.7623, "learning_rate": 3.1e-05, "epoch": 0.005183657544172566, "percentage": 0.52, "elapsed_time": "0:13:11", "remaining_time": "1 day, 18:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 17941, "loss": 1.7103, "learning_rate": 3.1333333333333334e-05, "epoch": 0.005239395797335711, "percentage": 0.52, "elapsed_time": "0:13:19", "remaining_time": "1 day, 18:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 17941, "loss": 1.537, "learning_rate": 3.1666666666666666e-05, "epoch": 0.005295134050498858, "percentage": 0.53, "elapsed_time": "0:13:28", "remaining_time": "1 day, 18:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 17941, "loss": 1.6681, "learning_rate": 3.2000000000000005e-05, "epoch": 0.005350872303662003, "percentage": 0.54, "elapsed_time": "0:13:36", "remaining_time": "1 day, 18:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 17941, "loss": 2.1339, "learning_rate": 3.233333333333333e-05, "epoch": 0.005406610556825149, "percentage": 0.54, "elapsed_time": "0:13:45", "remaining_time": "1 day, 18:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 17941, "loss": 1.7591, "learning_rate": 3.266666666666667e-05, "epoch": 0.005462348809988295, "percentage": 0.55, "elapsed_time": "0:13:54", "remaining_time": "1 day, 18:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 17941, "loss": 1.901, "learning_rate": 3.3e-05, "epoch": 0.005518087063151441, "percentage": 0.55, "elapsed_time": "0:14:02", "remaining_time": "1 day, 18:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 17941, "loss": 1.5989, "learning_rate": 3.3333333333333335e-05, "epoch": 0.005573825316314587, "percentage": 0.56, "elapsed_time": "0:14:11", "remaining_time": "1 day, 18:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 17941, "loss": 1.7429, "learning_rate": 3.366666666666667e-05, "epoch": 0.005629563569477733, "percentage": 0.56, "elapsed_time": "0:14:19", "remaining_time": "1 day, 18:11:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 17941, "loss": 1.9885, "learning_rate": 3.4000000000000007e-05, "epoch": 0.005685301822640878, "percentage": 0.57, "elapsed_time": "0:14:28", "remaining_time": "1 day, 18:10:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 17941, "loss": 1.8521, "learning_rate": 3.433333333333333e-05, "epoch": 0.005741040075804025, "percentage": 0.57, "elapsed_time": "0:14:36", "remaining_time": "1 day, 18:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 17941, "loss": 1.8404, "learning_rate": 3.466666666666667e-05, "epoch": 0.00579677832896717, "percentage": 0.58, "elapsed_time": "0:14:45", "remaining_time": "1 day, 18:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 17941, "loss": 1.8081, "learning_rate": 3.5e-05, "epoch": 0.005852516582130316, "percentage": 0.59, "elapsed_time": "0:14:53", "remaining_time": "1 day, 18:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 17941, "loss": 1.8672, "learning_rate": 3.5333333333333336e-05, "epoch": 0.005908254835293462, "percentage": 0.59, "elapsed_time": "0:15:02", "remaining_time": "1 day, 18:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 17941, "loss": 1.7029, "learning_rate": 3.566666666666667e-05, "epoch": 0.005963993088456607, "percentage": 0.6, "elapsed_time": "0:15:10", "remaining_time": "1 day, 18:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 17941, "loss": 1.5455, "learning_rate": 3.6e-05, "epoch": 0.006019731341619754, "percentage": 0.6, "elapsed_time": "0:15:18", "remaining_time": "1 day, 18:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 17941, "loss": 1.9576, "learning_rate": 3.633333333333333e-05, "epoch": 0.006075469594782899, "percentage": 0.61, "elapsed_time": "0:15:27", "remaining_time": "1 day, 18:08:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 17941, "loss": 1.9341, "learning_rate": 3.6666666666666666e-05, "epoch": 0.0061312078479460455, "percentage": 0.61, "elapsed_time": "0:15:35", "remaining_time": "1 day, 18:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 17941, "loss": 1.9828, "learning_rate": 3.7e-05, "epoch": 0.006186946101109191, "percentage": 0.62, "elapsed_time": "0:15:44", "remaining_time": "1 day, 18:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 17941, "loss": 2.0277, "learning_rate": 3.733333333333334e-05, "epoch": 0.006242684354272337, "percentage": 0.62, "elapsed_time": "0:15:52", "remaining_time": "1 day, 18:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 17941, "loss": 1.7702, "learning_rate": 3.766666666666667e-05, "epoch": 0.006298422607435483, "percentage": 0.63, "elapsed_time": "0:16:01", "remaining_time": "1 day, 18:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 17941, "loss": 1.9062, "learning_rate": 3.8e-05, "epoch": 0.006354160860598629, "percentage": 0.64, "elapsed_time": "0:16:09", "remaining_time": "1 day, 18:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 17941, "loss": 1.8527, "learning_rate": 3.8333333333333334e-05, "epoch": 0.0064098991137617745, "percentage": 0.64, "elapsed_time": "0:16:18", "remaining_time": "1 day, 18:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 17941, "loss": 1.8439, "learning_rate": 3.866666666666667e-05, "epoch": 0.006465637366924921, "percentage": 0.65, "elapsed_time": "0:16:26", "remaining_time": "1 day, 18:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 17941, "loss": 2.0114, "learning_rate": 3.9000000000000006e-05, "epoch": 0.006521375620088066, "percentage": 0.65, "elapsed_time": "0:16:34", "remaining_time": "1 day, 18:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 17941, "loss": 1.6951, "learning_rate": 3.933333333333333e-05, "epoch": 0.0065771138732512125, "percentage": 0.66, "elapsed_time": "0:16:43", "remaining_time": "1 day, 18:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 17941, "loss": 1.9907, "learning_rate": 3.966666666666667e-05, "epoch": 0.006632852126414358, "percentage": 0.66, "elapsed_time": "0:16:51", "remaining_time": "1 day, 18:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 17941, "loss": 1.7934, "learning_rate": 4e-05, "epoch": 0.006688590379577504, "percentage": 0.67, "elapsed_time": "0:17:00", "remaining_time": "1 day, 18:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 17941, "loss": 1.6549, "learning_rate": 4.0333333333333336e-05, "epoch": 0.00674432863274065, "percentage": 0.67, "elapsed_time": "0:17:08", "remaining_time": "1 day, 18:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 17941, "loss": 1.9666, "learning_rate": 4.066666666666667e-05, "epoch": 0.006800066885903796, "percentage": 0.68, "elapsed_time": "0:17:17", "remaining_time": "1 day, 18:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 17941, "loss": 2.024, "learning_rate": 4.1e-05, "epoch": 0.0068558051390669415, "percentage": 0.69, "elapsed_time": "0:17:25", "remaining_time": "1 day, 18:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 17941, "loss": 1.6993, "learning_rate": 4.133333333333333e-05, "epoch": 0.006911543392230088, "percentage": 0.69, "elapsed_time": "0:17:34", "remaining_time": "1 day, 18:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 17941, "loss": 2.0135, "learning_rate": 4.166666666666667e-05, "epoch": 0.006967281645393233, "percentage": 0.7, "elapsed_time": "0:17:43", "remaining_time": "1 day, 18:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 17941, "loss": 1.9444, "learning_rate": 4.2e-05, "epoch": 0.00702301989855638, "percentage": 0.7, "elapsed_time": "0:17:51", "remaining_time": "1 day, 18:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 17941, "loss": 1.6977, "learning_rate": 4.233333333333334e-05, "epoch": 0.007078758151719525, "percentage": 0.71, "elapsed_time": "0:18:00", "remaining_time": "1 day, 18:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 17941, "loss": 1.7938, "learning_rate": 4.266666666666667e-05, "epoch": 0.007134496404882671, "percentage": 0.71, "elapsed_time": "0:18:08", "remaining_time": "1 day, 18:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 17941, "loss": 2.1036, "learning_rate": 4.3e-05, "epoch": 0.007190234658045817, "percentage": 0.72, "elapsed_time": "0:18:17", "remaining_time": "1 day, 18:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 17941, "loss": 2.0052, "learning_rate": 4.3333333333333334e-05, "epoch": 0.007245972911208962, "percentage": 0.72, "elapsed_time": "0:18:25", "remaining_time": "1 day, 18:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 17941, "loss": 1.7815, "learning_rate": 4.3666666666666666e-05, "epoch": 0.007301711164372109, "percentage": 0.73, "elapsed_time": "0:18:34", "remaining_time": "1 day, 18:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 17941, "loss": 1.7225, "learning_rate": 4.4000000000000006e-05, "epoch": 0.007357449417535254, "percentage": 0.74, "elapsed_time": "0:18:42", "remaining_time": "1 day, 18:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 17941, "loss": 1.5821, "learning_rate": 4.433333333333334e-05, "epoch": 0.0074131876706984, "percentage": 0.74, "elapsed_time": "0:18:51", "remaining_time": "1 day, 18:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 17941, "loss": 1.7831, "learning_rate": 4.466666666666667e-05, "epoch": 0.007468925923861546, "percentage": 0.75, "elapsed_time": "0:18:59", "remaining_time": "1 day, 18:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 17941, "loss": 1.7933, "learning_rate": 4.5e-05, "epoch": 0.007524664177024692, "percentage": 0.75, "elapsed_time": "0:19:07", "remaining_time": "1 day, 18:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 17941, "loss": 1.697, "learning_rate": 4.5333333333333335e-05, "epoch": 0.007580402430187838, "percentage": 0.76, "elapsed_time": "0:19:16", "remaining_time": "1 day, 18:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 17941, "loss": 1.8226, "learning_rate": 4.566666666666667e-05, "epoch": 0.007636140683350984, "percentage": 0.76, "elapsed_time": "0:19:24", "remaining_time": "1 day, 18:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 17941, "loss": 1.9071, "learning_rate": 4.600000000000001e-05, "epoch": 0.007691878936514129, "percentage": 0.77, "elapsed_time": "0:19:33", "remaining_time": "1 day, 18:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 17941, "loss": 1.8796, "learning_rate": 4.633333333333333e-05, "epoch": 0.007747617189677276, "percentage": 0.77, "elapsed_time": "0:19:41", "remaining_time": "1 day, 18:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 17941, "loss": 1.7765, "learning_rate": 4.666666666666667e-05, "epoch": 0.007803355442840421, "percentage": 0.78, "elapsed_time": "0:19:50", "remaining_time": "1 day, 18:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 17941, "loss": 1.9653, "learning_rate": 4.7e-05, "epoch": 0.007859093696003567, "percentage": 0.79, "elapsed_time": "0:19:59", "remaining_time": "1 day, 18:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 17941, "loss": 1.9019, "learning_rate": 4.7333333333333336e-05, "epoch": 0.007914831949166713, "percentage": 0.79, "elapsed_time": "0:20:08", "remaining_time": "1 day, 18:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 17941, "loss": 1.8028, "learning_rate": 4.766666666666667e-05, "epoch": 0.00797057020232986, "percentage": 0.8, "elapsed_time": "0:20:16", "remaining_time": "1 day, 18:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 17941, "loss": 1.8229, "learning_rate": 4.8e-05, "epoch": 0.008026308455493006, "percentage": 0.8, "elapsed_time": "0:20:25", "remaining_time": "1 day, 18:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 17941, "loss": 1.8648, "learning_rate": 4.8333333333333334e-05, "epoch": 0.00808204670865615, "percentage": 0.81, "elapsed_time": "0:20:33", "remaining_time": "1 day, 18:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 17941, "loss": 1.7499, "learning_rate": 4.866666666666667e-05, "epoch": 0.008137784961819296, "percentage": 0.81, "elapsed_time": "0:20:42", "remaining_time": "1 day, 18:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 17941, "loss": 1.9345, "learning_rate": 4.9e-05, "epoch": 0.008193523214982443, "percentage": 0.82, "elapsed_time": "0:20:50", "remaining_time": "1 day, 18:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 17941, "loss": 2.0028, "learning_rate": 4.933333333333334e-05, "epoch": 0.008249261468145589, "percentage": 0.82, "elapsed_time": "0:20:59", "remaining_time": "1 day, 18:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 17941, "loss": 2.0291, "learning_rate": 4.966666666666667e-05, "epoch": 0.008304999721308734, "percentage": 0.83, "elapsed_time": "0:21:07", "remaining_time": "1 day, 18:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 17941, "loss": 2.0909, "learning_rate": 5e-05, "epoch": 0.00836073797447188, "percentage": 0.84, "elapsed_time": "0:21:16", "remaining_time": "1 day, 18:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 151, "total_steps": 17941, "loss": 1.75, "learning_rate": 5.0333333333333335e-05, "epoch": 0.008416476227635026, "percentage": 0.84, "elapsed_time": "0:21:24", "remaining_time": "1 day, 18:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 17941, "loss": 1.8499, "learning_rate": 5.0666666666666674e-05, "epoch": 0.008472214480798173, "percentage": 0.85, "elapsed_time": "0:21:33", "remaining_time": "1 day, 18:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 153, "total_steps": 17941, "loss": 1.9604, "learning_rate": 5.1000000000000006e-05, "epoch": 0.008527952733961317, "percentage": 0.85, "elapsed_time": "0:21:41", "remaining_time": "1 day, 18:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 17941, "loss": 1.813, "learning_rate": 5.133333333333333e-05, "epoch": 0.008583690987124463, "percentage": 0.86, "elapsed_time": "0:21:49", "remaining_time": "1 day, 18:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 17941, "loss": 1.7692, "learning_rate": 5.166666666666667e-05, "epoch": 0.00863942924028761, "percentage": 0.86, "elapsed_time": "0:21:58", "remaining_time": "1 day, 18:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 17941, "loss": 1.8756, "learning_rate": 5.2000000000000004e-05, "epoch": 0.008695167493450754, "percentage": 0.87, "elapsed_time": "0:22:06", "remaining_time": "1 day, 18:01:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 157, "total_steps": 17941, "loss": 2.0465, "learning_rate": 5.2333333333333336e-05, "epoch": 0.0087509057466139, "percentage": 0.88, "elapsed_time": "0:22:15", "remaining_time": "1 day, 18:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 17941, "loss": 1.9387, "learning_rate": 5.266666666666666e-05, "epoch": 0.008806643999777047, "percentage": 0.88, "elapsed_time": "0:22:24", "remaining_time": "1 day, 18:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 159, "total_steps": 17941, "loss": 1.7746, "learning_rate": 5.300000000000001e-05, "epoch": 0.008862382252940193, "percentage": 0.89, "elapsed_time": "0:22:32", "remaining_time": "1 day, 18:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 17941, "loss": 1.7729, "learning_rate": 5.333333333333333e-05, "epoch": 0.008918120506103338, "percentage": 0.89, "elapsed_time": "0:22:41", "remaining_time": "1 day, 18:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 161, "total_steps": 17941, "loss": 1.7488, "learning_rate": 5.3666666666666666e-05, "epoch": 0.008973858759266484, "percentage": 0.9, "elapsed_time": "0:22:49", "remaining_time": "1 day, 18:00:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 17941, "loss": 1.8962, "learning_rate": 5.4000000000000005e-05, "epoch": 0.00902959701242963, "percentage": 0.9, "elapsed_time": "0:22:58", "remaining_time": "1 day, 18:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 163, "total_steps": 17941, "loss": 1.8141, "learning_rate": 5.433333333333334e-05, "epoch": 0.009085335265592777, "percentage": 0.91, "elapsed_time": "0:23:06", "remaining_time": "1 day, 18:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 17941, "loss": 1.5107, "learning_rate": 5.466666666666666e-05, "epoch": 0.009141073518755921, "percentage": 0.91, "elapsed_time": "0:23:14", "remaining_time": "1 day, 18:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 17941, "loss": 2.1324, "learning_rate": 5.500000000000001e-05, "epoch": 0.009196811771919068, "percentage": 0.92, "elapsed_time": "0:23:23", "remaining_time": "1 day, 17:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 17941, "loss": 1.7378, "learning_rate": 5.5333333333333334e-05, "epoch": 0.009252550025082214, "percentage": 0.93, "elapsed_time": "0:23:31", "remaining_time": "1 day, 17:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 167, "total_steps": 17941, "loss": 1.7654, "learning_rate": 5.566666666666667e-05, "epoch": 0.00930828827824536, "percentage": 0.93, "elapsed_time": "0:23:40", "remaining_time": "1 day, 17:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 17941, "loss": 1.8091, "learning_rate": 5.6000000000000006e-05, "epoch": 0.009364026531408505, "percentage": 0.94, "elapsed_time": "0:23:48", "remaining_time": "1 day, 17:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 169, "total_steps": 17941, "loss": 1.6823, "learning_rate": 5.633333333333334e-05, "epoch": 0.009419764784571651, "percentage": 0.94, "elapsed_time": "0:23:57", "remaining_time": "1 day, 17:59:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 17941, "loss": 1.7736, "learning_rate": 5.666666666666667e-05, "epoch": 0.009475503037734798, "percentage": 0.95, "elapsed_time": "0:24:05", "remaining_time": "1 day, 17:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 171, "total_steps": 17941, "loss": 2.0331, "learning_rate": 5.6999999999999996e-05, "epoch": 0.009531241290897944, "percentage": 0.95, "elapsed_time": "0:24:14", "remaining_time": "1 day, 17:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 17941, "loss": 1.8546, "learning_rate": 5.7333333333333336e-05, "epoch": 0.009586979544061089, "percentage": 0.96, "elapsed_time": "0:24:23", "remaining_time": "1 day, 17:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 173, "total_steps": 17941, "loss": 2.0427, "learning_rate": 5.766666666666667e-05, "epoch": 0.009642717797224235, "percentage": 0.96, "elapsed_time": "0:24:31", "remaining_time": "1 day, 17:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 17941, "loss": 1.7323, "learning_rate": 5.8e-05, "epoch": 0.009698456050387381, "percentage": 0.97, "elapsed_time": "0:24:40", "remaining_time": "1 day, 17:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 17941, "loss": 2.2, "learning_rate": 5.833333333333334e-05, "epoch": 0.009754194303550527, "percentage": 0.98, "elapsed_time": "0:24:48", "remaining_time": "1 day, 17:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 17941, "loss": 1.5879, "learning_rate": 5.866666666666667e-05, "epoch": 0.009809932556713672, "percentage": 0.98, "elapsed_time": "0:24:56", "remaining_time": "1 day, 17:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 177, "total_steps": 17941, "loss": 1.6043, "learning_rate": 5.9e-05, "epoch": 0.009865670809876818, "percentage": 0.99, "elapsed_time": "0:25:06", "remaining_time": "1 day, 17:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 17941, "loss": 1.8772, "learning_rate": 5.9333333333333343e-05, "epoch": 0.009921409063039965, "percentage": 0.99, "elapsed_time": "0:25:14", "remaining_time": "1 day, 17:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 179, "total_steps": 17941, "loss": 1.7887, "learning_rate": 5.966666666666667e-05, "epoch": 0.009977147316203111, "percentage": 1.0, "elapsed_time": "0:25:22", "remaining_time": "1 day, 17:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 17941, "loss": 1.7228, "learning_rate": 6e-05, "epoch": 0.010032885569366256, "percentage": 1.0, "elapsed_time": "0:25:31", "remaining_time": "1 day, 17:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 181, "total_steps": 17941, "loss": 1.7767, "learning_rate": 6.033333333333334e-05, "epoch": 0.010088623822529402, "percentage": 1.01, "elapsed_time": "0:25:39", "remaining_time": "1 day, 17:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 17941, "loss": 2.002, "learning_rate": 6.066666666666667e-05, "epoch": 0.010144362075692548, "percentage": 1.01, "elapsed_time": "0:25:48", "remaining_time": "1 day, 17:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 183, "total_steps": 17941, "loss": 1.7755, "learning_rate": 6.1e-05, "epoch": 0.010200100328855693, "percentage": 1.02, "elapsed_time": "0:25:56", "remaining_time": "1 day, 17:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 17941, "loss": 1.7244, "learning_rate": 6.133333333333334e-05, "epoch": 0.01025583858201884, "percentage": 1.03, "elapsed_time": "0:26:05", "remaining_time": "1 day, 17:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 17941, "loss": 1.8041, "learning_rate": 6.166666666666667e-05, "epoch": 0.010311576835181985, "percentage": 1.03, "elapsed_time": "0:26:13", "remaining_time": "1 day, 17:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 17941, "loss": 1.7813, "learning_rate": 6.2e-05, "epoch": 0.010367315088345132, "percentage": 1.04, "elapsed_time": "0:26:22", "remaining_time": "1 day, 17:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 187, "total_steps": 17941, "loss": 1.9419, "learning_rate": 6.233333333333334e-05, "epoch": 0.010423053341508276, "percentage": 1.04, "elapsed_time": "0:26:30", "remaining_time": "1 day, 17:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 17941, "loss": 1.6804, "learning_rate": 6.266666666666667e-05, "epoch": 0.010478791594671423, "percentage": 1.05, "elapsed_time": "0:26:39", "remaining_time": "1 day, 17:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 189, "total_steps": 17941, "loss": 1.8406, "learning_rate": 6.3e-05, "epoch": 0.010534529847834569, "percentage": 1.05, "elapsed_time": "0:26:47", "remaining_time": "1 day, 17:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 17941, "loss": 1.9451, "learning_rate": 6.333333333333333e-05, "epoch": 0.010590268100997715, "percentage": 1.06, "elapsed_time": "0:26:55", "remaining_time": "1 day, 17:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 191, "total_steps": 17941, "loss": 1.7783, "learning_rate": 6.366666666666668e-05, "epoch": 0.01064600635416086, "percentage": 1.06, "elapsed_time": "0:27:04", "remaining_time": "1 day, 17:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 17941, "loss": 1.8944, "learning_rate": 6.400000000000001e-05, "epoch": 0.010701744607324006, "percentage": 1.07, "elapsed_time": "0:27:12", "remaining_time": "1 day, 17:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 193, "total_steps": 17941, "loss": 1.8799, "learning_rate": 6.433333333333333e-05, "epoch": 0.010757482860487153, "percentage": 1.08, "elapsed_time": "0:27:21", "remaining_time": "1 day, 17:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 17941, "loss": 1.8651, "learning_rate": 6.466666666666666e-05, "epoch": 0.010813221113650299, "percentage": 1.08, "elapsed_time": "0:27:29", "remaining_time": "1 day, 17:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 17941, "loss": 1.6938, "learning_rate": 6.500000000000001e-05, "epoch": 0.010868959366813443, "percentage": 1.09, "elapsed_time": "0:27:38", "remaining_time": "1 day, 17:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 17941, "loss": 1.756, "learning_rate": 6.533333333333334e-05, "epoch": 0.01092469761997659, "percentage": 1.09, "elapsed_time": "0:27:46", "remaining_time": "1 day, 17:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 197, "total_steps": 17941, "loss": 1.8388, "learning_rate": 6.566666666666666e-05, "epoch": 0.010980435873139736, "percentage": 1.1, "elapsed_time": "0:27:55", "remaining_time": "1 day, 17:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 17941, "loss": 2.0311, "learning_rate": 6.6e-05, "epoch": 0.011036174126302882, "percentage": 1.1, "elapsed_time": "0:28:04", "remaining_time": "1 day, 17:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 199, "total_steps": 17941, "loss": 2.0285, "learning_rate": 6.633333333333334e-05, "epoch": 0.011091912379466027, "percentage": 1.11, "elapsed_time": "0:28:12", "remaining_time": "1 day, 17:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 17941, "loss": 1.7062, "learning_rate": 6.666666666666667e-05, "epoch": 0.011147650632629173, "percentage": 1.11, "elapsed_time": "0:28:21", "remaining_time": "1 day, 17:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 201, "total_steps": 17941, "loss": 1.916, "learning_rate": 6.7e-05, "epoch": 0.01120338888579232, "percentage": 1.12, "elapsed_time": "0:28:29", "remaining_time": "1 day, 17:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 17941, "loss": 1.9394, "learning_rate": 6.733333333333333e-05, "epoch": 0.011259127138955466, "percentage": 1.13, "elapsed_time": "0:28:38", "remaining_time": "1 day, 17:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 203, "total_steps": 17941, "loss": 2.248, "learning_rate": 6.766666666666667e-05, "epoch": 0.01131486539211861, "percentage": 1.13, "elapsed_time": "0:28:46", "remaining_time": "1 day, 17:55:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 17941, "loss": 1.835, "learning_rate": 6.800000000000001e-05, "epoch": 0.011370603645281757, "percentage": 1.14, "elapsed_time": "0:28:55", "remaining_time": "1 day, 17:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 17941, "loss": 1.7373, "learning_rate": 6.833333333333333e-05, "epoch": 0.011426341898444903, "percentage": 1.14, "elapsed_time": "0:29:03", "remaining_time": "1 day, 17:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 17941, "loss": 2.1801, "learning_rate": 6.866666666666666e-05, "epoch": 0.01148208015160805, "percentage": 1.15, "elapsed_time": "0:29:12", "remaining_time": "1 day, 17:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 207, "total_steps": 17941, "loss": 1.7873, "learning_rate": 6.9e-05, "epoch": 0.011537818404771194, "percentage": 1.15, "elapsed_time": "0:29:20", "remaining_time": "1 day, 17:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 17941, "loss": 1.9491, "learning_rate": 6.933333333333334e-05, "epoch": 0.01159355665793434, "percentage": 1.16, "elapsed_time": "0:29:29", "remaining_time": "1 day, 17:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 209, "total_steps": 17941, "loss": 1.7532, "learning_rate": 6.966666666666668e-05, "epoch": 0.011649294911097487, "percentage": 1.16, "elapsed_time": "0:29:37", "remaining_time": "1 day, 17:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 17941, "loss": 1.7694, "learning_rate": 7e-05, "epoch": 0.011705033164260631, "percentage": 1.17, "elapsed_time": "0:29:46", "remaining_time": "1 day, 17:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 211, "total_steps": 17941, "loss": 2.2063, "learning_rate": 7.033333333333334e-05, "epoch": 0.011760771417423778, "percentage": 1.18, "elapsed_time": "0:29:54", "remaining_time": "1 day, 17:53:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 17941, "loss": 1.8842, "learning_rate": 7.066666666666667e-05, "epoch": 0.011816509670586924, "percentage": 1.18, "elapsed_time": "0:30:03", "remaining_time": "1 day, 17:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 213, "total_steps": 17941, "loss": 1.7411, "learning_rate": 7.1e-05, "epoch": 0.01187224792375007, "percentage": 1.19, "elapsed_time": "0:30:11", "remaining_time": "1 day, 17:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 17941, "loss": 1.8457, "learning_rate": 7.133333333333334e-05, "epoch": 0.011927986176913215, "percentage": 1.19, "elapsed_time": "0:30:20", "remaining_time": "1 day, 17:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 17941, "loss": 1.8425, "learning_rate": 7.166666666666667e-05, "epoch": 0.011983724430076361, "percentage": 1.2, "elapsed_time": "0:30:28", "remaining_time": "1 day, 17:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 17941, "loss": 1.9535, "learning_rate": 7.2e-05, "epoch": 0.012039462683239507, "percentage": 1.2, "elapsed_time": "0:30:37", "remaining_time": "1 day, 17:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 217, "total_steps": 17941, "loss": 1.8465, "learning_rate": 7.233333333333335e-05, "epoch": 0.012095200936402654, "percentage": 1.21, "elapsed_time": "0:30:45", "remaining_time": "1 day, 17:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 17941, "loss": 2.1711, "learning_rate": 7.266666666666667e-05, "epoch": 0.012150939189565798, "percentage": 1.22, "elapsed_time": "0:30:54", "remaining_time": "1 day, 17:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 219, "total_steps": 17941, "loss": 1.7793, "learning_rate": 7.3e-05, "epoch": 0.012206677442728945, "percentage": 1.22, "elapsed_time": "0:31:02", "remaining_time": "1 day, 17:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 17941, "loss": 1.9454, "learning_rate": 7.333333333333333e-05, "epoch": 0.012262415695892091, "percentage": 1.23, "elapsed_time": "0:31:11", "remaining_time": "1 day, 17:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 221, "total_steps": 17941, "loss": 1.8544, "learning_rate": 7.366666666666668e-05, "epoch": 0.012318153949055237, "percentage": 1.23, "elapsed_time": "0:31:19", "remaining_time": "1 day, 17:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 17941, "loss": 1.8335, "learning_rate": 7.4e-05, "epoch": 0.012373892202218382, "percentage": 1.24, "elapsed_time": "0:31:28", "remaining_time": "1 day, 17:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 223, "total_steps": 17941, "loss": 1.6647, "learning_rate": 7.433333333333333e-05, "epoch": 0.012429630455381528, "percentage": 1.24, "elapsed_time": "0:31:36", "remaining_time": "1 day, 17:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 17941, "loss": 1.9092, "learning_rate": 7.466666666666667e-05, "epoch": 0.012485368708544674, "percentage": 1.25, "elapsed_time": "0:31:45", "remaining_time": "1 day, 17:51:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 17941, "loss": 1.7344, "learning_rate": 7.500000000000001e-05, "epoch": 0.01254110696170782, "percentage": 1.25, "elapsed_time": "0:31:53", "remaining_time": "1 day, 17:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 17941, "loss": 1.6805, "learning_rate": 7.533333333333334e-05, "epoch": 0.012596845214870965, "percentage": 1.26, "elapsed_time": "0:32:02", "remaining_time": "1 day, 17:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 227, "total_steps": 17941, "loss": 1.6711, "learning_rate": 7.566666666666667e-05, "epoch": 0.012652583468034112, "percentage": 1.27, "elapsed_time": "0:32:10", "remaining_time": "1 day, 17:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 17941, "loss": 1.9194, "learning_rate": 7.6e-05, "epoch": 0.012708321721197258, "percentage": 1.27, "elapsed_time": "0:32:19", "remaining_time": "1 day, 17:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 229, "total_steps": 17941, "loss": 1.9374, "learning_rate": 7.633333333333334e-05, "epoch": 0.012764059974360404, "percentage": 1.28, "elapsed_time": "0:32:28", "remaining_time": "1 day, 17:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 17941, "loss": 1.605, "learning_rate": 7.666666666666667e-05, "epoch": 0.012819798227523549, "percentage": 1.28, "elapsed_time": "0:32:36", "remaining_time": "1 day, 17:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 231, "total_steps": 17941, "loss": 1.804, "learning_rate": 7.7e-05, "epoch": 0.012875536480686695, "percentage": 1.29, "elapsed_time": "0:32:45", "remaining_time": "1 day, 17:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 17941, "loss": 1.796, "learning_rate": 7.733333333333333e-05, "epoch": 0.012931274733849842, "percentage": 1.29, "elapsed_time": "0:32:53", "remaining_time": "1 day, 17:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 233, "total_steps": 17941, "loss": 1.704, "learning_rate": 7.766666666666667e-05, "epoch": 0.012987012987012988, "percentage": 1.3, "elapsed_time": "0:33:02", "remaining_time": "1 day, 17:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 17941, "loss": 2.0598, "learning_rate": 7.800000000000001e-05, "epoch": 0.013042751240176132, "percentage": 1.3, "elapsed_time": "0:33:10", "remaining_time": "1 day, 17:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 17941, "loss": 1.9391, "learning_rate": 7.833333333333333e-05, "epoch": 0.013098489493339279, "percentage": 1.31, "elapsed_time": "0:33:19", "remaining_time": "1 day, 17:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 17941, "loss": 1.851, "learning_rate": 7.866666666666666e-05, "epoch": 0.013154227746502425, "percentage": 1.32, "elapsed_time": "0:33:27", "remaining_time": "1 day, 17:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 237, "total_steps": 17941, "loss": 1.9757, "learning_rate": 7.900000000000001e-05, "epoch": 0.01320996599966557, "percentage": 1.32, "elapsed_time": "0:33:36", "remaining_time": "1 day, 17:50:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 17941, "loss": 2.2063, "learning_rate": 7.933333333333334e-05, "epoch": 0.013265704252828716, "percentage": 1.33, "elapsed_time": "0:33:45", "remaining_time": "1 day, 17:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 239, "total_steps": 17941, "loss": 1.8813, "learning_rate": 7.966666666666666e-05, "epoch": 0.013321442505991862, "percentage": 1.33, "elapsed_time": "0:33:53", "remaining_time": "1 day, 17:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 17941, "loss": 1.928, "learning_rate": 8e-05, "epoch": 0.013377180759155009, "percentage": 1.34, "elapsed_time": "0:34:02", "remaining_time": "1 day, 17:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 241, "total_steps": 17941, "loss": 1.5582, "learning_rate": 8.033333333333334e-05, "epoch": 0.013432919012318153, "percentage": 1.34, "elapsed_time": "0:34:10", "remaining_time": "1 day, 17:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 17941, "loss": 2.1044, "learning_rate": 8.066666666666667e-05, "epoch": 0.0134886572654813, "percentage": 1.35, "elapsed_time": "0:34:19", "remaining_time": "1 day, 17:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 243, "total_steps": 17941, "loss": 1.7521, "learning_rate": 8.1e-05, "epoch": 0.013544395518644446, "percentage": 1.35, "elapsed_time": "0:34:27", "remaining_time": "1 day, 17:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 17941, "loss": 1.9605, "learning_rate": 8.133333333333334e-05, "epoch": 0.013600133771807592, "percentage": 1.36, "elapsed_time": "0:34:36", "remaining_time": "1 day, 17:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 17941, "loss": 1.8198, "learning_rate": 8.166666666666667e-05, "epoch": 0.013655872024970737, "percentage": 1.37, "elapsed_time": "0:34:44", "remaining_time": "1 day, 17:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 17941, "loss": 2.0001, "learning_rate": 8.2e-05, "epoch": 0.013711610278133883, "percentage": 1.37, "elapsed_time": "0:34:53", "remaining_time": "1 day, 17:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 247, "total_steps": 17941, "loss": 1.9317, "learning_rate": 8.233333333333333e-05, "epoch": 0.01376734853129703, "percentage": 1.38, "elapsed_time": "0:35:01", "remaining_time": "1 day, 17:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 17941, "loss": 1.7716, "learning_rate": 8.266666666666667e-05, "epoch": 0.013823086784460176, "percentage": 1.38, "elapsed_time": "0:35:10", "remaining_time": "1 day, 17:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 249, "total_steps": 17941, "loss": 1.82, "learning_rate": 8.3e-05, "epoch": 0.01387882503762332, "percentage": 1.39, "elapsed_time": "0:35:18", "remaining_time": "1 day, 17:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 17941, "loss": 1.8309, "learning_rate": 8.333333333333334e-05, "epoch": 0.013934563290786467, "percentage": 1.39, "elapsed_time": "0:35:27", "remaining_time": "1 day, 17:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 251, "total_steps": 17941, "loss": 1.682, "learning_rate": 8.366666666666668e-05, "epoch": 0.013990301543949613, "percentage": 1.4, "elapsed_time": "0:35:36", "remaining_time": "1 day, 17:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 17941, "loss": 2.001, "learning_rate": 8.4e-05, "epoch": 0.01404603979711276, "percentage": 1.4, "elapsed_time": "0:35:44", "remaining_time": "1 day, 17:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 253, "total_steps": 17941, "loss": 1.7766, "learning_rate": 8.433333333333334e-05, "epoch": 0.014101778050275904, "percentage": 1.41, "elapsed_time": "0:35:52", "remaining_time": "1 day, 17:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 17941, "loss": 1.6948, "learning_rate": 8.466666666666667e-05, "epoch": 0.01415751630343905, "percentage": 1.42, "elapsed_time": "0:36:01", "remaining_time": "1 day, 17:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 17941, "loss": 1.8978, "learning_rate": 8.5e-05, "epoch": 0.014213254556602196, "percentage": 1.42, "elapsed_time": "0:36:09", "remaining_time": "1 day, 17:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 17941, "loss": 1.7381, "learning_rate": 8.533333333333334e-05, "epoch": 0.014268992809765343, "percentage": 1.43, "elapsed_time": "0:36:18", "remaining_time": "1 day, 17:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 257, "total_steps": 17941, "loss": 1.7016, "learning_rate": 8.566666666666667e-05, "epoch": 0.014324731062928487, "percentage": 1.43, "elapsed_time": "0:36:26", "remaining_time": "1 day, 17:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 17941, "loss": 1.8649, "learning_rate": 8.6e-05, "epoch": 0.014380469316091634, "percentage": 1.44, "elapsed_time": "0:36:35", "remaining_time": "1 day, 17:47:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 259, "total_steps": 17941, "loss": 1.7844, "learning_rate": 8.633333333333334e-05, "epoch": 0.01443620756925478, "percentage": 1.44, "elapsed_time": "0:36:43", "remaining_time": "1 day, 17:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 17941, "loss": 2.0572, "learning_rate": 8.666666666666667e-05, "epoch": 0.014491945822417925, "percentage": 1.45, "elapsed_time": "0:36:52", "remaining_time": "1 day, 17:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 261, "total_steps": 17941, "loss": 1.8073, "learning_rate": 8.7e-05, "epoch": 0.014547684075581071, "percentage": 1.45, "elapsed_time": "0:37:01", "remaining_time": "1 day, 17:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 17941, "loss": 1.9706, "learning_rate": 8.733333333333333e-05, "epoch": 0.014603422328744217, "percentage": 1.46, "elapsed_time": "0:37:10", "remaining_time": "1 day, 17:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 263, "total_steps": 17941, "loss": 1.7742, "learning_rate": 8.766666666666668e-05, "epoch": 0.014659160581907364, "percentage": 1.47, "elapsed_time": "0:37:18", "remaining_time": "1 day, 17:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 17941, "loss": 1.6763, "learning_rate": 8.800000000000001e-05, "epoch": 0.014714898835070508, "percentage": 1.47, "elapsed_time": "0:37:26", "remaining_time": "1 day, 17:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 17941, "loss": 1.5731, "learning_rate": 8.833333333333333e-05, "epoch": 0.014770637088233654, "percentage": 1.48, "elapsed_time": "0:37:35", "remaining_time": "1 day, 17:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 17941, "loss": 1.9837, "learning_rate": 8.866666666666668e-05, "epoch": 0.0148263753413968, "percentage": 1.48, "elapsed_time": "0:37:43", "remaining_time": "1 day, 17:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 267, "total_steps": 17941, "loss": 1.8844, "learning_rate": 8.900000000000001e-05, "epoch": 0.014882113594559947, "percentage": 1.49, "elapsed_time": "0:37:52", "remaining_time": "1 day, 17:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 17941, "loss": 1.9141, "learning_rate": 8.933333333333334e-05, "epoch": 0.014937851847723092, "percentage": 1.49, "elapsed_time": "0:38:01", "remaining_time": "1 day, 17:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 269, "total_steps": 17941, "loss": 2.1101, "learning_rate": 8.966666666666666e-05, "epoch": 0.014993590100886238, "percentage": 1.5, "elapsed_time": "0:38:09", "remaining_time": "1 day, 17:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 17941, "loss": 1.8388, "learning_rate": 9e-05, "epoch": 0.015049328354049384, "percentage": 1.5, "elapsed_time": "0:38:18", "remaining_time": "1 day, 17:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 271, "total_steps": 17941, "loss": 1.8648, "learning_rate": 9.033333333333334e-05, "epoch": 0.01510506660721253, "percentage": 1.51, "elapsed_time": "0:38:26", "remaining_time": "1 day, 17:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 17941, "loss": 1.7059, "learning_rate": 9.066666666666667e-05, "epoch": 0.015160804860375675, "percentage": 1.52, "elapsed_time": "0:38:34", "remaining_time": "1 day, 17:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 273, "total_steps": 17941, "loss": 1.8659, "learning_rate": 9.1e-05, "epoch": 0.015216543113538821, "percentage": 1.52, "elapsed_time": "0:38:43", "remaining_time": "1 day, 17:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 17941, "loss": 1.6187, "learning_rate": 9.133333333333334e-05, "epoch": 0.015272281366701968, "percentage": 1.53, "elapsed_time": "0:38:51", "remaining_time": "1 day, 17:45:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 17941, "loss": 1.8554, "learning_rate": 9.166666666666667e-05, "epoch": 0.015328019619865114, "percentage": 1.53, "elapsed_time": "0:39:00", "remaining_time": "1 day, 17:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 17941, "loss": 1.8108, "learning_rate": 9.200000000000001e-05, "epoch": 0.015383757873028259, "percentage": 1.54, "elapsed_time": "0:39:08", "remaining_time": "1 day, 17:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 277, "total_steps": 17941, "loss": 1.7369, "learning_rate": 9.233333333333333e-05, "epoch": 0.015439496126191405, "percentage": 1.54, "elapsed_time": "0:39:17", "remaining_time": "1 day, 17:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 17941, "loss": 1.7879, "learning_rate": 9.266666666666666e-05, "epoch": 0.015495234379354551, "percentage": 1.55, "elapsed_time": "0:39:25", "remaining_time": "1 day, 17:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 279, "total_steps": 17941, "loss": 1.8687, "learning_rate": 9.300000000000001e-05, "epoch": 0.015550972632517698, "percentage": 1.56, "elapsed_time": "0:39:34", "remaining_time": "1 day, 17:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 17941, "loss": 2.0486, "learning_rate": 9.333333333333334e-05, "epoch": 0.015606710885680842, "percentage": 1.56, "elapsed_time": "0:39:42", "remaining_time": "1 day, 17:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 281, "total_steps": 17941, "loss": 1.8764, "learning_rate": 9.366666666666668e-05, "epoch": 0.01566244913884399, "percentage": 1.57, "elapsed_time": "0:39:51", "remaining_time": "1 day, 17:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 17941, "loss": 1.8098, "learning_rate": 9.4e-05, "epoch": 0.015718187392007133, "percentage": 1.57, "elapsed_time": "0:39:59", "remaining_time": "1 day, 17:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 283, "total_steps": 17941, "loss": 1.8023, "learning_rate": 9.433333333333334e-05, "epoch": 0.01577392564517028, "percentage": 1.58, "elapsed_time": "0:40:08", "remaining_time": "1 day, 17:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 17941, "loss": 1.9003, "learning_rate": 9.466666666666667e-05, "epoch": 0.015829663898333426, "percentage": 1.58, "elapsed_time": "0:40:16", "remaining_time": "1 day, 17:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 17941, "loss": 1.6793, "learning_rate": 9.5e-05, "epoch": 0.015885402151496572, "percentage": 1.59, "elapsed_time": "0:40:25", "remaining_time": "1 day, 17:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 17941, "loss": 1.7691, "learning_rate": 9.533333333333334e-05, "epoch": 0.01594114040465972, "percentage": 1.59, "elapsed_time": "0:40:33", "remaining_time": "1 day, 17:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 287, "total_steps": 17941, "loss": 1.8312, "learning_rate": 9.566666666666667e-05, "epoch": 0.015996878657822865, "percentage": 1.6, "elapsed_time": "0:40:42", "remaining_time": "1 day, 17:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 17941, "loss": 1.9652, "learning_rate": 9.6e-05, "epoch": 0.01605261691098601, "percentage": 1.61, "elapsed_time": "0:40:50", "remaining_time": "1 day, 17:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 289, "total_steps": 17941, "loss": 1.8264, "learning_rate": 9.633333333333335e-05, "epoch": 0.016108355164149154, "percentage": 1.61, "elapsed_time": "0:40:58", "remaining_time": "1 day, 17:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 17941, "loss": 1.9074, "learning_rate": 9.666666666666667e-05, "epoch": 0.0161640934173123, "percentage": 1.62, "elapsed_time": "0:41:07", "remaining_time": "1 day, 17:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 291, "total_steps": 17941, "loss": 1.9993, "learning_rate": 9.7e-05, "epoch": 0.016219831670475447, "percentage": 1.62, "elapsed_time": "0:41:15", "remaining_time": "1 day, 17:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 17941, "loss": 1.6385, "learning_rate": 9.733333333333335e-05, "epoch": 0.016275569923638593, "percentage": 1.63, "elapsed_time": "0:41:24", "remaining_time": "1 day, 17:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 293, "total_steps": 17941, "loss": 1.8513, "learning_rate": 9.766666666666668e-05, "epoch": 0.01633130817680174, "percentage": 1.63, "elapsed_time": "0:41:32", "remaining_time": "1 day, 17:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 17941, "loss": 1.7628, "learning_rate": 9.8e-05, "epoch": 0.016387046429964885, "percentage": 1.64, "elapsed_time": "0:41:41", "remaining_time": "1 day, 17:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 17941, "loss": 1.8406, "learning_rate": 9.833333333333333e-05, "epoch": 0.016442784683128032, "percentage": 1.64, "elapsed_time": "0:41:49", "remaining_time": "1 day, 17:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 17941, "loss": 1.9504, "learning_rate": 9.866666666666668e-05, "epoch": 0.016498522936291178, "percentage": 1.65, "elapsed_time": "0:41:59", "remaining_time": "1 day, 17:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 297, "total_steps": 17941, "loss": 1.9845, "learning_rate": 9.900000000000001e-05, "epoch": 0.01655426118945432, "percentage": 1.66, "elapsed_time": "0:42:07", "remaining_time": "1 day, 17:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 17941, "loss": 1.8234, "learning_rate": 9.933333333333334e-05, "epoch": 0.016609999442617467, "percentage": 1.66, "elapsed_time": "0:42:15", "remaining_time": "1 day, 17:42:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 299, "total_steps": 17941, "loss": 1.6132, "learning_rate": 9.966666666666667e-05, "epoch": 0.016665737695780614, "percentage": 1.67, "elapsed_time": "0:42:24", "remaining_time": "1 day, 17:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 17941, "loss": 2.0395, "learning_rate": 0.0001, "epoch": 0.01672147594894376, "percentage": 1.67, "elapsed_time": "0:42:32", "remaining_time": "1 day, 17:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 301, "total_steps": 17941, "loss": 1.6945, "learning_rate": 9.999999920714576e-05, "epoch": 0.016777214202106906, "percentage": 1.68, "elapsed_time": "0:42:41", "remaining_time": "1 day, 17:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 17941, "loss": 1.6877, "learning_rate": 9.999999682858307e-05, "epoch": 0.016832952455270053, "percentage": 1.68, "elapsed_time": "0:42:49", "remaining_time": "1 day, 17:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 303, "total_steps": 17941, "loss": 1.6779, "learning_rate": 9.9999992864312e-05, "epoch": 0.0168886907084332, "percentage": 1.69, "elapsed_time": "0:42:58", "remaining_time": "1 day, 17:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 17941, "loss": 1.64, "learning_rate": 9.999998731433267e-05, "epoch": 0.016944428961596345, "percentage": 1.69, "elapsed_time": "0:43:06", "remaining_time": "1 day, 17:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 17941, "loss": 1.66, "learning_rate": 9.999998017864527e-05, "epoch": 0.017000167214759488, "percentage": 1.7, "elapsed_time": "0:43:15", "remaining_time": "1 day, 17:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 17941, "loss": 1.8884, "learning_rate": 9.999997145725001e-05, "epoch": 0.017055905467922634, "percentage": 1.71, "elapsed_time": "0:43:24", "remaining_time": "1 day, 17:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 307, "total_steps": 17941, "loss": 1.6844, "learning_rate": 9.999996115014719e-05, "epoch": 0.01711164372108578, "percentage": 1.71, "elapsed_time": "0:43:32", "remaining_time": "1 day, 17:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 17941, "loss": 1.7733, "learning_rate": 9.99999492573371e-05, "epoch": 0.017167381974248927, "percentage": 1.72, "elapsed_time": "0:43:41", "remaining_time": "1 day, 17:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 309, "total_steps": 17941, "loss": 1.6295, "learning_rate": 9.999993577882016e-05, "epoch": 0.017223120227412073, "percentage": 1.72, "elapsed_time": "0:43:49", "remaining_time": "1 day, 17:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 17941, "loss": 1.6118, "learning_rate": 9.999992071459676e-05, "epoch": 0.01727885848057522, "percentage": 1.73, "elapsed_time": "0:43:57", "remaining_time": "1 day, 17:40:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 311, "total_steps": 17941, "loss": 1.594, "learning_rate": 9.999990406466741e-05, "epoch": 0.017334596733738366, "percentage": 1.73, "elapsed_time": "0:44:06", "remaining_time": "1 day, 17:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 17941, "loss": 1.6829, "learning_rate": 9.999988582903262e-05, "epoch": 0.01739033498690151, "percentage": 1.74, "elapsed_time": "0:44:14", "remaining_time": "1 day, 17:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 313, "total_steps": 17941, "loss": 1.662, "learning_rate": 9.999986600769295e-05, "epoch": 0.017446073240064655, "percentage": 1.74, "elapsed_time": "0:44:23", "remaining_time": "1 day, 17:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 17941, "loss": 1.7087, "learning_rate": 9.999984460064908e-05, "epoch": 0.0175018114932278, "percentage": 1.75, "elapsed_time": "0:44:31", "remaining_time": "1 day, 17:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 17941, "loss": 1.8628, "learning_rate": 9.999982160790164e-05, "epoch": 0.017557549746390948, "percentage": 1.76, "elapsed_time": "0:44:40", "remaining_time": "1 day, 17:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 17941, "loss": 2.143, "learning_rate": 9.999979702945138e-05, "epoch": 0.017613287999554094, "percentage": 1.76, "elapsed_time": "0:44:48", "remaining_time": "1 day, 17:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 317, "total_steps": 17941, "loss": 1.6862, "learning_rate": 9.999977086529909e-05, "epoch": 0.01766902625271724, "percentage": 1.77, "elapsed_time": "0:44:57", "remaining_time": "1 day, 17:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 17941, "loss": 1.8495, "learning_rate": 9.999974311544556e-05, "epoch": 0.017724764505880387, "percentage": 1.77, "elapsed_time": "0:45:05", "remaining_time": "1 day, 17:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 319, "total_steps": 17941, "loss": 1.9501, "learning_rate": 9.999971377989172e-05, "epoch": 0.017780502759043533, "percentage": 1.78, "elapsed_time": "0:45:14", "remaining_time": "1 day, 17:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 17941, "loss": 1.981, "learning_rate": 9.999968285863848e-05, "epoch": 0.017836241012206676, "percentage": 1.78, "elapsed_time": "0:45:22", "remaining_time": "1 day, 17:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 321, "total_steps": 17941, "loss": 1.9126, "learning_rate": 9.99996503516868e-05, "epoch": 0.017891979265369822, "percentage": 1.79, "elapsed_time": "0:45:30", "remaining_time": "1 day, 17:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 17941, "loss": 1.7568, "learning_rate": 9.999961625903774e-05, "epoch": 0.01794771751853297, "percentage": 1.79, "elapsed_time": "0:45:39", "remaining_time": "1 day, 17:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 323, "total_steps": 17941, "loss": 1.9625, "learning_rate": 9.999958058069237e-05, "epoch": 0.018003455771696115, "percentage": 1.8, "elapsed_time": "0:45:47", "remaining_time": "1 day, 17:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 17941, "loss": 1.6326, "learning_rate": 9.999954331665182e-05, "epoch": 0.01805919402485926, "percentage": 1.81, "elapsed_time": "0:45:56", "remaining_time": "1 day, 17:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 17941, "loss": 1.8484, "learning_rate": 9.999950446691728e-05, "epoch": 0.018114932278022407, "percentage": 1.81, "elapsed_time": "0:46:04", "remaining_time": "1 day, 17:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 17941, "loss": 1.8855, "learning_rate": 9.999946403148997e-05, "epoch": 0.018170670531185554, "percentage": 1.82, "elapsed_time": "0:46:13", "remaining_time": "1 day, 17:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 327, "total_steps": 17941, "loss": 1.8222, "learning_rate": 9.999942201037118e-05, "epoch": 0.0182264087843487, "percentage": 1.82, "elapsed_time": "0:46:21", "remaining_time": "1 day, 17:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 17941, "loss": 1.4395, "learning_rate": 9.999937840356224e-05, "epoch": 0.018282147037511843, "percentage": 1.83, "elapsed_time": "0:46:30", "remaining_time": "1 day, 17:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 329, "total_steps": 17941, "loss": 1.7122, "learning_rate": 9.999933321106452e-05, "epoch": 0.01833788529067499, "percentage": 1.83, "elapsed_time": "0:46:38", "remaining_time": "1 day, 17:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 17941, "loss": 1.8863, "learning_rate": 9.999928643287948e-05, "epoch": 0.018393623543838136, "percentage": 1.84, "elapsed_time": "0:46:47", "remaining_time": "1 day, 17:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 331, "total_steps": 17941, "loss": 1.8184, "learning_rate": 9.999923806900859e-05, "epoch": 0.018449361797001282, "percentage": 1.84, "elapsed_time": "0:46:56", "remaining_time": "1 day, 17:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 17941, "loss": 1.843, "learning_rate": 9.99991881194534e-05, "epoch": 0.018505100050164428, "percentage": 1.85, "elapsed_time": "0:47:04", "remaining_time": "1 day, 17:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 333, "total_steps": 17941, "loss": 1.7728, "learning_rate": 9.999913658421544e-05, "epoch": 0.018560838303327575, "percentage": 1.86, "elapsed_time": "0:47:13", "remaining_time": "1 day, 17:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 17941, "loss": 1.9225, "learning_rate": 9.999908346329642e-05, "epoch": 0.01861657655649072, "percentage": 1.86, "elapsed_time": "0:47:21", "remaining_time": "1 day, 17:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 17941, "loss": 1.7579, "learning_rate": 9.999902875669797e-05, "epoch": 0.018672314809653867, "percentage": 1.87, "elapsed_time": "0:47:30", "remaining_time": "1 day, 17:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 17941, "loss": 1.8859, "learning_rate": 9.999897246442184e-05, "epoch": 0.01872805306281701, "percentage": 1.87, "elapsed_time": "0:47:38", "remaining_time": "1 day, 17:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 337, "total_steps": 17941, "loss": 1.6809, "learning_rate": 9.999891458646983e-05, "epoch": 0.018783791315980156, "percentage": 1.88, "elapsed_time": "0:47:46", "remaining_time": "1 day, 17:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 17941, "loss": 1.7961, "learning_rate": 9.999885512284375e-05, "epoch": 0.018839529569143303, "percentage": 1.88, "elapsed_time": "0:47:55", "remaining_time": "1 day, 17:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 339, "total_steps": 17941, "loss": 1.6943, "learning_rate": 9.999879407354551e-05, "epoch": 0.01889526782230645, "percentage": 1.89, "elapsed_time": "0:48:03", "remaining_time": "1 day, 17:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 17941, "loss": 1.7652, "learning_rate": 9.999873143857704e-05, "epoch": 0.018951006075469595, "percentage": 1.9, "elapsed_time": "0:48:13", "remaining_time": "1 day, 17:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 341, "total_steps": 17941, "loss": 1.7483, "learning_rate": 9.99986672179403e-05, "epoch": 0.01900674432863274, "percentage": 1.9, "elapsed_time": "0:48:22", "remaining_time": "1 day, 17:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 17941, "loss": 1.8883, "learning_rate": 9.999860141163736e-05, "epoch": 0.019062482581795888, "percentage": 1.91, "elapsed_time": "0:48:30", "remaining_time": "1 day, 17:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 343, "total_steps": 17941, "loss": 2.1536, "learning_rate": 9.99985340196703e-05, "epoch": 0.01911822083495903, "percentage": 1.91, "elapsed_time": "0:48:38", "remaining_time": "1 day, 17:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 17941, "loss": 1.9443, "learning_rate": 9.999846504204124e-05, "epoch": 0.019173959088122177, "percentage": 1.92, "elapsed_time": "0:48:47", "remaining_time": "1 day, 17:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 17941, "loss": 1.7273, "learning_rate": 9.999839447875238e-05, "epoch": 0.019229697341285323, "percentage": 1.92, "elapsed_time": "0:48:55", "remaining_time": "1 day, 17:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 17941, "loss": 1.8024, "learning_rate": 9.999832232980597e-05, "epoch": 0.01928543559444847, "percentage": 1.93, "elapsed_time": "0:49:04", "remaining_time": "1 day, 17:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 347, "total_steps": 17941, "loss": 1.6531, "learning_rate": 9.999824859520428e-05, "epoch": 0.019341173847611616, "percentage": 1.93, "elapsed_time": "0:49:12", "remaining_time": "1 day, 17:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 17941, "loss": 2.1477, "learning_rate": 9.999817327494967e-05, "epoch": 0.019396912100774762, "percentage": 1.94, "elapsed_time": "0:49:21", "remaining_time": "1 day, 17:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 349, "total_steps": 17941, "loss": 2.0333, "learning_rate": 9.999809636904449e-05, "epoch": 0.01945265035393791, "percentage": 1.95, "elapsed_time": "0:49:29", "remaining_time": "1 day, 17:34:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 17941, "loss": 1.7542, "learning_rate": 9.999801787749121e-05, "epoch": 0.019508388607101055, "percentage": 1.95, "elapsed_time": "0:49:39", "remaining_time": "1 day, 17:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 351, "total_steps": 17941, "loss": 1.9207, "learning_rate": 9.999793780029232e-05, "epoch": 0.019564126860264198, "percentage": 1.96, "elapsed_time": "0:49:47", "remaining_time": "1 day, 17:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 17941, "loss": 1.8293, "learning_rate": 9.999785613745035e-05, "epoch": 0.019619865113427344, "percentage": 1.96, "elapsed_time": "0:49:55", "remaining_time": "1 day, 17:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 353, "total_steps": 17941, "loss": 1.8176, "learning_rate": 9.999777288896787e-05, "epoch": 0.01967560336659049, "percentage": 1.97, "elapsed_time": "0:50:04", "remaining_time": "1 day, 17:34:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 17941, "loss": 1.961, "learning_rate": 9.999768805484757e-05, "epoch": 0.019731341619753637, "percentage": 1.97, "elapsed_time": "0:50:12", "remaining_time": "1 day, 17:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 17941, "loss": 1.6902, "learning_rate": 9.999760163509209e-05, "epoch": 0.019787079872916783, "percentage": 1.98, "elapsed_time": "0:50:21", "remaining_time": "1 day, 17:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 17941, "loss": 1.352, "learning_rate": 9.99975136297042e-05, "epoch": 0.01984281812607993, "percentage": 1.98, "elapsed_time": "0:50:29", "remaining_time": "1 day, 17:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 357, "total_steps": 17941, "loss": 1.952, "learning_rate": 9.999742403868668e-05, "epoch": 0.019898556379243076, "percentage": 1.99, "elapsed_time": "0:50:38", "remaining_time": "1 day, 17:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 17941, "loss": 1.8768, "learning_rate": 9.999733286204238e-05, "epoch": 0.019954294632406222, "percentage": 2.0, "elapsed_time": "0:50:46", "remaining_time": "1 day, 17:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 359, "total_steps": 17941, "loss": 1.8014, "learning_rate": 9.99972400997742e-05, "epoch": 0.020010032885569365, "percentage": 2.0, "elapsed_time": "0:50:55", "remaining_time": "1 day, 17:33:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 17941, "loss": 1.9884, "learning_rate": 9.999714575188505e-05, "epoch": 0.02006577113873251, "percentage": 2.01, "elapsed_time": "0:51:03", "remaining_time": "1 day, 17:33:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 361, "total_steps": 17941, "loss": 1.9038, "learning_rate": 9.999704981837794e-05, "epoch": 0.020121509391895658, "percentage": 2.01, "elapsed_time": "0:51:12", "remaining_time": "1 day, 17:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 17941, "loss": 1.9049, "learning_rate": 9.999695229925591e-05, "epoch": 0.020177247645058804, "percentage": 2.02, "elapsed_time": "0:51:20", "remaining_time": "1 day, 17:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 363, "total_steps": 17941, "loss": 1.7111, "learning_rate": 9.999685319452208e-05, "epoch": 0.02023298589822195, "percentage": 2.02, "elapsed_time": "0:51:28", "remaining_time": "1 day, 17:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 17941, "loss": 1.6416, "learning_rate": 9.999675250417954e-05, "epoch": 0.020288724151385096, "percentage": 2.03, "elapsed_time": "0:51:37", "remaining_time": "1 day, 17:32:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 17941, "loss": 1.7197, "learning_rate": 9.999665022823152e-05, "epoch": 0.020344462404548243, "percentage": 2.03, "elapsed_time": "0:51:45", "remaining_time": "1 day, 17:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 17941, "loss": 1.8762, "learning_rate": 9.999654636668125e-05, "epoch": 0.020400200657711386, "percentage": 2.04, "elapsed_time": "0:51:54", "remaining_time": "1 day, 17:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 367, "total_steps": 17941, "loss": 2.4684, "learning_rate": 9.999644091953204e-05, "epoch": 0.020455938910874532, "percentage": 2.05, "elapsed_time": "0:52:03", "remaining_time": "1 day, 17:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 17941, "loss": 1.8079, "learning_rate": 9.999633388678723e-05, "epoch": 0.02051167716403768, "percentage": 2.05, "elapsed_time": "0:52:11", "remaining_time": "1 day, 17:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 369, "total_steps": 17941, "loss": 1.6885, "learning_rate": 9.999622526845021e-05, "epoch": 0.020567415417200825, "percentage": 2.06, "elapsed_time": "0:52:20", "remaining_time": "1 day, 17:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 17941, "loss": 1.8686, "learning_rate": 9.999611506452439e-05, "epoch": 0.02062315367036397, "percentage": 2.06, "elapsed_time": "0:52:28", "remaining_time": "1 day, 17:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 371, "total_steps": 17941, "loss": 1.8592, "learning_rate": 9.999600327501333e-05, "epoch": 0.020678891923527117, "percentage": 2.07, "elapsed_time": "0:52:36", "remaining_time": "1 day, 17:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 17941, "loss": 1.8752, "learning_rate": 9.999588989992052e-05, "epoch": 0.020734630176690264, "percentage": 2.07, "elapsed_time": "0:52:45", "remaining_time": "1 day, 17:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 373, "total_steps": 17941, "loss": 1.7596, "learning_rate": 9.99957749392496e-05, "epoch": 0.02079036842985341, "percentage": 2.08, "elapsed_time": "0:52:53", "remaining_time": "1 day, 17:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 17941, "loss": 1.7573, "learning_rate": 9.999565839300419e-05, "epoch": 0.020846106683016553, "percentage": 2.08, "elapsed_time": "0:53:02", "remaining_time": "1 day, 17:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 17941, "loss": 1.9692, "learning_rate": 9.999554026118798e-05, "epoch": 0.0209018449361797, "percentage": 2.09, "elapsed_time": "0:53:10", "remaining_time": "1 day, 17:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 17941, "loss": 1.8881, "learning_rate": 9.999542054380473e-05, "epoch": 0.020957583189342845, "percentage": 2.1, "elapsed_time": "0:53:19", "remaining_time": "1 day, 17:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 377, "total_steps": 17941, "loss": 1.8369, "learning_rate": 9.999529924085824e-05, "epoch": 0.02101332144250599, "percentage": 2.1, "elapsed_time": "0:53:28", "remaining_time": "1 day, 17:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 17941, "loss": 1.3352, "learning_rate": 9.999517635235237e-05, "epoch": 0.021069059695669138, "percentage": 2.11, "elapsed_time": "0:53:36", "remaining_time": "1 day, 17:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 379, "total_steps": 17941, "loss": 1.763, "learning_rate": 9.999505187829096e-05, "epoch": 0.021124797948832284, "percentage": 2.11, "elapsed_time": "0:53:44", "remaining_time": "1 day, 17:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 17941, "loss": 1.7431, "learning_rate": 9.9994925818678e-05, "epoch": 0.02118053620199543, "percentage": 2.12, "elapsed_time": "0:53:53", "remaining_time": "1 day, 17:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 381, "total_steps": 17941, "loss": 1.7356, "learning_rate": 9.99947981735175e-05, "epoch": 0.021236274455158577, "percentage": 2.12, "elapsed_time": "0:54:01", "remaining_time": "1 day, 17:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 17941, "loss": 1.861, "learning_rate": 9.99946689428135e-05, "epoch": 0.02129201270832172, "percentage": 2.13, "elapsed_time": "0:54:10", "remaining_time": "1 day, 17:30:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 383, "total_steps": 17941, "loss": 1.9594, "learning_rate": 9.999453812657007e-05, "epoch": 0.021347750961484866, "percentage": 2.13, "elapsed_time": "0:54:18", "remaining_time": "1 day, 17:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 17941, "loss": 2.0073, "learning_rate": 9.99944057247914e-05, "epoch": 0.021403489214648012, "percentage": 2.14, "elapsed_time": "0:54:27", "remaining_time": "1 day, 17:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 17941, "loss": 1.6862, "learning_rate": 9.999427173748164e-05, "epoch": 0.02145922746781116, "percentage": 2.15, "elapsed_time": "0:54:36", "remaining_time": "1 day, 17:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 17941, "loss": 1.8631, "learning_rate": 9.999413616464508e-05, "epoch": 0.021514965720974305, "percentage": 2.15, "elapsed_time": "0:54:44", "remaining_time": "1 day, 17:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 387, "total_steps": 17941, "loss": 1.8636, "learning_rate": 9.999399900628601e-05, "epoch": 0.02157070397413745, "percentage": 2.16, "elapsed_time": "0:54:53", "remaining_time": "1 day, 17:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 17941, "loss": 1.7465, "learning_rate": 9.999386026240878e-05, "epoch": 0.021626442227300598, "percentage": 2.16, "elapsed_time": "0:55:01", "remaining_time": "1 day, 17:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 389, "total_steps": 17941, "loss": 1.6336, "learning_rate": 9.999371993301779e-05, "epoch": 0.021682180480463744, "percentage": 2.17, "elapsed_time": "0:55:10", "remaining_time": "1 day, 17:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 17941, "loss": 1.6755, "learning_rate": 9.999357801811748e-05, "epoch": 0.021737918733626887, "percentage": 2.17, "elapsed_time": "0:55:18", "remaining_time": "1 day, 17:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 391, "total_steps": 17941, "loss": 1.9477, "learning_rate": 9.999343451771234e-05, "epoch": 0.021793656986790033, "percentage": 2.18, "elapsed_time": "0:55:27", "remaining_time": "1 day, 17:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 17941, "loss": 1.7902, "learning_rate": 9.999328943180697e-05, "epoch": 0.02184939523995318, "percentage": 2.18, "elapsed_time": "0:55:35", "remaining_time": "1 day, 17:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 393, "total_steps": 17941, "loss": 1.6744, "learning_rate": 9.999314276040592e-05, "epoch": 0.021905133493116326, "percentage": 2.19, "elapsed_time": "0:55:43", "remaining_time": "1 day, 17:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 17941, "loss": 1.8258, "learning_rate": 9.999299450351387e-05, "epoch": 0.021960871746279472, "percentage": 2.2, "elapsed_time": "0:55:52", "remaining_time": "1 day, 17:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 17941, "loss": 1.8488, "learning_rate": 9.999284466113552e-05, "epoch": 0.02201660999944262, "percentage": 2.2, "elapsed_time": "0:56:01", "remaining_time": "1 day, 17:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 17941, "loss": 2.1775, "learning_rate": 9.999269323327561e-05, "epoch": 0.022072348252605765, "percentage": 2.21, "elapsed_time": "0:56:09", "remaining_time": "1 day, 17:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 397, "total_steps": 17941, "loss": 1.6503, "learning_rate": 9.999254021993895e-05, "epoch": 0.022128086505768908, "percentage": 2.21, "elapsed_time": "0:56:18", "remaining_time": "1 day, 17:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 17941, "loss": 1.8169, "learning_rate": 9.999238562113038e-05, "epoch": 0.022183824758932054, "percentage": 2.22, "elapsed_time": "0:56:27", "remaining_time": "1 day, 17:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 399, "total_steps": 17941, "loss": 1.647, "learning_rate": 9.999222943685482e-05, "epoch": 0.0222395630120952, "percentage": 2.22, "elapsed_time": "0:56:36", "remaining_time": "1 day, 17:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 17941, "loss": 1.6712, "learning_rate": 9.999207166711723e-05, "epoch": 0.022295301265258347, "percentage": 2.23, "elapsed_time": "0:56:44", "remaining_time": "1 day, 17:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 401, "total_steps": 17941, "loss": 1.8125, "learning_rate": 9.999191231192258e-05, "epoch": 0.022351039518421493, "percentage": 2.24, "elapsed_time": "0:56:53", "remaining_time": "1 day, 17:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 17941, "loss": 1.8486, "learning_rate": 9.999175137127596e-05, "epoch": 0.02240677777158464, "percentage": 2.24, "elapsed_time": "0:57:01", "remaining_time": "1 day, 17:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 403, "total_steps": 17941, "loss": 1.6692, "learning_rate": 9.999158884518245e-05, "epoch": 0.022462516024747785, "percentage": 2.25, "elapsed_time": "0:57:10", "remaining_time": "1 day, 17:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 17941, "loss": 1.5916, "learning_rate": 9.999142473364722e-05, "epoch": 0.022518254277910932, "percentage": 2.25, "elapsed_time": "0:57:18", "remaining_time": "1 day, 17:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 17941, "loss": 1.646, "learning_rate": 9.999125903667545e-05, "epoch": 0.022573992531074075, "percentage": 2.26, "elapsed_time": "0:57:27", "remaining_time": "1 day, 17:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 17941, "loss": 1.6874, "learning_rate": 9.999109175427243e-05, "epoch": 0.02262973078423722, "percentage": 2.26, "elapsed_time": "0:57:35", "remaining_time": "1 day, 17:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 407, "total_steps": 17941, "loss": 1.9116, "learning_rate": 9.999092288644345e-05, "epoch": 0.022685469037400367, "percentage": 2.27, "elapsed_time": "0:57:44", "remaining_time": "1 day, 17:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 17941, "loss": 1.4898, "learning_rate": 9.999075243319386e-05, "epoch": 0.022741207290563514, "percentage": 2.27, "elapsed_time": "0:57:52", "remaining_time": "1 day, 17:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 409, "total_steps": 17941, "loss": 1.7671, "learning_rate": 9.999058039452906e-05, "epoch": 0.02279694554372666, "percentage": 2.28, "elapsed_time": "0:58:01", "remaining_time": "1 day, 17:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 17941, "loss": 1.7068, "learning_rate": 9.999040677045453e-05, "epoch": 0.022852683796889806, "percentage": 2.29, "elapsed_time": "0:58:09", "remaining_time": "1 day, 17:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 411, "total_steps": 17941, "loss": 1.912, "learning_rate": 9.999023156097575e-05, "epoch": 0.022908422050052953, "percentage": 2.29, "elapsed_time": "0:58:17", "remaining_time": "1 day, 17:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 17941, "loss": 1.7907, "learning_rate": 9.99900547660983e-05, "epoch": 0.0229641603032161, "percentage": 2.3, "elapsed_time": "0:58:26", "remaining_time": "1 day, 17:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 413, "total_steps": 17941, "loss": 1.8333, "learning_rate": 9.998987638582775e-05, "epoch": 0.02301989855637924, "percentage": 2.3, "elapsed_time": "0:58:34", "remaining_time": "1 day, 17:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 17941, "loss": 2.0069, "learning_rate": 9.99896964201698e-05, "epoch": 0.023075636809542388, "percentage": 2.31, "elapsed_time": "0:58:43", "remaining_time": "1 day, 17:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 17941, "loss": 1.8571, "learning_rate": 9.998951486913015e-05, "epoch": 0.023131375062705534, "percentage": 2.31, "elapsed_time": "0:58:52", "remaining_time": "1 day, 17:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 17941, "loss": 1.6536, "learning_rate": 9.998933173271453e-05, "epoch": 0.02318711331586868, "percentage": 2.32, "elapsed_time": "0:59:01", "remaining_time": "1 day, 17:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 417, "total_steps": 17941, "loss": 1.8969, "learning_rate": 9.998914701092877e-05, "epoch": 0.023242851569031827, "percentage": 2.32, "elapsed_time": "0:59:09", "remaining_time": "1 day, 17:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 17941, "loss": 1.9305, "learning_rate": 9.998896070377873e-05, "epoch": 0.023298589822194973, "percentage": 2.33, "elapsed_time": "0:59:17", "remaining_time": "1 day, 17:25:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 419, "total_steps": 17941, "loss": 1.9801, "learning_rate": 9.99887728112703e-05, "epoch": 0.02335432807535812, "percentage": 2.34, "elapsed_time": "0:59:26", "remaining_time": "1 day, 17:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 17941, "loss": 1.879, "learning_rate": 9.998858333340945e-05, "epoch": 0.023410066328521262, "percentage": 2.34, "elapsed_time": "0:59:34", "remaining_time": "1 day, 17:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 421, "total_steps": 17941, "loss": 1.6029, "learning_rate": 9.998839227020221e-05, "epoch": 0.02346580458168441, "percentage": 2.35, "elapsed_time": "0:59:43", "remaining_time": "1 day, 17:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 17941, "loss": 1.9165, "learning_rate": 9.998819962165462e-05, "epoch": 0.023521542834847555, "percentage": 2.35, "elapsed_time": "0:59:51", "remaining_time": "1 day, 17:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 423, "total_steps": 17941, "loss": 1.6276, "learning_rate": 9.998800538777278e-05, "epoch": 0.0235772810880107, "percentage": 2.36, "elapsed_time": "1:00:00", "remaining_time": "1 day, 17:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 17941, "loss": 1.5287, "learning_rate": 9.998780956856285e-05, "epoch": 0.023633019341173848, "percentage": 2.36, "elapsed_time": "1:00:08", "remaining_time": "1 day, 17:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 17941, "loss": 1.8008, "learning_rate": 9.998761216403106e-05, "epoch": 0.023688757594336994, "percentage": 2.37, "elapsed_time": "1:00:17", "remaining_time": "1 day, 17:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 17941, "loss": 2.0055, "learning_rate": 9.998741317418366e-05, "epoch": 0.02374449584750014, "percentage": 2.37, "elapsed_time": "1:00:25", "remaining_time": "1 day, 17:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 427, "total_steps": 17941, "loss": 1.6324, "learning_rate": 9.998721259902694e-05, "epoch": 0.023800234100663287, "percentage": 2.38, "elapsed_time": "1:00:34", "remaining_time": "1 day, 17:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 17941, "loss": 1.6075, "learning_rate": 9.99870104385673e-05, "epoch": 0.02385597235382643, "percentage": 2.39, "elapsed_time": "1:00:42", "remaining_time": "1 day, 17:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 429, "total_steps": 17941, "loss": 1.6517, "learning_rate": 9.998680669281116e-05, "epoch": 0.023911710606989576, "percentage": 2.39, "elapsed_time": "1:00:51", "remaining_time": "1 day, 17:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 17941, "loss": 1.6884, "learning_rate": 9.998660136176492e-05, "epoch": 0.023967448860152722, "percentage": 2.4, "elapsed_time": "1:00:59", "remaining_time": "1 day, 17:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 431, "total_steps": 17941, "loss": 1.7113, "learning_rate": 9.998639444543514e-05, "epoch": 0.02402318711331587, "percentage": 2.4, "elapsed_time": "1:01:08", "remaining_time": "1 day, 17:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 17941, "loss": 1.5067, "learning_rate": 9.998618594382836e-05, "epoch": 0.024078925366479015, "percentage": 2.41, "elapsed_time": "1:01:17", "remaining_time": "1 day, 17:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 433, "total_steps": 17941, "loss": 1.6967, "learning_rate": 9.99859758569512e-05, "epoch": 0.02413466361964216, "percentage": 2.41, "elapsed_time": "1:01:25", "remaining_time": "1 day, 17:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 17941, "loss": 2.0151, "learning_rate": 9.998576418481033e-05, "epoch": 0.024190401872805307, "percentage": 2.42, "elapsed_time": "1:01:34", "remaining_time": "1 day, 17:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 17941, "loss": 1.6199, "learning_rate": 9.998555092741247e-05, "epoch": 0.024246140125968454, "percentage": 2.42, "elapsed_time": "1:01:42", "remaining_time": "1 day, 17:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 17941, "loss": 1.8874, "learning_rate": 9.998533608476435e-05, "epoch": 0.024301878379131597, "percentage": 2.43, "elapsed_time": "1:01:50", "remaining_time": "1 day, 17:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 437, "total_steps": 17941, "loss": 1.8761, "learning_rate": 9.99851196568728e-05, "epoch": 0.024357616632294743, "percentage": 2.44, "elapsed_time": "1:01:59", "remaining_time": "1 day, 17:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 17941, "loss": 1.6399, "learning_rate": 9.998490164374472e-05, "epoch": 0.02441335488545789, "percentage": 2.44, "elapsed_time": "1:02:07", "remaining_time": "1 day, 17:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 439, "total_steps": 17941, "loss": 1.8343, "learning_rate": 9.998468204538696e-05, "epoch": 0.024469093138621036, "percentage": 2.45, "elapsed_time": "1:02:16", "remaining_time": "1 day, 17:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 17941, "loss": 2.0423, "learning_rate": 9.998446086180653e-05, "epoch": 0.024524831391784182, "percentage": 2.45, "elapsed_time": "1:02:24", "remaining_time": "1 day, 17:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 441, "total_steps": 17941, "loss": 1.5796, "learning_rate": 9.998423809301043e-05, "epoch": 0.024580569644947328, "percentage": 2.46, "elapsed_time": "1:02:33", "remaining_time": "1 day, 17:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 17941, "loss": 1.661, "learning_rate": 9.998401373900573e-05, "epoch": 0.024636307898110475, "percentage": 2.46, "elapsed_time": "1:02:41", "remaining_time": "1 day, 17:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 443, "total_steps": 17941, "loss": 1.9646, "learning_rate": 9.998378779979954e-05, "epoch": 0.024692046151273617, "percentage": 2.47, "elapsed_time": "1:02:50", "remaining_time": "1 day, 17:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 17941, "loss": 1.7896, "learning_rate": 9.998356027539901e-05, "epoch": 0.024747784404436764, "percentage": 2.47, "elapsed_time": "1:02:58", "remaining_time": "1 day, 17:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 17941, "loss": 1.7329, "learning_rate": 9.99833311658114e-05, "epoch": 0.02480352265759991, "percentage": 2.48, "elapsed_time": "1:03:07", "remaining_time": "1 day, 17:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 17941, "loss": 2.0303, "learning_rate": 9.998310047104393e-05, "epoch": 0.024859260910763056, "percentage": 2.49, "elapsed_time": "1:03:15", "remaining_time": "1 day, 17:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 447, "total_steps": 17941, "loss": 1.6114, "learning_rate": 9.998286819110394e-05, "epoch": 0.024914999163926203, "percentage": 2.49, "elapsed_time": "1:03:24", "remaining_time": "1 day, 17:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 17941, "loss": 1.8658, "learning_rate": 9.99826343259988e-05, "epoch": 0.02497073741708935, "percentage": 2.5, "elapsed_time": "1:03:32", "remaining_time": "1 day, 17:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 449, "total_steps": 17941, "loss": 1.8958, "learning_rate": 9.99823988757359e-05, "epoch": 0.025026475670252495, "percentage": 2.5, "elapsed_time": "1:03:40", "remaining_time": "1 day, 17:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 17941, "loss": 1.7768, "learning_rate": 9.998216184032274e-05, "epoch": 0.02508221392341564, "percentage": 2.51, "elapsed_time": "1:03:49", "remaining_time": "1 day, 17:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 451, "total_steps": 17941, "loss": 1.7367, "learning_rate": 9.99819232197668e-05, "epoch": 0.025137952176578784, "percentage": 2.51, "elapsed_time": "1:03:57", "remaining_time": "1 day, 17:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 17941, "loss": 1.6027, "learning_rate": 9.99816830140757e-05, "epoch": 0.02519369042974193, "percentage": 2.52, "elapsed_time": "1:04:06", "remaining_time": "1 day, 17:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 453, "total_steps": 17941, "loss": 1.8879, "learning_rate": 9.998144122325702e-05, "epoch": 0.025249428682905077, "percentage": 2.52, "elapsed_time": "1:04:14", "remaining_time": "1 day, 17:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 17941, "loss": 1.954, "learning_rate": 9.998119784731843e-05, "epoch": 0.025305166936068223, "percentage": 2.53, "elapsed_time": "1:04:23", "remaining_time": "1 day, 17:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 17941, "loss": 1.6971, "learning_rate": 9.998095288626765e-05, "epoch": 0.02536090518923137, "percentage": 2.54, "elapsed_time": "1:04:31", "remaining_time": "1 day, 17:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 17941, "loss": 1.8801, "learning_rate": 9.998070634011246e-05, "epoch": 0.025416643442394516, "percentage": 2.54, "elapsed_time": "1:04:39", "remaining_time": "1 day, 17:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 457, "total_steps": 17941, "loss": 1.8882, "learning_rate": 9.998045820886068e-05, "epoch": 0.025472381695557662, "percentage": 2.55, "elapsed_time": "1:04:48", "remaining_time": "1 day, 17:19:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 17941, "loss": 1.7204, "learning_rate": 9.998020849252017e-05, "epoch": 0.02552811994872081, "percentage": 2.55, "elapsed_time": "1:04:56", "remaining_time": "1 day, 17:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 459, "total_steps": 17941, "loss": 1.6934, "learning_rate": 9.997995719109884e-05, "epoch": 0.02558385820188395, "percentage": 2.56, "elapsed_time": "1:05:05", "remaining_time": "1 day, 17:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 17941, "loss": 1.5534, "learning_rate": 9.997970430460468e-05, "epoch": 0.025639596455047098, "percentage": 2.56, "elapsed_time": "1:05:13", "remaining_time": "1 day, 17:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 461, "total_steps": 17941, "loss": 1.7817, "learning_rate": 9.99794498330457e-05, "epoch": 0.025695334708210244, "percentage": 2.57, "elapsed_time": "1:05:22", "remaining_time": "1 day, 17:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 17941, "loss": 1.759, "learning_rate": 9.997919377642997e-05, "epoch": 0.02575107296137339, "percentage": 2.58, "elapsed_time": "1:05:30", "remaining_time": "1 day, 17:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 463, "total_steps": 17941, "loss": 1.6342, "learning_rate": 9.997893613476561e-05, "epoch": 0.025806811214536537, "percentage": 2.58, "elapsed_time": "1:05:39", "remaining_time": "1 day, 17:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 17941, "loss": 1.7754, "learning_rate": 9.99786769080608e-05, "epoch": 0.025862549467699683, "percentage": 2.59, "elapsed_time": "1:05:47", "remaining_time": "1 day, 17:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 17941, "loss": 1.9323, "learning_rate": 9.997841609632375e-05, "epoch": 0.02591828772086283, "percentage": 2.59, "elapsed_time": "1:05:56", "remaining_time": "1 day, 17:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 17941, "loss": 1.945, "learning_rate": 9.997815369956273e-05, "epoch": 0.025974025974025976, "percentage": 2.6, "elapsed_time": "1:06:04", "remaining_time": "1 day, 17:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 467, "total_steps": 17941, "loss": 1.5908, "learning_rate": 9.997788971778608e-05, "epoch": 0.02602976422718912, "percentage": 2.6, "elapsed_time": "1:06:13", "remaining_time": "1 day, 17:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 17941, "loss": 1.449, "learning_rate": 9.997762415100214e-05, "epoch": 0.026085502480352265, "percentage": 2.61, "elapsed_time": "1:06:21", "remaining_time": "1 day, 17:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 469, "total_steps": 17941, "loss": 1.7667, "learning_rate": 9.997735699921938e-05, "epoch": 0.02614124073351541, "percentage": 2.61, "elapsed_time": "1:06:30", "remaining_time": "1 day, 17:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 17941, "loss": 2.0801, "learning_rate": 9.997708826244623e-05, "epoch": 0.026196978986678558, "percentage": 2.62, "elapsed_time": "1:06:38", "remaining_time": "1 day, 17:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 471, "total_steps": 17941, "loss": 1.9385, "learning_rate": 9.997681794069123e-05, "epoch": 0.026252717239841704, "percentage": 2.63, "elapsed_time": "1:06:47", "remaining_time": "1 day, 17:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 17941, "loss": 1.9021, "learning_rate": 9.997654603396294e-05, "epoch": 0.02630845549300485, "percentage": 2.63, "elapsed_time": "1:06:55", "remaining_time": "1 day, 17:16:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 473, "total_steps": 17941, "loss": 1.7698, "learning_rate": 9.997627254227e-05, "epoch": 0.026364193746167996, "percentage": 2.64, "elapsed_time": "1:07:03", "remaining_time": "1 day, 17:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 17941, "loss": 1.6786, "learning_rate": 9.997599746562108e-05, "epoch": 0.02641993199933114, "percentage": 2.64, "elapsed_time": "1:07:12", "remaining_time": "1 day, 17:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 17941, "loss": 1.8663, "learning_rate": 9.997572080402488e-05, "epoch": 0.026475670252494286, "percentage": 2.65, "elapsed_time": "1:07:20", "remaining_time": "1 day, 17:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 17941, "loss": 1.6064, "learning_rate": 9.997544255749021e-05, "epoch": 0.026531408505657432, "percentage": 2.65, "elapsed_time": "1:07:29", "remaining_time": "1 day, 17:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 477, "total_steps": 17941, "loss": 2.035, "learning_rate": 9.99751627260259e-05, "epoch": 0.02658714675882058, "percentage": 2.66, "elapsed_time": "1:07:37", "remaining_time": "1 day, 17:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 17941, "loss": 1.7838, "learning_rate": 9.997488130964077e-05, "epoch": 0.026642885011983725, "percentage": 2.66, "elapsed_time": "1:07:46", "remaining_time": "1 day, 17:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 479, "total_steps": 17941, "loss": 1.7242, "learning_rate": 9.997459830834379e-05, "epoch": 0.02669862326514687, "percentage": 2.67, "elapsed_time": "1:07:54", "remaining_time": "1 day, 17:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 17941, "loss": 1.8634, "learning_rate": 9.997431372214394e-05, "epoch": 0.026754361518310017, "percentage": 2.68, "elapsed_time": "1:08:03", "remaining_time": "1 day, 17:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 481, "total_steps": 17941, "loss": 1.678, "learning_rate": 9.997402755105022e-05, "epoch": 0.026810099771473164, "percentage": 2.68, "elapsed_time": "1:08:12", "remaining_time": "1 day, 17:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 17941, "loss": 1.6952, "learning_rate": 9.997373979507169e-05, "epoch": 0.026865838024636306, "percentage": 2.69, "elapsed_time": "1:08:20", "remaining_time": "1 day, 17:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 483, "total_steps": 17941, "loss": 1.6948, "learning_rate": 9.997345045421753e-05, "epoch": 0.026921576277799453, "percentage": 2.69, "elapsed_time": "1:08:29", "remaining_time": "1 day, 17:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 17941, "loss": 1.9746, "learning_rate": 9.997315952849688e-05, "epoch": 0.0269773145309626, "percentage": 2.7, "elapsed_time": "1:08:37", "remaining_time": "1 day, 17:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 17941, "loss": 1.9413, "learning_rate": 9.997286701791896e-05, "epoch": 0.027033052784125745, "percentage": 2.7, "elapsed_time": "1:08:46", "remaining_time": "1 day, 17:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 17941, "loss": 1.7646, "learning_rate": 9.99725729224931e-05, "epoch": 0.02708879103728889, "percentage": 2.71, "elapsed_time": "1:08:54", "remaining_time": "1 day, 17:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 487, "total_steps": 17941, "loss": 1.6941, "learning_rate": 9.997227724222855e-05, "epoch": 0.027144529290452038, "percentage": 2.71, "elapsed_time": "1:09:03", "remaining_time": "1 day, 17:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 17941, "loss": 1.6994, "learning_rate": 9.997197997713473e-05, "epoch": 0.027200267543615184, "percentage": 2.72, "elapsed_time": "1:09:11", "remaining_time": "1 day, 17:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 489, "total_steps": 17941, "loss": 1.8408, "learning_rate": 9.997168112722107e-05, "epoch": 0.02725600579677833, "percentage": 2.73, "elapsed_time": "1:09:19", "remaining_time": "1 day, 17:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 17941, "loss": 1.636, "learning_rate": 9.997138069249703e-05, "epoch": 0.027311744049941473, "percentage": 2.73, "elapsed_time": "1:09:28", "remaining_time": "1 day, 17:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 491, "total_steps": 17941, "loss": 1.5011, "learning_rate": 9.997107867297216e-05, "epoch": 0.02736748230310462, "percentage": 2.74, "elapsed_time": "1:09:36", "remaining_time": "1 day, 17:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 17941, "loss": 2.0265, "learning_rate": 9.997077506865602e-05, "epoch": 0.027423220556267766, "percentage": 2.74, "elapsed_time": "1:09:45", "remaining_time": "1 day, 17:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 493, "total_steps": 17941, "loss": 2.0372, "learning_rate": 9.997046987955824e-05, "epoch": 0.027478958809430912, "percentage": 2.75, "elapsed_time": "1:09:53", "remaining_time": "1 day, 17:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 17941, "loss": 1.8226, "learning_rate": 9.997016310568851e-05, "epoch": 0.02753469706259406, "percentage": 2.75, "elapsed_time": "1:10:02", "remaining_time": "1 day, 17:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 17941, "loss": 1.7598, "learning_rate": 9.996985474705654e-05, "epoch": 0.027590435315757205, "percentage": 2.76, "elapsed_time": "1:10:10", "remaining_time": "1 day, 17:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 17941, "loss": 1.9021, "learning_rate": 9.996954480367214e-05, "epoch": 0.02764617356892035, "percentage": 2.76, "elapsed_time": "1:10:19", "remaining_time": "1 day, 17:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 497, "total_steps": 17941, "loss": 1.7989, "learning_rate": 9.996923327554511e-05, "epoch": 0.027701911822083494, "percentage": 2.77, "elapsed_time": "1:10:27", "remaining_time": "1 day, 17:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 17941, "loss": 1.7904, "learning_rate": 9.996892016268535e-05, "epoch": 0.02775765007524664, "percentage": 2.78, "elapsed_time": "1:10:35", "remaining_time": "1 day, 17:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 499, "total_steps": 17941, "loss": 1.5494, "learning_rate": 9.996860546510278e-05, "epoch": 0.027813388328409787, "percentage": 2.78, "elapsed_time": "1:10:44", "remaining_time": "1 day, 17:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 17941, "loss": 1.6759, "learning_rate": 9.996828918280737e-05, "epoch": 0.027869126581572933, "percentage": 2.79, "elapsed_time": "1:10:52", "remaining_time": "1 day, 17:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 501, "total_steps": 17941, "loss": 1.7032, "learning_rate": 9.996797131580917e-05, "epoch": 0.02792486483473608, "percentage": 2.79, "elapsed_time": "1:11:01", "remaining_time": "1 day, 17:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 17941, "loss": 1.7786, "learning_rate": 9.996765186411827e-05, "epoch": 0.027980603087899226, "percentage": 2.8, "elapsed_time": "1:11:09", "remaining_time": "1 day, 17:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 503, "total_steps": 17941, "loss": 1.9493, "learning_rate": 9.996733082774477e-05, "epoch": 0.028036341341062372, "percentage": 2.8, "elapsed_time": "1:11:18", "remaining_time": "1 day, 17:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 17941, "loss": 2.0257, "learning_rate": 9.996700820669886e-05, "epoch": 0.02809207959422552, "percentage": 2.81, "elapsed_time": "1:11:26", "remaining_time": "1 day, 17:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 17941, "loss": 1.8291, "learning_rate": 9.996668400099077e-05, "epoch": 0.02814781784738866, "percentage": 2.81, "elapsed_time": "1:11:35", "remaining_time": "1 day, 17:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 17941, "loss": 1.6841, "learning_rate": 9.99663582106308e-05, "epoch": 0.028203556100551808, "percentage": 2.82, "elapsed_time": "1:11:43", "remaining_time": "1 day, 17:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 507, "total_steps": 17941, "loss": 2.1915, "learning_rate": 9.996603083562928e-05, "epoch": 0.028259294353714954, "percentage": 2.83, "elapsed_time": "1:11:52", "remaining_time": "1 day, 17:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 17941, "loss": 1.6893, "learning_rate": 9.996570187599658e-05, "epoch": 0.0283150326068781, "percentage": 2.83, "elapsed_time": "1:12:00", "remaining_time": "1 day, 17:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 509, "total_steps": 17941, "loss": 1.5927, "learning_rate": 9.996537133174313e-05, "epoch": 0.028370770860041247, "percentage": 2.84, "elapsed_time": "1:12:09", "remaining_time": "1 day, 17:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 17941, "loss": 1.6685, "learning_rate": 9.996503920287942e-05, "epoch": 0.028426509113204393, "percentage": 2.84, "elapsed_time": "1:12:18", "remaining_time": "1 day, 17:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 511, "total_steps": 17941, "loss": 1.8294, "learning_rate": 9.996470548941598e-05, "epoch": 0.02848224736636754, "percentage": 2.85, "elapsed_time": "1:12:26", "remaining_time": "1 day, 17:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 17941, "loss": 1.6819, "learning_rate": 9.996437019136342e-05, "epoch": 0.028537985619530686, "percentage": 2.85, "elapsed_time": "1:12:35", "remaining_time": "1 day, 17:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 513, "total_steps": 17941, "loss": 1.8129, "learning_rate": 9.996403330873233e-05, "epoch": 0.02859372387269383, "percentage": 2.86, "elapsed_time": "1:12:43", "remaining_time": "1 day, 17:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 17941, "loss": 1.8961, "learning_rate": 9.996369484153342e-05, "epoch": 0.028649462125856975, "percentage": 2.86, "elapsed_time": "1:12:51", "remaining_time": "1 day, 17:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 17941, "loss": 1.7716, "learning_rate": 9.996335478977741e-05, "epoch": 0.02870520037902012, "percentage": 2.87, "elapsed_time": "1:13:00", "remaining_time": "1 day, 17:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 17941, "loss": 1.7395, "learning_rate": 9.99630131534751e-05, "epoch": 0.028760938632183267, "percentage": 2.88, "elapsed_time": "1:13:08", "remaining_time": "1 day, 17:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 517, "total_steps": 17941, "loss": 0.9524, "learning_rate": 9.996266993263732e-05, "epoch": 0.028816676885346414, "percentage": 2.88, "elapsed_time": "1:13:17", "remaining_time": "1 day, 17:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 17941, "loss": 1.5957, "learning_rate": 9.996232512727495e-05, "epoch": 0.02887241513850956, "percentage": 2.89, "elapsed_time": "1:13:26", "remaining_time": "1 day, 17:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 519, "total_steps": 17941, "loss": 1.8356, "learning_rate": 9.996197873739892e-05, "epoch": 0.028928153391672706, "percentage": 2.89, "elapsed_time": "1:13:35", "remaining_time": "1 day, 17:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 17941, "loss": 1.7832, "learning_rate": 9.996163076302023e-05, "epoch": 0.02898389164483585, "percentage": 2.9, "elapsed_time": "1:13:43", "remaining_time": "1 day, 17:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 521, "total_steps": 17941, "loss": 1.696, "learning_rate": 9.996128120414989e-05, "epoch": 0.029039629897998995, "percentage": 2.9, "elapsed_time": "1:13:52", "remaining_time": "1 day, 17:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 17941, "loss": 1.8185, "learning_rate": 9.996093006079903e-05, "epoch": 0.029095368151162142, "percentage": 2.91, "elapsed_time": "1:14:00", "remaining_time": "1 day, 17:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 523, "total_steps": 17941, "loss": 2.0013, "learning_rate": 9.996057733297876e-05, "epoch": 0.029151106404325288, "percentage": 2.92, "elapsed_time": "1:14:08", "remaining_time": "1 day, 17:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 17941, "loss": 1.7923, "learning_rate": 9.996022302070025e-05, "epoch": 0.029206844657488434, "percentage": 2.92, "elapsed_time": "1:14:17", "remaining_time": "1 day, 17:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 17941, "loss": 1.674, "learning_rate": 9.995986712397477e-05, "epoch": 0.02926258291065158, "percentage": 2.93, "elapsed_time": "1:14:25", "remaining_time": "1 day, 17:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 17941, "loss": 2.041, "learning_rate": 9.995950964281357e-05, "epoch": 0.029318321163814727, "percentage": 2.93, "elapsed_time": "1:14:34", "remaining_time": "1 day, 17:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 527, "total_steps": 17941, "loss": 1.9253, "learning_rate": 9.995915057722804e-05, "epoch": 0.029374059416977873, "percentage": 2.94, "elapsed_time": "1:14:43", "remaining_time": "1 day, 17:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 17941, "loss": 1.5032, "learning_rate": 9.995878992722951e-05, "epoch": 0.029429797670141016, "percentage": 2.94, "elapsed_time": "1:14:52", "remaining_time": "1 day, 17:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 529, "total_steps": 17941, "loss": 1.8901, "learning_rate": 9.995842769282946e-05, "epoch": 0.029485535923304163, "percentage": 2.95, "elapsed_time": "1:15:01", "remaining_time": "1 day, 17:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 17941, "loss": 2.1208, "learning_rate": 9.995806387403934e-05, "epoch": 0.02954127417646731, "percentage": 2.95, "elapsed_time": "1:15:09", "remaining_time": "1 day, 17:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 531, "total_steps": 17941, "loss": 1.9563, "learning_rate": 9.995769847087073e-05, "epoch": 0.029597012429630455, "percentage": 2.96, "elapsed_time": "1:15:18", "remaining_time": "1 day, 17:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 17941, "loss": 2.0126, "learning_rate": 9.99573314833352e-05, "epoch": 0.0296527506827936, "percentage": 2.97, "elapsed_time": "1:15:26", "remaining_time": "1 day, 17:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 533, "total_steps": 17941, "loss": 1.92, "learning_rate": 9.995696291144438e-05, "epoch": 0.029708488935956748, "percentage": 2.97, "elapsed_time": "1:15:34", "remaining_time": "1 day, 17:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 17941, "loss": 1.5072, "learning_rate": 9.995659275520995e-05, "epoch": 0.029764227189119894, "percentage": 2.98, "elapsed_time": "1:15:43", "remaining_time": "1 day, 17:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 17941, "loss": 2.0751, "learning_rate": 9.995622101464368e-05, "epoch": 0.02981996544228304, "percentage": 2.98, "elapsed_time": "1:15:51", "remaining_time": "1 day, 17:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 17941, "loss": 2.0538, "learning_rate": 9.995584768975734e-05, "epoch": 0.029875703695446183, "percentage": 2.99, "elapsed_time": "1:16:00", "remaining_time": "1 day, 17:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 537, "total_steps": 17941, "loss": 1.6813, "learning_rate": 9.995547278056279e-05, "epoch": 0.02993144194860933, "percentage": 2.99, "elapsed_time": "1:16:08", "remaining_time": "1 day, 17:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 17941, "loss": 1.9213, "learning_rate": 9.995509628707189e-05, "epoch": 0.029987180201772476, "percentage": 3.0, "elapsed_time": "1:16:17", "remaining_time": "1 day, 17:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 539, "total_steps": 17941, "loss": 1.7977, "learning_rate": 9.99547182092966e-05, "epoch": 0.030042918454935622, "percentage": 3.0, "elapsed_time": "1:16:25", "remaining_time": "1 day, 17:07:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 17941, "loss": 1.9346, "learning_rate": 9.99543385472489e-05, "epoch": 0.03009865670809877, "percentage": 3.01, "elapsed_time": "1:16:34", "remaining_time": "1 day, 17:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 541, "total_steps": 17941, "loss": 1.7214, "learning_rate": 9.995395730094083e-05, "epoch": 0.030154394961261915, "percentage": 3.02, "elapsed_time": "1:16:43", "remaining_time": "1 day, 17:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 17941, "loss": 1.6459, "learning_rate": 9.99535744703845e-05, "epoch": 0.03021013321442506, "percentage": 3.02, "elapsed_time": "1:16:51", "remaining_time": "1 day, 17:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 543, "total_steps": 17941, "loss": 1.7781, "learning_rate": 9.995319005559202e-05, "epoch": 0.030265871467588207, "percentage": 3.03, "elapsed_time": "1:16:59", "remaining_time": "1 day, 17:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 17941, "loss": 1.8662, "learning_rate": 9.995280405657561e-05, "epoch": 0.03032160972075135, "percentage": 3.03, "elapsed_time": "1:17:08", "remaining_time": "1 day, 17:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 17941, "loss": 1.7803, "learning_rate": 9.99524164733475e-05, "epoch": 0.030377347973914497, "percentage": 3.04, "elapsed_time": "1:17:16", "remaining_time": "1 day, 17:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 17941, "loss": 1.7344, "learning_rate": 9.995202730591997e-05, "epoch": 0.030433086227077643, "percentage": 3.04, "elapsed_time": "1:17:25", "remaining_time": "1 day, 17:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 547, "total_steps": 17941, "loss": 1.864, "learning_rate": 9.995163655430539e-05, "epoch": 0.03048882448024079, "percentage": 3.05, "elapsed_time": "1:17:33", "remaining_time": "1 day, 17:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 17941, "loss": 1.711, "learning_rate": 9.995124421851614e-05, "epoch": 0.030544562733403936, "percentage": 3.05, "elapsed_time": "1:17:42", "remaining_time": "1 day, 17:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 549, "total_steps": 17941, "loss": 1.4136, "learning_rate": 9.995085029856464e-05, "epoch": 0.030600300986567082, "percentage": 3.06, "elapsed_time": "1:17:50", "remaining_time": "1 day, 17:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 17941, "loss": 1.8524, "learning_rate": 9.99504547944634e-05, "epoch": 0.030656039239730228, "percentage": 3.07, "elapsed_time": "1:17:59", "remaining_time": "1 day, 17:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 551, "total_steps": 17941, "loss": 1.5452, "learning_rate": 9.995005770622499e-05, "epoch": 0.03071177749289337, "percentage": 3.07, "elapsed_time": "1:18:07", "remaining_time": "1 day, 17:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 17941, "loss": 1.8935, "learning_rate": 9.994965903386198e-05, "epoch": 0.030767515746056517, "percentage": 3.08, "elapsed_time": "1:18:16", "remaining_time": "1 day, 17:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 553, "total_steps": 17941, "loss": 1.9558, "learning_rate": 9.994925877738698e-05, "epoch": 0.030823253999219664, "percentage": 3.08, "elapsed_time": "1:18:24", "remaining_time": "1 day, 17:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 17941, "loss": 1.6339, "learning_rate": 9.994885693681274e-05, "epoch": 0.03087899225238281, "percentage": 3.09, "elapsed_time": "1:18:33", "remaining_time": "1 day, 17:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 17941, "loss": 1.6943, "learning_rate": 9.994845351215199e-05, "epoch": 0.030934730505545956, "percentage": 3.09, "elapsed_time": "1:18:41", "remaining_time": "1 day, 17:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 17941, "loss": 1.9641, "learning_rate": 9.994804850341748e-05, "epoch": 0.030990468758709103, "percentage": 3.1, "elapsed_time": "1:18:50", "remaining_time": "1 day, 17:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 557, "total_steps": 17941, "loss": 1.9041, "learning_rate": 9.994764191062212e-05, "epoch": 0.03104620701187225, "percentage": 3.1, "elapsed_time": "1:18:58", "remaining_time": "1 day, 17:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 17941, "loss": 1.6671, "learning_rate": 9.994723373377876e-05, "epoch": 0.031101945265035395, "percentage": 3.11, "elapsed_time": "1:19:06", "remaining_time": "1 day, 17:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 559, "total_steps": 17941, "loss": 1.6415, "learning_rate": 9.994682397290036e-05, "epoch": 0.031157683518198538, "percentage": 3.12, "elapsed_time": "1:19:15", "remaining_time": "1 day, 17:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 17941, "loss": 1.9253, "learning_rate": 9.99464126279999e-05, "epoch": 0.031213421771361684, "percentage": 3.12, "elapsed_time": "1:19:23", "remaining_time": "1 day, 17:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 561, "total_steps": 17941, "loss": 1.5449, "learning_rate": 9.994599969909047e-05, "epoch": 0.03126916002452483, "percentage": 3.13, "elapsed_time": "1:19:32", "remaining_time": "1 day, 17:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 562, "total_steps": 17941, "loss": 1.8665, "learning_rate": 9.99455851861851e-05, "epoch": 0.03132489827768798, "percentage": 3.13, "elapsed_time": "1:19:40", "remaining_time": "1 day, 17:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 563, "total_steps": 17941, "loss": 1.8442, "learning_rate": 9.9945169089297e-05, "epoch": 0.03138063653085112, "percentage": 3.14, "elapsed_time": "1:19:49", "remaining_time": "1 day, 17:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 564, "total_steps": 17941, "loss": 1.8436, "learning_rate": 9.994475140843933e-05, "epoch": 0.031436374784014266, "percentage": 3.14, "elapsed_time": "1:19:58", "remaining_time": "1 day, 17:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 565, "total_steps": 17941, "loss": 1.7172, "learning_rate": 9.994433214362532e-05, "epoch": 0.031492113037177416, "percentage": 3.15, "elapsed_time": "1:20:06", "remaining_time": "1 day, 17:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 566, "total_steps": 17941, "loss": 1.6919, "learning_rate": 9.994391129486833e-05, "epoch": 0.03154785129034056, "percentage": 3.15, "elapsed_time": "1:20:15", "remaining_time": "1 day, 17:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 567, "total_steps": 17941, "loss": 2.1026, "learning_rate": 9.994348886218163e-05, "epoch": 0.03160358954350371, "percentage": 3.16, "elapsed_time": "1:20:23", "remaining_time": "1 day, 17:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 568, "total_steps": 17941, "loss": 1.9232, "learning_rate": 9.994306484557868e-05, "epoch": 0.03165932779666685, "percentage": 3.17, "elapsed_time": "1:20:32", "remaining_time": "1 day, 17:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 569, "total_steps": 17941, "loss": 1.6408, "learning_rate": 9.99426392450729e-05, "epoch": 0.03171506604983, "percentage": 3.17, "elapsed_time": "1:20:40", "remaining_time": "1 day, 17:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 17941, "loss": 1.8562, "learning_rate": 9.994221206067777e-05, "epoch": 0.031770804302993144, "percentage": 3.18, "elapsed_time": "1:20:49", "remaining_time": "1 day, 17:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 571, "total_steps": 17941, "loss": 1.7045, "learning_rate": 9.994178329240686e-05, "epoch": 0.03182654255615629, "percentage": 3.18, "elapsed_time": "1:20:57", "remaining_time": "1 day, 17:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 572, "total_steps": 17941, "loss": 1.8015, "learning_rate": 9.994135294027378e-05, "epoch": 0.03188228080931944, "percentage": 3.19, "elapsed_time": "1:21:05", "remaining_time": "1 day, 17:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 573, "total_steps": 17941, "loss": 2.1681, "learning_rate": 9.994092100429215e-05, "epoch": 0.03193801906248258, "percentage": 3.19, "elapsed_time": "1:21:14", "remaining_time": "1 day, 17:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 574, "total_steps": 17941, "loss": 1.6771, "learning_rate": 9.994048748447569e-05, "epoch": 0.03199375731564573, "percentage": 3.2, "elapsed_time": "1:21:23", "remaining_time": "1 day, 17:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 575, "total_steps": 17941, "loss": 1.7157, "learning_rate": 9.994005238083815e-05, "epoch": 0.03204949556880887, "percentage": 3.2, "elapsed_time": "1:21:32", "remaining_time": "1 day, 17:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 576, "total_steps": 17941, "loss": 1.8095, "learning_rate": 9.99396156933933e-05, "epoch": 0.03210523382197202, "percentage": 3.21, "elapsed_time": "1:21:40", "remaining_time": "1 day, 17:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 577, "total_steps": 17941, "loss": 2.2013, "learning_rate": 9.993917742215502e-05, "epoch": 0.032160972075135165, "percentage": 3.22, "elapsed_time": "1:21:49", "remaining_time": "1 day, 17:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 578, "total_steps": 17941, "loss": 1.9967, "learning_rate": 9.993873756713719e-05, "epoch": 0.03221671032829831, "percentage": 3.22, "elapsed_time": "1:21:57", "remaining_time": "1 day, 17:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 579, "total_steps": 17941, "loss": 1.6328, "learning_rate": 9.993829612835378e-05, "epoch": 0.03227244858146146, "percentage": 3.23, "elapsed_time": "1:22:06", "remaining_time": "1 day, 17:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 17941, "loss": 1.9793, "learning_rate": 9.993785310581875e-05, "epoch": 0.0323281868346246, "percentage": 3.23, "elapsed_time": "1:22:14", "remaining_time": "1 day, 17:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 581, "total_steps": 17941, "loss": 1.7687, "learning_rate": 9.993740849954619e-05, "epoch": 0.03238392508778775, "percentage": 3.24, "elapsed_time": "1:22:23", "remaining_time": "1 day, 17:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 582, "total_steps": 17941, "loss": 1.8983, "learning_rate": 9.99369623095502e-05, "epoch": 0.03243966334095089, "percentage": 3.24, "elapsed_time": "1:22:31", "remaining_time": "1 day, 17:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 583, "total_steps": 17941, "loss": 1.6625, "learning_rate": 9.993651453584491e-05, "epoch": 0.03249540159411404, "percentage": 3.25, "elapsed_time": "1:22:39", "remaining_time": "1 day, 17:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 584, "total_steps": 17941, "loss": 1.7413, "learning_rate": 9.993606517844452e-05, "epoch": 0.032551139847277186, "percentage": 3.26, "elapsed_time": "1:22:49", "remaining_time": "1 day, 17:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 585, "total_steps": 17941, "loss": 1.875, "learning_rate": 9.993561423736331e-05, "epoch": 0.032606878100440335, "percentage": 3.26, "elapsed_time": "1:22:57", "remaining_time": "1 day, 17:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 586, "total_steps": 17941, "loss": 1.9669, "learning_rate": 9.993516171261555e-05, "epoch": 0.03266261635360348, "percentage": 3.27, "elapsed_time": "1:23:06", "remaining_time": "1 day, 17:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 587, "total_steps": 17941, "loss": 1.808, "learning_rate": 9.993470760421559e-05, "epoch": 0.03271835460676662, "percentage": 3.27, "elapsed_time": "1:23:14", "remaining_time": "1 day, 17:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 588, "total_steps": 17941, "loss": 1.7654, "learning_rate": 9.993425191217787e-05, "epoch": 0.03277409285992977, "percentage": 3.28, "elapsed_time": "1:23:23", "remaining_time": "1 day, 17:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 589, "total_steps": 17941, "loss": 1.8282, "learning_rate": 9.993379463651679e-05, "epoch": 0.032829831113092914, "percentage": 3.28, "elapsed_time": "1:23:31", "remaining_time": "1 day, 17:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 17941, "loss": 1.6477, "learning_rate": 9.99333357772469e-05, "epoch": 0.032885569366256064, "percentage": 3.29, "elapsed_time": "1:23:40", "remaining_time": "1 day, 17:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 591, "total_steps": 17941, "loss": 1.6518, "learning_rate": 9.993287533438273e-05, "epoch": 0.032941307619419206, "percentage": 3.29, "elapsed_time": "1:23:48", "remaining_time": "1 day, 17:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 592, "total_steps": 17941, "loss": 1.6485, "learning_rate": 9.993241330793888e-05, "epoch": 0.032997045872582356, "percentage": 3.3, "elapsed_time": "1:23:56", "remaining_time": "1 day, 17:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 593, "total_steps": 17941, "loss": 2.0397, "learning_rate": 9.993194969792999e-05, "epoch": 0.0330527841257455, "percentage": 3.31, "elapsed_time": "1:24:05", "remaining_time": "1 day, 16:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 594, "total_steps": 17941, "loss": 1.6368, "learning_rate": 9.99314845043708e-05, "epoch": 0.03310852237890864, "percentage": 3.31, "elapsed_time": "1:24:13", "remaining_time": "1 day, 16:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 595, "total_steps": 17941, "loss": 1.6886, "learning_rate": 9.993101772727602e-05, "epoch": 0.03316426063207179, "percentage": 3.32, "elapsed_time": "1:24:22", "remaining_time": "1 day, 16:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 596, "total_steps": 17941, "loss": 1.7587, "learning_rate": 9.993054936666048e-05, "epoch": 0.033219998885234935, "percentage": 3.32, "elapsed_time": "1:24:30", "remaining_time": "1 day, 16:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 597, "total_steps": 17941, "loss": 1.8861, "learning_rate": 9.993007942253905e-05, "epoch": 0.033275737138398084, "percentage": 3.33, "elapsed_time": "1:24:39", "remaining_time": "1 day, 16:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 598, "total_steps": 17941, "loss": 1.6563, "learning_rate": 9.99296078949266e-05, "epoch": 0.03333147539156123, "percentage": 3.33, "elapsed_time": "1:24:47", "remaining_time": "1 day, 16:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 599, "total_steps": 17941, "loss": 1.5493, "learning_rate": 9.99291347838381e-05, "epoch": 0.03338721364472438, "percentage": 3.34, "elapsed_time": "1:24:56", "remaining_time": "1 day, 16:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 17941, "loss": 2.1359, "learning_rate": 9.992866008928855e-05, "epoch": 0.03344295189788752, "percentage": 3.34, "elapsed_time": "1:25:04", "remaining_time": "1 day, 16:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 601, "total_steps": 17941, "loss": 2.0139, "learning_rate": 9.9928183811293e-05, "epoch": 0.03349869015105066, "percentage": 3.35, "elapsed_time": "1:25:13", "remaining_time": "1 day, 16:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 602, "total_steps": 17941, "loss": 1.6594, "learning_rate": 9.992770594986658e-05, "epoch": 0.03355442840421381, "percentage": 3.36, "elapsed_time": "1:25:21", "remaining_time": "1 day, 16:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 603, "total_steps": 17941, "loss": 1.8432, "learning_rate": 9.992722650502442e-05, "epoch": 0.033610166657376955, "percentage": 3.36, "elapsed_time": "1:25:29", "remaining_time": "1 day, 16:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 604, "total_steps": 17941, "loss": 1.8071, "learning_rate": 9.992674547678171e-05, "epoch": 0.033665904910540105, "percentage": 3.37, "elapsed_time": "1:25:38", "remaining_time": "1 day, 16:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 605, "total_steps": 17941, "loss": 1.6391, "learning_rate": 9.992626286515373e-05, "epoch": 0.03372164316370325, "percentage": 3.37, "elapsed_time": "1:25:46", "remaining_time": "1 day, 16:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 606, "total_steps": 17941, "loss": 2.0711, "learning_rate": 9.992577867015581e-05, "epoch": 0.0337773814168664, "percentage": 3.38, "elapsed_time": "1:25:55", "remaining_time": "1 day, 16:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 607, "total_steps": 17941, "loss": 1.5886, "learning_rate": 9.992529289180326e-05, "epoch": 0.03383311967002954, "percentage": 3.38, "elapsed_time": "1:26:03", "remaining_time": "1 day, 16:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 608, "total_steps": 17941, "loss": 1.9211, "learning_rate": 9.992480553011151e-05, "epoch": 0.03388885792319269, "percentage": 3.39, "elapsed_time": "1:26:12", "remaining_time": "1 day, 16:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 609, "total_steps": 17941, "loss": 1.819, "learning_rate": 9.9924316585096e-05, "epoch": 0.03394459617635583, "percentage": 3.39, "elapsed_time": "1:26:21", "remaining_time": "1 day, 16:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 17941, "loss": 1.6631, "learning_rate": 9.992382605677226e-05, "epoch": 0.034000334429518976, "percentage": 3.4, "elapsed_time": "1:26:30", "remaining_time": "1 day, 16:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 611, "total_steps": 17941, "loss": 2.0759, "learning_rate": 9.992333394515583e-05, "epoch": 0.034056072682682126, "percentage": 3.41, "elapsed_time": "1:26:38", "remaining_time": "1 day, 16:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 612, "total_steps": 17941, "loss": 1.6721, "learning_rate": 9.992284025026231e-05, "epoch": 0.03411181093584527, "percentage": 3.41, "elapsed_time": "1:26:46", "remaining_time": "1 day, 16:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 613, "total_steps": 17941, "loss": 1.807, "learning_rate": 9.992234497210737e-05, "epoch": 0.03416754918900842, "percentage": 3.42, "elapsed_time": "1:26:55", "remaining_time": "1 day, 16:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 614, "total_steps": 17941, "loss": 1.9095, "learning_rate": 9.992184811070673e-05, "epoch": 0.03422328744217156, "percentage": 3.42, "elapsed_time": "1:27:03", "remaining_time": "1 day, 16:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 615, "total_steps": 17941, "loss": 1.7303, "learning_rate": 9.992134966607612e-05, "epoch": 0.03427902569533471, "percentage": 3.43, "elapsed_time": "1:27:12", "remaining_time": "1 day, 16:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 616, "total_steps": 17941, "loss": 1.6339, "learning_rate": 9.992084963823136e-05, "epoch": 0.034334763948497854, "percentage": 3.43, "elapsed_time": "1:27:20", "remaining_time": "1 day, 16:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 617, "total_steps": 17941, "loss": 1.8881, "learning_rate": 9.992034802718832e-05, "epoch": 0.034390502201661, "percentage": 3.44, "elapsed_time": "1:27:29", "remaining_time": "1 day, 16:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 618, "total_steps": 17941, "loss": 1.9386, "learning_rate": 9.991984483296288e-05, "epoch": 0.03444624045482415, "percentage": 3.44, "elapsed_time": "1:27:37", "remaining_time": "1 day, 16:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 619, "total_steps": 17941, "loss": 2.0836, "learning_rate": 9.991934005557103e-05, "epoch": 0.03450197870798729, "percentage": 3.45, "elapsed_time": "1:27:45", "remaining_time": "1 day, 16:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 17941, "loss": 1.6526, "learning_rate": 9.991883369502874e-05, "epoch": 0.03455771696115044, "percentage": 3.46, "elapsed_time": "1:27:54", "remaining_time": "1 day, 16:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 621, "total_steps": 17941, "loss": 1.7326, "learning_rate": 9.991832575135211e-05, "epoch": 0.03461345521431358, "percentage": 3.46, "elapsed_time": "1:28:02", "remaining_time": "1 day, 16:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 622, "total_steps": 17941, "loss": 1.6398, "learning_rate": 9.991781622455723e-05, "epoch": 0.03466919346747673, "percentage": 3.47, "elapsed_time": "1:28:11", "remaining_time": "1 day, 16:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 623, "total_steps": 17941, "loss": 1.7927, "learning_rate": 9.991730511466026e-05, "epoch": 0.034724931720639875, "percentage": 3.47, "elapsed_time": "1:28:20", "remaining_time": "1 day, 16:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 624, "total_steps": 17941, "loss": 1.8047, "learning_rate": 9.991679242167741e-05, "epoch": 0.03478066997380302, "percentage": 3.48, "elapsed_time": "1:28:28", "remaining_time": "1 day, 16:55:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 625, "total_steps": 17941, "loss": 1.9146, "learning_rate": 9.991627814562494e-05, "epoch": 0.03483640822696617, "percentage": 3.48, "elapsed_time": "1:28:37", "remaining_time": "1 day, 16:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 626, "total_steps": 17941, "loss": 1.9453, "learning_rate": 9.991576228651915e-05, "epoch": 0.03489214648012931, "percentage": 3.49, "elapsed_time": "1:28:45", "remaining_time": "1 day, 16:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 627, "total_steps": 17941, "loss": 1.7143, "learning_rate": 9.991524484437642e-05, "epoch": 0.03494788473329246, "percentage": 3.49, "elapsed_time": "1:28:54", "remaining_time": "1 day, 16:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 628, "total_steps": 17941, "loss": 1.7371, "learning_rate": 9.991472581921316e-05, "epoch": 0.0350036229864556, "percentage": 3.5, "elapsed_time": "1:29:02", "remaining_time": "1 day, 16:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 629, "total_steps": 17941, "loss": 1.9569, "learning_rate": 9.99142052110458e-05, "epoch": 0.03505936123961875, "percentage": 3.51, "elapsed_time": "1:29:11", "remaining_time": "1 day, 16:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 17941, "loss": 1.4609, "learning_rate": 9.991368301989088e-05, "epoch": 0.035115099492781895, "percentage": 3.51, "elapsed_time": "1:29:19", "remaining_time": "1 day, 16:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 631, "total_steps": 17941, "loss": 1.7577, "learning_rate": 9.991315924576495e-05, "epoch": 0.035170837745945045, "percentage": 3.52, "elapsed_time": "1:29:28", "remaining_time": "1 day, 16:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 632, "total_steps": 17941, "loss": 1.8534, "learning_rate": 9.991263388868461e-05, "epoch": 0.03522657599910819, "percentage": 3.52, "elapsed_time": "1:29:36", "remaining_time": "1 day, 16:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 633, "total_steps": 17941, "loss": 1.6853, "learning_rate": 9.991210694866654e-05, "epoch": 0.03528231425227133, "percentage": 3.53, "elapsed_time": "1:29:44", "remaining_time": "1 day, 16:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 634, "total_steps": 17941, "loss": 1.8088, "learning_rate": 9.991157842572747e-05, "epoch": 0.03533805250543448, "percentage": 3.53, "elapsed_time": "1:29:53", "remaining_time": "1 day, 16:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 635, "total_steps": 17941, "loss": 1.9148, "learning_rate": 9.991104831988412e-05, "epoch": 0.035393790758597624, "percentage": 3.54, "elapsed_time": "1:30:01", "remaining_time": "1 day, 16:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 636, "total_steps": 17941, "loss": 1.7816, "learning_rate": 9.991051663115331e-05, "epoch": 0.03544952901176077, "percentage": 3.54, "elapsed_time": "1:30:10", "remaining_time": "1 day, 16:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 637, "total_steps": 17941, "loss": 1.8764, "learning_rate": 9.990998335955193e-05, "epoch": 0.035505267264923916, "percentage": 3.55, "elapsed_time": "1:30:18", "remaining_time": "1 day, 16:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 638, "total_steps": 17941, "loss": 1.6103, "learning_rate": 9.990944850509685e-05, "epoch": 0.035561005518087066, "percentage": 3.56, "elapsed_time": "1:30:28", "remaining_time": "1 day, 16:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 639, "total_steps": 17941, "loss": 1.7798, "learning_rate": 9.990891206780506e-05, "epoch": 0.03561674377125021, "percentage": 3.56, "elapsed_time": "1:30:36", "remaining_time": "1 day, 16:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 17941, "loss": 1.8771, "learning_rate": 9.990837404769358e-05, "epoch": 0.03567248202441335, "percentage": 3.57, "elapsed_time": "1:30:44", "remaining_time": "1 day, 16:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 641, "total_steps": 17941, "loss": 2.0712, "learning_rate": 9.990783444477946e-05, "epoch": 0.0357282202775765, "percentage": 3.57, "elapsed_time": "1:30:54", "remaining_time": "1 day, 16:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 642, "total_steps": 17941, "loss": 1.7693, "learning_rate": 9.990729325907981e-05, "epoch": 0.035783958530739644, "percentage": 3.58, "elapsed_time": "1:31:02", "remaining_time": "1 day, 16:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 643, "total_steps": 17941, "loss": 1.8675, "learning_rate": 9.99067504906118e-05, "epoch": 0.035839696783902794, "percentage": 3.58, "elapsed_time": "1:31:12", "remaining_time": "1 day, 16:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 644, "total_steps": 17941, "loss": 1.7557, "learning_rate": 9.990620613939263e-05, "epoch": 0.03589543503706594, "percentage": 3.59, "elapsed_time": "1:31:20", "remaining_time": "1 day, 16:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 645, "total_steps": 17941, "loss": 1.7199, "learning_rate": 9.990566020543959e-05, "epoch": 0.03595117329022909, "percentage": 3.6, "elapsed_time": "1:31:29", "remaining_time": "1 day, 16:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 646, "total_steps": 17941, "loss": 1.9156, "learning_rate": 9.990511268876998e-05, "epoch": 0.03600691154339223, "percentage": 3.6, "elapsed_time": "1:31:37", "remaining_time": "1 day, 16:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 647, "total_steps": 17941, "loss": 1.6183, "learning_rate": 9.990456358940115e-05, "epoch": 0.03606264979655538, "percentage": 3.61, "elapsed_time": "1:31:45", "remaining_time": "1 day, 16:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 648, "total_steps": 17941, "loss": 1.8159, "learning_rate": 9.990401290735053e-05, "epoch": 0.03611838804971852, "percentage": 3.61, "elapsed_time": "1:31:54", "remaining_time": "1 day, 16:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 649, "total_steps": 17941, "loss": 1.9306, "learning_rate": 9.990346064263558e-05, "epoch": 0.036174126302881665, "percentage": 3.62, "elapsed_time": "1:32:02", "remaining_time": "1 day, 16:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 17941, "loss": 1.4257, "learning_rate": 9.990290679527382e-05, "epoch": 0.036229864556044815, "percentage": 3.62, "elapsed_time": "1:32:11", "remaining_time": "1 day, 16:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 651, "total_steps": 17941, "loss": 1.6587, "learning_rate": 9.990235136528281e-05, "epoch": 0.03628560280920796, "percentage": 3.63, "elapsed_time": "1:32:19", "remaining_time": "1 day, 16:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 652, "total_steps": 17941, "loss": 1.9138, "learning_rate": 9.990179435268017e-05, "epoch": 0.03634134106237111, "percentage": 3.63, "elapsed_time": "1:32:28", "remaining_time": "1 day, 16:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 653, "total_steps": 17941, "loss": 2.0153, "learning_rate": 9.990123575748355e-05, "epoch": 0.03639707931553425, "percentage": 3.64, "elapsed_time": "1:32:36", "remaining_time": "1 day, 16:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 654, "total_steps": 17941, "loss": 1.9489, "learning_rate": 9.990067557971068e-05, "epoch": 0.0364528175686974, "percentage": 3.65, "elapsed_time": "1:32:45", "remaining_time": "1 day, 16:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 655, "total_steps": 17941, "loss": 1.6926, "learning_rate": 9.990011381937933e-05, "epoch": 0.03650855582186054, "percentage": 3.65, "elapsed_time": "1:32:53", "remaining_time": "1 day, 16:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 656, "total_steps": 17941, "loss": 1.7961, "learning_rate": 9.98995504765073e-05, "epoch": 0.036564294075023686, "percentage": 3.66, "elapsed_time": "1:33:02", "remaining_time": "1 day, 16:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 657, "total_steps": 17941, "loss": 1.8846, "learning_rate": 9.989898555111245e-05, "epoch": 0.036620032328186836, "percentage": 3.66, "elapsed_time": "1:33:10", "remaining_time": "1 day, 16:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 658, "total_steps": 17941, "loss": 1.7094, "learning_rate": 9.989841904321274e-05, "epoch": 0.03667577058134998, "percentage": 3.67, "elapsed_time": "1:33:18", "remaining_time": "1 day, 16:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 659, "total_steps": 17941, "loss": 1.8777, "learning_rate": 9.989785095282609e-05, "epoch": 0.03673150883451313, "percentage": 3.67, "elapsed_time": "1:33:27", "remaining_time": "1 day, 16:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 17941, "loss": 1.8686, "learning_rate": 9.989728127997052e-05, "epoch": 0.03678724708767627, "percentage": 3.68, "elapsed_time": "1:33:35", "remaining_time": "1 day, 16:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 661, "total_steps": 17941, "loss": 1.7542, "learning_rate": 9.989671002466412e-05, "epoch": 0.03684298534083942, "percentage": 3.68, "elapsed_time": "1:33:45", "remaining_time": "1 day, 16:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 662, "total_steps": 17941, "loss": 1.4741, "learning_rate": 9.989613718692501e-05, "epoch": 0.036898723594002564, "percentage": 3.69, "elapsed_time": "1:33:53", "remaining_time": "1 day, 16:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 663, "total_steps": 17941, "loss": 1.6816, "learning_rate": 9.989556276677133e-05, "epoch": 0.03695446184716571, "percentage": 3.7, "elapsed_time": "1:34:01", "remaining_time": "1 day, 16:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 664, "total_steps": 17941, "loss": 1.8716, "learning_rate": 9.989498676422131e-05, "epoch": 0.037010200100328856, "percentage": 3.7, "elapsed_time": "1:34:10", "remaining_time": "1 day, 16:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 665, "total_steps": 17941, "loss": 1.7686, "learning_rate": 9.989440917929321e-05, "epoch": 0.037065938353492, "percentage": 3.71, "elapsed_time": "1:34:18", "remaining_time": "1 day, 16:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 666, "total_steps": 17941, "loss": 2.116, "learning_rate": 9.989383001200536e-05, "epoch": 0.03712167660665515, "percentage": 3.71, "elapsed_time": "1:34:27", "remaining_time": "1 day, 16:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 667, "total_steps": 17941, "loss": 1.8245, "learning_rate": 9.989324926237613e-05, "epoch": 0.03717741485981829, "percentage": 3.72, "elapsed_time": "1:34:35", "remaining_time": "1 day, 16:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 668, "total_steps": 17941, "loss": 1.661, "learning_rate": 9.989266693042394e-05, "epoch": 0.03723315311298144, "percentage": 3.72, "elapsed_time": "1:34:44", "remaining_time": "1 day, 16:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 669, "total_steps": 17941, "loss": 1.6531, "learning_rate": 9.989208301616724e-05, "epoch": 0.037288891366144584, "percentage": 3.73, "elapsed_time": "1:34:52", "remaining_time": "1 day, 16:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 17941, "loss": 1.8691, "learning_rate": 9.989149751962455e-05, "epoch": 0.037344629619307734, "percentage": 3.73, "elapsed_time": "1:35:01", "remaining_time": "1 day, 16:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 671, "total_steps": 17941, "loss": 1.7718, "learning_rate": 9.989091044081445e-05, "epoch": 0.03740036787247088, "percentage": 3.74, "elapsed_time": "1:35:09", "remaining_time": "1 day, 16:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 672, "total_steps": 17941, "loss": 2.2129, "learning_rate": 9.989032177975554e-05, "epoch": 0.03745610612563402, "percentage": 3.75, "elapsed_time": "1:35:18", "remaining_time": "1 day, 16:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 673, "total_steps": 17941, "loss": 1.9084, "learning_rate": 9.988973153646654e-05, "epoch": 0.03751184437879717, "percentage": 3.75, "elapsed_time": "1:35:26", "remaining_time": "1 day, 16:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 674, "total_steps": 17941, "loss": 1.9491, "learning_rate": 9.988913971096611e-05, "epoch": 0.03756758263196031, "percentage": 3.76, "elapsed_time": "1:35:34", "remaining_time": "1 day, 16:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 675, "total_steps": 17941, "loss": 1.7176, "learning_rate": 9.988854630327305e-05, "epoch": 0.03762332088512346, "percentage": 3.76, "elapsed_time": "1:35:43", "remaining_time": "1 day, 16:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 676, "total_steps": 17941, "loss": 1.5625, "learning_rate": 9.988795131340616e-05, "epoch": 0.037679059138286605, "percentage": 3.77, "elapsed_time": "1:35:51", "remaining_time": "1 day, 16:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 677, "total_steps": 17941, "loss": 1.7208, "learning_rate": 9.988735474138433e-05, "epoch": 0.037734797391449755, "percentage": 3.77, "elapsed_time": "1:36:00", "remaining_time": "1 day, 16:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 678, "total_steps": 17941, "loss": 1.9678, "learning_rate": 9.988675658722648e-05, "epoch": 0.0377905356446129, "percentage": 3.78, "elapsed_time": "1:36:08", "remaining_time": "1 day, 16:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 679, "total_steps": 17941, "loss": 2.2239, "learning_rate": 9.988615685095155e-05, "epoch": 0.03784627389777604, "percentage": 3.78, "elapsed_time": "1:36:17", "remaining_time": "1 day, 16:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 17941, "loss": 1.6574, "learning_rate": 9.98855555325786e-05, "epoch": 0.03790201215093919, "percentage": 3.79, "elapsed_time": "1:36:25", "remaining_time": "1 day, 16:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 681, "total_steps": 17941, "loss": 1.6185, "learning_rate": 9.988495263212667e-05, "epoch": 0.03795775040410233, "percentage": 3.8, "elapsed_time": "1:36:34", "remaining_time": "1 day, 16:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 682, "total_steps": 17941, "loss": 2.0788, "learning_rate": 9.98843481496149e-05, "epoch": 0.03801348865726548, "percentage": 3.8, "elapsed_time": "1:36:42", "remaining_time": "1 day, 16:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 683, "total_steps": 17941, "loss": 1.7213, "learning_rate": 9.988374208506243e-05, "epoch": 0.038069226910428626, "percentage": 3.81, "elapsed_time": "1:36:51", "remaining_time": "1 day, 16:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 684, "total_steps": 17941, "loss": 1.9524, "learning_rate": 9.988313443848853e-05, "epoch": 0.038124965163591776, "percentage": 3.81, "elapsed_time": "1:36:59", "remaining_time": "1 day, 16:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 685, "total_steps": 17941, "loss": 1.9489, "learning_rate": 9.988252520991244e-05, "epoch": 0.03818070341675492, "percentage": 3.82, "elapsed_time": "1:37:08", "remaining_time": "1 day, 16:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 686, "total_steps": 17941, "loss": 1.8805, "learning_rate": 9.988191439935348e-05, "epoch": 0.03823644166991806, "percentage": 3.82, "elapsed_time": "1:37:16", "remaining_time": "1 day, 16:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 687, "total_steps": 17941, "loss": 1.916, "learning_rate": 9.988130200683103e-05, "epoch": 0.03829217992308121, "percentage": 3.83, "elapsed_time": "1:37:24", "remaining_time": "1 day, 16:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 688, "total_steps": 17941, "loss": 1.3248, "learning_rate": 9.98806880323645e-05, "epoch": 0.038347918176244354, "percentage": 3.83, "elapsed_time": "1:37:33", "remaining_time": "1 day, 16:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 689, "total_steps": 17941, "loss": 1.945, "learning_rate": 9.988007247597337e-05, "epoch": 0.038403656429407504, "percentage": 3.84, "elapsed_time": "1:37:41", "remaining_time": "1 day, 16:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 17941, "loss": 1.9159, "learning_rate": 9.987945533767717e-05, "epoch": 0.03845939468257065, "percentage": 3.85, "elapsed_time": "1:37:50", "remaining_time": "1 day, 16:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 691, "total_steps": 17941, "loss": 1.7105, "learning_rate": 9.987883661749548e-05, "epoch": 0.0385151329357338, "percentage": 3.85, "elapsed_time": "1:37:59", "remaining_time": "1 day, 16:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 692, "total_steps": 17941, "loss": 1.6607, "learning_rate": 9.987821631544789e-05, "epoch": 0.03857087118889694, "percentage": 3.86, "elapsed_time": "1:38:07", "remaining_time": "1 day, 16:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 693, "total_steps": 17941, "loss": 1.8422, "learning_rate": 9.987759443155409e-05, "epoch": 0.03862660944206009, "percentage": 3.86, "elapsed_time": "1:38:16", "remaining_time": "1 day, 16:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 694, "total_steps": 17941, "loss": 1.8393, "learning_rate": 9.98769709658338e-05, "epoch": 0.03868234769522323, "percentage": 3.87, "elapsed_time": "1:38:24", "remaining_time": "1 day, 16:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 695, "total_steps": 17941, "loss": 1.8819, "learning_rate": 9.987634591830679e-05, "epoch": 0.038738085948386375, "percentage": 3.87, "elapsed_time": "1:38:33", "remaining_time": "1 day, 16:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 696, "total_steps": 17941, "loss": 1.7872, "learning_rate": 9.987571928899288e-05, "epoch": 0.038793824201549525, "percentage": 3.88, "elapsed_time": "1:38:41", "remaining_time": "1 day, 16:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 697, "total_steps": 17941, "loss": 1.8078, "learning_rate": 9.987509107791196e-05, "epoch": 0.03884956245471267, "percentage": 3.88, "elapsed_time": "1:38:51", "remaining_time": "1 day, 16:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 698, "total_steps": 17941, "loss": 1.7838, "learning_rate": 9.987446128508396e-05, "epoch": 0.03890530070787582, "percentage": 3.89, "elapsed_time": "1:38:59", "remaining_time": "1 day, 16:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 699, "total_steps": 17941, "loss": 1.7299, "learning_rate": 9.98738299105288e-05, "epoch": 0.03896103896103896, "percentage": 3.9, "elapsed_time": "1:39:07", "remaining_time": "1 day, 16:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 17941, "loss": 1.7414, "learning_rate": 9.987319695426657e-05, "epoch": 0.03901677721420211, "percentage": 3.9, "elapsed_time": "1:39:16", "remaining_time": "1 day, 16:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 701, "total_steps": 17941, "loss": 1.8223, "learning_rate": 9.98725624163173e-05, "epoch": 0.03907251546736525, "percentage": 3.91, "elapsed_time": "1:39:24", "remaining_time": "1 day, 16:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 702, "total_steps": 17941, "loss": 1.791, "learning_rate": 9.987192629670112e-05, "epoch": 0.039128253720528396, "percentage": 3.91, "elapsed_time": "1:39:33", "remaining_time": "1 day, 16:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 703, "total_steps": 17941, "loss": 1.7428, "learning_rate": 9.987128859543824e-05, "epoch": 0.039183991973691545, "percentage": 3.92, "elapsed_time": "1:39:42", "remaining_time": "1 day, 16:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 704, "total_steps": 17941, "loss": 1.6701, "learning_rate": 9.987064931254884e-05, "epoch": 0.03923973022685469, "percentage": 3.92, "elapsed_time": "1:39:50", "remaining_time": "1 day, 16:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 705, "total_steps": 17941, "loss": 1.9592, "learning_rate": 9.987000844805319e-05, "epoch": 0.03929546848001784, "percentage": 3.93, "elapsed_time": "1:39:59", "remaining_time": "1 day, 16:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 706, "total_steps": 17941, "loss": 1.786, "learning_rate": 9.986936600197165e-05, "epoch": 0.03935120673318098, "percentage": 3.94, "elapsed_time": "1:40:07", "remaining_time": "1 day, 16:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 707, "total_steps": 17941, "loss": 1.7937, "learning_rate": 9.986872197432459e-05, "epoch": 0.03940694498634413, "percentage": 3.94, "elapsed_time": "1:40:16", "remaining_time": "1 day, 16:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 708, "total_steps": 17941, "loss": 1.8019, "learning_rate": 9.986807636513241e-05, "epoch": 0.039462683239507274, "percentage": 3.95, "elapsed_time": "1:40:25", "remaining_time": "1 day, 16:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 709, "total_steps": 17941, "loss": 1.9214, "learning_rate": 9.986742917441561e-05, "epoch": 0.039518421492670416, "percentage": 3.95, "elapsed_time": "1:40:33", "remaining_time": "1 day, 16:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 17941, "loss": 1.7621, "learning_rate": 9.986678040219469e-05, "epoch": 0.039574159745833566, "percentage": 3.96, "elapsed_time": "1:40:41", "remaining_time": "1 day, 16:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 711, "total_steps": 17941, "loss": 1.7435, "learning_rate": 9.986613004849024e-05, "epoch": 0.03962989799899671, "percentage": 3.96, "elapsed_time": "1:40:50", "remaining_time": "1 day, 16:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 712, "total_steps": 17941, "loss": 1.7199, "learning_rate": 9.986547811332289e-05, "epoch": 0.03968563625215986, "percentage": 3.97, "elapsed_time": "1:40:58", "remaining_time": "1 day, 16:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 713, "total_steps": 17941, "loss": 1.9435, "learning_rate": 9.986482459671332e-05, "epoch": 0.039741374505323, "percentage": 3.97, "elapsed_time": "1:41:07", "remaining_time": "1 day, 16:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 714, "total_steps": 17941, "loss": 1.799, "learning_rate": 9.986416949868223e-05, "epoch": 0.03979711275848615, "percentage": 3.98, "elapsed_time": "1:41:15", "remaining_time": "1 day, 16:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 715, "total_steps": 17941, "loss": 1.8455, "learning_rate": 9.986351281925042e-05, "epoch": 0.039852851011649294, "percentage": 3.99, "elapsed_time": "1:41:24", "remaining_time": "1 day, 16:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 716, "total_steps": 17941, "loss": 1.5848, "learning_rate": 9.986285455843872e-05, "epoch": 0.039908589264812444, "percentage": 3.99, "elapsed_time": "1:41:32", "remaining_time": "1 day, 16:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 717, "total_steps": 17941, "loss": 1.6527, "learning_rate": 9.986219471626797e-05, "epoch": 0.03996432751797559, "percentage": 4.0, "elapsed_time": "1:41:41", "remaining_time": "1 day, 16:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 718, "total_steps": 17941, "loss": 1.8773, "learning_rate": 9.986153329275913e-05, "epoch": 0.04002006577113873, "percentage": 4.0, "elapsed_time": "1:41:49", "remaining_time": "1 day, 16:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 719, "total_steps": 17941, "loss": 1.8737, "learning_rate": 9.986087028793316e-05, "epoch": 0.04007580402430188, "percentage": 4.01, "elapsed_time": "1:41:58", "remaining_time": "1 day, 16:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 17941, "loss": 1.9581, "learning_rate": 9.98602057018111e-05, "epoch": 0.04013154227746502, "percentage": 4.01, "elapsed_time": "1:42:06", "remaining_time": "1 day, 16:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 721, "total_steps": 17941, "loss": 1.887, "learning_rate": 9.985953953441402e-05, "epoch": 0.04018728053062817, "percentage": 4.02, "elapsed_time": "1:42:15", "remaining_time": "1 day, 16:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 722, "total_steps": 17941, "loss": 1.9981, "learning_rate": 9.985887178576305e-05, "epoch": 0.040243018783791315, "percentage": 4.02, "elapsed_time": "1:42:23", "remaining_time": "1 day, 16:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 723, "total_steps": 17941, "loss": 2.0195, "learning_rate": 9.985820245587936e-05, "epoch": 0.040298757036954465, "percentage": 4.03, "elapsed_time": "1:42:32", "remaining_time": "1 day, 16:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 724, "total_steps": 17941, "loss": 1.6134, "learning_rate": 9.985753154478418e-05, "epoch": 0.04035449529011761, "percentage": 4.04, "elapsed_time": "1:42:40", "remaining_time": "1 day, 16:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 725, "total_steps": 17941, "loss": 1.7501, "learning_rate": 9.98568590524988e-05, "epoch": 0.04041023354328075, "percentage": 4.04, "elapsed_time": "1:42:49", "remaining_time": "1 day, 16:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 726, "total_steps": 17941, "loss": 1.9164, "learning_rate": 9.985618497904453e-05, "epoch": 0.0404659717964439, "percentage": 4.05, "elapsed_time": "1:42:57", "remaining_time": "1 day, 16:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 727, "total_steps": 17941, "loss": 1.8159, "learning_rate": 9.985550932444275e-05, "epoch": 0.04052171004960704, "percentage": 4.05, "elapsed_time": "1:43:06", "remaining_time": "1 day, 16:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 728, "total_steps": 17941, "loss": 1.6184, "learning_rate": 9.98548320887149e-05, "epoch": 0.04057744830277019, "percentage": 4.06, "elapsed_time": "1:43:15", "remaining_time": "1 day, 16:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 729, "total_steps": 17941, "loss": 1.8383, "learning_rate": 9.985415327188245e-05, "epoch": 0.040633186555933336, "percentage": 4.06, "elapsed_time": "1:43:23", "remaining_time": "1 day, 16:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 17941, "loss": 1.67, "learning_rate": 9.985347287396692e-05, "epoch": 0.040688924809096486, "percentage": 4.07, "elapsed_time": "1:43:31", "remaining_time": "1 day, 16:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 731, "total_steps": 17941, "loss": 1.8185, "learning_rate": 9.98527908949899e-05, "epoch": 0.04074466306225963, "percentage": 4.07, "elapsed_time": "1:43:40", "remaining_time": "1 day, 16:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 732, "total_steps": 17941, "loss": 1.7909, "learning_rate": 9.985210733497301e-05, "epoch": 0.04080040131542277, "percentage": 4.08, "elapsed_time": "1:43:48", "remaining_time": "1 day, 16:40:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 733, "total_steps": 17941, "loss": 1.8615, "learning_rate": 9.985142219393795e-05, "epoch": 0.04085613956858592, "percentage": 4.09, "elapsed_time": "1:43:57", "remaining_time": "1 day, 16:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 734, "total_steps": 17941, "loss": 1.9337, "learning_rate": 9.985073547190641e-05, "epoch": 0.040911877821749064, "percentage": 4.09, "elapsed_time": "1:44:05", "remaining_time": "1 day, 16:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 735, "total_steps": 17941, "loss": 1.8345, "learning_rate": 9.98500471689002e-05, "epoch": 0.040967616074912214, "percentage": 4.1, "elapsed_time": "1:44:14", "remaining_time": "1 day, 16:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 736, "total_steps": 17941, "loss": 1.843, "learning_rate": 9.984935728494113e-05, "epoch": 0.04102335432807536, "percentage": 4.1, "elapsed_time": "1:44:22", "remaining_time": "1 day, 16:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 737, "total_steps": 17941, "loss": 1.9642, "learning_rate": 9.984866582005111e-05, "epoch": 0.041079092581238506, "percentage": 4.11, "elapsed_time": "1:44:31", "remaining_time": "1 day, 16:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 738, "total_steps": 17941, "loss": 1.8874, "learning_rate": 9.984797277425204e-05, "epoch": 0.04113483083440165, "percentage": 4.11, "elapsed_time": "1:44:39", "remaining_time": "1 day, 16:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 739, "total_steps": 17941, "loss": 1.9269, "learning_rate": 9.98472781475659e-05, "epoch": 0.0411905690875648, "percentage": 4.12, "elapsed_time": "1:44:48", "remaining_time": "1 day, 16:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 17941, "loss": 1.5059, "learning_rate": 9.984658194001474e-05, "epoch": 0.04124630734072794, "percentage": 4.12, "elapsed_time": "1:44:56", "remaining_time": "1 day, 16:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 741, "total_steps": 17941, "loss": 1.7386, "learning_rate": 9.984588415162061e-05, "epoch": 0.041302045593891085, "percentage": 4.13, "elapsed_time": "1:45:05", "remaining_time": "1 day, 16:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 742, "total_steps": 17941, "loss": 1.9075, "learning_rate": 9.984518478240568e-05, "epoch": 0.041357783847054234, "percentage": 4.14, "elapsed_time": "1:45:13", "remaining_time": "1 day, 16:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 743, "total_steps": 17941, "loss": 1.7812, "learning_rate": 9.98444838323921e-05, "epoch": 0.04141352210021738, "percentage": 4.14, "elapsed_time": "1:45:22", "remaining_time": "1 day, 16:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 744, "total_steps": 17941, "loss": 1.9155, "learning_rate": 9.984378130160208e-05, "epoch": 0.04146926035338053, "percentage": 4.15, "elapsed_time": "1:45:30", "remaining_time": "1 day, 16:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 745, "total_steps": 17941, "loss": 1.6661, "learning_rate": 9.984307719005795e-05, "epoch": 0.04152499860654367, "percentage": 4.15, "elapsed_time": "1:45:38", "remaining_time": "1 day, 16:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 746, "total_steps": 17941, "loss": 1.8456, "learning_rate": 9.984237149778201e-05, "epoch": 0.04158073685970682, "percentage": 4.16, "elapsed_time": "1:45:47", "remaining_time": "1 day, 16:38:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 747, "total_steps": 17941, "loss": 1.9118, "learning_rate": 9.984166422479663e-05, "epoch": 0.04163647511286996, "percentage": 4.16, "elapsed_time": "1:45:55", "remaining_time": "1 day, 16:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 748, "total_steps": 17941, "loss": 1.7721, "learning_rate": 9.984095537112429e-05, "epoch": 0.041692213366033105, "percentage": 4.17, "elapsed_time": "1:46:04", "remaining_time": "1 day, 16:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 749, "total_steps": 17941, "loss": 1.7968, "learning_rate": 9.984024493678743e-05, "epoch": 0.041747951619196255, "percentage": 4.17, "elapsed_time": "1:46:13", "remaining_time": "1 day, 16:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 17941, "loss": 1.858, "learning_rate": 9.983953292180857e-05, "epoch": 0.0418036898723594, "percentage": 4.18, "elapsed_time": "1:46:21", "remaining_time": "1 day, 16:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 751, "total_steps": 17941, "loss": 1.751, "learning_rate": 9.983881932621033e-05, "epoch": 0.04185942812552255, "percentage": 4.19, "elapsed_time": "1:46:29", "remaining_time": "1 day, 16:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 752, "total_steps": 17941, "loss": 1.5998, "learning_rate": 9.983810415001531e-05, "epoch": 0.04191516637868569, "percentage": 4.19, "elapsed_time": "1:46:38", "remaining_time": "1 day, 16:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 753, "total_steps": 17941, "loss": 1.7263, "learning_rate": 9.983738739324621e-05, "epoch": 0.04197090463184884, "percentage": 4.2, "elapsed_time": "1:46:47", "remaining_time": "1 day, 16:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 754, "total_steps": 17941, "loss": 1.9334, "learning_rate": 9.983666905592576e-05, "epoch": 0.04202664288501198, "percentage": 4.2, "elapsed_time": "1:46:55", "remaining_time": "1 day, 16:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 755, "total_steps": 17941, "loss": 1.6944, "learning_rate": 9.983594913807672e-05, "epoch": 0.042082381138175126, "percentage": 4.21, "elapsed_time": "1:47:03", "remaining_time": "1 day, 16:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 756, "total_steps": 17941, "loss": 2.042, "learning_rate": 9.983522763972196e-05, "epoch": 0.042138119391338276, "percentage": 4.21, "elapsed_time": "1:47:12", "remaining_time": "1 day, 16:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 757, "total_steps": 17941, "loss": 1.6733, "learning_rate": 9.983450456088432e-05, "epoch": 0.04219385764450142, "percentage": 4.22, "elapsed_time": "1:47:20", "remaining_time": "1 day, 16:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 758, "total_steps": 17941, "loss": 1.8463, "learning_rate": 9.983377990158676e-05, "epoch": 0.04224959589766457, "percentage": 4.22, "elapsed_time": "1:47:29", "remaining_time": "1 day, 16:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 759, "total_steps": 17941, "loss": 1.7602, "learning_rate": 9.983305366185223e-05, "epoch": 0.04230533415082771, "percentage": 4.23, "elapsed_time": "1:47:37", "remaining_time": "1 day, 16:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 17941, "loss": 1.8644, "learning_rate": 9.983232584170381e-05, "epoch": 0.04236107240399086, "percentage": 4.24, "elapsed_time": "1:47:46", "remaining_time": "1 day, 16:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 761, "total_steps": 17941, "loss": 1.6919, "learning_rate": 9.983159644116454e-05, "epoch": 0.042416810657154004, "percentage": 4.24, "elapsed_time": "1:47:54", "remaining_time": "1 day, 16:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 762, "total_steps": 17941, "loss": 1.9491, "learning_rate": 9.983086546025759e-05, "epoch": 0.042472548910317154, "percentage": 4.25, "elapsed_time": "1:48:03", "remaining_time": "1 day, 16:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 763, "total_steps": 17941, "loss": 1.9184, "learning_rate": 9.98301328990061e-05, "epoch": 0.0425282871634803, "percentage": 4.25, "elapsed_time": "1:48:11", "remaining_time": "1 day, 16:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 764, "total_steps": 17941, "loss": 1.826, "learning_rate": 9.982939875743333e-05, "epoch": 0.04258402541664344, "percentage": 4.26, "elapsed_time": "1:48:20", "remaining_time": "1 day, 16:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 765, "total_steps": 17941, "loss": 1.7675, "learning_rate": 9.982866303556258e-05, "epoch": 0.04263976366980659, "percentage": 4.26, "elapsed_time": "1:48:29", "remaining_time": "1 day, 16:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 766, "total_steps": 17941, "loss": 1.8539, "learning_rate": 9.982792573341713e-05, "epoch": 0.04269550192296973, "percentage": 4.27, "elapsed_time": "1:48:38", "remaining_time": "1 day, 16:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 767, "total_steps": 17941, "loss": 1.9196, "learning_rate": 9.982718685102039e-05, "epoch": 0.04275124017613288, "percentage": 4.28, "elapsed_time": "1:48:46", "remaining_time": "1 day, 16:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 768, "total_steps": 17941, "loss": 1.8719, "learning_rate": 9.982644638839583e-05, "epoch": 0.042806978429296025, "percentage": 4.28, "elapsed_time": "1:48:55", "remaining_time": "1 day, 16:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 769, "total_steps": 17941, "loss": 1.9678, "learning_rate": 9.982570434556686e-05, "epoch": 0.042862716682459175, "percentage": 4.29, "elapsed_time": "1:49:03", "remaining_time": "1 day, 16:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 17941, "loss": 1.7078, "learning_rate": 9.982496072255708e-05, "epoch": 0.04291845493562232, "percentage": 4.29, "elapsed_time": "1:49:12", "remaining_time": "1 day, 16:35:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 771, "total_steps": 17941, "loss": 1.8064, "learning_rate": 9.982421551939003e-05, "epoch": 0.04297419318878546, "percentage": 4.3, "elapsed_time": "1:49:20", "remaining_time": "1 day, 16:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 772, "total_steps": 17941, "loss": 1.6427, "learning_rate": 9.982346873608937e-05, "epoch": 0.04302993144194861, "percentage": 4.3, "elapsed_time": "1:49:29", "remaining_time": "1 day, 16:35:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 773, "total_steps": 17941, "loss": 1.7367, "learning_rate": 9.982272037267877e-05, "epoch": 0.04308566969511175, "percentage": 4.31, "elapsed_time": "1:49:38", "remaining_time": "1 day, 16:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 774, "total_steps": 17941, "loss": 1.6834, "learning_rate": 9.982197042918195e-05, "epoch": 0.0431414079482749, "percentage": 4.31, "elapsed_time": "1:49:46", "remaining_time": "1 day, 16:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 775, "total_steps": 17941, "loss": 1.7545, "learning_rate": 9.982121890562273e-05, "epoch": 0.043197146201438046, "percentage": 4.32, "elapsed_time": "1:49:55", "remaining_time": "1 day, 16:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 776, "total_steps": 17941, "loss": 1.784, "learning_rate": 9.982046580202493e-05, "epoch": 0.043252884454601195, "percentage": 4.33, "elapsed_time": "1:50:03", "remaining_time": "1 day, 16:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 777, "total_steps": 17941, "loss": 1.8328, "learning_rate": 9.98197111184124e-05, "epoch": 0.04330862270776434, "percentage": 4.33, "elapsed_time": "1:50:12", "remaining_time": "1 day, 16:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 778, "total_steps": 17941, "loss": 1.8808, "learning_rate": 9.981895485480912e-05, "epoch": 0.04336436096092749, "percentage": 4.34, "elapsed_time": "1:50:20", "remaining_time": "1 day, 16:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 779, "total_steps": 17941, "loss": 1.577, "learning_rate": 9.981819701123907e-05, "epoch": 0.04342009921409063, "percentage": 4.34, "elapsed_time": "1:50:29", "remaining_time": "1 day, 16:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 17941, "loss": 1.6959, "learning_rate": 9.981743758772625e-05, "epoch": 0.043475837467253774, "percentage": 4.35, "elapsed_time": "1:50:37", "remaining_time": "1 day, 16:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 781, "total_steps": 17941, "loss": 1.6635, "learning_rate": 9.981667658429477e-05, "epoch": 0.043531575720416923, "percentage": 4.35, "elapsed_time": "1:50:46", "remaining_time": "1 day, 16:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 782, "total_steps": 17941, "loss": 1.854, "learning_rate": 9.981591400096877e-05, "epoch": 0.043587313973580066, "percentage": 4.36, "elapsed_time": "1:50:55", "remaining_time": "1 day, 16:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 783, "total_steps": 17941, "loss": 1.781, "learning_rate": 9.98151498377724e-05, "epoch": 0.043643052226743216, "percentage": 4.36, "elapsed_time": "1:51:03", "remaining_time": "1 day, 16:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 784, "total_steps": 17941, "loss": 1.6629, "learning_rate": 9.981438409472994e-05, "epoch": 0.04369879047990636, "percentage": 4.37, "elapsed_time": "1:51:12", "remaining_time": "1 day, 16:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 785, "total_steps": 17941, "loss": 1.7694, "learning_rate": 9.981361677186566e-05, "epoch": 0.04375452873306951, "percentage": 4.38, "elapsed_time": "1:51:20", "remaining_time": "1 day, 16:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 786, "total_steps": 17941, "loss": 1.7242, "learning_rate": 9.981284786920388e-05, "epoch": 0.04381026698623265, "percentage": 4.38, "elapsed_time": "1:51:29", "remaining_time": "1 day, 16:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 787, "total_steps": 17941, "loss": 1.6032, "learning_rate": 9.981207738676899e-05, "epoch": 0.043866005239395794, "percentage": 4.39, "elapsed_time": "1:51:37", "remaining_time": "1 day, 16:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 788, "total_steps": 17941, "loss": 1.8624, "learning_rate": 9.981130532458544e-05, "epoch": 0.043921743492558944, "percentage": 4.39, "elapsed_time": "1:51:46", "remaining_time": "1 day, 16:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 789, "total_steps": 17941, "loss": 1.6831, "learning_rate": 9.98105316826777e-05, "epoch": 0.04397748174572209, "percentage": 4.4, "elapsed_time": "1:51:54", "remaining_time": "1 day, 16:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 17941, "loss": 1.7933, "learning_rate": 9.980975646107032e-05, "epoch": 0.04403321999888524, "percentage": 4.4, "elapsed_time": "1:52:03", "remaining_time": "1 day, 16:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 791, "total_steps": 17941, "loss": 1.6383, "learning_rate": 9.980897965978787e-05, "epoch": 0.04408895825204838, "percentage": 4.41, "elapsed_time": "1:52:11", "remaining_time": "1 day, 16:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 792, "total_steps": 17941, "loss": 1.8771, "learning_rate": 9.980820127885497e-05, "epoch": 0.04414469650521153, "percentage": 4.41, "elapsed_time": "1:52:20", "remaining_time": "1 day, 16:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 793, "total_steps": 17941, "loss": 2.0977, "learning_rate": 9.980742131829635e-05, "epoch": 0.04420043475837467, "percentage": 4.42, "elapsed_time": "1:52:28", "remaining_time": "1 day, 16:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 794, "total_steps": 17941, "loss": 1.9813, "learning_rate": 9.980663977813672e-05, "epoch": 0.044256173011537815, "percentage": 4.43, "elapsed_time": "1:52:36", "remaining_time": "1 day, 16:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 795, "total_steps": 17941, "loss": 1.7362, "learning_rate": 9.980585665840087e-05, "epoch": 0.044311911264700965, "percentage": 4.43, "elapsed_time": "1:52:45", "remaining_time": "1 day, 16:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 796, "total_steps": 17941, "loss": 1.5489, "learning_rate": 9.980507195911363e-05, "epoch": 0.04436764951786411, "percentage": 4.44, "elapsed_time": "1:52:54", "remaining_time": "1 day, 16:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 797, "total_steps": 17941, "loss": 1.9545, "learning_rate": 9.980428568029989e-05, "epoch": 0.04442338777102726, "percentage": 4.44, "elapsed_time": "1:53:02", "remaining_time": "1 day, 16:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 798, "total_steps": 17941, "loss": 1.6321, "learning_rate": 9.98034978219846e-05, "epoch": 0.0444791260241904, "percentage": 4.45, "elapsed_time": "1:53:10", "remaining_time": "1 day, 16:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 799, "total_steps": 17941, "loss": 1.7045, "learning_rate": 9.980270838419273e-05, "epoch": 0.04453486427735355, "percentage": 4.45, "elapsed_time": "1:53:19", "remaining_time": "1 day, 16:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 17941, "loss": 1.6414, "learning_rate": 9.98019173669493e-05, "epoch": 0.04459060253051669, "percentage": 4.46, "elapsed_time": "1:53:27", "remaining_time": "1 day, 16:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 801, "total_steps": 17941, "loss": 1.8683, "learning_rate": 9.980112477027942e-05, "epoch": 0.04464634078367984, "percentage": 4.46, "elapsed_time": "1:53:36", "remaining_time": "1 day, 16:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 802, "total_steps": 17941, "loss": 1.7773, "learning_rate": 9.980033059420826e-05, "epoch": 0.044702079036842986, "percentage": 4.47, "elapsed_time": "1:53:44", "remaining_time": "1 day, 16:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 803, "total_steps": 17941, "loss": 2.0631, "learning_rate": 9.979953483876095e-05, "epoch": 0.04475781729000613, "percentage": 4.48, "elapsed_time": "1:53:53", "remaining_time": "1 day, 16:30:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 804, "total_steps": 17941, "loss": 2.0601, "learning_rate": 9.979873750396273e-05, "epoch": 0.04481355554316928, "percentage": 4.48, "elapsed_time": "1:54:02", "remaining_time": "1 day, 16:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 805, "total_steps": 17941, "loss": 1.7687, "learning_rate": 9.979793858983891e-05, "epoch": 0.04486929379633242, "percentage": 4.49, "elapsed_time": "1:54:11", "remaining_time": "1 day, 16:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 806, "total_steps": 17941, "loss": 1.9662, "learning_rate": 9.979713809641482e-05, "epoch": 0.04492503204949557, "percentage": 4.49, "elapsed_time": "1:54:19", "remaining_time": "1 day, 16:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 807, "total_steps": 17941, "loss": 1.7011, "learning_rate": 9.979633602371586e-05, "epoch": 0.044980770302658714, "percentage": 4.5, "elapsed_time": "1:54:28", "remaining_time": "1 day, 16:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 808, "total_steps": 17941, "loss": 1.7632, "learning_rate": 9.979553237176744e-05, "epoch": 0.045036508555821864, "percentage": 4.5, "elapsed_time": "1:54:36", "remaining_time": "1 day, 16:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 809, "total_steps": 17941, "loss": 1.917, "learning_rate": 9.979472714059506e-05, "epoch": 0.045092246808985006, "percentage": 4.51, "elapsed_time": "1:54:45", "remaining_time": "1 day, 16:30:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 17941, "loss": 1.946, "learning_rate": 9.979392033022427e-05, "epoch": 0.04514798506214815, "percentage": 4.51, "elapsed_time": "1:54:53", "remaining_time": "1 day, 16:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 811, "total_steps": 17941, "loss": 1.8072, "learning_rate": 9.979311194068064e-05, "epoch": 0.0452037233153113, "percentage": 4.52, "elapsed_time": "1:55:02", "remaining_time": "1 day, 16:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 812, "total_steps": 17941, "loss": 1.6243, "learning_rate": 9.979230197198981e-05, "epoch": 0.04525946156847444, "percentage": 4.53, "elapsed_time": "1:55:10", "remaining_time": "1 day, 16:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 813, "total_steps": 17941, "loss": 1.7733, "learning_rate": 9.979149042417749e-05, "epoch": 0.04531519982163759, "percentage": 4.53, "elapsed_time": "1:55:19", "remaining_time": "1 day, 16:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 814, "total_steps": 17941, "loss": 1.821, "learning_rate": 9.979067729726938e-05, "epoch": 0.045370938074800735, "percentage": 4.54, "elapsed_time": "1:55:27", "remaining_time": "1 day, 16:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 815, "total_steps": 17941, "loss": 1.8286, "learning_rate": 9.978986259129129e-05, "epoch": 0.045426676327963884, "percentage": 4.54, "elapsed_time": "1:55:35", "remaining_time": "1 day, 16:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 816, "total_steps": 17941, "loss": 1.7967, "learning_rate": 9.978904630626904e-05, "epoch": 0.04548241458112703, "percentage": 4.55, "elapsed_time": "1:55:44", "remaining_time": "1 day, 16:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 817, "total_steps": 17941, "loss": 1.9883, "learning_rate": 9.978822844222855e-05, "epoch": 0.04553815283429017, "percentage": 4.55, "elapsed_time": "1:55:53", "remaining_time": "1 day, 16:29:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 818, "total_steps": 17941, "loss": 1.8694, "learning_rate": 9.978740899919574e-05, "epoch": 0.04559389108745332, "percentage": 4.56, "elapsed_time": "1:56:01", "remaining_time": "1 day, 16:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 819, "total_steps": 17941, "loss": 1.714, "learning_rate": 9.978658797719658e-05, "epoch": 0.04564962934061646, "percentage": 4.56, "elapsed_time": "1:56:10", "remaining_time": "1 day, 16:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 17941, "loss": 1.8288, "learning_rate": 9.978576537625714e-05, "epoch": 0.04570536759377961, "percentage": 4.57, "elapsed_time": "1:56:19", "remaining_time": "1 day, 16:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 821, "total_steps": 17941, "loss": 2.093, "learning_rate": 9.97849411964035e-05, "epoch": 0.045761105846942755, "percentage": 4.58, "elapsed_time": "1:56:27", "remaining_time": "1 day, 16:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 822, "total_steps": 17941, "loss": 1.6607, "learning_rate": 9.978411543766177e-05, "epoch": 0.045816844100105905, "percentage": 4.58, "elapsed_time": "1:56:36", "remaining_time": "1 day, 16:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 823, "total_steps": 17941, "loss": 1.9762, "learning_rate": 9.978328810005816e-05, "epoch": 0.04587258235326905, "percentage": 4.59, "elapsed_time": "1:56:45", "remaining_time": "1 day, 16:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 824, "total_steps": 17941, "loss": 1.6018, "learning_rate": 9.978245918361893e-05, "epoch": 0.0459283206064322, "percentage": 4.59, "elapsed_time": "1:56:54", "remaining_time": "1 day, 16:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 825, "total_steps": 17941, "loss": 1.8532, "learning_rate": 9.978162868837034e-05, "epoch": 0.04598405885959534, "percentage": 4.6, "elapsed_time": "1:57:02", "remaining_time": "1 day, 16:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 826, "total_steps": 17941, "loss": 1.7551, "learning_rate": 9.978079661433873e-05, "epoch": 0.04603979711275848, "percentage": 4.6, "elapsed_time": "1:57:11", "remaining_time": "1 day, 16:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 827, "total_steps": 17941, "loss": 1.7463, "learning_rate": 9.977996296155049e-05, "epoch": 0.04609553536592163, "percentage": 4.61, "elapsed_time": "1:57:19", "remaining_time": "1 day, 16:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 828, "total_steps": 17941, "loss": 1.6216, "learning_rate": 9.977912773003206e-05, "epoch": 0.046151273619084776, "percentage": 4.62, "elapsed_time": "1:57:28", "remaining_time": "1 day, 16:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 829, "total_steps": 17941, "loss": 1.9011, "learning_rate": 9.977829091980995e-05, "epoch": 0.046207011872247926, "percentage": 4.62, "elapsed_time": "1:57:36", "remaining_time": "1 day, 16:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 17941, "loss": 1.3583, "learning_rate": 9.977745253091067e-05, "epoch": 0.04626275012541107, "percentage": 4.63, "elapsed_time": "1:57:45", "remaining_time": "1 day, 16:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 831, "total_steps": 17941, "loss": 1.7256, "learning_rate": 9.977661256336081e-05, "epoch": 0.04631848837857422, "percentage": 4.63, "elapsed_time": "1:57:53", "remaining_time": "1 day, 16:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 832, "total_steps": 17941, "loss": 1.8484, "learning_rate": 9.977577101718701e-05, "epoch": 0.04637422663173736, "percentage": 4.64, "elapsed_time": "1:58:01", "remaining_time": "1 day, 16:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 833, "total_steps": 17941, "loss": 1.6564, "learning_rate": 9.977492789241598e-05, "epoch": 0.046429964884900504, "percentage": 4.64, "elapsed_time": "1:58:10", "remaining_time": "1 day, 16:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 834, "total_steps": 17941, "loss": 1.721, "learning_rate": 9.977408318907444e-05, "epoch": 0.046485703138063654, "percentage": 4.65, "elapsed_time": "1:58:19", "remaining_time": "1 day, 16:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 835, "total_steps": 17941, "loss": 2.0474, "learning_rate": 9.97732369071892e-05, "epoch": 0.0465414413912268, "percentage": 4.65, "elapsed_time": "1:58:28", "remaining_time": "1 day, 16:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 836, "total_steps": 17941, "loss": 1.4078, "learning_rate": 9.977238904678707e-05, "epoch": 0.04659717964438995, "percentage": 4.66, "elapsed_time": "1:58:36", "remaining_time": "1 day, 16:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 837, "total_steps": 17941, "loss": 1.5402, "learning_rate": 9.977153960789497e-05, "epoch": 0.04665291789755309, "percentage": 4.67, "elapsed_time": "1:58:45", "remaining_time": "1 day, 16:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 838, "total_steps": 17941, "loss": 1.8641, "learning_rate": 9.97706885905398e-05, "epoch": 0.04670865615071624, "percentage": 4.67, "elapsed_time": "1:58:53", "remaining_time": "1 day, 16:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 839, "total_steps": 17941, "loss": 1.8055, "learning_rate": 9.976983599474857e-05, "epoch": 0.04676439440387938, "percentage": 4.68, "elapsed_time": "1:59:02", "remaining_time": "1 day, 16:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 17941, "loss": 1.5263, "learning_rate": 9.976898182054832e-05, "epoch": 0.046820132657042525, "percentage": 4.68, "elapsed_time": "1:59:10", "remaining_time": "1 day, 16:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 841, "total_steps": 17941, "loss": 1.7926, "learning_rate": 9.976812606796615e-05, "epoch": 0.046875870910205675, "percentage": 4.69, "elapsed_time": "1:59:18", "remaining_time": "1 day, 16:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 842, "total_steps": 17941, "loss": 1.6341, "learning_rate": 9.976726873702918e-05, "epoch": 0.04693160916336882, "percentage": 4.69, "elapsed_time": "1:59:27", "remaining_time": "1 day, 16:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 843, "total_steps": 17941, "loss": 1.882, "learning_rate": 9.976640982776461e-05, "epoch": 0.04698734741653197, "percentage": 4.7, "elapsed_time": "1:59:36", "remaining_time": "1 day, 16:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 844, "total_steps": 17941, "loss": 1.6004, "learning_rate": 9.97655493401997e-05, "epoch": 0.04704308566969511, "percentage": 4.7, "elapsed_time": "1:59:44", "remaining_time": "1 day, 16:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 845, "total_steps": 17941, "loss": 1.7355, "learning_rate": 9.97646872743617e-05, "epoch": 0.04709882392285826, "percentage": 4.71, "elapsed_time": "1:59:52", "remaining_time": "1 day, 16:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 846, "total_steps": 17941, "loss": 1.9073, "learning_rate": 9.976382363027797e-05, "epoch": 0.0471545621760214, "percentage": 4.72, "elapsed_time": "2:00:01", "remaining_time": "1 day, 16:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 847, "total_steps": 17941, "loss": 1.6875, "learning_rate": 9.976295840797589e-05, "epoch": 0.04721030042918455, "percentage": 4.72, "elapsed_time": "2:00:09", "remaining_time": "1 day, 16:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 848, "total_steps": 17941, "loss": 1.6172, "learning_rate": 9.976209160748292e-05, "epoch": 0.047266038682347696, "percentage": 4.73, "elapsed_time": "2:00:18", "remaining_time": "1 day, 16:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 849, "total_steps": 17941, "loss": 1.6371, "learning_rate": 9.976122322882653e-05, "epoch": 0.04732177693551084, "percentage": 4.73, "elapsed_time": "2:00:26", "remaining_time": "1 day, 16:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 17941, "loss": 1.9283, "learning_rate": 9.976035327203427e-05, "epoch": 0.04737751518867399, "percentage": 4.74, "elapsed_time": "2:00:35", "remaining_time": "1 day, 16:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 851, "total_steps": 17941, "loss": 2.0407, "learning_rate": 9.975948173713374e-05, "epoch": 0.04743325344183713, "percentage": 4.74, "elapsed_time": "2:00:43", "remaining_time": "1 day, 16:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 852, "total_steps": 17941, "loss": 1.7475, "learning_rate": 9.975860862415254e-05, "epoch": 0.04748899169500028, "percentage": 4.75, "elapsed_time": "2:00:52", "remaining_time": "1 day, 16:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 853, "total_steps": 17941, "loss": 1.7922, "learning_rate": 9.975773393311841e-05, "epoch": 0.047544729948163424, "percentage": 4.75, "elapsed_time": "2:01:00", "remaining_time": "1 day, 16:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 854, "total_steps": 17941, "loss": 1.7012, "learning_rate": 9.975685766405906e-05, "epoch": 0.04760046820132657, "percentage": 4.76, "elapsed_time": "2:01:09", "remaining_time": "1 day, 16:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 855, "total_steps": 17941, "loss": 1.6647, "learning_rate": 9.975597981700228e-05, "epoch": 0.047656206454489716, "percentage": 4.77, "elapsed_time": "2:01:17", "remaining_time": "1 day, 16:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 856, "total_steps": 17941, "loss": 1.5522, "learning_rate": 9.975510039197592e-05, "epoch": 0.04771194470765286, "percentage": 4.77, "elapsed_time": "2:01:26", "remaining_time": "1 day, 16:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 857, "total_steps": 17941, "loss": 1.5235, "learning_rate": 9.975421938900789e-05, "epoch": 0.04776768296081601, "percentage": 4.78, "elapsed_time": "2:01:34", "remaining_time": "1 day, 16:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 858, "total_steps": 17941, "loss": 1.8876, "learning_rate": 9.975333680812609e-05, "epoch": 0.04782342121397915, "percentage": 4.78, "elapsed_time": "2:01:43", "remaining_time": "1 day, 16:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 859, "total_steps": 17941, "loss": 1.8422, "learning_rate": 9.975245264935852e-05, "epoch": 0.0478791594671423, "percentage": 4.79, "elapsed_time": "2:01:51", "remaining_time": "1 day, 16:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 17941, "loss": 1.7702, "learning_rate": 9.975156691273324e-05, "epoch": 0.047934897720305444, "percentage": 4.79, "elapsed_time": "2:02:00", "remaining_time": "1 day, 16:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 861, "total_steps": 17941, "loss": 1.9332, "learning_rate": 9.975067959827833e-05, "epoch": 0.047990635973468594, "percentage": 4.8, "elapsed_time": "2:02:08", "remaining_time": "1 day, 16:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 862, "total_steps": 17941, "loss": 1.7497, "learning_rate": 9.974979070602192e-05, "epoch": 0.04804637422663174, "percentage": 4.8, "elapsed_time": "2:02:17", "remaining_time": "1 day, 16:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 863, "total_steps": 17941, "loss": 2.0405, "learning_rate": 9.974890023599222e-05, "epoch": 0.04810211247979488, "percentage": 4.81, "elapsed_time": "2:02:26", "remaining_time": "1 day, 16:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 864, "total_steps": 17941, "loss": 1.7609, "learning_rate": 9.974800818821746e-05, "epoch": 0.04815785073295803, "percentage": 4.82, "elapsed_time": "2:02:34", "remaining_time": "1 day, 16:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 865, "total_steps": 17941, "loss": 1.9515, "learning_rate": 9.974711456272593e-05, "epoch": 0.04821358898612117, "percentage": 4.82, "elapsed_time": "2:02:43", "remaining_time": "1 day, 16:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 866, "total_steps": 17941, "loss": 1.645, "learning_rate": 9.974621935954597e-05, "epoch": 0.04826932723928432, "percentage": 4.83, "elapsed_time": "2:02:52", "remaining_time": "1 day, 16:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 867, "total_steps": 17941, "loss": 1.7104, "learning_rate": 9.974532257870596e-05, "epoch": 0.048325065492447465, "percentage": 4.83, "elapsed_time": "2:03:01", "remaining_time": "1 day, 16:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 868, "total_steps": 17941, "loss": 1.8043, "learning_rate": 9.974442422023438e-05, "epoch": 0.048380803745610615, "percentage": 4.84, "elapsed_time": "2:03:09", "remaining_time": "1 day, 16:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 869, "total_steps": 17941, "loss": 1.9662, "learning_rate": 9.974352428415968e-05, "epoch": 0.04843654199877376, "percentage": 4.84, "elapsed_time": "2:03:18", "remaining_time": "1 day, 16:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 17941, "loss": 1.8876, "learning_rate": 9.974262277051041e-05, "epoch": 0.04849228025193691, "percentage": 4.85, "elapsed_time": "2:03:26", "remaining_time": "1 day, 16:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 871, "total_steps": 17941, "loss": 1.5996, "learning_rate": 9.974171967931519e-05, "epoch": 0.04854801850510005, "percentage": 4.85, "elapsed_time": "2:03:35", "remaining_time": "1 day, 16:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 872, "total_steps": 17941, "loss": 1.6907, "learning_rate": 9.974081501060259e-05, "epoch": 0.04860375675826319, "percentage": 4.86, "elapsed_time": "2:03:43", "remaining_time": "1 day, 16:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 873, "total_steps": 17941, "loss": 1.7377, "learning_rate": 9.973990876440138e-05, "epoch": 0.04865949501142634, "percentage": 4.87, "elapsed_time": "2:03:52", "remaining_time": "1 day, 16:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 874, "total_steps": 17941, "loss": 1.8001, "learning_rate": 9.973900094074027e-05, "epoch": 0.048715233264589486, "percentage": 4.87, "elapsed_time": "2:04:01", "remaining_time": "1 day, 16:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 875, "total_steps": 17941, "loss": 1.8128, "learning_rate": 9.973809153964804e-05, "epoch": 0.048770971517752636, "percentage": 4.88, "elapsed_time": "2:04:09", "remaining_time": "1 day, 16:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 876, "total_steps": 17941, "loss": 2.0648, "learning_rate": 9.973718056115354e-05, "epoch": 0.04882670977091578, "percentage": 4.88, "elapsed_time": "2:04:17", "remaining_time": "1 day, 16:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 877, "total_steps": 17941, "loss": 1.8552, "learning_rate": 9.973626800528566e-05, "epoch": 0.04888244802407893, "percentage": 4.89, "elapsed_time": "2:04:26", "remaining_time": "1 day, 16:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 878, "total_steps": 17941, "loss": 1.577, "learning_rate": 9.973535387207333e-05, "epoch": 0.04893818627724207, "percentage": 4.89, "elapsed_time": "2:04:34", "remaining_time": "1 day, 16:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 879, "total_steps": 17941, "loss": 1.66, "learning_rate": 9.973443816154557e-05, "epoch": 0.048993924530405214, "percentage": 4.9, "elapsed_time": "2:04:43", "remaining_time": "1 day, 16:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 17941, "loss": 1.7623, "learning_rate": 9.97335208737314e-05, "epoch": 0.049049662783568364, "percentage": 4.9, "elapsed_time": "2:04:51", "remaining_time": "1 day, 16:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 881, "total_steps": 17941, "loss": 1.8681, "learning_rate": 9.973260200865991e-05, "epoch": 0.04910540103673151, "percentage": 4.91, "elapsed_time": "2:05:00", "remaining_time": "1 day, 16:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 882, "total_steps": 17941, "loss": 1.9225, "learning_rate": 9.973168156636025e-05, "epoch": 0.049161139289894656, "percentage": 4.92, "elapsed_time": "2:05:08", "remaining_time": "1 day, 16:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 883, "total_steps": 17941, "loss": 1.8308, "learning_rate": 9.97307595468616e-05, "epoch": 0.0492168775430578, "percentage": 4.92, "elapsed_time": "2:05:17", "remaining_time": "1 day, 16:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 884, "total_steps": 17941, "loss": 1.5791, "learning_rate": 9.97298359501932e-05, "epoch": 0.04927261579622095, "percentage": 4.93, "elapsed_time": "2:05:25", "remaining_time": "1 day, 16:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 885, "total_steps": 17941, "loss": 1.7279, "learning_rate": 9.972891077638438e-05, "epoch": 0.04932835404938409, "percentage": 4.93, "elapsed_time": "2:05:34", "remaining_time": "1 day, 16:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 886, "total_steps": 17941, "loss": 1.5131, "learning_rate": 9.972798402546441e-05, "epoch": 0.049384092302547235, "percentage": 4.94, "elapsed_time": "2:05:42", "remaining_time": "1 day, 16:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 887, "total_steps": 17941, "loss": 1.6591, "learning_rate": 9.972705569746274e-05, "epoch": 0.049439830555710385, "percentage": 4.94, "elapsed_time": "2:05:51", "remaining_time": "1 day, 16:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 888, "total_steps": 17941, "loss": 1.7141, "learning_rate": 9.972612579240881e-05, "epoch": 0.04949556880887353, "percentage": 4.95, "elapsed_time": "2:05:59", "remaining_time": "1 day, 16:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 889, "total_steps": 17941, "loss": 1.8636, "learning_rate": 9.972519431033206e-05, "epoch": 0.04955130706203668, "percentage": 4.96, "elapsed_time": "2:06:08", "remaining_time": "1 day, 16:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 17941, "loss": 1.7943, "learning_rate": 9.972426125126209e-05, "epoch": 0.04960704531519982, "percentage": 4.96, "elapsed_time": "2:06:16", "remaining_time": "1 day, 16:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 891, "total_steps": 17941, "loss": 1.6949, "learning_rate": 9.972332661522845e-05, "epoch": 0.04966278356836297, "percentage": 4.97, "elapsed_time": "2:06:25", "remaining_time": "1 day, 16:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 892, "total_steps": 17941, "loss": 1.9313, "learning_rate": 9.972239040226082e-05, "epoch": 0.04971852182152611, "percentage": 4.97, "elapsed_time": "2:06:33", "remaining_time": "1 day, 16:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 893, "total_steps": 17941, "loss": 1.8589, "learning_rate": 9.972145261238884e-05, "epoch": 0.04977426007468926, "percentage": 4.98, "elapsed_time": "2:06:42", "remaining_time": "1 day, 16:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 894, "total_steps": 17941, "loss": 1.9736, "learning_rate": 9.972051324564229e-05, "epoch": 0.049829998327852405, "percentage": 4.98, "elapsed_time": "2:06:50", "remaining_time": "1 day, 16:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 895, "total_steps": 17941, "loss": 2.1093, "learning_rate": 9.971957230205096e-05, "epoch": 0.04988573658101555, "percentage": 4.99, "elapsed_time": "2:06:59", "remaining_time": "1 day, 16:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 896, "total_steps": 17941, "loss": 1.6786, "learning_rate": 9.971862978164466e-05, "epoch": 0.0499414748341787, "percentage": 4.99, "elapsed_time": "2:07:07", "remaining_time": "1 day, 16:18:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 897, "total_steps": 17941, "loss": 1.8162, "learning_rate": 9.971768568445332e-05, "epoch": 0.04999721308734184, "percentage": 5.0, "elapsed_time": "2:07:16", "remaining_time": "1 day, 16:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 898, "total_steps": 17941, "loss": 1.3044, "learning_rate": 9.971674001050686e-05, "epoch": 0.05005295134050499, "percentage": 5.01, "elapsed_time": "2:07:24", "remaining_time": "1 day, 16:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 899, "total_steps": 17941, "loss": 1.7169, "learning_rate": 9.971579275983527e-05, "epoch": 0.05010868959366813, "percentage": 5.01, "elapsed_time": "2:07:32", "remaining_time": "1 day, 16:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 17941, "loss": 1.4898, "learning_rate": 9.971484393246861e-05, "epoch": 0.05016442784683128, "percentage": 5.02, "elapsed_time": "2:07:41", "remaining_time": "1 day, 16:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 901, "total_steps": 17941, "loss": 1.6325, "learning_rate": 9.971389352843695e-05, "epoch": 0.050220166099994426, "percentage": 5.02, "elapsed_time": "2:07:49", "remaining_time": "1 day, 16:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 902, "total_steps": 17941, "loss": 1.5962, "learning_rate": 9.971294154777044e-05, "epoch": 0.05027590435315757, "percentage": 5.03, "elapsed_time": "2:07:58", "remaining_time": "1 day, 16:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 903, "total_steps": 17941, "loss": 1.8215, "learning_rate": 9.971198799049928e-05, "epoch": 0.05033164260632072, "percentage": 5.03, "elapsed_time": "2:08:06", "remaining_time": "1 day, 16:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 904, "total_steps": 17941, "loss": 1.9647, "learning_rate": 9.971103285665369e-05, "epoch": 0.05038738085948386, "percentage": 5.04, "elapsed_time": "2:08:15", "remaining_time": "1 day, 16:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 905, "total_steps": 17941, "loss": 1.6109, "learning_rate": 9.971007614626397e-05, "epoch": 0.05044311911264701, "percentage": 5.04, "elapsed_time": "2:08:23", "remaining_time": "1 day, 16:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 906, "total_steps": 17941, "loss": 1.6419, "learning_rate": 9.970911785936047e-05, "epoch": 0.050498857365810154, "percentage": 5.05, "elapsed_time": "2:08:32", "remaining_time": "1 day, 16:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 907, "total_steps": 17941, "loss": 1.6144, "learning_rate": 9.970815799597358e-05, "epoch": 0.050554595618973304, "percentage": 5.06, "elapsed_time": "2:08:41", "remaining_time": "1 day, 16:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 908, "total_steps": 17941, "loss": 1.7978, "learning_rate": 9.970719655613373e-05, "epoch": 0.05061033387213645, "percentage": 5.06, "elapsed_time": "2:08:49", "remaining_time": "1 day, 16:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 909, "total_steps": 17941, "loss": 1.8175, "learning_rate": 9.970623353987141e-05, "epoch": 0.05066607212529959, "percentage": 5.07, "elapsed_time": "2:08:58", "remaining_time": "1 day, 16:16:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 17941, "loss": 2.043, "learning_rate": 9.97052689472172e-05, "epoch": 0.05072181037846274, "percentage": 5.07, "elapsed_time": "2:09:06", "remaining_time": "1 day, 16:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 911, "total_steps": 17941, "loss": 1.9165, "learning_rate": 9.970430277820165e-05, "epoch": 0.05077754863162588, "percentage": 5.08, "elapsed_time": "2:09:15", "remaining_time": "1 day, 16:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 912, "total_steps": 17941, "loss": 1.8203, "learning_rate": 9.970333503285539e-05, "epoch": 0.05083328688478903, "percentage": 5.08, "elapsed_time": "2:09:23", "remaining_time": "1 day, 16:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 913, "total_steps": 17941, "loss": 1.9429, "learning_rate": 9.970236571120915e-05, "epoch": 0.050889025137952175, "percentage": 5.09, "elapsed_time": "2:09:32", "remaining_time": "1 day, 16:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 914, "total_steps": 17941, "loss": 2.0989, "learning_rate": 9.970139481329364e-05, "epoch": 0.050944763391115325, "percentage": 5.09, "elapsed_time": "2:09:40", "remaining_time": "1 day, 16:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 915, "total_steps": 17941, "loss": 1.7213, "learning_rate": 9.970042233913968e-05, "epoch": 0.05100050164427847, "percentage": 5.1, "elapsed_time": "2:09:49", "remaining_time": "1 day, 16:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 916, "total_steps": 17941, "loss": 1.6979, "learning_rate": 9.96994482887781e-05, "epoch": 0.05105623989744162, "percentage": 5.11, "elapsed_time": "2:09:57", "remaining_time": "1 day, 16:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 917, "total_steps": 17941, "loss": 1.7629, "learning_rate": 9.969847266223979e-05, "epoch": 0.05111197815060476, "percentage": 5.11, "elapsed_time": "2:10:06", "remaining_time": "1 day, 16:15:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 918, "total_steps": 17941, "loss": 1.7208, "learning_rate": 9.969749545955567e-05, "epoch": 0.0511677164037679, "percentage": 5.12, "elapsed_time": "2:10:14", "remaining_time": "1 day, 16:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 919, "total_steps": 17941, "loss": 1.952, "learning_rate": 9.969651668075678e-05, "epoch": 0.05122345465693105, "percentage": 5.12, "elapsed_time": "2:10:22", "remaining_time": "1 day, 16:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 17941, "loss": 1.6574, "learning_rate": 9.969553632587409e-05, "epoch": 0.051279192910094196, "percentage": 5.13, "elapsed_time": "2:10:31", "remaining_time": "1 day, 16:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 921, "total_steps": 17941, "loss": 1.6173, "learning_rate": 9.969455439493877e-05, "epoch": 0.051334931163257345, "percentage": 5.13, "elapsed_time": "2:10:39", "remaining_time": "1 day, 16:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 922, "total_steps": 17941, "loss": 1.6471, "learning_rate": 9.96935708879819e-05, "epoch": 0.05139066941642049, "percentage": 5.14, "elapsed_time": "2:10:48", "remaining_time": "1 day, 16:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 923, "total_steps": 17941, "loss": 2.0134, "learning_rate": 9.969258580503471e-05, "epoch": 0.05144640766958364, "percentage": 5.14, "elapsed_time": "2:10:56", "remaining_time": "1 day, 16:14:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 924, "total_steps": 17941, "loss": 2.1658, "learning_rate": 9.969159914612843e-05, "epoch": 0.05150214592274678, "percentage": 5.15, "elapsed_time": "2:11:05", "remaining_time": "1 day, 16:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 925, "total_steps": 17941, "loss": 1.9766, "learning_rate": 9.969061091129433e-05, "epoch": 0.051557884175909924, "percentage": 5.16, "elapsed_time": "2:11:13", "remaining_time": "1 day, 16:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 926, "total_steps": 17941, "loss": 1.678, "learning_rate": 9.968962110056379e-05, "epoch": 0.051613622429073074, "percentage": 5.16, "elapsed_time": "2:11:22", "remaining_time": "1 day, 16:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 927, "total_steps": 17941, "loss": 1.8249, "learning_rate": 9.968862971396816e-05, "epoch": 0.051669360682236216, "percentage": 5.17, "elapsed_time": "2:11:30", "remaining_time": "1 day, 16:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 928, "total_steps": 17941, "loss": 1.7606, "learning_rate": 9.96876367515389e-05, "epoch": 0.051725098935399366, "percentage": 5.17, "elapsed_time": "2:11:39", "remaining_time": "1 day, 16:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 929, "total_steps": 17941, "loss": 1.8612, "learning_rate": 9.968664221330751e-05, "epoch": 0.05178083718856251, "percentage": 5.18, "elapsed_time": "2:11:47", "remaining_time": "1 day, 16:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 17941, "loss": 1.8672, "learning_rate": 9.968564609930553e-05, "epoch": 0.05183657544172566, "percentage": 5.18, "elapsed_time": "2:11:56", "remaining_time": "1 day, 16:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 931, "total_steps": 17941, "loss": 1.766, "learning_rate": 9.968464840956453e-05, "epoch": 0.0518923136948888, "percentage": 5.19, "elapsed_time": "2:12:04", "remaining_time": "1 day, 16:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 932, "total_steps": 17941, "loss": 1.8631, "learning_rate": 9.968364914411616e-05, "epoch": 0.05194805194805195, "percentage": 5.19, "elapsed_time": "2:12:13", "remaining_time": "1 day, 16:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 933, "total_steps": 17941, "loss": 1.5441, "learning_rate": 9.968264830299213e-05, "epoch": 0.052003790201215094, "percentage": 5.2, "elapsed_time": "2:12:21", "remaining_time": "1 day, 16:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 934, "total_steps": 17941, "loss": 1.7751, "learning_rate": 9.968164588622415e-05, "epoch": 0.05205952845437824, "percentage": 5.21, "elapsed_time": "2:12:30", "remaining_time": "1 day, 16:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 935, "total_steps": 17941, "loss": 1.662, "learning_rate": 9.968064189384403e-05, "epoch": 0.05211526670754139, "percentage": 5.21, "elapsed_time": "2:12:38", "remaining_time": "1 day, 16:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 936, "total_steps": 17941, "loss": 1.7384, "learning_rate": 9.967963632588362e-05, "epoch": 0.05217100496070453, "percentage": 5.22, "elapsed_time": "2:12:47", "remaining_time": "1 day, 16:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 937, "total_steps": 17941, "loss": 1.8133, "learning_rate": 9.96786291823748e-05, "epoch": 0.05222674321386768, "percentage": 5.22, "elapsed_time": "2:12:55", "remaining_time": "1 day, 16:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 938, "total_steps": 17941, "loss": 1.8851, "learning_rate": 9.96776204633495e-05, "epoch": 0.05228248146703082, "percentage": 5.23, "elapsed_time": "2:13:04", "remaining_time": "1 day, 16:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 939, "total_steps": 17941, "loss": 1.6583, "learning_rate": 9.967661016883972e-05, "epoch": 0.05233821972019397, "percentage": 5.23, "elapsed_time": "2:13:12", "remaining_time": "1 day, 16:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 17941, "loss": 1.6385, "learning_rate": 9.967559829887749e-05, "epoch": 0.052393957973357115, "percentage": 5.24, "elapsed_time": "2:13:21", "remaining_time": "1 day, 16:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 941, "total_steps": 17941, "loss": 1.6901, "learning_rate": 9.967458485349492e-05, "epoch": 0.05244969622652026, "percentage": 5.24, "elapsed_time": "2:13:29", "remaining_time": "1 day, 16:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 942, "total_steps": 17941, "loss": 1.9757, "learning_rate": 9.967356983272414e-05, "epoch": 0.05250543447968341, "percentage": 5.25, "elapsed_time": "2:13:39", "remaining_time": "1 day, 16:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 943, "total_steps": 17941, "loss": 1.6266, "learning_rate": 9.967255323659734e-05, "epoch": 0.05256117273284655, "percentage": 5.26, "elapsed_time": "2:13:47", "remaining_time": "1 day, 16:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 944, "total_steps": 17941, "loss": 1.6938, "learning_rate": 9.967153506514677e-05, "epoch": 0.0526169109860097, "percentage": 5.26, "elapsed_time": "2:13:56", "remaining_time": "1 day, 16:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 945, "total_steps": 17941, "loss": 1.8448, "learning_rate": 9.967051531840471e-05, "epoch": 0.05267264923917284, "percentage": 5.27, "elapsed_time": "2:14:04", "remaining_time": "1 day, 16:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 946, "total_steps": 17941, "loss": 1.5313, "learning_rate": 9.96694939964035e-05, "epoch": 0.05272838749233599, "percentage": 5.27, "elapsed_time": "2:14:13", "remaining_time": "1 day, 16:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 947, "total_steps": 17941, "loss": 1.9398, "learning_rate": 9.966847109917555e-05, "epoch": 0.052784125745499136, "percentage": 5.28, "elapsed_time": "2:14:21", "remaining_time": "1 day, 16:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 948, "total_steps": 17941, "loss": 1.8052, "learning_rate": 9.966744662675326e-05, "epoch": 0.05283986399866228, "percentage": 5.28, "elapsed_time": "2:14:30", "remaining_time": "1 day, 16:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 949, "total_steps": 17941, "loss": 1.7875, "learning_rate": 9.966642057916915e-05, "epoch": 0.05289560225182543, "percentage": 5.29, "elapsed_time": "2:14:38", "remaining_time": "1 day, 16:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 17941, "loss": 1.6786, "learning_rate": 9.966539295645576e-05, "epoch": 0.05295134050498857, "percentage": 5.3, "elapsed_time": "2:14:47", "remaining_time": "1 day, 16:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 951, "total_steps": 17941, "loss": 1.473, "learning_rate": 9.966436375864567e-05, "epoch": 0.05300707875815172, "percentage": 5.3, "elapsed_time": "2:14:55", "remaining_time": "1 day, 16:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 952, "total_steps": 17941, "loss": 1.7648, "learning_rate": 9.966333298577154e-05, "epoch": 0.053062817011314864, "percentage": 5.31, "elapsed_time": "2:15:03", "remaining_time": "1 day, 16:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 953, "total_steps": 17941, "loss": 1.6435, "learning_rate": 9.966230063786602e-05, "epoch": 0.053118555264478014, "percentage": 5.31, "elapsed_time": "2:15:12", "remaining_time": "1 day, 16:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 954, "total_steps": 17941, "loss": 1.762, "learning_rate": 9.96612667149619e-05, "epoch": 0.05317429351764116, "percentage": 5.32, "elapsed_time": "2:15:21", "remaining_time": "1 day, 16:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 955, "total_steps": 17941, "loss": 1.8957, "learning_rate": 9.966023121709192e-05, "epoch": 0.053230031770804306, "percentage": 5.32, "elapsed_time": "2:15:30", "remaining_time": "1 day, 16:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 956, "total_steps": 17941, "loss": 1.8783, "learning_rate": 9.965919414428896e-05, "epoch": 0.05328577002396745, "percentage": 5.33, "elapsed_time": "2:15:39", "remaining_time": "1 day, 16:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 957, "total_steps": 17941, "loss": 1.8575, "learning_rate": 9.965815549658589e-05, "epoch": 0.05334150827713059, "percentage": 5.33, "elapsed_time": "2:15:48", "remaining_time": "1 day, 16:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 958, "total_steps": 17941, "loss": 1.7704, "learning_rate": 9.965711527401567e-05, "epoch": 0.05339724653029374, "percentage": 5.34, "elapsed_time": "2:15:56", "remaining_time": "1 day, 16:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 959, "total_steps": 17941, "loss": 1.6103, "learning_rate": 9.965607347661125e-05, "epoch": 0.053452984783456885, "percentage": 5.35, "elapsed_time": "2:16:04", "remaining_time": "1 day, 16:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 17941, "loss": 1.9864, "learning_rate": 9.965503010440571e-05, "epoch": 0.053508723036620034, "percentage": 5.35, "elapsed_time": "2:16:13", "remaining_time": "1 day, 16:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 961, "total_steps": 17941, "loss": 1.7264, "learning_rate": 9.965398515743212e-05, "epoch": 0.05356446128978318, "percentage": 5.36, "elapsed_time": "2:16:21", "remaining_time": "1 day, 16:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 962, "total_steps": 17941, "loss": 2.2176, "learning_rate": 9.965293863572363e-05, "epoch": 0.05362019954294633, "percentage": 5.36, "elapsed_time": "2:16:30", "remaining_time": "1 day, 16:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 963, "total_steps": 17941, "loss": 2.0434, "learning_rate": 9.96518905393134e-05, "epoch": 0.05367593779610947, "percentage": 5.37, "elapsed_time": "2:16:38", "remaining_time": "1 day, 16:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 964, "total_steps": 17941, "loss": 1.4151, "learning_rate": 9.965084086823472e-05, "epoch": 0.05373167604927261, "percentage": 5.37, "elapsed_time": "2:16:47", "remaining_time": "1 day, 16:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 965, "total_steps": 17941, "loss": 1.7144, "learning_rate": 9.964978962252085e-05, "epoch": 0.05378741430243576, "percentage": 5.38, "elapsed_time": "2:16:55", "remaining_time": "1 day, 16:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 966, "total_steps": 17941, "loss": 1.6531, "learning_rate": 9.964873680220512e-05, "epoch": 0.053843152555598905, "percentage": 5.38, "elapsed_time": "2:17:04", "remaining_time": "1 day, 16:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 967, "total_steps": 17941, "loss": 1.9851, "learning_rate": 9.964768240732093e-05, "epoch": 0.053898890808762055, "percentage": 5.39, "elapsed_time": "2:17:13", "remaining_time": "1 day, 16:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 968, "total_steps": 17941, "loss": 1.9137, "learning_rate": 9.964662643790173e-05, "epoch": 0.0539546290619252, "percentage": 5.4, "elapsed_time": "2:17:21", "remaining_time": "1 day, 16:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 969, "total_steps": 17941, "loss": 1.8972, "learning_rate": 9.9645568893981e-05, "epoch": 0.05401036731508835, "percentage": 5.4, "elapsed_time": "2:17:30", "remaining_time": "1 day, 16:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 17941, "loss": 1.5612, "learning_rate": 9.964450977559226e-05, "epoch": 0.05406610556825149, "percentage": 5.41, "elapsed_time": "2:17:38", "remaining_time": "1 day, 16:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 971, "total_steps": 17941, "loss": 2.0708, "learning_rate": 9.964344908276914e-05, "epoch": 0.054121843821414634, "percentage": 5.41, "elapsed_time": "2:17:47", "remaining_time": "1 day, 16:08:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 972, "total_steps": 17941, "loss": 1.6573, "learning_rate": 9.964238681554524e-05, "epoch": 0.05417758207457778, "percentage": 5.42, "elapsed_time": "2:17:55", "remaining_time": "1 day, 16:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 973, "total_steps": 17941, "loss": 1.918, "learning_rate": 9.964132297395428e-05, "epoch": 0.054233320327740926, "percentage": 5.42, "elapsed_time": "2:18:04", "remaining_time": "1 day, 16:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 974, "total_steps": 17941, "loss": 1.721, "learning_rate": 9.964025755802997e-05, "epoch": 0.054289058580904076, "percentage": 5.43, "elapsed_time": "2:18:12", "remaining_time": "1 day, 16:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 975, "total_steps": 17941, "loss": 1.9453, "learning_rate": 9.963919056780612e-05, "epoch": 0.05434479683406722, "percentage": 5.43, "elapsed_time": "2:18:21", "remaining_time": "1 day, 16:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 976, "total_steps": 17941, "loss": 1.9271, "learning_rate": 9.963812200331656e-05, "epoch": 0.05440053508723037, "percentage": 5.44, "elapsed_time": "2:18:30", "remaining_time": "1 day, 16:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 977, "total_steps": 17941, "loss": 1.5766, "learning_rate": 9.963705186459517e-05, "epoch": 0.05445627334039351, "percentage": 5.45, "elapsed_time": "2:18:38", "remaining_time": "1 day, 16:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 978, "total_steps": 17941, "loss": 1.7721, "learning_rate": 9.963598015167592e-05, "epoch": 0.05451201159355666, "percentage": 5.45, "elapsed_time": "2:18:46", "remaining_time": "1 day, 16:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 979, "total_steps": 17941, "loss": 1.6293, "learning_rate": 9.963490686459277e-05, "epoch": 0.054567749846719804, "percentage": 5.46, "elapsed_time": "2:18:55", "remaining_time": "1 day, 16:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 17941, "loss": 1.8723, "learning_rate": 9.963383200337977e-05, "epoch": 0.05462348809988295, "percentage": 5.46, "elapsed_time": "2:19:03", "remaining_time": "1 day, 16:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 981, "total_steps": 17941, "loss": 1.7368, "learning_rate": 9.963275556807098e-05, "epoch": 0.0546792263530461, "percentage": 5.47, "elapsed_time": "2:19:12", "remaining_time": "1 day, 16:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 982, "total_steps": 17941, "loss": 1.4994, "learning_rate": 9.963167755870059e-05, "epoch": 0.05473496460620924, "percentage": 5.47, "elapsed_time": "2:19:20", "remaining_time": "1 day, 16:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 983, "total_steps": 17941, "loss": 1.8058, "learning_rate": 9.963059797530274e-05, "epoch": 0.05479070285937239, "percentage": 5.48, "elapsed_time": "2:19:29", "remaining_time": "1 day, 16:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 984, "total_steps": 17941, "loss": 1.7393, "learning_rate": 9.96295168179117e-05, "epoch": 0.05484644111253553, "percentage": 5.48, "elapsed_time": "2:19:37", "remaining_time": "1 day, 16:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 985, "total_steps": 17941, "loss": 2.149, "learning_rate": 9.962843408656176e-05, "epoch": 0.05490217936569868, "percentage": 5.49, "elapsed_time": "2:19:46", "remaining_time": "1 day, 16:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 986, "total_steps": 17941, "loss": 2.1734, "learning_rate": 9.962734978128723e-05, "epoch": 0.054957917618861825, "percentage": 5.5, "elapsed_time": "2:19:55", "remaining_time": "1 day, 16:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 987, "total_steps": 17941, "loss": 1.8782, "learning_rate": 9.962626390212251e-05, "epoch": 0.05501365587202497, "percentage": 5.5, "elapsed_time": "2:20:03", "remaining_time": "1 day, 16:05:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 988, "total_steps": 17941, "loss": 1.7033, "learning_rate": 9.962517644910204e-05, "epoch": 0.05506939412518812, "percentage": 5.51, "elapsed_time": "2:20:12", "remaining_time": "1 day, 16:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 989, "total_steps": 17941, "loss": 1.969, "learning_rate": 9.962408742226032e-05, "epoch": 0.05512513237835126, "percentage": 5.51, "elapsed_time": "2:20:20", "remaining_time": "1 day, 16:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 17941, "loss": 1.8229, "learning_rate": 9.962299682163186e-05, "epoch": 0.05518087063151441, "percentage": 5.52, "elapsed_time": "2:20:29", "remaining_time": "1 day, 16:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 991, "total_steps": 17941, "loss": 1.8161, "learning_rate": 9.962190464725128e-05, "epoch": 0.05523660888467755, "percentage": 5.52, "elapsed_time": "2:20:38", "remaining_time": "1 day, 16:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 992, "total_steps": 17941, "loss": 1.938, "learning_rate": 9.962081089915319e-05, "epoch": 0.0552923471378407, "percentage": 5.53, "elapsed_time": "2:20:46", "remaining_time": "1 day, 16:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 993, "total_steps": 17941, "loss": 1.7414, "learning_rate": 9.961971557737227e-05, "epoch": 0.055348085391003846, "percentage": 5.53, "elapsed_time": "2:20:55", "remaining_time": "1 day, 16:05:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 994, "total_steps": 17941, "loss": 1.8595, "learning_rate": 9.96186186819433e-05, "epoch": 0.05540382364416699, "percentage": 5.54, "elapsed_time": "2:21:03", "remaining_time": "1 day, 16:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 995, "total_steps": 17941, "loss": 1.8233, "learning_rate": 9.961752021290103e-05, "epoch": 0.05545956189733014, "percentage": 5.55, "elapsed_time": "2:21:12", "remaining_time": "1 day, 16:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 996, "total_steps": 17941, "loss": 1.6666, "learning_rate": 9.961642017028033e-05, "epoch": 0.05551530015049328, "percentage": 5.55, "elapsed_time": "2:21:21", "remaining_time": "1 day, 16:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 997, "total_steps": 17941, "loss": 2.0589, "learning_rate": 9.961531855411603e-05, "epoch": 0.05557103840365643, "percentage": 5.56, "elapsed_time": "2:21:29", "remaining_time": "1 day, 16:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 998, "total_steps": 17941, "loss": 2.0774, "learning_rate": 9.961421536444313e-05, "epoch": 0.055626776656819574, "percentage": 5.56, "elapsed_time": "2:21:38", "remaining_time": "1 day, 16:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 999, "total_steps": 17941, "loss": 1.5936, "learning_rate": 9.961311060129659e-05, "epoch": 0.055682514909982724, "percentage": 5.57, "elapsed_time": "2:21:46", "remaining_time": "1 day, 16:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 17941, "loss": 1.8414, "learning_rate": 9.961200426471142e-05, "epoch": 0.055738253163145866, "percentage": 5.57, "elapsed_time": "2:21:55", "remaining_time": "1 day, 16:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1001, "total_steps": 17941, "loss": 1.6496, "learning_rate": 9.961089635472276e-05, "epoch": 0.055793991416309016, "percentage": 5.58, "elapsed_time": "2:22:03", "remaining_time": "1 day, 16:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1002, "total_steps": 17941, "loss": 1.3193, "learning_rate": 9.96097868713657e-05, "epoch": 0.05584972966947216, "percentage": 5.58, "elapsed_time": "2:22:12", "remaining_time": "1 day, 16:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1003, "total_steps": 17941, "loss": 1.6453, "learning_rate": 9.960867581467546e-05, "epoch": 0.0559054679226353, "percentage": 5.59, "elapsed_time": "2:22:20", "remaining_time": "1 day, 16:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1004, "total_steps": 17941, "loss": 1.8798, "learning_rate": 9.960756318468726e-05, "epoch": 0.05596120617579845, "percentage": 5.6, "elapsed_time": "2:22:28", "remaining_time": "1 day, 16:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1005, "total_steps": 17941, "loss": 1.9322, "learning_rate": 9.960644898143639e-05, "epoch": 0.056016944428961594, "percentage": 5.6, "elapsed_time": "2:22:37", "remaining_time": "1 day, 16:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1006, "total_steps": 17941, "loss": 1.5659, "learning_rate": 9.960533320495818e-05, "epoch": 0.056072682682124744, "percentage": 5.61, "elapsed_time": "2:22:45", "remaining_time": "1 day, 16:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1007, "total_steps": 17941, "loss": 1.8482, "learning_rate": 9.960421585528802e-05, "epoch": 0.05612842093528789, "percentage": 5.61, "elapsed_time": "2:22:54", "remaining_time": "1 day, 16:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1008, "total_steps": 17941, "loss": 1.9905, "learning_rate": 9.960309693246135e-05, "epoch": 0.05618415918845104, "percentage": 5.62, "elapsed_time": "2:23:02", "remaining_time": "1 day, 16:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1009, "total_steps": 17941, "loss": 1.722, "learning_rate": 9.960197643651363e-05, "epoch": 0.05623989744161418, "percentage": 5.62, "elapsed_time": "2:23:11", "remaining_time": "1 day, 16:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 17941, "loss": 1.8293, "learning_rate": 9.960085436748044e-05, "epoch": 0.05629563569477732, "percentage": 5.63, "elapsed_time": "2:23:20", "remaining_time": "1 day, 16:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1011, "total_steps": 17941, "loss": 1.8081, "learning_rate": 9.959973072539734e-05, "epoch": 0.05635137394794047, "percentage": 5.64, "elapsed_time": "2:23:28", "remaining_time": "1 day, 16:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1012, "total_steps": 17941, "loss": 1.5834, "learning_rate": 9.959860551029996e-05, "epoch": 0.056407112201103615, "percentage": 5.64, "elapsed_time": "2:23:37", "remaining_time": "1 day, 16:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1013, "total_steps": 17941, "loss": 1.8318, "learning_rate": 9.9597478722224e-05, "epoch": 0.056462850454266765, "percentage": 5.65, "elapsed_time": "2:23:46", "remaining_time": "1 day, 16:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1014, "total_steps": 17941, "loss": 1.7475, "learning_rate": 9.959635036120518e-05, "epoch": 0.05651858870742991, "percentage": 5.65, "elapsed_time": "2:23:54", "remaining_time": "1 day, 16:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1015, "total_steps": 17941, "loss": 1.6809, "learning_rate": 9.959522042727932e-05, "epoch": 0.05657432696059306, "percentage": 5.66, "elapsed_time": "2:24:02", "remaining_time": "1 day, 16:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1016, "total_steps": 17941, "loss": 1.7024, "learning_rate": 9.959408892048219e-05, "epoch": 0.0566300652137562, "percentage": 5.66, "elapsed_time": "2:24:11", "remaining_time": "1 day, 16:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1017, "total_steps": 17941, "loss": 1.9791, "learning_rate": 9.959295584084974e-05, "epoch": 0.05668580346691934, "percentage": 5.67, "elapsed_time": "2:24:20", "remaining_time": "1 day, 16:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1018, "total_steps": 17941, "loss": 1.5592, "learning_rate": 9.959182118841786e-05, "epoch": 0.05674154172008249, "percentage": 5.67, "elapsed_time": "2:24:28", "remaining_time": "1 day, 16:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1019, "total_steps": 17941, "loss": 2.012, "learning_rate": 9.959068496322256e-05, "epoch": 0.056797279973245636, "percentage": 5.68, "elapsed_time": "2:24:38", "remaining_time": "1 day, 16:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 17941, "loss": 1.6301, "learning_rate": 9.958954716529987e-05, "epoch": 0.056853018226408786, "percentage": 5.69, "elapsed_time": "2:24:46", "remaining_time": "1 day, 16:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1021, "total_steps": 17941, "loss": 1.8351, "learning_rate": 9.958840779468586e-05, "epoch": 0.05690875647957193, "percentage": 5.69, "elapsed_time": "2:24:55", "remaining_time": "1 day, 16:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1022, "total_steps": 17941, "loss": 1.8221, "learning_rate": 9.958726685141668e-05, "epoch": 0.05696449473273508, "percentage": 5.7, "elapsed_time": "2:25:03", "remaining_time": "1 day, 16:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1023, "total_steps": 17941, "loss": 1.8575, "learning_rate": 9.958612433552852e-05, "epoch": 0.05702023298589822, "percentage": 5.7, "elapsed_time": "2:25:12", "remaining_time": "1 day, 16:01:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1024, "total_steps": 17941, "loss": 1.7646, "learning_rate": 9.95849802470576e-05, "epoch": 0.05707597123906137, "percentage": 5.71, "elapsed_time": "2:25:21", "remaining_time": "1 day, 16:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 17941, "loss": 1.6789, "learning_rate": 9.95838345860402e-05, "epoch": 0.057131709492224514, "percentage": 5.71, "elapsed_time": "2:25:29", "remaining_time": "1 day, 16:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1026, "total_steps": 17941, "loss": 1.8542, "learning_rate": 9.958268735251266e-05, "epoch": 0.05718744774538766, "percentage": 5.72, "elapsed_time": "2:25:37", "remaining_time": "1 day, 16:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1027, "total_steps": 17941, "loss": 1.819, "learning_rate": 9.958153854651136e-05, "epoch": 0.057243185998550807, "percentage": 5.72, "elapsed_time": "2:25:46", "remaining_time": "1 day, 16:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1028, "total_steps": 17941, "loss": 1.7872, "learning_rate": 9.958038816807276e-05, "epoch": 0.05729892425171395, "percentage": 5.73, "elapsed_time": "2:25:55", "remaining_time": "1 day, 16:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1029, "total_steps": 17941, "loss": 1.8243, "learning_rate": 9.957923621723329e-05, "epoch": 0.0573546625048771, "percentage": 5.74, "elapsed_time": "2:26:03", "remaining_time": "1 day, 16:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 17941, "loss": 1.7316, "learning_rate": 9.957808269402954e-05, "epoch": 0.05741040075804024, "percentage": 5.74, "elapsed_time": "2:26:12", "remaining_time": "1 day, 16:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1031, "total_steps": 17941, "loss": 2.0758, "learning_rate": 9.957692759849806e-05, "epoch": 0.05746613901120339, "percentage": 5.75, "elapsed_time": "2:26:21", "remaining_time": "1 day, 16:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1032, "total_steps": 17941, "loss": 1.6588, "learning_rate": 9.957577093067548e-05, "epoch": 0.057521877264366535, "percentage": 5.75, "elapsed_time": "2:26:30", "remaining_time": "1 day, 16:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1033, "total_steps": 17941, "loss": 1.8477, "learning_rate": 9.957461269059851e-05, "epoch": 0.05757761551752968, "percentage": 5.76, "elapsed_time": "2:26:38", "remaining_time": "1 day, 16:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1034, "total_steps": 17941, "loss": 1.7541, "learning_rate": 9.957345287830386e-05, "epoch": 0.05763335377069283, "percentage": 5.76, "elapsed_time": "2:26:46", "remaining_time": "1 day, 16:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1035, "total_steps": 17941, "loss": 1.8738, "learning_rate": 9.95722914938283e-05, "epoch": 0.05768909202385597, "percentage": 5.77, "elapsed_time": "2:26:55", "remaining_time": "1 day, 15:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1036, "total_steps": 17941, "loss": 1.6668, "learning_rate": 9.957112853720871e-05, "epoch": 0.05774483027701912, "percentage": 5.77, "elapsed_time": "2:27:03", "remaining_time": "1 day, 15:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1037, "total_steps": 17941, "loss": 1.5023, "learning_rate": 9.956996400848191e-05, "epoch": 0.05780056853018226, "percentage": 5.78, "elapsed_time": "2:27:12", "remaining_time": "1 day, 15:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1038, "total_steps": 17941, "loss": 1.7614, "learning_rate": 9.956879790768489e-05, "epoch": 0.05785630678334541, "percentage": 5.79, "elapsed_time": "2:27:20", "remaining_time": "1 day, 15:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1039, "total_steps": 17941, "loss": 1.7874, "learning_rate": 9.95676302348546e-05, "epoch": 0.057912045036508555, "percentage": 5.79, "elapsed_time": "2:27:30", "remaining_time": "1 day, 15:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 17941, "loss": 1.7864, "learning_rate": 9.956646099002807e-05, "epoch": 0.0579677832896717, "percentage": 5.8, "elapsed_time": "2:27:38", "remaining_time": "1 day, 15:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1041, "total_steps": 17941, "loss": 1.9396, "learning_rate": 9.95652901732424e-05, "epoch": 0.05802352154283485, "percentage": 5.8, "elapsed_time": "2:27:47", "remaining_time": "1 day, 15:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1042, "total_steps": 17941, "loss": 1.8373, "learning_rate": 9.95641177845347e-05, "epoch": 0.05807925979599799, "percentage": 5.81, "elapsed_time": "2:27:56", "remaining_time": "1 day, 15:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1043, "total_steps": 17941, "loss": 2.0565, "learning_rate": 9.956294382394218e-05, "epoch": 0.05813499804916114, "percentage": 5.81, "elapsed_time": "2:28:04", "remaining_time": "1 day, 15:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1044, "total_steps": 17941, "loss": 1.837, "learning_rate": 9.956176829150204e-05, "epoch": 0.058190736302324284, "percentage": 5.82, "elapsed_time": "2:28:13", "remaining_time": "1 day, 15:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1045, "total_steps": 17941, "loss": 1.736, "learning_rate": 9.956059118725158e-05, "epoch": 0.05824647455548743, "percentage": 5.82, "elapsed_time": "2:28:21", "remaining_time": "1 day, 15:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1046, "total_steps": 17941, "loss": 1.9561, "learning_rate": 9.955941251122812e-05, "epoch": 0.058302212808650576, "percentage": 5.83, "elapsed_time": "2:28:30", "remaining_time": "1 day, 15:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1047, "total_steps": 17941, "loss": 1.723, "learning_rate": 9.955823226346905e-05, "epoch": 0.058357951061813726, "percentage": 5.84, "elapsed_time": "2:28:38", "remaining_time": "1 day, 15:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1048, "total_steps": 17941, "loss": 1.6632, "learning_rate": 9.95570504440118e-05, "epoch": 0.05841368931497687, "percentage": 5.84, "elapsed_time": "2:28:47", "remaining_time": "1 day, 15:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1049, "total_steps": 17941, "loss": 1.5877, "learning_rate": 9.955586705289386e-05, "epoch": 0.05846942756814001, "percentage": 5.85, "elapsed_time": "2:28:55", "remaining_time": "1 day, 15:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 17941, "loss": 2.0043, "learning_rate": 9.955468209015273e-05, "epoch": 0.05852516582130316, "percentage": 5.85, "elapsed_time": "2:29:04", "remaining_time": "1 day, 15:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1051, "total_steps": 17941, "loss": 1.7604, "learning_rate": 9.9553495555826e-05, "epoch": 0.058580904074466304, "percentage": 5.86, "elapsed_time": "2:29:12", "remaining_time": "1 day, 15:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1052, "total_steps": 17941, "loss": 1.8945, "learning_rate": 9.955230744995132e-05, "epoch": 0.058636642327629454, "percentage": 5.86, "elapsed_time": "2:29:21", "remaining_time": "1 day, 15:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1053, "total_steps": 17941, "loss": 1.9154, "learning_rate": 9.955111777256635e-05, "epoch": 0.0586923805807926, "percentage": 5.87, "elapsed_time": "2:29:30", "remaining_time": "1 day, 15:57:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1054, "total_steps": 17941, "loss": 1.6888, "learning_rate": 9.954992652370885e-05, "epoch": 0.05874811883395575, "percentage": 5.87, "elapsed_time": "2:29:38", "remaining_time": "1 day, 15:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1055, "total_steps": 17941, "loss": 1.7544, "learning_rate": 9.954873370341656e-05, "epoch": 0.05880385708711889, "percentage": 5.88, "elapsed_time": "2:29:46", "remaining_time": "1 day, 15:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1056, "total_steps": 17941, "loss": 1.9448, "learning_rate": 9.954753931172733e-05, "epoch": 0.05885959534028203, "percentage": 5.89, "elapsed_time": "2:29:55", "remaining_time": "1 day, 15:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1057, "total_steps": 17941, "loss": 2.0281, "learning_rate": 9.954634334867902e-05, "epoch": 0.05891533359344518, "percentage": 5.89, "elapsed_time": "2:30:03", "remaining_time": "1 day, 15:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1058, "total_steps": 17941, "loss": 1.7383, "learning_rate": 9.95451458143096e-05, "epoch": 0.058971071846608325, "percentage": 5.9, "elapsed_time": "2:30:12", "remaining_time": "1 day, 15:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1059, "total_steps": 17941, "loss": 1.9047, "learning_rate": 9.9543946708657e-05, "epoch": 0.059026810099771475, "percentage": 5.9, "elapsed_time": "2:30:20", "remaining_time": "1 day, 15:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 17941, "loss": 2.1998, "learning_rate": 9.95427460317593e-05, "epoch": 0.05908254835293462, "percentage": 5.91, "elapsed_time": "2:30:29", "remaining_time": "1 day, 15:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1061, "total_steps": 17941, "loss": 1.9788, "learning_rate": 9.954154378365453e-05, "epoch": 0.05913828660609777, "percentage": 5.91, "elapsed_time": "2:30:37", "remaining_time": "1 day, 15:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1062, "total_steps": 17941, "loss": 1.7906, "learning_rate": 9.954033996438084e-05, "epoch": 0.05919402485926091, "percentage": 5.92, "elapsed_time": "2:30:46", "remaining_time": "1 day, 15:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1063, "total_steps": 17941, "loss": 1.9644, "learning_rate": 9.95391345739764e-05, "epoch": 0.05924976311242406, "percentage": 5.92, "elapsed_time": "2:30:54", "remaining_time": "1 day, 15:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1064, "total_steps": 17941, "loss": 1.7528, "learning_rate": 9.953792761247946e-05, "epoch": 0.0593055013655872, "percentage": 5.93, "elapsed_time": "2:31:03", "remaining_time": "1 day, 15:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1065, "total_steps": 17941, "loss": 1.7198, "learning_rate": 9.953671907992827e-05, "epoch": 0.059361239618750346, "percentage": 5.94, "elapsed_time": "2:31:11", "remaining_time": "1 day, 15:55:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1066, "total_steps": 17941, "loss": 1.8502, "learning_rate": 9.953550897636117e-05, "epoch": 0.059416977871913496, "percentage": 5.94, "elapsed_time": "2:31:20", "remaining_time": "1 day, 15:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1067, "total_steps": 17941, "loss": 1.8859, "learning_rate": 9.953429730181653e-05, "epoch": 0.05947271612507664, "percentage": 5.95, "elapsed_time": "2:31:29", "remaining_time": "1 day, 15:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1068, "total_steps": 17941, "loss": 1.9667, "learning_rate": 9.953308405633281e-05, "epoch": 0.05952845437823979, "percentage": 5.95, "elapsed_time": "2:31:37", "remaining_time": "1 day, 15:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1069, "total_steps": 17941, "loss": 1.9502, "learning_rate": 9.953186923994845e-05, "epoch": 0.05958419263140293, "percentage": 5.96, "elapsed_time": "2:31:45", "remaining_time": "1 day, 15:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 17941, "loss": 1.7872, "learning_rate": 9.953065285270198e-05, "epoch": 0.05963993088456608, "percentage": 5.96, "elapsed_time": "2:31:54", "remaining_time": "1 day, 15:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1071, "total_steps": 17941, "loss": 1.4861, "learning_rate": 9.952943489463199e-05, "epoch": 0.059695669137729224, "percentage": 5.97, "elapsed_time": "2:32:02", "remaining_time": "1 day, 15:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1072, "total_steps": 17941, "loss": 1.8046, "learning_rate": 9.95282153657771e-05, "epoch": 0.059751407390892367, "percentage": 5.98, "elapsed_time": "2:32:11", "remaining_time": "1 day, 15:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1073, "total_steps": 17941, "loss": 2.0209, "learning_rate": 9.9526994266176e-05, "epoch": 0.059807145644055516, "percentage": 5.98, "elapsed_time": "2:32:19", "remaining_time": "1 day, 15:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1074, "total_steps": 17941, "loss": 2.0277, "learning_rate": 9.952577159586739e-05, "epoch": 0.05986288389721866, "percentage": 5.99, "elapsed_time": "2:32:28", "remaining_time": "1 day, 15:54:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1075, "total_steps": 17941, "loss": 1.9108, "learning_rate": 9.952454735489007e-05, "epoch": 0.05991862215038181, "percentage": 5.99, "elapsed_time": "2:32:37", "remaining_time": "1 day, 15:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1076, "total_steps": 17941, "loss": 2.0656, "learning_rate": 9.952332154328286e-05, "epoch": 0.05997436040354495, "percentage": 6.0, "elapsed_time": "2:32:45", "remaining_time": "1 day, 15:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1077, "total_steps": 17941, "loss": 1.757, "learning_rate": 9.952209416108461e-05, "epoch": 0.0600300986567081, "percentage": 6.0, "elapsed_time": "2:32:53", "remaining_time": "1 day, 15:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1078, "total_steps": 17941, "loss": 1.7967, "learning_rate": 9.952086520833428e-05, "epoch": 0.060085836909871244, "percentage": 6.01, "elapsed_time": "2:33:02", "remaining_time": "1 day, 15:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1079, "total_steps": 17941, "loss": 1.705, "learning_rate": 9.951963468507084e-05, "epoch": 0.06014157516303439, "percentage": 6.01, "elapsed_time": "2:33:10", "remaining_time": "1 day, 15:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 17941, "loss": 1.6394, "learning_rate": 9.95184025913333e-05, "epoch": 0.06019731341619754, "percentage": 6.02, "elapsed_time": "2:33:19", "remaining_time": "1 day, 15:53:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1081, "total_steps": 17941, "loss": 1.5622, "learning_rate": 9.951716892716074e-05, "epoch": 0.06025305166936068, "percentage": 6.03, "elapsed_time": "2:33:27", "remaining_time": "1 day, 15:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1082, "total_steps": 17941, "loss": 1.943, "learning_rate": 9.951593369259229e-05, "epoch": 0.06030878992252383, "percentage": 6.03, "elapsed_time": "2:33:36", "remaining_time": "1 day, 15:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1083, "total_steps": 17941, "loss": 1.7855, "learning_rate": 9.951469688766712e-05, "epoch": 0.06036452817568697, "percentage": 6.04, "elapsed_time": "2:33:45", "remaining_time": "1 day, 15:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1084, "total_steps": 17941, "loss": 1.8589, "learning_rate": 9.951345851242445e-05, "epoch": 0.06042026642885012, "percentage": 6.04, "elapsed_time": "2:33:53", "remaining_time": "1 day, 15:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1085, "total_steps": 17941, "loss": 1.8431, "learning_rate": 9.951221856690355e-05, "epoch": 0.060476004682013265, "percentage": 6.05, "elapsed_time": "2:34:02", "remaining_time": "1 day, 15:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1086, "total_steps": 17941, "loss": 1.8495, "learning_rate": 9.951097705114378e-05, "epoch": 0.060531742935176415, "percentage": 6.05, "elapsed_time": "2:34:11", "remaining_time": "1 day, 15:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1087, "total_steps": 17941, "loss": 1.6244, "learning_rate": 9.950973396518449e-05, "epoch": 0.06058748118833956, "percentage": 6.06, "elapsed_time": "2:34:19", "remaining_time": "1 day, 15:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1088, "total_steps": 17941, "loss": 1.569, "learning_rate": 9.950848930906506e-05, "epoch": 0.0606432194415027, "percentage": 6.06, "elapsed_time": "2:34:28", "remaining_time": "1 day, 15:52:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1089, "total_steps": 17941, "loss": 1.8739, "learning_rate": 9.950724308282504e-05, "epoch": 0.06069895769466585, "percentage": 6.07, "elapsed_time": "2:34:36", "remaining_time": "1 day, 15:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 17941, "loss": 1.5985, "learning_rate": 9.95059952865039e-05, "epoch": 0.06075469594782899, "percentage": 6.08, "elapsed_time": "2:34:45", "remaining_time": "1 day, 15:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1091, "total_steps": 17941, "loss": 1.9313, "learning_rate": 9.950474592014123e-05, "epoch": 0.06081043420099214, "percentage": 6.08, "elapsed_time": "2:34:53", "remaining_time": "1 day, 15:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1092, "total_steps": 17941, "loss": 1.5846, "learning_rate": 9.950349498377666e-05, "epoch": 0.060866172454155286, "percentage": 6.09, "elapsed_time": "2:35:02", "remaining_time": "1 day, 15:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1093, "total_steps": 17941, "loss": 1.7246, "learning_rate": 9.950224247744986e-05, "epoch": 0.060921910707318436, "percentage": 6.09, "elapsed_time": "2:35:10", "remaining_time": "1 day, 15:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1094, "total_steps": 17941, "loss": 1.3499, "learning_rate": 9.950098840120055e-05, "epoch": 0.06097764896048158, "percentage": 6.1, "elapsed_time": "2:35:19", "remaining_time": "1 day, 15:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1095, "total_steps": 17941, "loss": 1.7099, "learning_rate": 9.949973275506847e-05, "epoch": 0.06103338721364472, "percentage": 6.1, "elapsed_time": "2:35:27", "remaining_time": "1 day, 15:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1096, "total_steps": 17941, "loss": 2.0376, "learning_rate": 9.94984755390935e-05, "epoch": 0.06108912546680787, "percentage": 6.11, "elapsed_time": "2:35:36", "remaining_time": "1 day, 15:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1097, "total_steps": 17941, "loss": 1.8721, "learning_rate": 9.949721675331546e-05, "epoch": 0.061144863719971014, "percentage": 6.11, "elapsed_time": "2:35:44", "remaining_time": "1 day, 15:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1098, "total_steps": 17941, "loss": 1.8502, "learning_rate": 9.94959563977743e-05, "epoch": 0.061200601973134164, "percentage": 6.12, "elapsed_time": "2:35:53", "remaining_time": "1 day, 15:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1099, "total_steps": 17941, "loss": 1.762, "learning_rate": 9.949469447250998e-05, "epoch": 0.06125634022629731, "percentage": 6.13, "elapsed_time": "2:36:01", "remaining_time": "1 day, 15:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 17941, "loss": 1.779, "learning_rate": 9.949343097756253e-05, "epoch": 0.061312078479460456, "percentage": 6.13, "elapsed_time": "2:36:10", "remaining_time": "1 day, 15:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1101, "total_steps": 17941, "loss": 1.6705, "learning_rate": 9.949216591297203e-05, "epoch": 0.0613678167326236, "percentage": 6.14, "elapsed_time": "2:36:18", "remaining_time": "1 day, 15:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1102, "total_steps": 17941, "loss": 1.6734, "learning_rate": 9.949089927877858e-05, "epoch": 0.06142355498578674, "percentage": 6.14, "elapsed_time": "2:36:27", "remaining_time": "1 day, 15:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1103, "total_steps": 17941, "loss": 2.0193, "learning_rate": 9.948963107502235e-05, "epoch": 0.06147929323894989, "percentage": 6.15, "elapsed_time": "2:36:36", "remaining_time": "1 day, 15:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1104, "total_steps": 17941, "loss": 1.9377, "learning_rate": 9.948836130174358e-05, "epoch": 0.061535031492113035, "percentage": 6.15, "elapsed_time": "2:36:44", "remaining_time": "1 day, 15:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1105, "total_steps": 17941, "loss": 1.6455, "learning_rate": 9.94870899589825e-05, "epoch": 0.061590769745276185, "percentage": 6.16, "elapsed_time": "2:36:53", "remaining_time": "1 day, 15:50:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1106, "total_steps": 17941, "loss": 1.9186, "learning_rate": 9.948581704677949e-05, "epoch": 0.06164650799843933, "percentage": 6.16, "elapsed_time": "2:37:01", "remaining_time": "1 day, 15:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1107, "total_steps": 17941, "loss": 1.9353, "learning_rate": 9.948454256517486e-05, "epoch": 0.06170224625160248, "percentage": 6.17, "elapsed_time": "2:37:10", "remaining_time": "1 day, 15:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1108, "total_steps": 17941, "loss": 1.6834, "learning_rate": 9.948326651420907e-05, "epoch": 0.06175798450476562, "percentage": 6.18, "elapsed_time": "2:37:18", "remaining_time": "1 day, 15:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1109, "total_steps": 17941, "loss": 1.8998, "learning_rate": 9.948198889392255e-05, "epoch": 0.06181372275792877, "percentage": 6.18, "elapsed_time": "2:37:27", "remaining_time": "1 day, 15:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 17941, "loss": 2.1707, "learning_rate": 9.948070970435587e-05, "epoch": 0.06186946101109191, "percentage": 6.19, "elapsed_time": "2:37:35", "remaining_time": "1 day, 15:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1111, "total_steps": 17941, "loss": 1.9854, "learning_rate": 9.947942894554956e-05, "epoch": 0.061925199264255056, "percentage": 6.19, "elapsed_time": "2:37:44", "remaining_time": "1 day, 15:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1112, "total_steps": 17941, "loss": 1.6627, "learning_rate": 9.947814661754425e-05, "epoch": 0.061980937517418205, "percentage": 6.2, "elapsed_time": "2:37:52", "remaining_time": "1 day, 15:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1113, "total_steps": 17941, "loss": 2.0686, "learning_rate": 9.947686272038059e-05, "epoch": 0.06203667577058135, "percentage": 6.2, "elapsed_time": "2:38:01", "remaining_time": "1 day, 15:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1114, "total_steps": 17941, "loss": 1.7178, "learning_rate": 9.947557725409934e-05, "epoch": 0.0620924140237445, "percentage": 6.21, "elapsed_time": "2:38:09", "remaining_time": "1 day, 15:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1115, "total_steps": 17941, "loss": 1.9185, "learning_rate": 9.947429021874123e-05, "epoch": 0.06214815227690764, "percentage": 6.21, "elapsed_time": "2:38:18", "remaining_time": "1 day, 15:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1116, "total_steps": 17941, "loss": 1.7684, "learning_rate": 9.94730016143471e-05, "epoch": 0.06220389053007079, "percentage": 6.22, "elapsed_time": "2:38:26", "remaining_time": "1 day, 15:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1117, "total_steps": 17941, "loss": 1.8471, "learning_rate": 9.947171144095779e-05, "epoch": 0.06225962878323393, "percentage": 6.23, "elapsed_time": "2:38:35", "remaining_time": "1 day, 15:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1118, "total_steps": 17941, "loss": 2.0452, "learning_rate": 9.947041969861424e-05, "epoch": 0.062315367036397076, "percentage": 6.23, "elapsed_time": "2:38:43", "remaining_time": "1 day, 15:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1119, "total_steps": 17941, "loss": 1.6376, "learning_rate": 9.946912638735741e-05, "epoch": 0.062371105289560226, "percentage": 6.24, "elapsed_time": "2:38:52", "remaining_time": "1 day, 15:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 17941, "loss": 1.7909, "learning_rate": 9.946783150722832e-05, "epoch": 0.06242684354272337, "percentage": 6.24, "elapsed_time": "2:39:00", "remaining_time": "1 day, 15:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1121, "total_steps": 17941, "loss": 2.3971, "learning_rate": 9.946653505826802e-05, "epoch": 0.06248258179588652, "percentage": 6.25, "elapsed_time": "2:39:09", "remaining_time": "1 day, 15:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1122, "total_steps": 17941, "loss": 1.6772, "learning_rate": 9.946523704051765e-05, "epoch": 0.06253832004904966, "percentage": 6.25, "elapsed_time": "2:39:18", "remaining_time": "1 day, 15:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1123, "total_steps": 17941, "loss": 1.5496, "learning_rate": 9.946393745401836e-05, "epoch": 0.0625940583022128, "percentage": 6.26, "elapsed_time": "2:39:26", "remaining_time": "1 day, 15:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1124, "total_steps": 17941, "loss": 1.926, "learning_rate": 9.946263629881137e-05, "epoch": 0.06264979655537596, "percentage": 6.26, "elapsed_time": "2:39:35", "remaining_time": "1 day, 15:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1125, "total_steps": 17941, "loss": 1.8916, "learning_rate": 9.946133357493794e-05, "epoch": 0.0627055348085391, "percentage": 6.27, "elapsed_time": "2:39:43", "remaining_time": "1 day, 15:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1126, "total_steps": 17941, "loss": 1.7043, "learning_rate": 9.946002928243939e-05, "epoch": 0.06276127306170225, "percentage": 6.28, "elapsed_time": "2:39:52", "remaining_time": "1 day, 15:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1127, "total_steps": 17941, "loss": 2.0595, "learning_rate": 9.945872342135709e-05, "epoch": 0.06281701131486539, "percentage": 6.28, "elapsed_time": "2:40:00", "remaining_time": "1 day, 15:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1128, "total_steps": 17941, "loss": 1.7227, "learning_rate": 9.945741599173244e-05, "epoch": 0.06287274956802853, "percentage": 6.29, "elapsed_time": "2:40:09", "remaining_time": "1 day, 15:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1129, "total_steps": 17941, "loss": 1.7466, "learning_rate": 9.945610699360692e-05, "epoch": 0.06292848782119169, "percentage": 6.29, "elapsed_time": "2:40:18", "remaining_time": "1 day, 15:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 17941, "loss": 1.9668, "learning_rate": 9.945479642702203e-05, "epoch": 0.06298422607435483, "percentage": 6.3, "elapsed_time": "2:40:27", "remaining_time": "1 day, 15:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1131, "total_steps": 17941, "loss": 1.664, "learning_rate": 9.945348429201933e-05, "epoch": 0.06303996432751797, "percentage": 6.3, "elapsed_time": "2:40:35", "remaining_time": "1 day, 15:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1132, "total_steps": 17941, "loss": 1.7043, "learning_rate": 9.945217058864045e-05, "epoch": 0.06309570258068112, "percentage": 6.31, "elapsed_time": "2:40:44", "remaining_time": "1 day, 15:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1133, "total_steps": 17941, "loss": 1.6095, "learning_rate": 9.945085531692704e-05, "epoch": 0.06315144083384426, "percentage": 6.32, "elapsed_time": "2:40:52", "remaining_time": "1 day, 15:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1134, "total_steps": 17941, "loss": 1.6696, "learning_rate": 9.944953847692082e-05, "epoch": 0.06320717908700742, "percentage": 6.32, "elapsed_time": "2:41:01", "remaining_time": "1 day, 15:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1135, "total_steps": 17941, "loss": 1.8795, "learning_rate": 9.944822006866356e-05, "epoch": 0.06326291734017056, "percentage": 6.33, "elapsed_time": "2:41:10", "remaining_time": "1 day, 15:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1136, "total_steps": 17941, "loss": 1.6658, "learning_rate": 9.944690009219705e-05, "epoch": 0.0633186555933337, "percentage": 6.33, "elapsed_time": "2:41:18", "remaining_time": "1 day, 15:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1137, "total_steps": 17941, "loss": 1.5768, "learning_rate": 9.944557854756316e-05, "epoch": 0.06337439384649685, "percentage": 6.34, "elapsed_time": "2:41:27", "remaining_time": "1 day, 15:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1138, "total_steps": 17941, "loss": 1.9228, "learning_rate": 9.944425543480382e-05, "epoch": 0.06343013209966, "percentage": 6.34, "elapsed_time": "2:41:36", "remaining_time": "1 day, 15:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1139, "total_steps": 17941, "loss": 1.5889, "learning_rate": 9.944293075396098e-05, "epoch": 0.06348587035282315, "percentage": 6.35, "elapsed_time": "2:41:44", "remaining_time": "1 day, 15:45:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 17941, "loss": 1.7821, "learning_rate": 9.944160450507665e-05, "epoch": 0.06354160860598629, "percentage": 6.35, "elapsed_time": "2:41:52", "remaining_time": "1 day, 15:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1141, "total_steps": 17941, "loss": 1.6987, "learning_rate": 9.944027668819286e-05, "epoch": 0.06359734685914943, "percentage": 6.36, "elapsed_time": "2:42:01", "remaining_time": "1 day, 15:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1142, "total_steps": 17941, "loss": 1.4687, "learning_rate": 9.943894730335179e-05, "epoch": 0.06365308511231257, "percentage": 6.37, "elapsed_time": "2:42:10", "remaining_time": "1 day, 15:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1143, "total_steps": 17941, "loss": 1.6539, "learning_rate": 9.943761635059554e-05, "epoch": 0.06370882336547573, "percentage": 6.37, "elapsed_time": "2:42:18", "remaining_time": "1 day, 15:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1144, "total_steps": 17941, "loss": 1.9439, "learning_rate": 9.943628382996634e-05, "epoch": 0.06376456161863887, "percentage": 6.38, "elapsed_time": "2:42:26", "remaining_time": "1 day, 15:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1145, "total_steps": 17941, "loss": 1.6248, "learning_rate": 9.943494974150644e-05, "epoch": 0.06382029987180202, "percentage": 6.38, "elapsed_time": "2:42:35", "remaining_time": "1 day, 15:45:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1146, "total_steps": 17941, "loss": 1.8027, "learning_rate": 9.943361408525818e-05, "epoch": 0.06387603812496516, "percentage": 6.39, "elapsed_time": "2:42:43", "remaining_time": "1 day, 15:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1147, "total_steps": 17941, "loss": 2.1447, "learning_rate": 9.94322768612639e-05, "epoch": 0.06393177637812832, "percentage": 6.39, "elapsed_time": "2:42:52", "remaining_time": "1 day, 15:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1148, "total_steps": 17941, "loss": 1.8147, "learning_rate": 9.943093806956601e-05, "epoch": 0.06398751463129146, "percentage": 6.4, "elapsed_time": "2:43:01", "remaining_time": "1 day, 15:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1149, "total_steps": 17941, "loss": 1.9251, "learning_rate": 9.942959771020694e-05, "epoch": 0.0640432528844546, "percentage": 6.4, "elapsed_time": "2:43:09", "remaining_time": "1 day, 15:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 17941, "loss": 1.9842, "learning_rate": 9.942825578322926e-05, "epoch": 0.06409899113761774, "percentage": 6.41, "elapsed_time": "2:43:18", "remaining_time": "1 day, 15:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1151, "total_steps": 17941, "loss": 1.7163, "learning_rate": 9.942691228867546e-05, "epoch": 0.06415472939078089, "percentage": 6.42, "elapsed_time": "2:43:27", "remaining_time": "1 day, 15:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1152, "total_steps": 17941, "loss": 1.8273, "learning_rate": 9.94255672265882e-05, "epoch": 0.06421046764394404, "percentage": 6.42, "elapsed_time": "2:43:35", "remaining_time": "1 day, 15:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1153, "total_steps": 17941, "loss": 1.8914, "learning_rate": 9.942422059701012e-05, "epoch": 0.06426620589710719, "percentage": 6.43, "elapsed_time": "2:43:44", "remaining_time": "1 day, 15:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1154, "total_steps": 17941, "loss": 1.7668, "learning_rate": 9.942287239998392e-05, "epoch": 0.06432194415027033, "percentage": 6.43, "elapsed_time": "2:43:52", "remaining_time": "1 day, 15:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1155, "total_steps": 17941, "loss": 1.5809, "learning_rate": 9.942152263555237e-05, "epoch": 0.06437768240343347, "percentage": 6.44, "elapsed_time": "2:44:01", "remaining_time": "1 day, 15:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1156, "total_steps": 17941, "loss": 1.8543, "learning_rate": 9.942017130375825e-05, "epoch": 0.06443342065659662, "percentage": 6.44, "elapsed_time": "2:44:09", "remaining_time": "1 day, 15:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1157, "total_steps": 17941, "loss": 1.7744, "learning_rate": 9.941881840464447e-05, "epoch": 0.06448915890975977, "percentage": 6.45, "elapsed_time": "2:44:18", "remaining_time": "1 day, 15:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1158, "total_steps": 17941, "loss": 1.5802, "learning_rate": 9.941746393825386e-05, "epoch": 0.06454489716292292, "percentage": 6.45, "elapsed_time": "2:44:28", "remaining_time": "1 day, 15:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1159, "total_steps": 17941, "loss": 1.8704, "learning_rate": 9.941610790462946e-05, "epoch": 0.06460063541608606, "percentage": 6.46, "elapsed_time": "2:44:36", "remaining_time": "1 day, 15:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 17941, "loss": 1.7503, "learning_rate": 9.94147503038142e-05, "epoch": 0.0646563736692492, "percentage": 6.47, "elapsed_time": "2:44:45", "remaining_time": "1 day, 15:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1161, "total_steps": 17941, "loss": 1.7069, "learning_rate": 9.941339113585117e-05, "epoch": 0.06471211192241236, "percentage": 6.47, "elapsed_time": "2:44:53", "remaining_time": "1 day, 15:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1162, "total_steps": 17941, "loss": 1.6529, "learning_rate": 9.94120304007835e-05, "epoch": 0.0647678501755755, "percentage": 6.48, "elapsed_time": "2:45:02", "remaining_time": "1 day, 15:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1163, "total_steps": 17941, "loss": 1.8965, "learning_rate": 9.941066809865429e-05, "epoch": 0.06482358842873864, "percentage": 6.48, "elapsed_time": "2:45:10", "remaining_time": "1 day, 15:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1164, "total_steps": 17941, "loss": 1.797, "learning_rate": 9.940930422950679e-05, "epoch": 0.06487932668190179, "percentage": 6.49, "elapsed_time": "2:45:19", "remaining_time": "1 day, 15:42:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1165, "total_steps": 17941, "loss": 1.9707, "learning_rate": 9.940793879338424e-05, "epoch": 0.06493506493506493, "percentage": 6.49, "elapsed_time": "2:45:27", "remaining_time": "1 day, 15:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1166, "total_steps": 17941, "loss": 1.8563, "learning_rate": 9.940657179032993e-05, "epoch": 0.06499080318822809, "percentage": 6.5, "elapsed_time": "2:45:36", "remaining_time": "1 day, 15:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1167, "total_steps": 17941, "loss": 1.6063, "learning_rate": 9.940520322038722e-05, "epoch": 0.06504654144139123, "percentage": 6.5, "elapsed_time": "2:45:45", "remaining_time": "1 day, 15:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1168, "total_steps": 17941, "loss": 1.8387, "learning_rate": 9.940383308359951e-05, "epoch": 0.06510227969455437, "percentage": 6.51, "elapsed_time": "2:45:53", "remaining_time": "1 day, 15:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1169, "total_steps": 17941, "loss": 1.4808, "learning_rate": 9.940246138001027e-05, "epoch": 0.06515801794771751, "percentage": 6.52, "elapsed_time": "2:46:02", "remaining_time": "1 day, 15:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 17941, "loss": 1.9234, "learning_rate": 9.9401088109663e-05, "epoch": 0.06521375620088067, "percentage": 6.52, "elapsed_time": "2:46:10", "remaining_time": "1 day, 15:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1171, "total_steps": 17941, "loss": 2.1587, "learning_rate": 9.939971327260122e-05, "epoch": 0.06526949445404381, "percentage": 6.53, "elapsed_time": "2:46:19", "remaining_time": "1 day, 15:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1172, "total_steps": 17941, "loss": 1.8453, "learning_rate": 9.939833686886857e-05, "epoch": 0.06532523270720696, "percentage": 6.53, "elapsed_time": "2:46:27", "remaining_time": "1 day, 15:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1173, "total_steps": 17941, "loss": 1.7421, "learning_rate": 9.939695889850869e-05, "epoch": 0.0653809709603701, "percentage": 6.54, "elapsed_time": "2:46:36", "remaining_time": "1 day, 15:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1174, "total_steps": 17941, "loss": 1.7447, "learning_rate": 9.939557936156527e-05, "epoch": 0.06543670921353324, "percentage": 6.54, "elapsed_time": "2:46:44", "remaining_time": "1 day, 15:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1175, "total_steps": 17941, "loss": 1.5579, "learning_rate": 9.939419825808207e-05, "epoch": 0.0654924474666964, "percentage": 6.55, "elapsed_time": "2:46:53", "remaining_time": "1 day, 15:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1176, "total_steps": 17941, "loss": 2.1224, "learning_rate": 9.93928155881029e-05, "epoch": 0.06554818571985954, "percentage": 6.55, "elapsed_time": "2:47:02", "remaining_time": "1 day, 15:41:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1177, "total_steps": 17941, "loss": 1.8331, "learning_rate": 9.939143135167158e-05, "epoch": 0.06560392397302268, "percentage": 6.56, "elapsed_time": "2:47:10", "remaining_time": "1 day, 15:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1178, "total_steps": 17941, "loss": 1.7895, "learning_rate": 9.939004554883205e-05, "epoch": 0.06565966222618583, "percentage": 6.57, "elapsed_time": "2:47:19", "remaining_time": "1 day, 15:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1179, "total_steps": 17941, "loss": 1.7342, "learning_rate": 9.938865817962822e-05, "epoch": 0.06571540047934897, "percentage": 6.57, "elapsed_time": "2:47:28", "remaining_time": "1 day, 15:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 17941, "loss": 1.5657, "learning_rate": 9.938726924410412e-05, "epoch": 0.06577113873251213, "percentage": 6.58, "elapsed_time": "2:47:36", "remaining_time": "1 day, 15:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1181, "total_steps": 17941, "loss": 1.7487, "learning_rate": 9.938587874230379e-05, "epoch": 0.06582687698567527, "percentage": 6.58, "elapsed_time": "2:47:45", "remaining_time": "1 day, 15:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1182, "total_steps": 17941, "loss": 1.8534, "learning_rate": 9.938448667427131e-05, "epoch": 0.06588261523883841, "percentage": 6.59, "elapsed_time": "2:47:54", "remaining_time": "1 day, 15:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1183, "total_steps": 17941, "loss": 1.6074, "learning_rate": 9.938309304005086e-05, "epoch": 0.06593835349200156, "percentage": 6.59, "elapsed_time": "2:48:03", "remaining_time": "1 day, 15:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1184, "total_steps": 17941, "loss": 1.7358, "learning_rate": 9.938169783968663e-05, "epoch": 0.06599409174516471, "percentage": 6.6, "elapsed_time": "2:48:13", "remaining_time": "1 day, 15:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1185, "total_steps": 17941, "loss": 1.5923, "learning_rate": 9.938030107322283e-05, "epoch": 0.06604982999832786, "percentage": 6.6, "elapsed_time": "2:48:22", "remaining_time": "1 day, 15:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1186, "total_steps": 17941, "loss": 1.8394, "learning_rate": 9.93789027407038e-05, "epoch": 0.066105568251491, "percentage": 6.61, "elapsed_time": "2:48:30", "remaining_time": "1 day, 15:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1187, "total_steps": 17941, "loss": 1.6385, "learning_rate": 9.937750284217389e-05, "epoch": 0.06616130650465414, "percentage": 6.62, "elapsed_time": "2:48:39", "remaining_time": "1 day, 15:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1188, "total_steps": 17941, "loss": 1.6236, "learning_rate": 9.937610137767747e-05, "epoch": 0.06621704475781728, "percentage": 6.62, "elapsed_time": "2:48:47", "remaining_time": "1 day, 15:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1189, "total_steps": 17941, "loss": 1.6139, "learning_rate": 9.937469834725898e-05, "epoch": 0.06627278301098044, "percentage": 6.63, "elapsed_time": "2:48:56", "remaining_time": "1 day, 15:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 17941, "loss": 1.62, "learning_rate": 9.937329375096297e-05, "epoch": 0.06632852126414358, "percentage": 6.63, "elapsed_time": "2:49:04", "remaining_time": "1 day, 15:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1191, "total_steps": 17941, "loss": 1.8803, "learning_rate": 9.937188758883393e-05, "epoch": 0.06638425951730673, "percentage": 6.64, "elapsed_time": "2:49:13", "remaining_time": "1 day, 15:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1192, "total_steps": 17941, "loss": 1.9219, "learning_rate": 9.937047986091646e-05, "epoch": 0.06643999777046987, "percentage": 6.64, "elapsed_time": "2:49:22", "remaining_time": "1 day, 15:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1193, "total_steps": 17941, "loss": 1.7777, "learning_rate": 9.936907056725524e-05, "epoch": 0.06649573602363303, "percentage": 6.65, "elapsed_time": "2:49:30", "remaining_time": "1 day, 15:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1194, "total_steps": 17941, "loss": 1.9888, "learning_rate": 9.936765970789492e-05, "epoch": 0.06655147427679617, "percentage": 6.66, "elapsed_time": "2:49:39", "remaining_time": "1 day, 15:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1195, "total_steps": 17941, "loss": 1.6308, "learning_rate": 9.936624728288029e-05, "epoch": 0.06660721252995931, "percentage": 6.66, "elapsed_time": "2:49:47", "remaining_time": "1 day, 15:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1196, "total_steps": 17941, "loss": 1.6621, "learning_rate": 9.93648332922561e-05, "epoch": 0.06666295078312245, "percentage": 6.67, "elapsed_time": "2:49:56", "remaining_time": "1 day, 15:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1197, "total_steps": 17941, "loss": 1.6883, "learning_rate": 9.936341773606723e-05, "epoch": 0.0667186890362856, "percentage": 6.67, "elapsed_time": "2:50:05", "remaining_time": "1 day, 15:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1198, "total_steps": 17941, "loss": 1.6099, "learning_rate": 9.936200061435857e-05, "epoch": 0.06677442728944875, "percentage": 6.68, "elapsed_time": "2:50:14", "remaining_time": "1 day, 15:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1199, "total_steps": 17941, "loss": 1.725, "learning_rate": 9.936058192717502e-05, "epoch": 0.0668301655426119, "percentage": 6.68, "elapsed_time": "2:50:22", "remaining_time": "1 day, 15:38:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 17941, "loss": 1.5314, "learning_rate": 9.935916167456163e-05, "epoch": 0.06688590379577504, "percentage": 6.69, "elapsed_time": "2:50:30", "remaining_time": "1 day, 15:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1201, "total_steps": 17941, "loss": 1.094, "learning_rate": 9.93577398565634e-05, "epoch": 0.06694164204893818, "percentage": 6.69, "elapsed_time": "2:50:39", "remaining_time": "1 day, 15:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1202, "total_steps": 17941, "loss": 1.9806, "learning_rate": 9.935631647322544e-05, "epoch": 0.06699738030210133, "percentage": 6.7, "elapsed_time": "2:50:48", "remaining_time": "1 day, 15:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1203, "total_steps": 17941, "loss": 1.7586, "learning_rate": 9.93548915245929e-05, "epoch": 0.06705311855526448, "percentage": 6.71, "elapsed_time": "2:50:56", "remaining_time": "1 day, 15:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1204, "total_steps": 17941, "loss": 1.6344, "learning_rate": 9.935346501071095e-05, "epoch": 0.06710885680842762, "percentage": 6.71, "elapsed_time": "2:51:05", "remaining_time": "1 day, 15:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1205, "total_steps": 17941, "loss": 1.7792, "learning_rate": 9.935203693162483e-05, "epoch": 0.06716459506159077, "percentage": 6.72, "elapsed_time": "2:51:13", "remaining_time": "1 day, 15:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1206, "total_steps": 17941, "loss": 1.8226, "learning_rate": 9.935060728737986e-05, "epoch": 0.06722033331475391, "percentage": 6.72, "elapsed_time": "2:51:21", "remaining_time": "1 day, 15:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1207, "total_steps": 17941, "loss": 1.65, "learning_rate": 9.934917607802135e-05, "epoch": 0.06727607156791707, "percentage": 6.73, "elapsed_time": "2:51:30", "remaining_time": "1 day, 15:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1208, "total_steps": 17941, "loss": 1.5889, "learning_rate": 9.934774330359471e-05, "epoch": 0.06733180982108021, "percentage": 6.73, "elapsed_time": "2:51:38", "remaining_time": "1 day, 15:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1209, "total_steps": 17941, "loss": 1.6367, "learning_rate": 9.934630896414536e-05, "epoch": 0.06738754807424335, "percentage": 6.74, "elapsed_time": "2:51:47", "remaining_time": "1 day, 15:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 17941, "loss": 1.6565, "learning_rate": 9.93448730597188e-05, "epoch": 0.0674432863274065, "percentage": 6.74, "elapsed_time": "2:51:55", "remaining_time": "1 day, 15:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1211, "total_steps": 17941, "loss": 1.7874, "learning_rate": 9.934343559036056e-05, "epoch": 0.06749902458056964, "percentage": 6.75, "elapsed_time": "2:52:04", "remaining_time": "1 day, 15:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1212, "total_steps": 17941, "loss": 1.4178, "learning_rate": 9.934199655611624e-05, "epoch": 0.0675547628337328, "percentage": 6.76, "elapsed_time": "2:52:12", "remaining_time": "1 day, 15:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1213, "total_steps": 17941, "loss": 1.8371, "learning_rate": 9.934055595703149e-05, "epoch": 0.06761050108689594, "percentage": 6.76, "elapsed_time": "2:52:21", "remaining_time": "1 day, 15:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1214, "total_steps": 17941, "loss": 1.77, "learning_rate": 9.933911379315198e-05, "epoch": 0.06766623934005908, "percentage": 6.77, "elapsed_time": "2:52:29", "remaining_time": "1 day, 15:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1215, "total_steps": 17941, "loss": 1.7457, "learning_rate": 9.933767006452341e-05, "epoch": 0.06772197759322222, "percentage": 6.77, "elapsed_time": "2:52:37", "remaining_time": "1 day, 15:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1216, "total_steps": 17941, "loss": 1.4759, "learning_rate": 9.933622477119165e-05, "epoch": 0.06777771584638538, "percentage": 6.78, "elapsed_time": "2:52:46", "remaining_time": "1 day, 15:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1217, "total_steps": 17941, "loss": 1.5853, "learning_rate": 9.933477791320246e-05, "epoch": 0.06783345409954852, "percentage": 6.78, "elapsed_time": "2:52:54", "remaining_time": "1 day, 15:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1218, "total_steps": 17941, "loss": 1.624, "learning_rate": 9.933332949060177e-05, "epoch": 0.06788919235271167, "percentage": 6.79, "elapsed_time": "2:53:03", "remaining_time": "1 day, 15:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1219, "total_steps": 17941, "loss": 1.9126, "learning_rate": 9.93318795034355e-05, "epoch": 0.06794493060587481, "percentage": 6.79, "elapsed_time": "2:53:11", "remaining_time": "1 day, 15:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 17941, "loss": 1.7807, "learning_rate": 9.933042795174963e-05, "epoch": 0.06800066885903795, "percentage": 6.8, "elapsed_time": "2:53:20", "remaining_time": "1 day, 15:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1221, "total_steps": 17941, "loss": 1.8777, "learning_rate": 9.93289748355902e-05, "epoch": 0.06805640711220111, "percentage": 6.81, "elapsed_time": "2:53:28", "remaining_time": "1 day, 15:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1222, "total_steps": 17941, "loss": 1.7479, "learning_rate": 9.93275201550033e-05, "epoch": 0.06811214536536425, "percentage": 6.81, "elapsed_time": "2:53:37", "remaining_time": "1 day, 15:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1223, "total_steps": 17941, "loss": 1.9158, "learning_rate": 9.932606391003508e-05, "epoch": 0.0681678836185274, "percentage": 6.82, "elapsed_time": "2:53:45", "remaining_time": "1 day, 15:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1224, "total_steps": 17941, "loss": 1.7554, "learning_rate": 9.932460610073167e-05, "epoch": 0.06822362187169054, "percentage": 6.82, "elapsed_time": "2:53:54", "remaining_time": "1 day, 15:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1225, "total_steps": 17941, "loss": 1.7927, "learning_rate": 9.932314672713936e-05, "epoch": 0.06827936012485368, "percentage": 6.83, "elapsed_time": "2:54:02", "remaining_time": "1 day, 15:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1226, "total_steps": 17941, "loss": 1.7221, "learning_rate": 9.932168578930439e-05, "epoch": 0.06833509837801684, "percentage": 6.83, "elapsed_time": "2:54:11", "remaining_time": "1 day, 15:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1227, "total_steps": 17941, "loss": 2.0262, "learning_rate": 9.932022328727313e-05, "epoch": 0.06839083663117998, "percentage": 6.84, "elapsed_time": "2:54:19", "remaining_time": "1 day, 15:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1228, "total_steps": 17941, "loss": 1.7353, "learning_rate": 9.931875922109195e-05, "epoch": 0.06844657488434312, "percentage": 6.84, "elapsed_time": "2:54:28", "remaining_time": "1 day, 15:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1229, "total_steps": 17941, "loss": 1.8789, "learning_rate": 9.931729359080726e-05, "epoch": 0.06850231313750627, "percentage": 6.85, "elapsed_time": "2:54:37", "remaining_time": "1 day, 15:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 17941, "loss": 1.9549, "learning_rate": 9.931582639646556e-05, "epoch": 0.06855805139066942, "percentage": 6.86, "elapsed_time": "2:54:45", "remaining_time": "1 day, 15:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1231, "total_steps": 17941, "loss": 1.7371, "learning_rate": 9.931435763811338e-05, "epoch": 0.06861378964383257, "percentage": 6.86, "elapsed_time": "2:54:54", "remaining_time": "1 day, 15:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1232, "total_steps": 17941, "loss": 1.8187, "learning_rate": 9.93128873157973e-05, "epoch": 0.06866952789699571, "percentage": 6.87, "elapsed_time": "2:55:02", "remaining_time": "1 day, 15:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1233, "total_steps": 17941, "loss": 1.6269, "learning_rate": 9.931141542956394e-05, "epoch": 0.06872526615015885, "percentage": 6.87, "elapsed_time": "2:55:10", "remaining_time": "1 day, 15:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1234, "total_steps": 17941, "loss": 1.9831, "learning_rate": 9.930994197945999e-05, "epoch": 0.068781004403322, "percentage": 6.88, "elapsed_time": "2:55:19", "remaining_time": "1 day, 15:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1235, "total_steps": 17941, "loss": 1.9577, "learning_rate": 9.930846696553219e-05, "epoch": 0.06883674265648515, "percentage": 6.88, "elapsed_time": "2:55:27", "remaining_time": "1 day, 15:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1236, "total_steps": 17941, "loss": 1.7921, "learning_rate": 9.930699038782729e-05, "epoch": 0.0688924809096483, "percentage": 6.89, "elapsed_time": "2:55:36", "remaining_time": "1 day, 15:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1237, "total_steps": 17941, "loss": 1.921, "learning_rate": 9.930551224639215e-05, "epoch": 0.06894821916281144, "percentage": 6.89, "elapsed_time": "2:55:44", "remaining_time": "1 day, 15:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1238, "total_steps": 17941, "loss": 1.8209, "learning_rate": 9.930403254127363e-05, "epoch": 0.06900395741597458, "percentage": 6.9, "elapsed_time": "2:55:53", "remaining_time": "1 day, 15:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1239, "total_steps": 17941, "loss": 1.9209, "learning_rate": 9.930255127251866e-05, "epoch": 0.06905969566913774, "percentage": 6.91, "elapsed_time": "2:56:02", "remaining_time": "1 day, 15:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 17941, "loss": 1.9073, "learning_rate": 9.93010684401742e-05, "epoch": 0.06911543392230088, "percentage": 6.91, "elapsed_time": "2:56:10", "remaining_time": "1 day, 15:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1241, "total_steps": 17941, "loss": 1.6648, "learning_rate": 9.929958404428732e-05, "epoch": 0.06917117217546402, "percentage": 6.92, "elapsed_time": "2:56:19", "remaining_time": "1 day, 15:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1242, "total_steps": 17941, "loss": 1.6878, "learning_rate": 9.929809808490505e-05, "epoch": 0.06922691042862716, "percentage": 6.92, "elapsed_time": "2:56:28", "remaining_time": "1 day, 15:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1243, "total_steps": 17941, "loss": 1.8051, "learning_rate": 9.929661056207455e-05, "epoch": 0.06928264868179031, "percentage": 6.93, "elapsed_time": "2:56:36", "remaining_time": "1 day, 15:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1244, "total_steps": 17941, "loss": 1.7016, "learning_rate": 9.929512147584297e-05, "epoch": 0.06933838693495346, "percentage": 6.93, "elapsed_time": "2:56:45", "remaining_time": "1 day, 15:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1245, "total_steps": 17941, "loss": 1.7512, "learning_rate": 9.929363082625755e-05, "epoch": 0.0693941251881166, "percentage": 6.94, "elapsed_time": "2:56:53", "remaining_time": "1 day, 15:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1246, "total_steps": 17941, "loss": 1.7578, "learning_rate": 9.929213861336557e-05, "epoch": 0.06944986344127975, "percentage": 6.94, "elapsed_time": "2:57:02", "remaining_time": "1 day, 15:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1247, "total_steps": 17941, "loss": 1.7655, "learning_rate": 9.929064483721435e-05, "epoch": 0.06950560169444289, "percentage": 6.95, "elapsed_time": "2:57:11", "remaining_time": "1 day, 15:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1248, "total_steps": 17941, "loss": 1.8085, "learning_rate": 9.928914949785124e-05, "epoch": 0.06956133994760604, "percentage": 6.96, "elapsed_time": "2:57:19", "remaining_time": "1 day, 15:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1249, "total_steps": 17941, "loss": 1.4068, "learning_rate": 9.928765259532371e-05, "epoch": 0.06961707820076919, "percentage": 6.96, "elapsed_time": "2:57:28", "remaining_time": "1 day, 15:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 17941, "loss": 1.9137, "learning_rate": 9.928615412967919e-05, "epoch": 0.06967281645393233, "percentage": 6.97, "elapsed_time": "2:57:36", "remaining_time": "1 day, 15:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1251, "total_steps": 17941, "loss": 1.6562, "learning_rate": 9.928465410096521e-05, "epoch": 0.06972855470709548, "percentage": 6.97, "elapsed_time": "2:57:44", "remaining_time": "1 day, 15:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1252, "total_steps": 17941, "loss": 1.7661, "learning_rate": 9.928315250922937e-05, "epoch": 0.06978429296025862, "percentage": 6.98, "elapsed_time": "2:57:53", "remaining_time": "1 day, 15:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1253, "total_steps": 17941, "loss": 1.9336, "learning_rate": 9.928164935451927e-05, "epoch": 0.06984003121342178, "percentage": 6.98, "elapsed_time": "2:58:01", "remaining_time": "1 day, 15:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1254, "total_steps": 17941, "loss": 1.8955, "learning_rate": 9.928014463688257e-05, "epoch": 0.06989576946658492, "percentage": 6.99, "elapsed_time": "2:58:10", "remaining_time": "1 day, 15:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1255, "total_steps": 17941, "loss": 1.7892, "learning_rate": 9.927863835636703e-05, "epoch": 0.06995150771974806, "percentage": 7.0, "elapsed_time": "2:58:18", "remaining_time": "1 day, 15:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1256, "total_steps": 17941, "loss": 1.8628, "learning_rate": 9.927713051302037e-05, "epoch": 0.0700072459729112, "percentage": 7.0, "elapsed_time": "2:58:27", "remaining_time": "1 day, 15:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1257, "total_steps": 17941, "loss": 1.9999, "learning_rate": 9.927562110689046e-05, "epoch": 0.07006298422607435, "percentage": 7.01, "elapsed_time": "2:58:35", "remaining_time": "1 day, 15:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1258, "total_steps": 17941, "loss": 1.6341, "learning_rate": 9.927411013802512e-05, "epoch": 0.0701187224792375, "percentage": 7.01, "elapsed_time": "2:58:44", "remaining_time": "1 day, 15:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1259, "total_steps": 17941, "loss": 1.8801, "learning_rate": 9.927259760647232e-05, "epoch": 0.07017446073240065, "percentage": 7.02, "elapsed_time": "2:58:52", "remaining_time": "1 day, 15:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 17941, "loss": 1.6122, "learning_rate": 9.927108351227998e-05, "epoch": 0.07023019898556379, "percentage": 7.02, "elapsed_time": "2:59:01", "remaining_time": "1 day, 15:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1261, "total_steps": 17941, "loss": 2.0343, "learning_rate": 9.926956785549616e-05, "epoch": 0.07028593723872693, "percentage": 7.03, "elapsed_time": "2:59:09", "remaining_time": "1 day, 15:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1262, "total_steps": 17941, "loss": 1.9449, "learning_rate": 9.92680506361689e-05, "epoch": 0.07034167549189009, "percentage": 7.03, "elapsed_time": "2:59:17", "remaining_time": "1 day, 15:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1263, "total_steps": 17941, "loss": 1.7354, "learning_rate": 9.926653185434634e-05, "epoch": 0.07039741374505323, "percentage": 7.04, "elapsed_time": "2:59:26", "remaining_time": "1 day, 15:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1264, "total_steps": 17941, "loss": 1.8347, "learning_rate": 9.926501151007662e-05, "epoch": 0.07045315199821638, "percentage": 7.05, "elapsed_time": "2:59:34", "remaining_time": "1 day, 15:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1265, "total_steps": 17941, "loss": 1.887, "learning_rate": 9.926348960340796e-05, "epoch": 0.07050889025137952, "percentage": 7.05, "elapsed_time": "2:59:43", "remaining_time": "1 day, 15:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1266, "total_steps": 17941, "loss": 1.8267, "learning_rate": 9.926196613438865e-05, "epoch": 0.07056462850454266, "percentage": 7.06, "elapsed_time": "2:59:51", "remaining_time": "1 day, 15:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1267, "total_steps": 17941, "loss": 1.4021, "learning_rate": 9.926044110306698e-05, "epoch": 0.07062036675770582, "percentage": 7.06, "elapsed_time": "3:00:00", "remaining_time": "1 day, 15:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1268, "total_steps": 17941, "loss": 2.1346, "learning_rate": 9.925891450949135e-05, "epoch": 0.07067610501086896, "percentage": 7.07, "elapsed_time": "3:00:08", "remaining_time": "1 day, 15:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1269, "total_steps": 17941, "loss": 1.7458, "learning_rate": 9.925738635371011e-05, "epoch": 0.0707318432640321, "percentage": 7.07, "elapsed_time": "3:00:17", "remaining_time": "1 day, 15:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 17941, "loss": 1.9184, "learning_rate": 9.925585663577181e-05, "epoch": 0.07078758151719525, "percentage": 7.08, "elapsed_time": "3:00:25", "remaining_time": "1 day, 15:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1271, "total_steps": 17941, "loss": 1.7406, "learning_rate": 9.92543253557249e-05, "epoch": 0.0708433197703584, "percentage": 7.08, "elapsed_time": "3:00:34", "remaining_time": "1 day, 15:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1272, "total_steps": 17941, "loss": 1.6771, "learning_rate": 9.925279251361795e-05, "epoch": 0.07089905802352155, "percentage": 7.09, "elapsed_time": "3:00:42", "remaining_time": "1 day, 15:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1273, "total_steps": 17941, "loss": 1.534, "learning_rate": 9.92512581094996e-05, "epoch": 0.07095479627668469, "percentage": 7.1, "elapsed_time": "3:00:51", "remaining_time": "1 day, 15:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1274, "total_steps": 17941, "loss": 1.6932, "learning_rate": 9.92497221434185e-05, "epoch": 0.07101053452984783, "percentage": 7.1, "elapsed_time": "3:00:59", "remaining_time": "1 day, 15:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1275, "total_steps": 17941, "loss": 1.7863, "learning_rate": 9.924818461542335e-05, "epoch": 0.07106627278301098, "percentage": 7.11, "elapsed_time": "3:01:08", "remaining_time": "1 day, 15:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1276, "total_steps": 17941, "loss": 1.5134, "learning_rate": 9.924664552556293e-05, "epoch": 0.07112201103617413, "percentage": 7.11, "elapsed_time": "3:01:16", "remaining_time": "1 day, 15:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1277, "total_steps": 17941, "loss": 1.7264, "learning_rate": 9.924510487388603e-05, "epoch": 0.07117774928933727, "percentage": 7.12, "elapsed_time": "3:01:25", "remaining_time": "1 day, 15:27:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1278, "total_steps": 17941, "loss": 2.0642, "learning_rate": 9.924356266044153e-05, "epoch": 0.07123348754250042, "percentage": 7.12, "elapsed_time": "3:01:33", "remaining_time": "1 day, 15:27:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1279, "total_steps": 17941, "loss": 1.5962, "learning_rate": 9.924201888527833e-05, "epoch": 0.07128922579566356, "percentage": 7.13, "elapsed_time": "3:01:42", "remaining_time": "1 day, 15:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 17941, "loss": 1.657, "learning_rate": 9.924047354844539e-05, "epoch": 0.0713449640488267, "percentage": 7.13, "elapsed_time": "3:01:50", "remaining_time": "1 day, 15:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1281, "total_steps": 17941, "loss": 1.8447, "learning_rate": 9.923892664999173e-05, "epoch": 0.07140070230198986, "percentage": 7.14, "elapsed_time": "3:01:59", "remaining_time": "1 day, 15:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1282, "total_steps": 17941, "loss": 1.7732, "learning_rate": 9.923737818996639e-05, "epoch": 0.071456440555153, "percentage": 7.15, "elapsed_time": "3:02:07", "remaining_time": "1 day, 15:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1283, "total_steps": 17941, "loss": 1.5262, "learning_rate": 9.92358281684185e-05, "epoch": 0.07151217880831615, "percentage": 7.15, "elapsed_time": "3:02:16", "remaining_time": "1 day, 15:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1284, "total_steps": 17941, "loss": 2.0328, "learning_rate": 9.92342765853972e-05, "epoch": 0.07156791706147929, "percentage": 7.16, "elapsed_time": "3:02:25", "remaining_time": "1 day, 15:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1285, "total_steps": 17941, "loss": 1.7766, "learning_rate": 9.923272344095169e-05, "epoch": 0.07162365531464245, "percentage": 7.16, "elapsed_time": "3:02:33", "remaining_time": "1 day, 15:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1286, "total_steps": 17941, "loss": 1.9544, "learning_rate": 9.923116873513125e-05, "epoch": 0.07167939356780559, "percentage": 7.17, "elapsed_time": "3:02:42", "remaining_time": "1 day, 15:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1287, "total_steps": 17941, "loss": 1.6245, "learning_rate": 9.922961246798516e-05, "epoch": 0.07173513182096873, "percentage": 7.17, "elapsed_time": "3:02:50", "remaining_time": "1 day, 15:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1288, "total_steps": 17941, "loss": 1.8113, "learning_rate": 9.922805463956282e-05, "epoch": 0.07179087007413187, "percentage": 7.18, "elapsed_time": "3:02:58", "remaining_time": "1 day, 15:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1289, "total_steps": 17941, "loss": 1.5682, "learning_rate": 9.922649524991359e-05, "epoch": 0.07184660832729502, "percentage": 7.18, "elapsed_time": "3:03:07", "remaining_time": "1 day, 15:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 17941, "loss": 1.7724, "learning_rate": 9.922493429908695e-05, "epoch": 0.07190234658045817, "percentage": 7.19, "elapsed_time": "3:03:15", "remaining_time": "1 day, 15:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1291, "total_steps": 17941, "loss": 1.8775, "learning_rate": 9.922337178713238e-05, "epoch": 0.07195808483362132, "percentage": 7.2, "elapsed_time": "3:03:24", "remaining_time": "1 day, 15:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1292, "total_steps": 17941, "loss": 1.6585, "learning_rate": 9.922180771409945e-05, "epoch": 0.07201382308678446, "percentage": 7.2, "elapsed_time": "3:03:33", "remaining_time": "1 day, 15:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1293, "total_steps": 17941, "loss": 1.7811, "learning_rate": 9.922024208003777e-05, "epoch": 0.0720695613399476, "percentage": 7.21, "elapsed_time": "3:03:41", "remaining_time": "1 day, 15:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1294, "total_steps": 17941, "loss": 1.5123, "learning_rate": 9.921867488499699e-05, "epoch": 0.07212529959311076, "percentage": 7.21, "elapsed_time": "3:03:50", "remaining_time": "1 day, 15:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1295, "total_steps": 17941, "loss": 1.798, "learning_rate": 9.92171061290268e-05, "epoch": 0.0721810378462739, "percentage": 7.22, "elapsed_time": "3:03:58", "remaining_time": "1 day, 15:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1296, "total_steps": 17941, "loss": 1.8681, "learning_rate": 9.921553581217697e-05, "epoch": 0.07223677609943704, "percentage": 7.22, "elapsed_time": "3:04:07", "remaining_time": "1 day, 15:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1297, "total_steps": 17941, "loss": 1.5803, "learning_rate": 9.921396393449727e-05, "epoch": 0.07229251435260019, "percentage": 7.23, "elapsed_time": "3:04:15", "remaining_time": "1 day, 15:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1298, "total_steps": 17941, "loss": 1.8512, "learning_rate": 9.921239049603759e-05, "epoch": 0.07234825260576333, "percentage": 7.23, "elapsed_time": "3:04:24", "remaining_time": "1 day, 15:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1299, "total_steps": 17941, "loss": 1.9001, "learning_rate": 9.921081549684779e-05, "epoch": 0.07240399085892649, "percentage": 7.24, "elapsed_time": "3:04:32", "remaining_time": "1 day, 15:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 17941, "loss": 1.718, "learning_rate": 9.920923893697786e-05, "epoch": 0.07245972911208963, "percentage": 7.25, "elapsed_time": "3:04:41", "remaining_time": "1 day, 15:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1301, "total_steps": 17941, "loss": 1.6531, "learning_rate": 9.920766081647779e-05, "epoch": 0.07251546736525277, "percentage": 7.25, "elapsed_time": "3:04:49", "remaining_time": "1 day, 15:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1302, "total_steps": 17941, "loss": 1.6522, "learning_rate": 9.92060811353976e-05, "epoch": 0.07257120561841592, "percentage": 7.26, "elapsed_time": "3:04:58", "remaining_time": "1 day, 15:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1303, "total_steps": 17941, "loss": 1.5131, "learning_rate": 9.920449989378742e-05, "epoch": 0.07262694387157906, "percentage": 7.26, "elapsed_time": "3:05:07", "remaining_time": "1 day, 15:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1304, "total_steps": 17941, "loss": 1.5922, "learning_rate": 9.920291709169737e-05, "epoch": 0.07268268212474222, "percentage": 7.27, "elapsed_time": "3:05:15", "remaining_time": "1 day, 15:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1305, "total_steps": 17941, "loss": 1.83, "learning_rate": 9.920133272917767e-05, "epoch": 0.07273842037790536, "percentage": 7.27, "elapsed_time": "3:05:24", "remaining_time": "1 day, 15:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1306, "total_steps": 17941, "loss": 1.8742, "learning_rate": 9.919974680627856e-05, "epoch": 0.0727941586310685, "percentage": 7.28, "elapsed_time": "3:05:33", "remaining_time": "1 day, 15:23:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1307, "total_steps": 17941, "loss": 1.8706, "learning_rate": 9.919815932305034e-05, "epoch": 0.07284989688423164, "percentage": 7.28, "elapsed_time": "3:05:42", "remaining_time": "1 day, 15:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1308, "total_steps": 17941, "loss": 1.6827, "learning_rate": 9.919657027954335e-05, "epoch": 0.0729056351373948, "percentage": 7.29, "elapsed_time": "3:05:51", "remaining_time": "1 day, 15:23:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1309, "total_steps": 17941, "loss": 1.7064, "learning_rate": 9.919497967580798e-05, "epoch": 0.07296137339055794, "percentage": 7.3, "elapsed_time": "3:05:59", "remaining_time": "1 day, 15:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 17941, "loss": 1.7643, "learning_rate": 9.919338751189468e-05, "epoch": 0.07301711164372109, "percentage": 7.3, "elapsed_time": "3:06:08", "remaining_time": "1 day, 15:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1311, "total_steps": 17941, "loss": 1.928, "learning_rate": 9.919179378785396e-05, "epoch": 0.07307284989688423, "percentage": 7.31, "elapsed_time": "3:06:16", "remaining_time": "1 day, 15:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1312, "total_steps": 17941, "loss": 2.0754, "learning_rate": 9.919019850373635e-05, "epoch": 0.07312858815004737, "percentage": 7.31, "elapsed_time": "3:06:25", "remaining_time": "1 day, 15:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1313, "total_steps": 17941, "loss": 1.652, "learning_rate": 9.918860165959243e-05, "epoch": 0.07318432640321053, "percentage": 7.32, "elapsed_time": "3:06:33", "remaining_time": "1 day, 15:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1314, "total_steps": 17941, "loss": 1.9413, "learning_rate": 9.918700325547286e-05, "epoch": 0.07324006465637367, "percentage": 7.32, "elapsed_time": "3:06:42", "remaining_time": "1 day, 15:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1315, "total_steps": 17941, "loss": 1.7279, "learning_rate": 9.918540329142831e-05, "epoch": 0.07329580290953681, "percentage": 7.33, "elapsed_time": "3:06:51", "remaining_time": "1 day, 15:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1316, "total_steps": 17941, "loss": 1.7546, "learning_rate": 9.918380176750955e-05, "epoch": 0.07335154116269996, "percentage": 7.34, "elapsed_time": "3:07:00", "remaining_time": "1 day, 15:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1317, "total_steps": 17941, "loss": 1.657, "learning_rate": 9.918219868376737e-05, "epoch": 0.07340727941586311, "percentage": 7.34, "elapsed_time": "3:07:08", "remaining_time": "1 day, 15:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1318, "total_steps": 17941, "loss": 1.8728, "learning_rate": 9.91805940402526e-05, "epoch": 0.07346301766902626, "percentage": 7.35, "elapsed_time": "3:07:16", "remaining_time": "1 day, 15:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1319, "total_steps": 17941, "loss": 2.008, "learning_rate": 9.917898783701612e-05, "epoch": 0.0735187559221894, "percentage": 7.35, "elapsed_time": "3:07:25", "remaining_time": "1 day, 15:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 17941, "loss": 1.6254, "learning_rate": 9.917738007410888e-05, "epoch": 0.07357449417535254, "percentage": 7.36, "elapsed_time": "3:07:33", "remaining_time": "1 day, 15:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1321, "total_steps": 17941, "loss": 2.0478, "learning_rate": 9.917577075158186e-05, "epoch": 0.07363023242851569, "percentage": 7.36, "elapsed_time": "3:07:42", "remaining_time": "1 day, 15:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1322, "total_steps": 17941, "loss": 1.8852, "learning_rate": 9.917415986948612e-05, "epoch": 0.07368597068167884, "percentage": 7.37, "elapsed_time": "3:07:50", "remaining_time": "1 day, 15:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1323, "total_steps": 17941, "loss": 1.5704, "learning_rate": 9.917254742787273e-05, "epoch": 0.07374170893484198, "percentage": 7.37, "elapsed_time": "3:07:59", "remaining_time": "1 day, 15:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1324, "total_steps": 17941, "loss": 1.6683, "learning_rate": 9.917093342679284e-05, "epoch": 0.07379744718800513, "percentage": 7.38, "elapsed_time": "3:08:07", "remaining_time": "1 day, 15:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1325, "total_steps": 17941, "loss": 1.6127, "learning_rate": 9.916931786629761e-05, "epoch": 0.07385318544116827, "percentage": 7.39, "elapsed_time": "3:08:16", "remaining_time": "1 day, 15:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1326, "total_steps": 17941, "loss": 1.8274, "learning_rate": 9.916770074643831e-05, "epoch": 0.07390892369433141, "percentage": 7.39, "elapsed_time": "3:08:24", "remaining_time": "1 day, 15:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1327, "total_steps": 17941, "loss": 1.7747, "learning_rate": 9.91660820672662e-05, "epoch": 0.07396466194749457, "percentage": 7.4, "elapsed_time": "3:08:32", "remaining_time": "1 day, 15:20:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1328, "total_steps": 17941, "loss": 1.8716, "learning_rate": 9.916446182883264e-05, "epoch": 0.07402040020065771, "percentage": 7.4, "elapsed_time": "3:08:41", "remaining_time": "1 day, 15:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1329, "total_steps": 17941, "loss": 1.572, "learning_rate": 9.916284003118897e-05, "epoch": 0.07407613845382086, "percentage": 7.41, "elapsed_time": "3:08:49", "remaining_time": "1 day, 15:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 17941, "loss": 1.852, "learning_rate": 9.916121667438667e-05, "epoch": 0.074131876706984, "percentage": 7.41, "elapsed_time": "3:08:58", "remaining_time": "1 day, 15:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1331, "total_steps": 17941, "loss": 1.8053, "learning_rate": 9.915959175847723e-05, "epoch": 0.07418761496014716, "percentage": 7.42, "elapsed_time": "3:09:07", "remaining_time": "1 day, 15:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1332, "total_steps": 17941, "loss": 1.9061, "learning_rate": 9.915796528351212e-05, "epoch": 0.0742433532133103, "percentage": 7.42, "elapsed_time": "3:09:15", "remaining_time": "1 day, 15:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1333, "total_steps": 17941, "loss": 1.8031, "learning_rate": 9.915633724954299e-05, "epoch": 0.07429909146647344, "percentage": 7.43, "elapsed_time": "3:09:24", "remaining_time": "1 day, 15:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1334, "total_steps": 17941, "loss": 1.7918, "learning_rate": 9.915470765662143e-05, "epoch": 0.07435482971963658, "percentage": 7.44, "elapsed_time": "3:09:32", "remaining_time": "1 day, 15:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1335, "total_steps": 17941, "loss": 1.7687, "learning_rate": 9.915307650479914e-05, "epoch": 0.07441056797279973, "percentage": 7.44, "elapsed_time": "3:09:41", "remaining_time": "1 day, 15:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1336, "total_steps": 17941, "loss": 1.6509, "learning_rate": 9.915144379412784e-05, "epoch": 0.07446630622596288, "percentage": 7.45, "elapsed_time": "3:09:49", "remaining_time": "1 day, 15:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1337, "total_steps": 17941, "loss": 1.7922, "learning_rate": 9.914980952465932e-05, "epoch": 0.07452204447912603, "percentage": 7.45, "elapsed_time": "3:09:58", "remaining_time": "1 day, 15:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1338, "total_steps": 17941, "loss": 1.6475, "learning_rate": 9.91481736964454e-05, "epoch": 0.07457778273228917, "percentage": 7.46, "elapsed_time": "3:10:07", "remaining_time": "1 day, 15:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1339, "total_steps": 17941, "loss": 1.9451, "learning_rate": 9.914653630953797e-05, "epoch": 0.07463352098545231, "percentage": 7.46, "elapsed_time": "3:10:15", "remaining_time": "1 day, 15:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 17941, "loss": 1.6014, "learning_rate": 9.914489736398895e-05, "epoch": 0.07468925923861547, "percentage": 7.47, "elapsed_time": "3:10:24", "remaining_time": "1 day, 15:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1341, "total_steps": 17941, "loss": 1.7206, "learning_rate": 9.914325685985033e-05, "epoch": 0.07474499749177861, "percentage": 7.47, "elapsed_time": "3:10:32", "remaining_time": "1 day, 15:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1342, "total_steps": 17941, "loss": 1.984, "learning_rate": 9.914161479717413e-05, "epoch": 0.07480073574494175, "percentage": 7.48, "elapsed_time": "3:10:40", "remaining_time": "1 day, 15:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1343, "total_steps": 17941, "loss": 1.8535, "learning_rate": 9.91399711760124e-05, "epoch": 0.0748564739981049, "percentage": 7.49, "elapsed_time": "3:10:49", "remaining_time": "1 day, 15:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1344, "total_steps": 17941, "loss": 1.7632, "learning_rate": 9.91383259964173e-05, "epoch": 0.07491221225126804, "percentage": 7.49, "elapsed_time": "3:10:58", "remaining_time": "1 day, 15:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1345, "total_steps": 17941, "loss": 2.0607, "learning_rate": 9.9136679258441e-05, "epoch": 0.0749679505044312, "percentage": 7.5, "elapsed_time": "3:11:07", "remaining_time": "1 day, 15:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1346, "total_steps": 17941, "loss": 1.914, "learning_rate": 9.913503096213572e-05, "epoch": 0.07502368875759434, "percentage": 7.5, "elapsed_time": "3:11:16", "remaining_time": "1 day, 15:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1347, "total_steps": 17941, "loss": 1.8349, "learning_rate": 9.913338110755375e-05, "epoch": 0.07507942701075748, "percentage": 7.51, "elapsed_time": "3:11:25", "remaining_time": "1 day, 15:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1348, "total_steps": 17941, "loss": 1.5673, "learning_rate": 9.913172969474737e-05, "epoch": 0.07513516526392063, "percentage": 7.51, "elapsed_time": "3:11:33", "remaining_time": "1 day, 15:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1349, "total_steps": 17941, "loss": 2.1014, "learning_rate": 9.913007672376899e-05, "epoch": 0.07519090351708377, "percentage": 7.52, "elapsed_time": "3:11:42", "remaining_time": "1 day, 15:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 17941, "loss": 1.6999, "learning_rate": 9.912842219467105e-05, "epoch": 0.07524664177024692, "percentage": 7.52, "elapsed_time": "3:11:50", "remaining_time": "1 day, 15:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1351, "total_steps": 17941, "loss": 1.9367, "learning_rate": 9.912676610750598e-05, "epoch": 0.07530238002341007, "percentage": 7.53, "elapsed_time": "3:11:59", "remaining_time": "1 day, 15:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1352, "total_steps": 17941, "loss": 1.8136, "learning_rate": 9.91251084623263e-05, "epoch": 0.07535811827657321, "percentage": 7.54, "elapsed_time": "3:12:08", "remaining_time": "1 day, 15:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1353, "total_steps": 17941, "loss": 1.7309, "learning_rate": 9.912344925918462e-05, "epoch": 0.07541385652973635, "percentage": 7.54, "elapsed_time": "3:12:16", "remaining_time": "1 day, 15:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1354, "total_steps": 17941, "loss": 1.2918, "learning_rate": 9.912178849813353e-05, "epoch": 0.07546959478289951, "percentage": 7.55, "elapsed_time": "3:12:25", "remaining_time": "1 day, 15:17:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1355, "total_steps": 17941, "loss": 1.8673, "learning_rate": 9.91201261792257e-05, "epoch": 0.07552533303606265, "percentage": 7.55, "elapsed_time": "3:12:33", "remaining_time": "1 day, 15:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1356, "total_steps": 17941, "loss": 1.6275, "learning_rate": 9.911846230251388e-05, "epoch": 0.0755810712892258, "percentage": 7.56, "elapsed_time": "3:12:42", "remaining_time": "1 day, 15:16:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1357, "total_steps": 17941, "loss": 1.7718, "learning_rate": 9.91167968680508e-05, "epoch": 0.07563680954238894, "percentage": 7.56, "elapsed_time": "3:12:50", "remaining_time": "1 day, 15:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1358, "total_steps": 17941, "loss": 1.7842, "learning_rate": 9.911512987588932e-05, "epoch": 0.07569254779555208, "percentage": 7.57, "elapsed_time": "3:12:59", "remaining_time": "1 day, 15:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1359, "total_steps": 17941, "loss": 1.5556, "learning_rate": 9.911346132608225e-05, "epoch": 0.07574828604871524, "percentage": 7.57, "elapsed_time": "3:13:08", "remaining_time": "1 day, 15:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 17941, "loss": 1.853, "learning_rate": 9.911179121868255e-05, "epoch": 0.07580402430187838, "percentage": 7.58, "elapsed_time": "3:13:16", "remaining_time": "1 day, 15:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1361, "total_steps": 17941, "loss": 1.646, "learning_rate": 9.911011955374316e-05, "epoch": 0.07585976255504152, "percentage": 7.59, "elapsed_time": "3:13:25", "remaining_time": "1 day, 15:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1362, "total_steps": 17941, "loss": 1.6188, "learning_rate": 9.910844633131713e-05, "epoch": 0.07591550080820467, "percentage": 7.59, "elapsed_time": "3:13:33", "remaining_time": "1 day, 15:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1363, "total_steps": 17941, "loss": 1.9164, "learning_rate": 9.91067715514575e-05, "epoch": 0.07597123906136782, "percentage": 7.6, "elapsed_time": "3:13:42", "remaining_time": "1 day, 15:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1364, "total_steps": 17941, "loss": 1.9139, "learning_rate": 9.910509521421738e-05, "epoch": 0.07602697731453097, "percentage": 7.6, "elapsed_time": "3:13:50", "remaining_time": "1 day, 15:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1365, "total_steps": 17941, "loss": 1.8488, "learning_rate": 9.910341731964996e-05, "epoch": 0.07608271556769411, "percentage": 7.61, "elapsed_time": "3:13:58", "remaining_time": "1 day, 15:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1366, "total_steps": 17941, "loss": 1.8503, "learning_rate": 9.910173786780842e-05, "epoch": 0.07613845382085725, "percentage": 7.61, "elapsed_time": "3:14:07", "remaining_time": "1 day, 15:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1367, "total_steps": 17941, "loss": 1.7051, "learning_rate": 9.910005685874603e-05, "epoch": 0.0761941920740204, "percentage": 7.62, "elapsed_time": "3:14:15", "remaining_time": "1 day, 15:15:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1368, "total_steps": 17941, "loss": 1.4925, "learning_rate": 9.909837429251614e-05, "epoch": 0.07624993032718355, "percentage": 7.62, "elapsed_time": "3:14:24", "remaining_time": "1 day, 15:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1369, "total_steps": 17941, "loss": 1.5833, "learning_rate": 9.909669016917204e-05, "epoch": 0.0763056685803467, "percentage": 7.63, "elapsed_time": "3:14:32", "remaining_time": "1 day, 15:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 17941, "loss": 2.1295, "learning_rate": 9.909500448876721e-05, "epoch": 0.07636140683350984, "percentage": 7.64, "elapsed_time": "3:14:41", "remaining_time": "1 day, 15:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1371, "total_steps": 17941, "loss": 1.862, "learning_rate": 9.909331725135509e-05, "epoch": 0.07641714508667298, "percentage": 7.64, "elapsed_time": "3:14:49", "remaining_time": "1 day, 15:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1372, "total_steps": 17941, "loss": 1.7541, "learning_rate": 9.909162845698916e-05, "epoch": 0.07647288333983612, "percentage": 7.65, "elapsed_time": "3:14:58", "remaining_time": "1 day, 15:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1373, "total_steps": 17941, "loss": 1.7944, "learning_rate": 9.9089938105723e-05, "epoch": 0.07652862159299928, "percentage": 7.65, "elapsed_time": "3:15:06", "remaining_time": "1 day, 15:14:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1374, "total_steps": 17941, "loss": 1.8207, "learning_rate": 9.908824619761023e-05, "epoch": 0.07658435984616242, "percentage": 7.66, "elapsed_time": "3:15:15", "remaining_time": "1 day, 15:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1375, "total_steps": 17941, "loss": 1.8224, "learning_rate": 9.908655273270449e-05, "epoch": 0.07664009809932557, "percentage": 7.66, "elapsed_time": "3:15:23", "remaining_time": "1 day, 15:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1376, "total_steps": 17941, "loss": 1.856, "learning_rate": 9.908485771105949e-05, "epoch": 0.07669583635248871, "percentage": 7.67, "elapsed_time": "3:15:32", "remaining_time": "1 day, 15:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1377, "total_steps": 17941, "loss": 1.7791, "learning_rate": 9.908316113272897e-05, "epoch": 0.07675157460565186, "percentage": 7.68, "elapsed_time": "3:15:41", "remaining_time": "1 day, 15:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1378, "total_steps": 17941, "loss": 1.7608, "learning_rate": 9.908146299776678e-05, "epoch": 0.07680731285881501, "percentage": 7.68, "elapsed_time": "3:15:49", "remaining_time": "1 day, 15:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1379, "total_steps": 17941, "loss": 1.772, "learning_rate": 9.907976330622674e-05, "epoch": 0.07686305111197815, "percentage": 7.69, "elapsed_time": "3:15:58", "remaining_time": "1 day, 15:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 17941, "loss": 1.2319, "learning_rate": 9.907806205816277e-05, "epoch": 0.0769187893651413, "percentage": 7.69, "elapsed_time": "3:16:06", "remaining_time": "1 day, 15:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1381, "total_steps": 17941, "loss": 1.676, "learning_rate": 9.90763592536288e-05, "epoch": 0.07697452761830444, "percentage": 7.7, "elapsed_time": "3:16:15", "remaining_time": "1 day, 15:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1382, "total_steps": 17941, "loss": 1.7612, "learning_rate": 9.907465489267886e-05, "epoch": 0.0770302658714676, "percentage": 7.7, "elapsed_time": "3:16:24", "remaining_time": "1 day, 15:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1383, "total_steps": 17941, "loss": 1.8883, "learning_rate": 9.907294897536699e-05, "epoch": 0.07708600412463074, "percentage": 7.71, "elapsed_time": "3:16:33", "remaining_time": "1 day, 15:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1384, "total_steps": 17941, "loss": 1.8195, "learning_rate": 9.90712415017473e-05, "epoch": 0.07714174237779388, "percentage": 7.71, "elapsed_time": "3:16:42", "remaining_time": "1 day, 15:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1385, "total_steps": 17941, "loss": 1.765, "learning_rate": 9.906953247187392e-05, "epoch": 0.07719748063095702, "percentage": 7.72, "elapsed_time": "3:16:50", "remaining_time": "1 day, 15:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1386, "total_steps": 17941, "loss": 1.5199, "learning_rate": 9.906782188580107e-05, "epoch": 0.07725321888412018, "percentage": 7.73, "elapsed_time": "3:16:59", "remaining_time": "1 day, 15:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1387, "total_steps": 17941, "loss": 2.1369, "learning_rate": 9.9066109743583e-05, "epoch": 0.07730895713728332, "percentage": 7.73, "elapsed_time": "3:17:07", "remaining_time": "1 day, 15:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1388, "total_steps": 17941, "loss": 1.6941, "learning_rate": 9.9064396045274e-05, "epoch": 0.07736469539044646, "percentage": 7.74, "elapsed_time": "3:17:16", "remaining_time": "1 day, 15:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1389, "total_steps": 17941, "loss": 1.7395, "learning_rate": 9.906268079092843e-05, "epoch": 0.0774204336436096, "percentage": 7.74, "elapsed_time": "3:17:24", "remaining_time": "1 day, 15:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 17941, "loss": 1.7771, "learning_rate": 9.906096398060067e-05, "epoch": 0.07747617189677275, "percentage": 7.75, "elapsed_time": "3:17:33", "remaining_time": "1 day, 15:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1391, "total_steps": 17941, "loss": 1.8375, "learning_rate": 9.905924561434519e-05, "epoch": 0.0775319101499359, "percentage": 7.75, "elapsed_time": "3:17:41", "remaining_time": "1 day, 15:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1392, "total_steps": 17941, "loss": 1.4259, "learning_rate": 9.905752569221647e-05, "epoch": 0.07758764840309905, "percentage": 7.76, "elapsed_time": "3:17:49", "remaining_time": "1 day, 15:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1393, "total_steps": 17941, "loss": 1.7302, "learning_rate": 9.905580421426905e-05, "epoch": 0.07764338665626219, "percentage": 7.76, "elapsed_time": "3:17:58", "remaining_time": "1 day, 15:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1394, "total_steps": 17941, "loss": 1.665, "learning_rate": 9.905408118055755e-05, "epoch": 0.07769912490942534, "percentage": 7.77, "elapsed_time": "3:18:06", "remaining_time": "1 day, 15:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1395, "total_steps": 17941, "loss": 1.7589, "learning_rate": 9.905235659113658e-05, "epoch": 0.07775486316258848, "percentage": 7.78, "elapsed_time": "3:18:15", "remaining_time": "1 day, 15:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1396, "total_steps": 17941, "loss": 1.9677, "learning_rate": 9.905063044606088e-05, "epoch": 0.07781060141575163, "percentage": 7.78, "elapsed_time": "3:18:23", "remaining_time": "1 day, 15:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1397, "total_steps": 17941, "loss": 1.6438, "learning_rate": 9.904890274538516e-05, "epoch": 0.07786633966891478, "percentage": 7.79, "elapsed_time": "3:18:32", "remaining_time": "1 day, 15:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1398, "total_steps": 17941, "loss": 1.8672, "learning_rate": 9.904717348916421e-05, "epoch": 0.07792207792207792, "percentage": 7.79, "elapsed_time": "3:18:40", "remaining_time": "1 day, 15:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1399, "total_steps": 17941, "loss": 1.6942, "learning_rate": 9.904544267745288e-05, "epoch": 0.07797781617524106, "percentage": 7.8, "elapsed_time": "3:18:49", "remaining_time": "1 day, 15:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 17941, "loss": 2.0127, "learning_rate": 9.904371031030608e-05, "epoch": 0.07803355442840422, "percentage": 7.8, "elapsed_time": "3:18:57", "remaining_time": "1 day, 15:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1401, "total_steps": 17941, "loss": 1.6781, "learning_rate": 9.904197638777872e-05, "epoch": 0.07808929268156736, "percentage": 7.81, "elapsed_time": "3:19:06", "remaining_time": "1 day, 15:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1402, "total_steps": 17941, "loss": 1.7314, "learning_rate": 9.904024090992581e-05, "epoch": 0.0781450309347305, "percentage": 7.81, "elapsed_time": "3:19:14", "remaining_time": "1 day, 15:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1403, "total_steps": 17941, "loss": 1.8782, "learning_rate": 9.903850387680238e-05, "epoch": 0.07820076918789365, "percentage": 7.82, "elapsed_time": "3:19:23", "remaining_time": "1 day, 15:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1404, "total_steps": 17941, "loss": 1.9028, "learning_rate": 9.903676528846352e-05, "epoch": 0.07825650744105679, "percentage": 7.83, "elapsed_time": "3:19:31", "remaining_time": "1 day, 15:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1405, "total_steps": 17941, "loss": 1.6501, "learning_rate": 9.903502514496436e-05, "epoch": 0.07831224569421995, "percentage": 7.83, "elapsed_time": "3:19:39", "remaining_time": "1 day, 15:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1406, "total_steps": 17941, "loss": 1.7873, "learning_rate": 9.903328344636012e-05, "epoch": 0.07836798394738309, "percentage": 7.84, "elapsed_time": "3:19:48", "remaining_time": "1 day, 15:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1407, "total_steps": 17941, "loss": 1.6404, "learning_rate": 9.903154019270599e-05, "epoch": 0.07842372220054623, "percentage": 7.84, "elapsed_time": "3:19:56", "remaining_time": "1 day, 15:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1408, "total_steps": 17941, "loss": 1.8049, "learning_rate": 9.90297953840573e-05, "epoch": 0.07847946045370938, "percentage": 7.85, "elapsed_time": "3:20:05", "remaining_time": "1 day, 15:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1409, "total_steps": 17941, "loss": 1.8979, "learning_rate": 9.902804902046935e-05, "epoch": 0.07853519870687253, "percentage": 7.85, "elapsed_time": "3:20:14", "remaining_time": "1 day, 15:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 17941, "loss": 1.5322, "learning_rate": 9.902630110199753e-05, "epoch": 0.07859093696003568, "percentage": 7.86, "elapsed_time": "3:20:23", "remaining_time": "1 day, 15:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1411, "total_steps": 17941, "loss": 1.8126, "learning_rate": 9.90245516286973e-05, "epoch": 0.07864667521319882, "percentage": 7.86, "elapsed_time": "3:20:31", "remaining_time": "1 day, 15:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1412, "total_steps": 17941, "loss": 1.9197, "learning_rate": 9.902280060062413e-05, "epoch": 0.07870241346636196, "percentage": 7.87, "elapsed_time": "3:20:40", "remaining_time": "1 day, 15:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1413, "total_steps": 17941, "loss": 2.0767, "learning_rate": 9.902104801783352e-05, "epoch": 0.0787581517195251, "percentage": 7.88, "elapsed_time": "3:20:49", "remaining_time": "1 day, 15:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1414, "total_steps": 17941, "loss": 1.4594, "learning_rate": 9.90192938803811e-05, "epoch": 0.07881388997268826, "percentage": 7.88, "elapsed_time": "3:20:57", "remaining_time": "1 day, 15:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1415, "total_steps": 17941, "loss": 1.6394, "learning_rate": 9.901753818832248e-05, "epoch": 0.0788696282258514, "percentage": 7.89, "elapsed_time": "3:21:06", "remaining_time": "1 day, 15:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1416, "total_steps": 17941, "loss": 1.6963, "learning_rate": 9.901578094171333e-05, "epoch": 0.07892536647901455, "percentage": 7.89, "elapsed_time": "3:21:14", "remaining_time": "1 day, 15:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1417, "total_steps": 17941, "loss": 1.5721, "learning_rate": 9.90140221406094e-05, "epoch": 0.07898110473217769, "percentage": 7.9, "elapsed_time": "3:21:23", "remaining_time": "1 day, 15:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1418, "total_steps": 17941, "loss": 1.7414, "learning_rate": 9.901226178506646e-05, "epoch": 0.07903684298534083, "percentage": 7.9, "elapsed_time": "3:21:31", "remaining_time": "1 day, 15:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1419, "total_steps": 17941, "loss": 1.7728, "learning_rate": 9.901049987514033e-05, "epoch": 0.07909258123850399, "percentage": 7.91, "elapsed_time": "3:21:40", "remaining_time": "1 day, 15:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 17941, "loss": 1.8569, "learning_rate": 9.90087364108869e-05, "epoch": 0.07914831949166713, "percentage": 7.91, "elapsed_time": "3:21:48", "remaining_time": "1 day, 15:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1421, "total_steps": 17941, "loss": 1.7734, "learning_rate": 9.900697139236209e-05, "epoch": 0.07920405774483028, "percentage": 7.92, "elapsed_time": "3:21:57", "remaining_time": "1 day, 15:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1422, "total_steps": 17941, "loss": 1.6859, "learning_rate": 9.900520481962188e-05, "epoch": 0.07925979599799342, "percentage": 7.93, "elapsed_time": "3:22:05", "remaining_time": "1 day, 15:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1423, "total_steps": 17941, "loss": 1.7148, "learning_rate": 9.90034366927223e-05, "epoch": 0.07931553425115657, "percentage": 7.93, "elapsed_time": "3:22:14", "remaining_time": "1 day, 15:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1424, "total_steps": 17941, "loss": 1.7605, "learning_rate": 9.90016670117194e-05, "epoch": 0.07937127250431972, "percentage": 7.94, "elapsed_time": "3:22:22", "remaining_time": "1 day, 15:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1425, "total_steps": 17941, "loss": 1.7824, "learning_rate": 9.899989577666933e-05, "epoch": 0.07942701075748286, "percentage": 7.94, "elapsed_time": "3:22:30", "remaining_time": "1 day, 15:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1426, "total_steps": 17941, "loss": 1.8003, "learning_rate": 9.899812298762826e-05, "epoch": 0.079482749010646, "percentage": 7.95, "elapsed_time": "3:22:39", "remaining_time": "1 day, 15:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1427, "total_steps": 17941, "loss": 1.7588, "learning_rate": 9.899634864465241e-05, "epoch": 0.07953848726380915, "percentage": 7.95, "elapsed_time": "3:22:48", "remaining_time": "1 day, 15:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1428, "total_steps": 17941, "loss": 1.7284, "learning_rate": 9.899457274779804e-05, "epoch": 0.0795942255169723, "percentage": 7.96, "elapsed_time": "3:22:56", "remaining_time": "1 day, 15:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1429, "total_steps": 17941, "loss": 1.9947, "learning_rate": 9.899279529712148e-05, "epoch": 0.07964996377013545, "percentage": 7.96, "elapsed_time": "3:23:05", "remaining_time": "1 day, 15:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 17941, "loss": 1.5956, "learning_rate": 9.899101629267911e-05, "epoch": 0.07970570202329859, "percentage": 7.97, "elapsed_time": "3:23:13", "remaining_time": "1 day, 15:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1431, "total_steps": 17941, "loss": 2.0396, "learning_rate": 9.898923573452734e-05, "epoch": 0.07976144027646173, "percentage": 7.98, "elapsed_time": "3:23:22", "remaining_time": "1 day, 15:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1432, "total_steps": 17941, "loss": 1.5054, "learning_rate": 9.898745362272264e-05, "epoch": 0.07981717852962489, "percentage": 7.98, "elapsed_time": "3:23:30", "remaining_time": "1 day, 15:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1433, "total_steps": 17941, "loss": 1.6304, "learning_rate": 9.898566995732153e-05, "epoch": 0.07987291678278803, "percentage": 7.99, "elapsed_time": "3:23:39", "remaining_time": "1 day, 15:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1434, "total_steps": 17941, "loss": 1.8177, "learning_rate": 9.898388473838056e-05, "epoch": 0.07992865503595117, "percentage": 7.99, "elapsed_time": "3:23:47", "remaining_time": "1 day, 15:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1435, "total_steps": 17941, "loss": 1.7325, "learning_rate": 9.898209796595636e-05, "epoch": 0.07998439328911432, "percentage": 8.0, "elapsed_time": "3:23:55", "remaining_time": "1 day, 15:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1436, "total_steps": 17941, "loss": 1.5905, "learning_rate": 9.898030964010562e-05, "epoch": 0.08004013154227746, "percentage": 8.0, "elapsed_time": "3:24:04", "remaining_time": "1 day, 15:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1437, "total_steps": 17941, "loss": 1.672, "learning_rate": 9.897851976088501e-05, "epoch": 0.08009586979544062, "percentage": 8.01, "elapsed_time": "3:24:12", "remaining_time": "1 day, 15:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1438, "total_steps": 17941, "loss": 1.9549, "learning_rate": 9.897672832835135e-05, "epoch": 0.08015160804860376, "percentage": 8.02, "elapsed_time": "3:24:21", "remaining_time": "1 day, 15:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1439, "total_steps": 17941, "loss": 1.7438, "learning_rate": 9.89749353425614e-05, "epoch": 0.0802073463017669, "percentage": 8.02, "elapsed_time": "3:24:29", "remaining_time": "1 day, 15:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 17941, "loss": 1.6437, "learning_rate": 9.897314080357202e-05, "epoch": 0.08026308455493004, "percentage": 8.03, "elapsed_time": "3:24:38", "remaining_time": "1 day, 15:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1441, "total_steps": 17941, "loss": 1.742, "learning_rate": 9.897134471144019e-05, "epoch": 0.08031882280809319, "percentage": 8.03, "elapsed_time": "3:24:47", "remaining_time": "1 day, 15:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1442, "total_steps": 17941, "loss": 1.5031, "learning_rate": 9.896954706622281e-05, "epoch": 0.08037456106125634, "percentage": 8.04, "elapsed_time": "3:24:56", "remaining_time": "1 day, 15:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1443, "total_steps": 17941, "loss": 1.533, "learning_rate": 9.896774786797691e-05, "epoch": 0.08043029931441949, "percentage": 8.04, "elapsed_time": "3:25:04", "remaining_time": "1 day, 15:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1444, "total_steps": 17941, "loss": 2.0242, "learning_rate": 9.896594711675954e-05, "epoch": 0.08048603756758263, "percentage": 8.05, "elapsed_time": "3:25:13", "remaining_time": "1 day, 15:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1445, "total_steps": 17941, "loss": 1.815, "learning_rate": 9.896414481262784e-05, "epoch": 0.08054177582074577, "percentage": 8.05, "elapsed_time": "3:25:21", "remaining_time": "1 day, 15:04:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1446, "total_steps": 17941, "loss": 1.5458, "learning_rate": 9.896234095563893e-05, "epoch": 0.08059751407390893, "percentage": 8.06, "elapsed_time": "3:25:30", "remaining_time": "1 day, 15:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1447, "total_steps": 17941, "loss": 2.1062, "learning_rate": 9.896053554585006e-05, "epoch": 0.08065325232707207, "percentage": 8.07, "elapsed_time": "3:25:38", "remaining_time": "1 day, 15:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1448, "total_steps": 17941, "loss": 1.7228, "learning_rate": 9.895872858331843e-05, "epoch": 0.08070899058023522, "percentage": 8.07, "elapsed_time": "3:25:47", "remaining_time": "1 day, 15:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1449, "total_steps": 17941, "loss": 1.8915, "learning_rate": 9.89569200681014e-05, "epoch": 0.08076472883339836, "percentage": 8.08, "elapsed_time": "3:25:55", "remaining_time": "1 day, 15:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 17941, "loss": 1.857, "learning_rate": 9.895511000025629e-05, "epoch": 0.0808204670865615, "percentage": 8.08, "elapsed_time": "3:26:04", "remaining_time": "1 day, 15:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1451, "total_steps": 17941, "loss": 1.7033, "learning_rate": 9.895329837984053e-05, "epoch": 0.08087620533972466, "percentage": 8.09, "elapsed_time": "3:26:12", "remaining_time": "1 day, 15:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1452, "total_steps": 17941, "loss": 1.9076, "learning_rate": 9.895148520691155e-05, "epoch": 0.0809319435928878, "percentage": 8.09, "elapsed_time": "3:26:22", "remaining_time": "1 day, 15:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1453, "total_steps": 17941, "loss": 1.4164, "learning_rate": 9.894967048152688e-05, "epoch": 0.08098768184605094, "percentage": 8.1, "elapsed_time": "3:26:30", "remaining_time": "1 day, 15:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1454, "total_steps": 17941, "loss": 1.9833, "learning_rate": 9.894785420374405e-05, "epoch": 0.08104342009921409, "percentage": 8.1, "elapsed_time": "3:26:39", "remaining_time": "1 day, 15:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1455, "total_steps": 17941, "loss": 1.8342, "learning_rate": 9.894603637362068e-05, "epoch": 0.08109915835237724, "percentage": 8.11, "elapsed_time": "3:26:47", "remaining_time": "1 day, 15:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1456, "total_steps": 17941, "loss": 2.1415, "learning_rate": 9.894421699121439e-05, "epoch": 0.08115489660554039, "percentage": 8.12, "elapsed_time": "3:26:56", "remaining_time": "1 day, 15:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1457, "total_steps": 17941, "loss": 1.8387, "learning_rate": 9.894239605658292e-05, "epoch": 0.08121063485870353, "percentage": 8.12, "elapsed_time": "3:27:04", "remaining_time": "1 day, 15:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1458, "total_steps": 17941, "loss": 1.9307, "learning_rate": 9.8940573569784e-05, "epoch": 0.08126637311186667, "percentage": 8.13, "elapsed_time": "3:27:13", "remaining_time": "1 day, 15:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1459, "total_steps": 17941, "loss": 1.7991, "learning_rate": 9.893874953087543e-05, "epoch": 0.08132211136502981, "percentage": 8.13, "elapsed_time": "3:27:21", "remaining_time": "1 day, 15:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 17941, "loss": 1.7898, "learning_rate": 9.893692393991504e-05, "epoch": 0.08137784961819297, "percentage": 8.14, "elapsed_time": "3:27:29", "remaining_time": "1 day, 15:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1461, "total_steps": 17941, "loss": 1.8955, "learning_rate": 9.893509679696077e-05, "epoch": 0.08143358787135611, "percentage": 8.14, "elapsed_time": "3:27:38", "remaining_time": "1 day, 15:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1462, "total_steps": 17941, "loss": 1.6774, "learning_rate": 9.893326810207053e-05, "epoch": 0.08148932612451926, "percentage": 8.15, "elapsed_time": "3:27:46", "remaining_time": "1 day, 15:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1463, "total_steps": 17941, "loss": 1.5989, "learning_rate": 9.893143785530233e-05, "epoch": 0.0815450643776824, "percentage": 8.15, "elapsed_time": "3:27:55", "remaining_time": "1 day, 15:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1464, "total_steps": 17941, "loss": 1.6129, "learning_rate": 9.892960605671421e-05, "epoch": 0.08160080263084554, "percentage": 8.16, "elapsed_time": "3:28:04", "remaining_time": "1 day, 15:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1465, "total_steps": 17941, "loss": 1.7568, "learning_rate": 9.892777270636426e-05, "epoch": 0.0816565408840087, "percentage": 8.17, "elapsed_time": "3:28:12", "remaining_time": "1 day, 15:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1466, "total_steps": 17941, "loss": 1.5785, "learning_rate": 9.892593780431063e-05, "epoch": 0.08171227913717184, "percentage": 8.17, "elapsed_time": "3:28:21", "remaining_time": "1 day, 15:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1467, "total_steps": 17941, "loss": 1.6021, "learning_rate": 9.892410135061151e-05, "epoch": 0.08176801739033498, "percentage": 8.18, "elapsed_time": "3:28:29", "remaining_time": "1 day, 15:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1468, "total_steps": 17941, "loss": 1.7185, "learning_rate": 9.892226334532515e-05, "epoch": 0.08182375564349813, "percentage": 8.18, "elapsed_time": "3:28:37", "remaining_time": "1 day, 15:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1469, "total_steps": 17941, "loss": 1.7729, "learning_rate": 9.892042378850983e-05, "epoch": 0.08187949389666128, "percentage": 8.19, "elapsed_time": "3:28:46", "remaining_time": "1 day, 15:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 17941, "loss": 1.7497, "learning_rate": 9.89185826802239e-05, "epoch": 0.08193523214982443, "percentage": 8.19, "elapsed_time": "3:28:54", "remaining_time": "1 day, 15:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1471, "total_steps": 17941, "loss": 1.7032, "learning_rate": 9.891674002052572e-05, "epoch": 0.08199097040298757, "percentage": 8.2, "elapsed_time": "3:29:04", "remaining_time": "1 day, 15:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1472, "total_steps": 17941, "loss": 1.697, "learning_rate": 9.891489580947377e-05, "epoch": 0.08204670865615071, "percentage": 8.2, "elapsed_time": "3:29:12", "remaining_time": "1 day, 15:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1473, "total_steps": 17941, "loss": 1.676, "learning_rate": 9.891305004712652e-05, "epoch": 0.08210244690931386, "percentage": 8.21, "elapsed_time": "3:29:21", "remaining_time": "1 day, 15:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1474, "total_steps": 17941, "loss": 1.7862, "learning_rate": 9.891120273354248e-05, "epoch": 0.08215818516247701, "percentage": 8.22, "elapsed_time": "3:29:29", "remaining_time": "1 day, 15:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1475, "total_steps": 17941, "loss": 1.7835, "learning_rate": 9.890935386878029e-05, "epoch": 0.08221392341564016, "percentage": 8.22, "elapsed_time": "3:29:38", "remaining_time": "1 day, 15:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1476, "total_steps": 17941, "loss": 1.9147, "learning_rate": 9.890750345289855e-05, "epoch": 0.0822696616688033, "percentage": 8.23, "elapsed_time": "3:29:46", "remaining_time": "1 day, 15:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1477, "total_steps": 17941, "loss": 1.9944, "learning_rate": 9.890565148595594e-05, "epoch": 0.08232539992196644, "percentage": 8.23, "elapsed_time": "3:29:55", "remaining_time": "1 day, 15:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1478, "total_steps": 17941, "loss": 1.7003, "learning_rate": 9.890379796801122e-05, "epoch": 0.0823811381751296, "percentage": 8.24, "elapsed_time": "3:30:04", "remaining_time": "1 day, 14:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1479, "total_steps": 17941, "loss": 1.5901, "learning_rate": 9.890194289912315e-05, "epoch": 0.08243687642829274, "percentage": 8.24, "elapsed_time": "3:30:12", "remaining_time": "1 day, 14:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 17941, "loss": 1.4628, "learning_rate": 9.890008627935057e-05, "epoch": 0.08249261468145588, "percentage": 8.25, "elapsed_time": "3:30:21", "remaining_time": "1 day, 14:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1481, "total_steps": 17941, "loss": 1.797, "learning_rate": 9.889822810875236e-05, "epoch": 0.08254835293461903, "percentage": 8.25, "elapsed_time": "3:30:29", "remaining_time": "1 day, 14:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1482, "total_steps": 17941, "loss": 1.7715, "learning_rate": 9.889636838738745e-05, "epoch": 0.08260409118778217, "percentage": 8.26, "elapsed_time": "3:30:38", "remaining_time": "1 day, 14:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1483, "total_steps": 17941, "loss": 1.7935, "learning_rate": 9.889450711531482e-05, "epoch": 0.08265982944094533, "percentage": 8.27, "elapsed_time": "3:30:46", "remaining_time": "1 day, 14:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1484, "total_steps": 17941, "loss": 1.7009, "learning_rate": 9.889264429259351e-05, "epoch": 0.08271556769410847, "percentage": 8.27, "elapsed_time": "3:30:54", "remaining_time": "1 day, 14:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1485, "total_steps": 17941, "loss": 1.9159, "learning_rate": 9.889077991928257e-05, "epoch": 0.08277130594727161, "percentage": 8.28, "elapsed_time": "3:31:03", "remaining_time": "1 day, 14:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1486, "total_steps": 17941, "loss": 1.8089, "learning_rate": 9.888891399544116e-05, "epoch": 0.08282704420043475, "percentage": 8.28, "elapsed_time": "3:31:11", "remaining_time": "1 day, 14:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1487, "total_steps": 17941, "loss": 1.81, "learning_rate": 9.888704652112841e-05, "epoch": 0.0828827824535979, "percentage": 8.29, "elapsed_time": "3:31:20", "remaining_time": "1 day, 14:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1488, "total_steps": 17941, "loss": 1.8359, "learning_rate": 9.88851774964036e-05, "epoch": 0.08293852070676105, "percentage": 8.29, "elapsed_time": "3:31:28", "remaining_time": "1 day, 14:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1489, "total_steps": 17941, "loss": 1.7542, "learning_rate": 9.8883306921326e-05, "epoch": 0.0829942589599242, "percentage": 8.3, "elapsed_time": "3:31:37", "remaining_time": "1 day, 14:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 17941, "loss": 1.761, "learning_rate": 9.888143479595487e-05, "epoch": 0.08304999721308734, "percentage": 8.3, "elapsed_time": "3:31:45", "remaining_time": "1 day, 14:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1491, "total_steps": 17941, "loss": 1.961, "learning_rate": 9.887956112034965e-05, "epoch": 0.08310573546625048, "percentage": 8.31, "elapsed_time": "3:31:54", "remaining_time": "1 day, 14:57:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1492, "total_steps": 17941, "loss": 1.6075, "learning_rate": 9.887768589456973e-05, "epoch": 0.08316147371941364, "percentage": 8.32, "elapsed_time": "3:32:02", "remaining_time": "1 day, 14:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1493, "total_steps": 17941, "loss": 1.7721, "learning_rate": 9.88758091186746e-05, "epoch": 0.08321721197257678, "percentage": 8.32, "elapsed_time": "3:32:11", "remaining_time": "1 day, 14:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1494, "total_steps": 17941, "loss": 2.0317, "learning_rate": 9.887393079272378e-05, "epoch": 0.08327295022573993, "percentage": 8.33, "elapsed_time": "3:32:20", "remaining_time": "1 day, 14:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1495, "total_steps": 17941, "loss": 1.614, "learning_rate": 9.88720509167768e-05, "epoch": 0.08332868847890307, "percentage": 8.33, "elapsed_time": "3:32:28", "remaining_time": "1 day, 14:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1496, "total_steps": 17941, "loss": 1.7988, "learning_rate": 9.887016949089333e-05, "epoch": 0.08338442673206621, "percentage": 8.34, "elapsed_time": "3:32:37", "remaining_time": "1 day, 14:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1497, "total_steps": 17941, "loss": 1.6694, "learning_rate": 9.886828651513302e-05, "epoch": 0.08344016498522937, "percentage": 8.34, "elapsed_time": "3:32:45", "remaining_time": "1 day, 14:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1498, "total_steps": 17941, "loss": 1.9023, "learning_rate": 9.886640198955557e-05, "epoch": 0.08349590323839251, "percentage": 8.35, "elapsed_time": "3:32:53", "remaining_time": "1 day, 14:56:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1499, "total_steps": 17941, "loss": 1.8974, "learning_rate": 9.886451591422076e-05, "epoch": 0.08355164149155565, "percentage": 8.36, "elapsed_time": "3:33:02", "remaining_time": "1 day, 14:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 17941, "loss": 2.011, "learning_rate": 9.886262828918842e-05, "epoch": 0.0836073797447188, "percentage": 8.36, "elapsed_time": "3:33:10", "remaining_time": "1 day, 14:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1501, "total_steps": 17941, "loss": 1.853, "learning_rate": 9.886073911451838e-05, "epoch": 0.08366311799788195, "percentage": 8.37, "elapsed_time": "3:33:20", "remaining_time": "1 day, 14:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1502, "total_steps": 17941, "loss": 2.0279, "learning_rate": 9.88588483902706e-05, "epoch": 0.0837188562510451, "percentage": 8.37, "elapsed_time": "3:33:28", "remaining_time": "1 day, 14:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1503, "total_steps": 17941, "loss": 1.9006, "learning_rate": 9.8856956116505e-05, "epoch": 0.08377459450420824, "percentage": 8.38, "elapsed_time": "3:33:37", "remaining_time": "1 day, 14:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1504, "total_steps": 17941, "loss": 1.8549, "learning_rate": 9.88550622932816e-05, "epoch": 0.08383033275737138, "percentage": 8.38, "elapsed_time": "3:33:45", "remaining_time": "1 day, 14:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1505, "total_steps": 17941, "loss": 1.6991, "learning_rate": 9.885316692066048e-05, "epoch": 0.08388607101053452, "percentage": 8.39, "elapsed_time": "3:33:53", "remaining_time": "1 day, 14:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1506, "total_steps": 17941, "loss": 1.7942, "learning_rate": 9.885126999870173e-05, "epoch": 0.08394180926369768, "percentage": 8.39, "elapsed_time": "3:34:02", "remaining_time": "1 day, 14:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1507, "total_steps": 17941, "loss": 1.7333, "learning_rate": 9.884937152746553e-05, "epoch": 0.08399754751686082, "percentage": 8.4, "elapsed_time": "3:34:10", "remaining_time": "1 day, 14:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1508, "total_steps": 17941, "loss": 1.8288, "learning_rate": 9.884747150701207e-05, "epoch": 0.08405328577002397, "percentage": 8.41, "elapsed_time": "3:34:19", "remaining_time": "1 day, 14:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1509, "total_steps": 17941, "loss": 1.7986, "learning_rate": 9.884556993740161e-05, "epoch": 0.08410902402318711, "percentage": 8.41, "elapsed_time": "3:34:27", "remaining_time": "1 day, 14:55:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 17941, "loss": 1.9335, "learning_rate": 9.884366681869447e-05, "epoch": 0.08416476227635025, "percentage": 8.42, "elapsed_time": "3:34:36", "remaining_time": "1 day, 14:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1511, "total_steps": 17941, "loss": 1.952, "learning_rate": 9.8841762150951e-05, "epoch": 0.08422050052951341, "percentage": 8.42, "elapsed_time": "3:34:44", "remaining_time": "1 day, 14:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1512, "total_steps": 17941, "loss": 1.6983, "learning_rate": 9.883985593423158e-05, "epoch": 0.08427623878267655, "percentage": 8.43, "elapsed_time": "3:34:53", "remaining_time": "1 day, 14:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1513, "total_steps": 17941, "loss": 1.9128, "learning_rate": 9.88379481685967e-05, "epoch": 0.0843319770358397, "percentage": 8.43, "elapsed_time": "3:35:01", "remaining_time": "1 day, 14:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1514, "total_steps": 17941, "loss": 1.8798, "learning_rate": 9.883603885410686e-05, "epoch": 0.08438771528900284, "percentage": 8.44, "elapsed_time": "3:35:11", "remaining_time": "1 day, 14:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1515, "total_steps": 17941, "loss": 1.987, "learning_rate": 9.88341279908226e-05, "epoch": 0.084443453542166, "percentage": 8.44, "elapsed_time": "3:35:19", "remaining_time": "1 day, 14:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1516, "total_steps": 17941, "loss": 1.9272, "learning_rate": 9.88322155788045e-05, "epoch": 0.08449919179532914, "percentage": 8.45, "elapsed_time": "3:35:28", "remaining_time": "1 day, 14:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1517, "total_steps": 17941, "loss": 1.747, "learning_rate": 9.883030161811324e-05, "epoch": 0.08455493004849228, "percentage": 8.46, "elapsed_time": "3:35:36", "remaining_time": "1 day, 14:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1518, "total_steps": 17941, "loss": 1.7361, "learning_rate": 9.882838610880954e-05, "epoch": 0.08461066830165542, "percentage": 8.46, "elapsed_time": "3:35:45", "remaining_time": "1 day, 14:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1519, "total_steps": 17941, "loss": 1.7197, "learning_rate": 9.88264690509541e-05, "epoch": 0.08466640655481857, "percentage": 8.47, "elapsed_time": "3:35:53", "remaining_time": "1 day, 14:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 17941, "loss": 1.6553, "learning_rate": 9.882455044460773e-05, "epoch": 0.08472214480798172, "percentage": 8.47, "elapsed_time": "3:36:02", "remaining_time": "1 day, 14:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1521, "total_steps": 17941, "loss": 1.9354, "learning_rate": 9.88226302898313e-05, "epoch": 0.08477788306114487, "percentage": 8.48, "elapsed_time": "3:36:10", "remaining_time": "1 day, 14:53:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1522, "total_steps": 17941, "loss": 1.7173, "learning_rate": 9.882070858668568e-05, "epoch": 0.08483362131430801, "percentage": 8.48, "elapsed_time": "3:36:18", "remaining_time": "1 day, 14:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1523, "total_steps": 17941, "loss": 1.5161, "learning_rate": 9.881878533523185e-05, "epoch": 0.08488935956747115, "percentage": 8.49, "elapsed_time": "3:36:27", "remaining_time": "1 day, 14:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1524, "total_steps": 17941, "loss": 1.4486, "learning_rate": 9.881686053553077e-05, "epoch": 0.08494509782063431, "percentage": 8.49, "elapsed_time": "3:36:35", "remaining_time": "1 day, 14:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1525, "total_steps": 17941, "loss": 1.7378, "learning_rate": 9.88149341876435e-05, "epoch": 0.08500083607379745, "percentage": 8.5, "elapsed_time": "3:36:44", "remaining_time": "1 day, 14:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1526, "total_steps": 17941, "loss": 1.7466, "learning_rate": 9.881300629163113e-05, "epoch": 0.0850565743269606, "percentage": 8.51, "elapsed_time": "3:36:52", "remaining_time": "1 day, 14:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1527, "total_steps": 17941, "loss": 2.05, "learning_rate": 9.88110768475548e-05, "epoch": 0.08511231258012374, "percentage": 8.51, "elapsed_time": "3:37:01", "remaining_time": "1 day, 14:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1528, "total_steps": 17941, "loss": 1.9213, "learning_rate": 9.88091458554757e-05, "epoch": 0.08516805083328688, "percentage": 8.52, "elapsed_time": "3:37:09", "remaining_time": "1 day, 14:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1529, "total_steps": 17941, "loss": 1.7725, "learning_rate": 9.880721331545507e-05, "epoch": 0.08522378908645004, "percentage": 8.52, "elapsed_time": "3:37:18", "remaining_time": "1 day, 14:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 17941, "loss": 1.7671, "learning_rate": 9.880527922755418e-05, "epoch": 0.08527952733961318, "percentage": 8.53, "elapsed_time": "3:37:26", "remaining_time": "1 day, 14:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1531, "total_steps": 17941, "loss": 1.5094, "learning_rate": 9.880334359183441e-05, "epoch": 0.08533526559277632, "percentage": 8.53, "elapsed_time": "3:37:35", "remaining_time": "1 day, 14:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1532, "total_steps": 17941, "loss": 1.8291, "learning_rate": 9.880140640835711e-05, "epoch": 0.08539100384593946, "percentage": 8.54, "elapsed_time": "3:37:43", "remaining_time": "1 day, 14:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1533, "total_steps": 17941, "loss": 1.6669, "learning_rate": 9.879946767718374e-05, "epoch": 0.08544674209910261, "percentage": 8.54, "elapsed_time": "3:37:52", "remaining_time": "1 day, 14:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1534, "total_steps": 17941, "loss": 2.1902, "learning_rate": 9.879752739837578e-05, "epoch": 0.08550248035226576, "percentage": 8.55, "elapsed_time": "3:38:01", "remaining_time": "1 day, 14:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1535, "total_steps": 17941, "loss": 1.5727, "learning_rate": 9.879558557199475e-05, "epoch": 0.0855582186054289, "percentage": 8.56, "elapsed_time": "3:38:09", "remaining_time": "1 day, 14:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1536, "total_steps": 17941, "loss": 1.6102, "learning_rate": 9.879364219810226e-05, "epoch": 0.08561395685859205, "percentage": 8.56, "elapsed_time": "3:38:18", "remaining_time": "1 day, 14:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1537, "total_steps": 17941, "loss": 1.7124, "learning_rate": 9.879169727675991e-05, "epoch": 0.08566969511175519, "percentage": 8.57, "elapsed_time": "3:38:26", "remaining_time": "1 day, 14:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1538, "total_steps": 17941, "loss": 1.7585, "learning_rate": 9.87897508080294e-05, "epoch": 0.08572543336491835, "percentage": 8.57, "elapsed_time": "3:38:35", "remaining_time": "1 day, 14:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1539, "total_steps": 17941, "loss": 1.7857, "learning_rate": 9.878780279197247e-05, "epoch": 0.08578117161808149, "percentage": 8.58, "elapsed_time": "3:38:43", "remaining_time": "1 day, 14:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 17941, "loss": 1.865, "learning_rate": 9.878585322865087e-05, "epoch": 0.08583690987124463, "percentage": 8.58, "elapsed_time": "3:38:52", "remaining_time": "1 day, 14:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1541, "total_steps": 17941, "loss": 1.627, "learning_rate": 9.878390211812646e-05, "epoch": 0.08589264812440778, "percentage": 8.59, "elapsed_time": "3:39:00", "remaining_time": "1 day, 14:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1542, "total_steps": 17941, "loss": 1.7221, "learning_rate": 9.87819494604611e-05, "epoch": 0.08594838637757092, "percentage": 8.59, "elapsed_time": "3:39:08", "remaining_time": "1 day, 14:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1543, "total_steps": 17941, "loss": 1.7696, "learning_rate": 9.877999525571673e-05, "epoch": 0.08600412463073408, "percentage": 8.6, "elapsed_time": "3:39:18", "remaining_time": "1 day, 14:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1544, "total_steps": 17941, "loss": 1.6928, "learning_rate": 9.87780395039553e-05, "epoch": 0.08605986288389722, "percentage": 8.61, "elapsed_time": "3:39:26", "remaining_time": "1 day, 14:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1545, "total_steps": 17941, "loss": 1.8461, "learning_rate": 9.877608220523886e-05, "epoch": 0.08611560113706036, "percentage": 8.61, "elapsed_time": "3:39:34", "remaining_time": "1 day, 14:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1546, "total_steps": 17941, "loss": 1.6598, "learning_rate": 9.877412335962948e-05, "epoch": 0.0861713393902235, "percentage": 8.62, "elapsed_time": "3:39:43", "remaining_time": "1 day, 14:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1547, "total_steps": 17941, "loss": 1.8449, "learning_rate": 9.877216296718929e-05, "epoch": 0.08622707764338666, "percentage": 8.62, "elapsed_time": "3:39:51", "remaining_time": "1 day, 14:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1548, "total_steps": 17941, "loss": 2.0521, "learning_rate": 9.877020102798044e-05, "epoch": 0.0862828158965498, "percentage": 8.63, "elapsed_time": "3:40:00", "remaining_time": "1 day, 14:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1549, "total_steps": 17941, "loss": 1.8019, "learning_rate": 9.876823754206517e-05, "epoch": 0.08633855414971295, "percentage": 8.63, "elapsed_time": "3:40:08", "remaining_time": "1 day, 14:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 17941, "loss": 1.9138, "learning_rate": 9.876627250950573e-05, "epoch": 0.08639429240287609, "percentage": 8.64, "elapsed_time": "3:40:17", "remaining_time": "1 day, 14:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1551, "total_steps": 17941, "loss": 1.6576, "learning_rate": 9.876430593036445e-05, "epoch": 0.08645003065603923, "percentage": 8.65, "elapsed_time": "3:40:26", "remaining_time": "1 day, 14:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1552, "total_steps": 17941, "loss": 1.9165, "learning_rate": 9.876233780470373e-05, "epoch": 0.08650576890920239, "percentage": 8.65, "elapsed_time": "3:40:34", "remaining_time": "1 day, 14:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1553, "total_steps": 17941, "loss": 1.7924, "learning_rate": 9.876036813258593e-05, "epoch": 0.08656150716236553, "percentage": 8.66, "elapsed_time": "3:40:43", "remaining_time": "1 day, 14:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1554, "total_steps": 17941, "loss": 1.7025, "learning_rate": 9.875839691407355e-05, "epoch": 0.08661724541552868, "percentage": 8.66, "elapsed_time": "3:40:51", "remaining_time": "1 day, 14:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1555, "total_steps": 17941, "loss": 1.7742, "learning_rate": 9.875642414922913e-05, "epoch": 0.08667298366869182, "percentage": 8.67, "elapsed_time": "3:41:00", "remaining_time": "1 day, 14:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1556, "total_steps": 17941, "loss": 1.7676, "learning_rate": 9.875444983811517e-05, "epoch": 0.08672872192185498, "percentage": 8.67, "elapsed_time": "3:41:08", "remaining_time": "1 day, 14:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1557, "total_steps": 17941, "loss": 1.7824, "learning_rate": 9.875247398079434e-05, "epoch": 0.08678446017501812, "percentage": 8.68, "elapsed_time": "3:41:17", "remaining_time": "1 day, 14:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1558, "total_steps": 17941, "loss": 1.5643, "learning_rate": 9.875049657732928e-05, "epoch": 0.08684019842818126, "percentage": 8.68, "elapsed_time": "3:41:25", "remaining_time": "1 day, 14:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1559, "total_steps": 17941, "loss": 1.7751, "learning_rate": 9.87485176277827e-05, "epoch": 0.0868959366813444, "percentage": 8.69, "elapsed_time": "3:41:33", "remaining_time": "1 day, 14:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 17941, "loss": 1.6758, "learning_rate": 9.874653713221736e-05, "epoch": 0.08695167493450755, "percentage": 8.7, "elapsed_time": "3:41:42", "remaining_time": "1 day, 14:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1561, "total_steps": 17941, "loss": 1.9237, "learning_rate": 9.874455509069608e-05, "epoch": 0.0870074131876707, "percentage": 8.7, "elapsed_time": "3:41:50", "remaining_time": "1 day, 14:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1562, "total_steps": 17941, "loss": 1.8882, "learning_rate": 9.874257150328171e-05, "epoch": 0.08706315144083385, "percentage": 8.71, "elapsed_time": "3:41:59", "remaining_time": "1 day, 14:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1563, "total_steps": 17941, "loss": 2.0451, "learning_rate": 9.874058637003715e-05, "epoch": 0.08711888969399699, "percentage": 8.71, "elapsed_time": "3:42:08", "remaining_time": "1 day, 14:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1564, "total_steps": 17941, "loss": 1.924, "learning_rate": 9.87385996910254e-05, "epoch": 0.08717462794716013, "percentage": 8.72, "elapsed_time": "3:42:16", "remaining_time": "1 day, 14:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1565, "total_steps": 17941, "loss": 1.58, "learning_rate": 9.87366114663094e-05, "epoch": 0.08723036620032328, "percentage": 8.72, "elapsed_time": "3:42:25", "remaining_time": "1 day, 14:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1566, "total_steps": 17941, "loss": 1.7895, "learning_rate": 9.873462169595225e-05, "epoch": 0.08728610445348643, "percentage": 8.73, "elapsed_time": "3:42:33", "remaining_time": "1 day, 14:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1567, "total_steps": 17941, "loss": 1.6593, "learning_rate": 9.873263038001706e-05, "epoch": 0.08734184270664958, "percentage": 8.73, "elapsed_time": "3:42:42", "remaining_time": "1 day, 14:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1568, "total_steps": 17941, "loss": 1.8271, "learning_rate": 9.873063751856693e-05, "epoch": 0.08739758095981272, "percentage": 8.74, "elapsed_time": "3:42:51", "remaining_time": "1 day, 14:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1569, "total_steps": 17941, "loss": 1.6083, "learning_rate": 9.872864311166513e-05, "epoch": 0.08745331921297586, "percentage": 8.75, "elapsed_time": "3:42:59", "remaining_time": "1 day, 14:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 17941, "loss": 1.4434, "learning_rate": 9.872664715937485e-05, "epoch": 0.08750905746613902, "percentage": 8.75, "elapsed_time": "3:43:09", "remaining_time": "1 day, 14:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1571, "total_steps": 17941, "loss": 1.7666, "learning_rate": 9.872464966175943e-05, "epoch": 0.08756479571930216, "percentage": 8.76, "elapsed_time": "3:43:17", "remaining_time": "1 day, 14:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1572, "total_steps": 17941, "loss": 2.129, "learning_rate": 9.872265061888222e-05, "epoch": 0.0876205339724653, "percentage": 8.76, "elapsed_time": "3:43:26", "remaining_time": "1 day, 14:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1573, "total_steps": 17941, "loss": 1.757, "learning_rate": 9.87206500308066e-05, "epoch": 0.08767627222562845, "percentage": 8.77, "elapsed_time": "3:43:34", "remaining_time": "1 day, 14:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1574, "total_steps": 17941, "loss": 1.8953, "learning_rate": 9.871864789759602e-05, "epoch": 0.08773201047879159, "percentage": 8.77, "elapsed_time": "3:43:43", "remaining_time": "1 day, 14:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1575, "total_steps": 17941, "loss": 1.5125, "learning_rate": 9.871664421931397e-05, "epoch": 0.08778774873195475, "percentage": 8.78, "elapsed_time": "3:43:51", "remaining_time": "1 day, 14:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1576, "total_steps": 17941, "loss": 1.9326, "learning_rate": 9.8714638996024e-05, "epoch": 0.08784348698511789, "percentage": 8.78, "elapsed_time": "3:43:59", "remaining_time": "1 day, 14:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1577, "total_steps": 17941, "loss": 1.4956, "learning_rate": 9.871263222778972e-05, "epoch": 0.08789922523828103, "percentage": 8.79, "elapsed_time": "3:44:08", "remaining_time": "1 day, 14:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1578, "total_steps": 17941, "loss": 2.0481, "learning_rate": 9.871062391467476e-05, "epoch": 0.08795496349144417, "percentage": 8.8, "elapsed_time": "3:44:16", "remaining_time": "1 day, 14:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1579, "total_steps": 17941, "loss": 1.6748, "learning_rate": 9.870861405674281e-05, "epoch": 0.08801070174460733, "percentage": 8.8, "elapsed_time": "3:44:25", "remaining_time": "1 day, 14:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 17941, "loss": 1.5146, "learning_rate": 9.87066026540576e-05, "epoch": 0.08806643999777047, "percentage": 8.81, "elapsed_time": "3:44:33", "remaining_time": "1 day, 14:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1581, "total_steps": 17941, "loss": 1.9752, "learning_rate": 9.870458970668295e-05, "epoch": 0.08812217825093362, "percentage": 8.81, "elapsed_time": "3:44:42", "remaining_time": "1 day, 14:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1582, "total_steps": 17941, "loss": 1.8943, "learning_rate": 9.870257521468267e-05, "epoch": 0.08817791650409676, "percentage": 8.82, "elapsed_time": "3:44:50", "remaining_time": "1 day, 14:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1583, "total_steps": 17941, "loss": 1.7243, "learning_rate": 9.870055917812066e-05, "epoch": 0.0882336547572599, "percentage": 8.82, "elapsed_time": "3:44:59", "remaining_time": "1 day, 14:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1584, "total_steps": 17941, "loss": 1.608, "learning_rate": 9.869854159706087e-05, "epoch": 0.08828939301042306, "percentage": 8.83, "elapsed_time": "3:45:07", "remaining_time": "1 day, 14:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1585, "total_steps": 17941, "loss": 1.8326, "learning_rate": 9.869652247156726e-05, "epoch": 0.0883451312635862, "percentage": 8.83, "elapsed_time": "3:45:16", "remaining_time": "1 day, 14:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1586, "total_steps": 17941, "loss": 1.5715, "learning_rate": 9.869450180170388e-05, "epoch": 0.08840086951674934, "percentage": 8.84, "elapsed_time": "3:45:24", "remaining_time": "1 day, 14:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1587, "total_steps": 17941, "loss": 1.9452, "learning_rate": 9.869247958753483e-05, "epoch": 0.08845660776991249, "percentage": 8.85, "elapsed_time": "3:45:33", "remaining_time": "1 day, 14:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1588, "total_steps": 17941, "loss": 1.7894, "learning_rate": 9.86904558291242e-05, "epoch": 0.08851234602307563, "percentage": 8.85, "elapsed_time": "3:45:41", "remaining_time": "1 day, 14:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1589, "total_steps": 17941, "loss": 1.8428, "learning_rate": 9.86884305265362e-05, "epoch": 0.08856808427623879, "percentage": 8.86, "elapsed_time": "3:45:49", "remaining_time": "1 day, 14:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 17941, "loss": 1.9602, "learning_rate": 9.868640367983507e-05, "epoch": 0.08862382252940193, "percentage": 8.86, "elapsed_time": "3:45:58", "remaining_time": "1 day, 14:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1591, "total_steps": 17941, "loss": 1.8967, "learning_rate": 9.868437528908507e-05, "epoch": 0.08867956078256507, "percentage": 8.87, "elapsed_time": "3:46:06", "remaining_time": "1 day, 14:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1592, "total_steps": 17941, "loss": 1.5939, "learning_rate": 9.868234535435052e-05, "epoch": 0.08873529903572822, "percentage": 8.87, "elapsed_time": "3:46:15", "remaining_time": "1 day, 14:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1593, "total_steps": 17941, "loss": 1.7461, "learning_rate": 9.868031387569583e-05, "epoch": 0.08879103728889137, "percentage": 8.88, "elapsed_time": "3:46:23", "remaining_time": "1 day, 14:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1594, "total_steps": 17941, "loss": 1.7843, "learning_rate": 9.867828085318541e-05, "epoch": 0.08884677554205452, "percentage": 8.88, "elapsed_time": "3:46:32", "remaining_time": "1 day, 14:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1595, "total_steps": 17941, "loss": 1.981, "learning_rate": 9.867624628688374e-05, "epoch": 0.08890251379521766, "percentage": 8.89, "elapsed_time": "3:46:40", "remaining_time": "1 day, 14:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1596, "total_steps": 17941, "loss": 1.3437, "learning_rate": 9.867421017685531e-05, "epoch": 0.0889582520483808, "percentage": 8.9, "elapsed_time": "3:46:49", "remaining_time": "1 day, 14:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1597, "total_steps": 17941, "loss": 1.6426, "learning_rate": 9.867217252316476e-05, "epoch": 0.08901399030154394, "percentage": 8.9, "elapsed_time": "3:46:57", "remaining_time": "1 day, 14:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1598, "total_steps": 17941, "loss": 1.5808, "learning_rate": 9.867013332587667e-05, "epoch": 0.0890697285547071, "percentage": 8.91, "elapsed_time": "3:47:06", "remaining_time": "1 day, 14:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1599, "total_steps": 17941, "loss": 1.8197, "learning_rate": 9.86680925850557e-05, "epoch": 0.08912546680787024, "percentage": 8.91, "elapsed_time": "3:47:14", "remaining_time": "1 day, 14:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 17941, "loss": 1.6238, "learning_rate": 9.86660503007666e-05, "epoch": 0.08918120506103339, "percentage": 8.92, "elapsed_time": "3:47:22", "remaining_time": "1 day, 14:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1601, "total_steps": 17941, "loss": 1.8063, "learning_rate": 9.866400647307413e-05, "epoch": 0.08923694331419653, "percentage": 8.92, "elapsed_time": "3:47:31", "remaining_time": "1 day, 14:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1602, "total_steps": 17941, "loss": 1.8849, "learning_rate": 9.86619611020431e-05, "epoch": 0.08929268156735969, "percentage": 8.93, "elapsed_time": "3:47:39", "remaining_time": "1 day, 14:41:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1603, "total_steps": 17941, "loss": 1.5961, "learning_rate": 9.865991418773837e-05, "epoch": 0.08934841982052283, "percentage": 8.93, "elapsed_time": "3:47:48", "remaining_time": "1 day, 14:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1604, "total_steps": 17941, "loss": 1.782, "learning_rate": 9.865786573022488e-05, "epoch": 0.08940415807368597, "percentage": 8.94, "elapsed_time": "3:47:56", "remaining_time": "1 day, 14:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1605, "total_steps": 17941, "loss": 1.9102, "learning_rate": 9.865581572956759e-05, "epoch": 0.08945989632684911, "percentage": 8.95, "elapsed_time": "3:48:05", "remaining_time": "1 day, 14:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1606, "total_steps": 17941, "loss": 1.8494, "learning_rate": 9.86537641858315e-05, "epoch": 0.08951563458001226, "percentage": 8.95, "elapsed_time": "3:48:13", "remaining_time": "1 day, 14:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1607, "total_steps": 17941, "loss": 1.7515, "learning_rate": 9.865171109908169e-05, "epoch": 0.08957137283317541, "percentage": 8.96, "elapsed_time": "3:48:22", "remaining_time": "1 day, 14:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1608, "total_steps": 17941, "loss": 1.6874, "learning_rate": 9.864965646938326e-05, "epoch": 0.08962711108633856, "percentage": 8.96, "elapsed_time": "3:48:30", "remaining_time": "1 day, 14:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1609, "total_steps": 17941, "loss": 1.7417, "learning_rate": 9.864760029680137e-05, "epoch": 0.0896828493395017, "percentage": 8.97, "elapsed_time": "3:48:39", "remaining_time": "1 day, 14:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 17941, "loss": 1.7553, "learning_rate": 9.864554258140124e-05, "epoch": 0.08973858759266484, "percentage": 8.97, "elapsed_time": "3:48:47", "remaining_time": "1 day, 14:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1611, "total_steps": 17941, "loss": 1.7663, "learning_rate": 9.864348332324811e-05, "epoch": 0.08979432584582799, "percentage": 8.98, "elapsed_time": "3:48:55", "remaining_time": "1 day, 14:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1612, "total_steps": 17941, "loss": 1.6, "learning_rate": 9.864142252240731e-05, "epoch": 0.08985006409899114, "percentage": 8.99, "elapsed_time": "3:49:04", "remaining_time": "1 day, 14:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1613, "total_steps": 17941, "loss": 1.8076, "learning_rate": 9.863936017894418e-05, "epoch": 0.08990580235215428, "percentage": 8.99, "elapsed_time": "3:49:12", "remaining_time": "1 day, 14:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1614, "total_steps": 17941, "loss": 1.7864, "learning_rate": 9.863729629292414e-05, "epoch": 0.08996154060531743, "percentage": 9.0, "elapsed_time": "3:49:21", "remaining_time": "1 day, 14:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1615, "total_steps": 17941, "loss": 1.931, "learning_rate": 9.863523086441264e-05, "epoch": 0.09001727885848057, "percentage": 9.0, "elapsed_time": "3:49:29", "remaining_time": "1 day, 14:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1616, "total_steps": 17941, "loss": 1.7562, "learning_rate": 9.863316389347517e-05, "epoch": 0.09007301711164373, "percentage": 9.01, "elapsed_time": "3:49:38", "remaining_time": "1 day, 14:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1617, "total_steps": 17941, "loss": 1.6973, "learning_rate": 9.863109538017729e-05, "epoch": 0.09012875536480687, "percentage": 9.01, "elapsed_time": "3:49:46", "remaining_time": "1 day, 14:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1618, "total_steps": 17941, "loss": 2.0494, "learning_rate": 9.862902532458461e-05, "epoch": 0.09018449361797001, "percentage": 9.02, "elapsed_time": "3:49:55", "remaining_time": "1 day, 14:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1619, "total_steps": 17941, "loss": 1.6505, "learning_rate": 9.862695372676278e-05, "epoch": 0.09024023187113316, "percentage": 9.02, "elapsed_time": "3:50:03", "remaining_time": "1 day, 14:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 17941, "loss": 1.734, "learning_rate": 9.862488058677748e-05, "epoch": 0.0902959701242963, "percentage": 9.03, "elapsed_time": "3:50:12", "remaining_time": "1 day, 14:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1621, "total_steps": 17941, "loss": 1.8098, "learning_rate": 9.862280590469448e-05, "epoch": 0.09035170837745946, "percentage": 9.04, "elapsed_time": "3:50:20", "remaining_time": "1 day, 14:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1622, "total_steps": 17941, "loss": 1.8394, "learning_rate": 9.862072968057956e-05, "epoch": 0.0904074466306226, "percentage": 9.04, "elapsed_time": "3:50:28", "remaining_time": "1 day, 14:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1623, "total_steps": 17941, "loss": 1.6742, "learning_rate": 9.861865191449858e-05, "epoch": 0.09046318488378574, "percentage": 9.05, "elapsed_time": "3:50:37", "remaining_time": "1 day, 14:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1624, "total_steps": 17941, "loss": 1.6425, "learning_rate": 9.861657260651742e-05, "epoch": 0.09051892313694888, "percentage": 9.05, "elapsed_time": "3:50:45", "remaining_time": "1 day, 14:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1625, "total_steps": 17941, "loss": 1.5693, "learning_rate": 9.861449175670204e-05, "epoch": 0.09057466139011204, "percentage": 9.06, "elapsed_time": "3:50:54", "remaining_time": "1 day, 14:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1626, "total_steps": 17941, "loss": 1.6782, "learning_rate": 9.861240936511842e-05, "epoch": 0.09063039964327518, "percentage": 9.06, "elapsed_time": "3:51:02", "remaining_time": "1 day, 14:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1627, "total_steps": 17941, "loss": 1.9775, "learning_rate": 9.86103254318326e-05, "epoch": 0.09068613789643833, "percentage": 9.07, "elapsed_time": "3:51:11", "remaining_time": "1 day, 14:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1628, "total_steps": 17941, "loss": 1.9425, "learning_rate": 9.860823995691068e-05, "epoch": 0.09074187614960147, "percentage": 9.07, "elapsed_time": "3:51:19", "remaining_time": "1 day, 14:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1629, "total_steps": 17941, "loss": 1.6473, "learning_rate": 9.860615294041879e-05, "epoch": 0.09079761440276461, "percentage": 9.08, "elapsed_time": "3:51:27", "remaining_time": "1 day, 14:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 17941, "loss": 1.6367, "learning_rate": 9.860406438242313e-05, "epoch": 0.09085335265592777, "percentage": 9.09, "elapsed_time": "3:51:36", "remaining_time": "1 day, 14:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1631, "total_steps": 17941, "loss": 1.7602, "learning_rate": 9.860197428298991e-05, "epoch": 0.09090909090909091, "percentage": 9.09, "elapsed_time": "3:51:44", "remaining_time": "1 day, 14:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1632, "total_steps": 17941, "loss": 1.546, "learning_rate": 9.859988264218546e-05, "epoch": 0.09096482916225405, "percentage": 9.1, "elapsed_time": "3:51:53", "remaining_time": "1 day, 14:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1633, "total_steps": 17941, "loss": 1.5578, "learning_rate": 9.859778946007608e-05, "epoch": 0.0910205674154172, "percentage": 9.1, "elapsed_time": "3:52:02", "remaining_time": "1 day, 14:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1634, "total_steps": 17941, "loss": 1.3888, "learning_rate": 9.859569473672816e-05, "epoch": 0.09107630566858034, "percentage": 9.11, "elapsed_time": "3:52:10", "remaining_time": "1 day, 14:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1635, "total_steps": 17941, "loss": 1.7516, "learning_rate": 9.859359847220815e-05, "epoch": 0.0911320439217435, "percentage": 9.11, "elapsed_time": "3:52:18", "remaining_time": "1 day, 14:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1636, "total_steps": 17941, "loss": 1.7055, "learning_rate": 9.85915006665825e-05, "epoch": 0.09118778217490664, "percentage": 9.12, "elapsed_time": "3:52:27", "remaining_time": "1 day, 14:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1637, "total_steps": 17941, "loss": 1.8203, "learning_rate": 9.858940131991777e-05, "epoch": 0.09124352042806978, "percentage": 9.12, "elapsed_time": "3:52:35", "remaining_time": "1 day, 14:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1638, "total_steps": 17941, "loss": 1.5783, "learning_rate": 9.85873004322805e-05, "epoch": 0.09129925868123293, "percentage": 9.13, "elapsed_time": "3:52:44", "remaining_time": "1 day, 14:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1639, "total_steps": 17941, "loss": 1.7707, "learning_rate": 9.858519800373738e-05, "epoch": 0.09135499693439608, "percentage": 9.14, "elapsed_time": "3:52:53", "remaining_time": "1 day, 14:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 17941, "loss": 1.6027, "learning_rate": 9.858309403435501e-05, "epoch": 0.09141073518755923, "percentage": 9.14, "elapsed_time": "3:53:01", "remaining_time": "1 day, 14:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1641, "total_steps": 17941, "loss": 1.7874, "learning_rate": 9.85809885242002e-05, "epoch": 0.09146647344072237, "percentage": 9.15, "elapsed_time": "3:53:10", "remaining_time": "1 day, 14:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1642, "total_steps": 17941, "loss": 1.7223, "learning_rate": 9.857888147333965e-05, "epoch": 0.09152221169388551, "percentage": 9.15, "elapsed_time": "3:53:18", "remaining_time": "1 day, 14:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1643, "total_steps": 17941, "loss": 1.8618, "learning_rate": 9.857677288184022e-05, "epoch": 0.09157794994704865, "percentage": 9.16, "elapsed_time": "3:53:27", "remaining_time": "1 day, 14:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1644, "total_steps": 17941, "loss": 1.761, "learning_rate": 9.857466274976878e-05, "epoch": 0.09163368820021181, "percentage": 9.16, "elapsed_time": "3:53:35", "remaining_time": "1 day, 14:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1645, "total_steps": 17941, "loss": 1.7272, "learning_rate": 9.857255107719225e-05, "epoch": 0.09168942645337495, "percentage": 9.17, "elapsed_time": "3:53:44", "remaining_time": "1 day, 14:35:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1646, "total_steps": 17941, "loss": 1.7532, "learning_rate": 9.857043786417759e-05, "epoch": 0.0917451647065381, "percentage": 9.17, "elapsed_time": "3:53:52", "remaining_time": "1 day, 14:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1647, "total_steps": 17941, "loss": 1.9235, "learning_rate": 9.856832311079183e-05, "epoch": 0.09180090295970124, "percentage": 9.18, "elapsed_time": "3:54:00", "remaining_time": "1 day, 14:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1648, "total_steps": 17941, "loss": 1.8481, "learning_rate": 9.856620681710205e-05, "epoch": 0.0918566412128644, "percentage": 9.19, "elapsed_time": "3:54:09", "remaining_time": "1 day, 14:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1649, "total_steps": 17941, "loss": 1.7273, "learning_rate": 9.856408898317533e-05, "epoch": 0.09191237946602754, "percentage": 9.19, "elapsed_time": "3:54:17", "remaining_time": "1 day, 14:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 17941, "loss": 1.8292, "learning_rate": 9.856196960907887e-05, "epoch": 0.09196811771919068, "percentage": 9.2, "elapsed_time": "3:54:26", "remaining_time": "1 day, 14:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1651, "total_steps": 17941, "loss": 1.7672, "learning_rate": 9.855984869487985e-05, "epoch": 0.09202385597235382, "percentage": 9.2, "elapsed_time": "3:54:34", "remaining_time": "1 day, 14:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1652, "total_steps": 17941, "loss": 1.7338, "learning_rate": 9.855772624064557e-05, "epoch": 0.09207959422551697, "percentage": 9.21, "elapsed_time": "3:54:43", "remaining_time": "1 day, 14:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1653, "total_steps": 17941, "loss": 1.8558, "learning_rate": 9.855560224644332e-05, "epoch": 0.09213533247868012, "percentage": 9.21, "elapsed_time": "3:54:51", "remaining_time": "1 day, 14:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1654, "total_steps": 17941, "loss": 1.7338, "learning_rate": 9.855347671234045e-05, "epoch": 0.09219107073184327, "percentage": 9.22, "elapsed_time": "3:55:00", "remaining_time": "1 day, 14:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1655, "total_steps": 17941, "loss": 1.9314, "learning_rate": 9.855134963840441e-05, "epoch": 0.09224680898500641, "percentage": 9.22, "elapsed_time": "3:55:08", "remaining_time": "1 day, 14:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1656, "total_steps": 17941, "loss": 1.7196, "learning_rate": 9.854922102470262e-05, "epoch": 0.09230254723816955, "percentage": 9.23, "elapsed_time": "3:55:18", "remaining_time": "1 day, 14:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1657, "total_steps": 17941, "loss": 1.7249, "learning_rate": 9.85470908713026e-05, "epoch": 0.0923582854913327, "percentage": 9.24, "elapsed_time": "3:55:26", "remaining_time": "1 day, 14:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1658, "total_steps": 17941, "loss": 1.7368, "learning_rate": 9.854495917827191e-05, "epoch": 0.09241402374449585, "percentage": 9.24, "elapsed_time": "3:55:34", "remaining_time": "1 day, 14:33:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1659, "total_steps": 17941, "loss": 1.8287, "learning_rate": 9.854282594567816e-05, "epoch": 0.092469761997659, "percentage": 9.25, "elapsed_time": "3:55:43", "remaining_time": "1 day, 14:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 17941, "loss": 1.743, "learning_rate": 9.854069117358899e-05, "epoch": 0.09252550025082214, "percentage": 9.25, "elapsed_time": "3:55:51", "remaining_time": "1 day, 14:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1661, "total_steps": 17941, "loss": 1.7903, "learning_rate": 9.853855486207211e-05, "epoch": 0.09258123850398528, "percentage": 9.26, "elapsed_time": "3:56:00", "remaining_time": "1 day, 14:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1662, "total_steps": 17941, "loss": 1.6038, "learning_rate": 9.853641701119525e-05, "epoch": 0.09263697675714844, "percentage": 9.26, "elapsed_time": "3:56:09", "remaining_time": "1 day, 14:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1663, "total_steps": 17941, "loss": 1.7459, "learning_rate": 9.853427762102625e-05, "epoch": 0.09269271501031158, "percentage": 9.27, "elapsed_time": "3:56:17", "remaining_time": "1 day, 14:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1664, "total_steps": 17941, "loss": 1.7409, "learning_rate": 9.853213669163293e-05, "epoch": 0.09274845326347472, "percentage": 9.27, "elapsed_time": "3:56:25", "remaining_time": "1 day, 14:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1665, "total_steps": 17941, "loss": 1.8207, "learning_rate": 9.852999422308319e-05, "epoch": 0.09280419151663787, "percentage": 9.28, "elapsed_time": "3:56:34", "remaining_time": "1 day, 14:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1666, "total_steps": 17941, "loss": 1.9794, "learning_rate": 9.852785021544499e-05, "epoch": 0.09285992976980101, "percentage": 9.29, "elapsed_time": "3:56:43", "remaining_time": "1 day, 14:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1667, "total_steps": 17941, "loss": 1.8052, "learning_rate": 9.852570466878632e-05, "epoch": 0.09291566802296417, "percentage": 9.29, "elapsed_time": "3:56:51", "remaining_time": "1 day, 14:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1668, "total_steps": 17941, "loss": 1.6414, "learning_rate": 9.852355758317523e-05, "epoch": 0.09297140627612731, "percentage": 9.3, "elapsed_time": "3:57:00", "remaining_time": "1 day, 14:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1669, "total_steps": 17941, "loss": 1.561, "learning_rate": 9.85214089586798e-05, "epoch": 0.09302714452929045, "percentage": 9.3, "elapsed_time": "3:57:08", "remaining_time": "1 day, 14:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 17941, "loss": 1.7192, "learning_rate": 9.851925879536817e-05, "epoch": 0.0930828827824536, "percentage": 9.31, "elapsed_time": "3:57:17", "remaining_time": "1 day, 14:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1671, "total_steps": 17941, "loss": 1.6869, "learning_rate": 9.851710709330855e-05, "epoch": 0.09313862103561675, "percentage": 9.31, "elapsed_time": "3:57:25", "remaining_time": "1 day, 14:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1672, "total_steps": 17941, "loss": 1.7307, "learning_rate": 9.851495385256915e-05, "epoch": 0.0931943592887799, "percentage": 9.32, "elapsed_time": "3:57:33", "remaining_time": "1 day, 14:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1673, "total_steps": 17941, "loss": 1.8593, "learning_rate": 9.851279907321829e-05, "epoch": 0.09325009754194304, "percentage": 9.33, "elapsed_time": "3:57:42", "remaining_time": "1 day, 14:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1674, "total_steps": 17941, "loss": 1.7155, "learning_rate": 9.851064275532428e-05, "epoch": 0.09330583579510618, "percentage": 9.33, "elapsed_time": "3:57:51", "remaining_time": "1 day, 14:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1675, "total_steps": 17941, "loss": 1.7011, "learning_rate": 9.850848489895553e-05, "epoch": 0.09336157404826932, "percentage": 9.34, "elapsed_time": "3:57:59", "remaining_time": "1 day, 14:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1676, "total_steps": 17941, "loss": 1.8851, "learning_rate": 9.850632550418046e-05, "epoch": 0.09341731230143248, "percentage": 9.34, "elapsed_time": "3:58:08", "remaining_time": "1 day, 14:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1677, "total_steps": 17941, "loss": 1.7392, "learning_rate": 9.850416457106755e-05, "epoch": 0.09347305055459562, "percentage": 9.35, "elapsed_time": "3:58:16", "remaining_time": "1 day, 14:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1678, "total_steps": 17941, "loss": 1.8583, "learning_rate": 9.850200209968535e-05, "epoch": 0.09352878880775876, "percentage": 9.35, "elapsed_time": "3:58:25", "remaining_time": "1 day, 14:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1679, "total_steps": 17941, "loss": 1.9008, "learning_rate": 9.849983809010242e-05, "epoch": 0.09358452706092191, "percentage": 9.36, "elapsed_time": "3:58:33", "remaining_time": "1 day, 14:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 17941, "loss": 1.8536, "learning_rate": 9.849767254238741e-05, "epoch": 0.09364026531408505, "percentage": 9.36, "elapsed_time": "3:58:42", "remaining_time": "1 day, 14:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1681, "total_steps": 17941, "loss": 1.6492, "learning_rate": 9.849550545660898e-05, "epoch": 0.0936960035672482, "percentage": 9.37, "elapsed_time": "3:58:50", "remaining_time": "1 day, 14:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1682, "total_steps": 17941, "loss": 1.8646, "learning_rate": 9.849333683283587e-05, "epoch": 0.09375174182041135, "percentage": 9.38, "elapsed_time": "3:58:59", "remaining_time": "1 day, 14:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1683, "total_steps": 17941, "loss": 1.6978, "learning_rate": 9.849116667113684e-05, "epoch": 0.09380748007357449, "percentage": 9.38, "elapsed_time": "3:59:07", "remaining_time": "1 day, 14:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1684, "total_steps": 17941, "loss": 1.7446, "learning_rate": 9.848899497158075e-05, "epoch": 0.09386321832673764, "percentage": 9.39, "elapsed_time": "3:59:15", "remaining_time": "1 day, 14:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1685, "total_steps": 17941, "loss": 1.9409, "learning_rate": 9.848682173423642e-05, "epoch": 0.09391895657990079, "percentage": 9.39, "elapsed_time": "3:59:24", "remaining_time": "1 day, 14:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1686, "total_steps": 17941, "loss": 1.9023, "learning_rate": 9.848464695917283e-05, "epoch": 0.09397469483306393, "percentage": 9.4, "elapsed_time": "3:59:33", "remaining_time": "1 day, 14:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1687, "total_steps": 17941, "loss": 1.8456, "learning_rate": 9.84824706464589e-05, "epoch": 0.09403043308622708, "percentage": 9.4, "elapsed_time": "3:59:41", "remaining_time": "1 day, 14:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1688, "total_steps": 17941, "loss": 1.6156, "learning_rate": 9.848029279616369e-05, "epoch": 0.09408617133939022, "percentage": 9.41, "elapsed_time": "3:59:50", "remaining_time": "1 day, 14:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1689, "total_steps": 17941, "loss": 1.8053, "learning_rate": 9.847811340835625e-05, "epoch": 0.09414190959255336, "percentage": 9.41, "elapsed_time": "3:59:58", "remaining_time": "1 day, 14:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1690, "total_steps": 17941, "loss": 1.8396, "learning_rate": 9.847593248310569e-05, "epoch": 0.09419764784571652, "percentage": 9.42, "elapsed_time": "4:00:06", "remaining_time": "1 day, 14:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1691, "total_steps": 17941, "loss": 1.702, "learning_rate": 9.847375002048119e-05, "epoch": 0.09425338609887966, "percentage": 9.43, "elapsed_time": "4:00:15", "remaining_time": "1 day, 14:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1692, "total_steps": 17941, "loss": 1.7258, "learning_rate": 9.847156602055196e-05, "epoch": 0.0943091243520428, "percentage": 9.43, "elapsed_time": "4:00:23", "remaining_time": "1 day, 14:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1693, "total_steps": 17941, "loss": 1.9521, "learning_rate": 9.846938048338728e-05, "epoch": 0.09436486260520595, "percentage": 9.44, "elapsed_time": "4:00:32", "remaining_time": "1 day, 14:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1694, "total_steps": 17941, "loss": 1.7358, "learning_rate": 9.846719340905643e-05, "epoch": 0.0944206008583691, "percentage": 9.44, "elapsed_time": "4:00:40", "remaining_time": "1 day, 14:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1695, "total_steps": 17941, "loss": 1.9847, "learning_rate": 9.846500479762879e-05, "epoch": 0.09447633911153225, "percentage": 9.45, "elapsed_time": "4:00:49", "remaining_time": "1 day, 14:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1696, "total_steps": 17941, "loss": 1.777, "learning_rate": 9.846281464917377e-05, "epoch": 0.09453207736469539, "percentage": 9.45, "elapsed_time": "4:00:58", "remaining_time": "1 day, 14:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1697, "total_steps": 17941, "loss": 1.6861, "learning_rate": 9.846062296376083e-05, "epoch": 0.09458781561785853, "percentage": 9.46, "elapsed_time": "4:01:06", "remaining_time": "1 day, 14:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1698, "total_steps": 17941, "loss": 1.8176, "learning_rate": 9.845842974145947e-05, "epoch": 0.09464355387102168, "percentage": 9.46, "elapsed_time": "4:01:15", "remaining_time": "1 day, 14:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1699, "total_steps": 17941, "loss": 1.6658, "learning_rate": 9.845623498233926e-05, "epoch": 0.09469929212418483, "percentage": 9.47, "elapsed_time": "4:01:23", "remaining_time": "1 day, 14:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 17941, "loss": 1.7287, "learning_rate": 9.845403868646979e-05, "epoch": 0.09475503037734798, "percentage": 9.48, "elapsed_time": "4:01:31", "remaining_time": "1 day, 14:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1701, "total_steps": 17941, "loss": 1.6861, "learning_rate": 9.845184085392072e-05, "epoch": 0.09481076863051112, "percentage": 9.48, "elapsed_time": "4:01:40", "remaining_time": "1 day, 14:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1702, "total_steps": 17941, "loss": 1.9309, "learning_rate": 9.844964148476175e-05, "epoch": 0.09486650688367426, "percentage": 9.49, "elapsed_time": "4:01:48", "remaining_time": "1 day, 14:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1703, "total_steps": 17941, "loss": 1.738, "learning_rate": 9.844744057906263e-05, "epoch": 0.0949222451368374, "percentage": 9.49, "elapsed_time": "4:01:57", "remaining_time": "1 day, 14:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1704, "total_steps": 17941, "loss": 1.8729, "learning_rate": 9.844523813689316e-05, "epoch": 0.09497798339000056, "percentage": 9.5, "elapsed_time": "4:02:06", "remaining_time": "1 day, 14:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1705, "total_steps": 17941, "loss": 1.901, "learning_rate": 9.844303415832322e-05, "epoch": 0.0950337216431637, "percentage": 9.5, "elapsed_time": "4:02:14", "remaining_time": "1 day, 14:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1706, "total_steps": 17941, "loss": 1.7838, "learning_rate": 9.844082864342265e-05, "epoch": 0.09508945989632685, "percentage": 9.51, "elapsed_time": "4:02:23", "remaining_time": "1 day, 14:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1707, "total_steps": 17941, "loss": 1.7044, "learning_rate": 9.843862159226142e-05, "epoch": 0.09514519814948999, "percentage": 9.51, "elapsed_time": "4:02:31", "remaining_time": "1 day, 14:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1708, "total_steps": 17941, "loss": 1.6637, "learning_rate": 9.843641300490956e-05, "epoch": 0.09520093640265315, "percentage": 9.52, "elapsed_time": "4:02:40", "remaining_time": "1 day, 14:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1709, "total_steps": 17941, "loss": 1.5714, "learning_rate": 9.843420288143706e-05, "epoch": 0.09525667465581629, "percentage": 9.53, "elapsed_time": "4:02:49", "remaining_time": "1 day, 14:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1710, "total_steps": 17941, "loss": 2.0123, "learning_rate": 9.843199122191404e-05, "epoch": 0.09531241290897943, "percentage": 9.53, "elapsed_time": "4:02:57", "remaining_time": "1 day, 14:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1711, "total_steps": 17941, "loss": 1.74, "learning_rate": 9.842977802641065e-05, "epoch": 0.09536815116214258, "percentage": 9.54, "elapsed_time": "4:03:06", "remaining_time": "1 day, 14:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1712, "total_steps": 17941, "loss": 1.8003, "learning_rate": 9.842756329499704e-05, "epoch": 0.09542388941530572, "percentage": 9.54, "elapsed_time": "4:03:14", "remaining_time": "1 day, 14:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1713, "total_steps": 17941, "loss": 1.6448, "learning_rate": 9.842534702774349e-05, "epoch": 0.09547962766846887, "percentage": 9.55, "elapsed_time": "4:03:23", "remaining_time": "1 day, 14:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1714, "total_steps": 17941, "loss": 1.8862, "learning_rate": 9.842312922472028e-05, "epoch": 0.09553536592163202, "percentage": 9.55, "elapsed_time": "4:03:31", "remaining_time": "1 day, 14:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1715, "total_steps": 17941, "loss": 1.7858, "learning_rate": 9.842090988599772e-05, "epoch": 0.09559110417479516, "percentage": 9.56, "elapsed_time": "4:03:40", "remaining_time": "1 day, 14:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1716, "total_steps": 17941, "loss": 1.8487, "learning_rate": 9.841868901164622e-05, "epoch": 0.0956468424279583, "percentage": 9.56, "elapsed_time": "4:03:49", "remaining_time": "1 day, 14:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1717, "total_steps": 17941, "loss": 1.5147, "learning_rate": 9.84164666017362e-05, "epoch": 0.09570258068112146, "percentage": 9.57, "elapsed_time": "4:03:57", "remaining_time": "1 day, 14:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1718, "total_steps": 17941, "loss": 1.9583, "learning_rate": 9.841424265633816e-05, "epoch": 0.0957583189342846, "percentage": 9.58, "elapsed_time": "4:04:06", "remaining_time": "1 day, 14:25:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1719, "total_steps": 17941, "loss": 1.7111, "learning_rate": 9.84120171755226e-05, "epoch": 0.09581405718744775, "percentage": 9.58, "elapsed_time": "4:04:14", "remaining_time": "1 day, 14:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1720, "total_steps": 17941, "loss": 1.9152, "learning_rate": 9.840979015936014e-05, "epoch": 0.09586979544061089, "percentage": 9.59, "elapsed_time": "4:04:23", "remaining_time": "1 day, 14:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1721, "total_steps": 17941, "loss": 1.7902, "learning_rate": 9.840756160792138e-05, "epoch": 0.09592553369377403, "percentage": 9.59, "elapsed_time": "4:04:32", "remaining_time": "1 day, 14:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1722, "total_steps": 17941, "loss": 1.864, "learning_rate": 9.840533152127697e-05, "epoch": 0.09598127194693719, "percentage": 9.6, "elapsed_time": "4:04:40", "remaining_time": "1 day, 14:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1723, "total_steps": 17941, "loss": 1.7866, "learning_rate": 9.840309989949769e-05, "epoch": 0.09603701020010033, "percentage": 9.6, "elapsed_time": "4:04:48", "remaining_time": "1 day, 14:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1724, "total_steps": 17941, "loss": 1.8186, "learning_rate": 9.84008667426543e-05, "epoch": 0.09609274845326347, "percentage": 9.61, "elapsed_time": "4:04:57", "remaining_time": "1 day, 14:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1725, "total_steps": 17941, "loss": 1.8207, "learning_rate": 9.839863205081761e-05, "epoch": 0.09614848670642662, "percentage": 9.61, "elapsed_time": "4:05:06", "remaining_time": "1 day, 14:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1726, "total_steps": 17941, "loss": 1.8912, "learning_rate": 9.839639582405849e-05, "epoch": 0.09620422495958976, "percentage": 9.62, "elapsed_time": "4:05:14", "remaining_time": "1 day, 14:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1727, "total_steps": 17941, "loss": 1.6001, "learning_rate": 9.839415806244785e-05, "epoch": 0.09625996321275292, "percentage": 9.63, "elapsed_time": "4:05:23", "remaining_time": "1 day, 14:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1728, "total_steps": 17941, "loss": 1.6385, "learning_rate": 9.839191876605668e-05, "epoch": 0.09631570146591606, "percentage": 9.63, "elapsed_time": "4:05:32", "remaining_time": "1 day, 14:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1729, "total_steps": 17941, "loss": 1.8683, "learning_rate": 9.838967793495601e-05, "epoch": 0.0963714397190792, "percentage": 9.64, "elapsed_time": "4:05:40", "remaining_time": "1 day, 14:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 17941, "loss": 1.7169, "learning_rate": 9.838743556921688e-05, "epoch": 0.09642717797224234, "percentage": 9.64, "elapsed_time": "4:05:49", "remaining_time": "1 day, 14:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1731, "total_steps": 17941, "loss": 1.7714, "learning_rate": 9.83851916689104e-05, "epoch": 0.0964829162254055, "percentage": 9.65, "elapsed_time": "4:05:57", "remaining_time": "1 day, 14:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1732, "total_steps": 17941, "loss": 1.961, "learning_rate": 9.838294623410776e-05, "epoch": 0.09653865447856864, "percentage": 9.65, "elapsed_time": "4:06:06", "remaining_time": "1 day, 14:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1733, "total_steps": 17941, "loss": 1.9466, "learning_rate": 9.838069926488016e-05, "epoch": 0.09659439273173179, "percentage": 9.66, "elapsed_time": "4:06:14", "remaining_time": "1 day, 14:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1734, "total_steps": 17941, "loss": 1.6369, "learning_rate": 9.837845076129885e-05, "epoch": 0.09665013098489493, "percentage": 9.67, "elapsed_time": "4:06:23", "remaining_time": "1 day, 14:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1735, "total_steps": 17941, "loss": 1.6879, "learning_rate": 9.837620072343514e-05, "epoch": 0.09670586923805807, "percentage": 9.67, "elapsed_time": "4:06:31", "remaining_time": "1 day, 14:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1736, "total_steps": 17941, "loss": 2.0888, "learning_rate": 9.83739491513604e-05, "epoch": 0.09676160749122123, "percentage": 9.68, "elapsed_time": "4:06:40", "remaining_time": "1 day, 14:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1737, "total_steps": 17941, "loss": 2.0155, "learning_rate": 9.837169604514605e-05, "epoch": 0.09681734574438437, "percentage": 9.68, "elapsed_time": "4:06:48", "remaining_time": "1 day, 14:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1738, "total_steps": 17941, "loss": 1.7143, "learning_rate": 9.83694414048635e-05, "epoch": 0.09687308399754752, "percentage": 9.69, "elapsed_time": "4:06:57", "remaining_time": "1 day, 14:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1739, "total_steps": 17941, "loss": 1.7708, "learning_rate": 9.83671852305843e-05, "epoch": 0.09692882225071066, "percentage": 9.69, "elapsed_time": "4:07:05", "remaining_time": "1 day, 14:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1740, "total_steps": 17941, "loss": 1.8367, "learning_rate": 9.836492752237998e-05, "epoch": 0.09698456050387382, "percentage": 9.7, "elapsed_time": "4:07:14", "remaining_time": "1 day, 14:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1741, "total_steps": 17941, "loss": 1.6913, "learning_rate": 9.836266828032214e-05, "epoch": 0.09704029875703696, "percentage": 9.7, "elapsed_time": "4:07:22", "remaining_time": "1 day, 14:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1742, "total_steps": 17941, "loss": 1.8108, "learning_rate": 9.836040750448246e-05, "epoch": 0.0970960370102001, "percentage": 9.71, "elapsed_time": "4:07:30", "remaining_time": "1 day, 14:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1743, "total_steps": 17941, "loss": 1.7643, "learning_rate": 9.835814519493258e-05, "epoch": 0.09715177526336324, "percentage": 9.72, "elapsed_time": "4:07:39", "remaining_time": "1 day, 14:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1744, "total_steps": 17941, "loss": 1.753, "learning_rate": 9.835588135174432e-05, "epoch": 0.09720751351652639, "percentage": 9.72, "elapsed_time": "4:07:48", "remaining_time": "1 day, 14:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1745, "total_steps": 17941, "loss": 1.9646, "learning_rate": 9.83536159749894e-05, "epoch": 0.09726325176968954, "percentage": 9.73, "elapsed_time": "4:07:56", "remaining_time": "1 day, 14:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1746, "total_steps": 17941, "loss": 1.8053, "learning_rate": 9.835134906473973e-05, "epoch": 0.09731899002285269, "percentage": 9.73, "elapsed_time": "4:08:04", "remaining_time": "1 day, 14:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1747, "total_steps": 17941, "loss": 1.9073, "learning_rate": 9.834908062106716e-05, "epoch": 0.09737472827601583, "percentage": 9.74, "elapsed_time": "4:08:13", "remaining_time": "1 day, 14:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1748, "total_steps": 17941, "loss": 1.8642, "learning_rate": 9.834681064404366e-05, "epoch": 0.09743046652917897, "percentage": 9.74, "elapsed_time": "4:08:21", "remaining_time": "1 day, 14:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1749, "total_steps": 17941, "loss": 1.7084, "learning_rate": 9.83445391337412e-05, "epoch": 0.09748620478234211, "percentage": 9.75, "elapsed_time": "4:08:30", "remaining_time": "1 day, 14:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 17941, "loss": 1.7273, "learning_rate": 9.834226609023183e-05, "epoch": 0.09754194303550527, "percentage": 9.75, "elapsed_time": "4:08:38", "remaining_time": "1 day, 14:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1751, "total_steps": 17941, "loss": 2.3455, "learning_rate": 9.833999151358763e-05, "epoch": 0.09759768128866841, "percentage": 9.76, "elapsed_time": "4:08:47", "remaining_time": "1 day, 14:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1752, "total_steps": 17941, "loss": 1.5965, "learning_rate": 9.833771540388074e-05, "epoch": 0.09765341954183156, "percentage": 9.77, "elapsed_time": "4:08:55", "remaining_time": "1 day, 14:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1753, "total_steps": 17941, "loss": 1.7655, "learning_rate": 9.833543776118334e-05, "epoch": 0.0977091577949947, "percentage": 9.77, "elapsed_time": "4:09:04", "remaining_time": "1 day, 14:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1754, "total_steps": 17941, "loss": 1.6425, "learning_rate": 9.833315858556769e-05, "epoch": 0.09776489604815786, "percentage": 9.78, "elapsed_time": "4:09:12", "remaining_time": "1 day, 14:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1755, "total_steps": 17941, "loss": 1.8848, "learning_rate": 9.833087787710604e-05, "epoch": 0.097820634301321, "percentage": 9.78, "elapsed_time": "4:09:20", "remaining_time": "1 day, 14:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1756, "total_steps": 17941, "loss": 1.6713, "learning_rate": 9.832859563587073e-05, "epoch": 0.09787637255448414, "percentage": 9.79, "elapsed_time": "4:09:29", "remaining_time": "1 day, 14:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1757, "total_steps": 17941, "loss": 1.7833, "learning_rate": 9.832631186193414e-05, "epoch": 0.09793211080764729, "percentage": 9.79, "elapsed_time": "4:09:38", "remaining_time": "1 day, 14:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1758, "total_steps": 17941, "loss": 2.0934, "learning_rate": 9.832402655536869e-05, "epoch": 0.09798784906081043, "percentage": 9.8, "elapsed_time": "4:09:47", "remaining_time": "1 day, 14:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1759, "total_steps": 17941, "loss": 1.6506, "learning_rate": 9.83217397162469e-05, "epoch": 0.09804358731397358, "percentage": 9.8, "elapsed_time": "4:09:55", "remaining_time": "1 day, 14:19:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1760, "total_steps": 17941, "loss": 2.1311, "learning_rate": 9.831945134464123e-05, "epoch": 0.09809932556713673, "percentage": 9.81, "elapsed_time": "4:10:03", "remaining_time": "1 day, 14:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1761, "total_steps": 17941, "loss": 1.7606, "learning_rate": 9.831716144062431e-05, "epoch": 0.09815506382029987, "percentage": 9.82, "elapsed_time": "4:10:12", "remaining_time": "1 day, 14:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1762, "total_steps": 17941, "loss": 1.7404, "learning_rate": 9.831487000426871e-05, "epoch": 0.09821080207346301, "percentage": 9.82, "elapsed_time": "4:10:20", "remaining_time": "1 day, 14:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1763, "total_steps": 17941, "loss": 1.7232, "learning_rate": 9.831257703564715e-05, "epoch": 0.09826654032662617, "percentage": 9.83, "elapsed_time": "4:10:29", "remaining_time": "1 day, 14:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1764, "total_steps": 17941, "loss": 1.8867, "learning_rate": 9.831028253483232e-05, "epoch": 0.09832227857978931, "percentage": 9.83, "elapsed_time": "4:10:37", "remaining_time": "1 day, 14:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1765, "total_steps": 17941, "loss": 1.6442, "learning_rate": 9.8307986501897e-05, "epoch": 0.09837801683295246, "percentage": 9.84, "elapsed_time": "4:10:46", "remaining_time": "1 day, 14:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1766, "total_steps": 17941, "loss": 2.025, "learning_rate": 9.8305688936914e-05, "epoch": 0.0984337550861156, "percentage": 9.84, "elapsed_time": "4:10:54", "remaining_time": "1 day, 14:18:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1767, "total_steps": 17941, "loss": 1.683, "learning_rate": 9.83033898399562e-05, "epoch": 0.09848949333927874, "percentage": 9.85, "elapsed_time": "4:11:03", "remaining_time": "1 day, 14:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1768, "total_steps": 17941, "loss": 2.0356, "learning_rate": 9.830108921109648e-05, "epoch": 0.0985452315924419, "percentage": 9.85, "elapsed_time": "4:11:11", "remaining_time": "1 day, 14:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1769, "total_steps": 17941, "loss": 1.2685, "learning_rate": 9.829878705040784e-05, "epoch": 0.09860096984560504, "percentage": 9.86, "elapsed_time": "4:11:20", "remaining_time": "1 day, 14:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1770, "total_steps": 17941, "loss": 1.5734, "learning_rate": 9.829648335796327e-05, "epoch": 0.09865670809876818, "percentage": 9.87, "elapsed_time": "4:11:28", "remaining_time": "1 day, 14:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1771, "total_steps": 17941, "loss": 1.6253, "learning_rate": 9.829417813383584e-05, "epoch": 0.09871244635193133, "percentage": 9.87, "elapsed_time": "4:11:37", "remaining_time": "1 day, 14:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1772, "total_steps": 17941, "loss": 1.9336, "learning_rate": 9.829187137809865e-05, "epoch": 0.09876818460509447, "percentage": 9.88, "elapsed_time": "4:11:46", "remaining_time": "1 day, 14:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1773, "total_steps": 17941, "loss": 1.6934, "learning_rate": 9.828956309082487e-05, "epoch": 0.09882392285825763, "percentage": 9.88, "elapsed_time": "4:11:55", "remaining_time": "1 day, 14:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1774, "total_steps": 17941, "loss": 1.7357, "learning_rate": 9.828725327208769e-05, "epoch": 0.09887966111142077, "percentage": 9.89, "elapsed_time": "4:12:03", "remaining_time": "1 day, 14:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1775, "total_steps": 17941, "loss": 1.75, "learning_rate": 9.828494192196037e-05, "epoch": 0.09893539936458391, "percentage": 9.89, "elapsed_time": "4:12:12", "remaining_time": "1 day, 14:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1776, "total_steps": 17941, "loss": 1.8905, "learning_rate": 9.828262904051621e-05, "epoch": 0.09899113761774705, "percentage": 9.9, "elapsed_time": "4:12:20", "remaining_time": "1 day, 14:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1777, "total_steps": 17941, "loss": 1.7111, "learning_rate": 9.828031462782858e-05, "epoch": 0.09904687587091021, "percentage": 9.9, "elapsed_time": "4:12:29", "remaining_time": "1 day, 14:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1778, "total_steps": 17941, "loss": 1.7898, "learning_rate": 9.827799868397086e-05, "epoch": 0.09910261412407335, "percentage": 9.91, "elapsed_time": "4:12:37", "remaining_time": "1 day, 14:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1779, "total_steps": 17941, "loss": 1.8621, "learning_rate": 9.827568120901649e-05, "epoch": 0.0991583523772365, "percentage": 9.92, "elapsed_time": "4:12:46", "remaining_time": "1 day, 14:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1780, "total_steps": 17941, "loss": 1.5574, "learning_rate": 9.827336220303898e-05, "epoch": 0.09921409063039964, "percentage": 9.92, "elapsed_time": "4:12:54", "remaining_time": "1 day, 14:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1781, "total_steps": 17941, "loss": 1.7218, "learning_rate": 9.827104166611188e-05, "epoch": 0.09926982888356278, "percentage": 9.93, "elapsed_time": "4:13:03", "remaining_time": "1 day, 14:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1782, "total_steps": 17941, "loss": 1.6587, "learning_rate": 9.826871959830877e-05, "epoch": 0.09932556713672594, "percentage": 9.93, "elapsed_time": "4:13:11", "remaining_time": "1 day, 14:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1783, "total_steps": 17941, "loss": 1.9942, "learning_rate": 9.826639599970331e-05, "epoch": 0.09938130538988908, "percentage": 9.94, "elapsed_time": "4:13:20", "remaining_time": "1 day, 14:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1784, "total_steps": 17941, "loss": 1.7953, "learning_rate": 9.826407087036918e-05, "epoch": 0.09943704364305223, "percentage": 9.94, "elapsed_time": "4:13:29", "remaining_time": "1 day, 14:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1785, "total_steps": 17941, "loss": 1.7257, "learning_rate": 9.82617442103801e-05, "epoch": 0.09949278189621537, "percentage": 9.95, "elapsed_time": "4:13:37", "remaining_time": "1 day, 14:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1786, "total_steps": 17941, "loss": 1.6209, "learning_rate": 9.82594160198099e-05, "epoch": 0.09954852014937852, "percentage": 9.95, "elapsed_time": "4:13:46", "remaining_time": "1 day, 14:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1787, "total_steps": 17941, "loss": 1.7242, "learning_rate": 9.82570862987324e-05, "epoch": 0.09960425840254167, "percentage": 9.96, "elapsed_time": "4:13:54", "remaining_time": "1 day, 14:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1788, "total_steps": 17941, "loss": 1.8402, "learning_rate": 9.825475504722147e-05, "epoch": 0.09965999665570481, "percentage": 9.97, "elapsed_time": "4:14:03", "remaining_time": "1 day, 14:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1789, "total_steps": 17941, "loss": 1.5434, "learning_rate": 9.825242226535106e-05, "epoch": 0.09971573490886795, "percentage": 9.97, "elapsed_time": "4:14:11", "remaining_time": "1 day, 14:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1790, "total_steps": 17941, "loss": 1.8505, "learning_rate": 9.825008795319514e-05, "epoch": 0.0997714731620311, "percentage": 9.98, "elapsed_time": "4:14:20", "remaining_time": "1 day, 14:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1791, "total_steps": 17941, "loss": 1.9345, "learning_rate": 9.824775211082776e-05, "epoch": 0.09982721141519425, "percentage": 9.98, "elapsed_time": "4:14:28", "remaining_time": "1 day, 14:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1792, "total_steps": 17941, "loss": 1.6482, "learning_rate": 9.824541473832298e-05, "epoch": 0.0998829496683574, "percentage": 9.99, "elapsed_time": "4:14:37", "remaining_time": "1 day, 14:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1793, "total_steps": 17941, "loss": 1.6791, "learning_rate": 9.824307583575494e-05, "epoch": 0.09993868792152054, "percentage": 9.99, "elapsed_time": "4:14:46", "remaining_time": "1 day, 14:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1794, "total_steps": 17941, "loss": 1.6764, "learning_rate": 9.82407354031978e-05, "epoch": 0.09999442617468368, "percentage": 10.0, "elapsed_time": "4:14:54", "remaining_time": "1 day, 14:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1795, "total_steps": 17941, "loss": 1.7993, "learning_rate": 9.82383934407258e-05, "epoch": 0.10005016442784682, "percentage": 10.01, "elapsed_time": "4:15:03", "remaining_time": "1 day, 14:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1796, "total_steps": 17941, "loss": 1.9674, "learning_rate": 9.823604994841322e-05, "epoch": 0.10010590268100998, "percentage": 10.01, "elapsed_time": "4:15:11", "remaining_time": "1 day, 14:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1797, "total_steps": 17941, "loss": 1.7585, "learning_rate": 9.823370492633435e-05, "epoch": 0.10016164093417312, "percentage": 10.02, "elapsed_time": "4:15:20", "remaining_time": "1 day, 14:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1798, "total_steps": 17941, "loss": 1.7215, "learning_rate": 9.823135837456362e-05, "epoch": 0.10021737918733627, "percentage": 10.02, "elapsed_time": "4:15:28", "remaining_time": "1 day, 14:13:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1799, "total_steps": 17941, "loss": 1.7812, "learning_rate": 9.822901029317537e-05, "epoch": 0.10027311744049941, "percentage": 10.03, "elapsed_time": "4:15:37", "remaining_time": "1 day, 14:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 17941, "loss": 1.6675, "learning_rate": 9.822666068224412e-05, "epoch": 0.10032885569366257, "percentage": 10.03, "elapsed_time": "4:15:46", "remaining_time": "1 day, 14:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1801, "total_steps": 17941, "loss": 1.8071, "learning_rate": 9.822430954184439e-05, "epoch": 0.10038459394682571, "percentage": 10.04, "elapsed_time": "4:15:54", "remaining_time": "1 day, 14:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1802, "total_steps": 17941, "loss": 1.7311, "learning_rate": 9.82219568720507e-05, "epoch": 0.10044033219998885, "percentage": 10.04, "elapsed_time": "4:16:03", "remaining_time": "1 day, 14:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1803, "total_steps": 17941, "loss": 1.8179, "learning_rate": 9.821960267293771e-05, "epoch": 0.100496070453152, "percentage": 10.05, "elapsed_time": "4:16:11", "remaining_time": "1 day, 14:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1804, "total_steps": 17941, "loss": 1.7443, "learning_rate": 9.821724694458006e-05, "epoch": 0.10055180870631514, "percentage": 10.06, "elapsed_time": "4:16:20", "remaining_time": "1 day, 14:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1805, "total_steps": 17941, "loss": 1.8426, "learning_rate": 9.821488968705246e-05, "epoch": 0.1006075469594783, "percentage": 10.06, "elapsed_time": "4:16:28", "remaining_time": "1 day, 14:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1806, "total_steps": 17941, "loss": 1.6857, "learning_rate": 9.821253090042967e-05, "epoch": 0.10066328521264144, "percentage": 10.07, "elapsed_time": "4:16:37", "remaining_time": "1 day, 14:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1807, "total_steps": 17941, "loss": 1.904, "learning_rate": 9.821017058478653e-05, "epoch": 0.10071902346580458, "percentage": 10.07, "elapsed_time": "4:16:45", "remaining_time": "1 day, 14:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1808, "total_steps": 17941, "loss": 1.8538, "learning_rate": 9.820780874019782e-05, "epoch": 0.10077476171896772, "percentage": 10.08, "elapsed_time": "4:16:54", "remaining_time": "1 day, 14:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1809, "total_steps": 17941, "loss": 1.9318, "learning_rate": 9.82054453667385e-05, "epoch": 0.10083049997213088, "percentage": 10.08, "elapsed_time": "4:17:02", "remaining_time": "1 day, 14:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1810, "total_steps": 17941, "loss": 1.6044, "learning_rate": 9.820308046448353e-05, "epoch": 0.10088623822529402, "percentage": 10.09, "elapsed_time": "4:17:10", "remaining_time": "1 day, 14:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1811, "total_steps": 17941, "loss": 1.7234, "learning_rate": 9.820071403350787e-05, "epoch": 0.10094197647845717, "percentage": 10.09, "elapsed_time": "4:17:19", "remaining_time": "1 day, 14:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1812, "total_steps": 17941, "loss": 1.7911, "learning_rate": 9.81983460738866e-05, "epoch": 0.10099771473162031, "percentage": 10.1, "elapsed_time": "4:17:27", "remaining_time": "1 day, 14:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1813, "total_steps": 17941, "loss": 1.8147, "learning_rate": 9.819597658569479e-05, "epoch": 0.10105345298478345, "percentage": 10.11, "elapsed_time": "4:17:36", "remaining_time": "1 day, 14:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1814, "total_steps": 17941, "loss": 1.8057, "learning_rate": 9.819360556900763e-05, "epoch": 0.10110919123794661, "percentage": 10.11, "elapsed_time": "4:17:44", "remaining_time": "1 day, 14:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1815, "total_steps": 17941, "loss": 1.7813, "learning_rate": 9.819123302390027e-05, "epoch": 0.10116492949110975, "percentage": 10.12, "elapsed_time": "4:17:53", "remaining_time": "1 day, 14:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1816, "total_steps": 17941, "loss": 1.7398, "learning_rate": 9.818885895044799e-05, "epoch": 0.1012206677442729, "percentage": 10.12, "elapsed_time": "4:18:01", "remaining_time": "1 day, 14:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1817, "total_steps": 17941, "loss": 1.985, "learning_rate": 9.818648334872607e-05, "epoch": 0.10127640599743604, "percentage": 10.13, "elapsed_time": "4:18:09", "remaining_time": "1 day, 14:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1818, "total_steps": 17941, "loss": 1.7932, "learning_rate": 9.818410621880982e-05, "epoch": 0.10133214425059918, "percentage": 10.13, "elapsed_time": "4:18:18", "remaining_time": "1 day, 14:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1819, "total_steps": 17941, "loss": 1.8672, "learning_rate": 9.818172756077466e-05, "epoch": 0.10138788250376234, "percentage": 10.14, "elapsed_time": "4:18:26", "remaining_time": "1 day, 14:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1820, "total_steps": 17941, "loss": 1.4847, "learning_rate": 9.817934737469603e-05, "epoch": 0.10144362075692548, "percentage": 10.14, "elapsed_time": "4:18:35", "remaining_time": "1 day, 14:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1821, "total_steps": 17941, "loss": 1.6301, "learning_rate": 9.81769656606494e-05, "epoch": 0.10149935901008862, "percentage": 10.15, "elapsed_time": "4:18:43", "remaining_time": "1 day, 14:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1822, "total_steps": 17941, "loss": 1.8199, "learning_rate": 9.817458241871032e-05, "epoch": 0.10155509726325176, "percentage": 10.16, "elapsed_time": "4:18:52", "remaining_time": "1 day, 14:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1823, "total_steps": 17941, "loss": 1.7238, "learning_rate": 9.817219764895435e-05, "epoch": 0.10161083551641492, "percentage": 10.16, "elapsed_time": "4:19:00", "remaining_time": "1 day, 14:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1824, "total_steps": 17941, "loss": 1.7099, "learning_rate": 9.816981135145714e-05, "epoch": 0.10166657376957806, "percentage": 10.17, "elapsed_time": "4:19:09", "remaining_time": "1 day, 14:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1825, "total_steps": 17941, "loss": 1.7679, "learning_rate": 9.816742352629437e-05, "epoch": 0.10172231202274121, "percentage": 10.17, "elapsed_time": "4:19:17", "remaining_time": "1 day, 14:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1826, "total_steps": 17941, "loss": 2.0049, "learning_rate": 9.816503417354174e-05, "epoch": 0.10177805027590435, "percentage": 10.18, "elapsed_time": "4:19:26", "remaining_time": "1 day, 14:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1827, "total_steps": 17941, "loss": 1.7042, "learning_rate": 9.816264329327507e-05, "epoch": 0.10183378852906749, "percentage": 10.18, "elapsed_time": "4:19:34", "remaining_time": "1 day, 14:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1828, "total_steps": 17941, "loss": 1.7472, "learning_rate": 9.816025088557015e-05, "epoch": 0.10188952678223065, "percentage": 10.19, "elapsed_time": "4:19:43", "remaining_time": "1 day, 14:09:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1829, "total_steps": 17941, "loss": 1.6525, "learning_rate": 9.815785695050288e-05, "epoch": 0.10194526503539379, "percentage": 10.19, "elapsed_time": "4:19:51", "remaining_time": "1 day, 14:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1830, "total_steps": 17941, "loss": 1.6744, "learning_rate": 9.815546148814915e-05, "epoch": 0.10200100328855694, "percentage": 10.2, "elapsed_time": "4:20:00", "remaining_time": "1 day, 14:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1831, "total_steps": 17941, "loss": 1.6183, "learning_rate": 9.815306449858497e-05, "epoch": 0.10205674154172008, "percentage": 10.21, "elapsed_time": "4:20:08", "remaining_time": "1 day, 14:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1832, "total_steps": 17941, "loss": 1.842, "learning_rate": 9.815066598188631e-05, "epoch": 0.10211247979488323, "percentage": 10.21, "elapsed_time": "4:20:17", "remaining_time": "1 day, 14:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1833, "total_steps": 17941, "loss": 1.6504, "learning_rate": 9.814826593812928e-05, "epoch": 0.10216821804804638, "percentage": 10.22, "elapsed_time": "4:20:25", "remaining_time": "1 day, 14:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1834, "total_steps": 17941, "loss": 1.8817, "learning_rate": 9.814586436738998e-05, "epoch": 0.10222395630120952, "percentage": 10.22, "elapsed_time": "4:20:34", "remaining_time": "1 day, 14:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1835, "total_steps": 17941, "loss": 1.8143, "learning_rate": 9.814346126974455e-05, "epoch": 0.10227969455437266, "percentage": 10.23, "elapsed_time": "4:20:42", "remaining_time": "1 day, 14:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1836, "total_steps": 17941, "loss": 1.8255, "learning_rate": 9.814105664526925e-05, "epoch": 0.1023354328075358, "percentage": 10.23, "elapsed_time": "4:20:51", "remaining_time": "1 day, 14:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1837, "total_steps": 17941, "loss": 1.5754, "learning_rate": 9.81386504940403e-05, "epoch": 0.10239117106069896, "percentage": 10.24, "elapsed_time": "4:20:59", "remaining_time": "1 day, 14:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1838, "total_steps": 17941, "loss": 1.7516, "learning_rate": 9.813624281613403e-05, "epoch": 0.1024469093138621, "percentage": 10.24, "elapsed_time": "4:21:08", "remaining_time": "1 day, 14:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1839, "total_steps": 17941, "loss": 1.7164, "learning_rate": 9.813383361162678e-05, "epoch": 0.10250264756702525, "percentage": 10.25, "elapsed_time": "4:21:17", "remaining_time": "1 day, 14:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1840, "total_steps": 17941, "loss": 1.4974, "learning_rate": 9.813142288059497e-05, "epoch": 0.10255838582018839, "percentage": 10.26, "elapsed_time": "4:21:25", "remaining_time": "1 day, 14:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1841, "total_steps": 17941, "loss": 1.6087, "learning_rate": 9.812901062311507e-05, "epoch": 0.10261412407335155, "percentage": 10.26, "elapsed_time": "4:21:34", "remaining_time": "1 day, 14:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1842, "total_steps": 17941, "loss": 1.734, "learning_rate": 9.812659683926355e-05, "epoch": 0.10266986232651469, "percentage": 10.27, "elapsed_time": "4:21:42", "remaining_time": "1 day, 14:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1843, "total_steps": 17941, "loss": 1.7643, "learning_rate": 9.812418152911697e-05, "epoch": 0.10272560057967783, "percentage": 10.27, "elapsed_time": "4:21:50", "remaining_time": "1 day, 14:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1844, "total_steps": 17941, "loss": 1.7052, "learning_rate": 9.812176469275196e-05, "epoch": 0.10278133883284098, "percentage": 10.28, "elapsed_time": "4:21:59", "remaining_time": "1 day, 14:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1845, "total_steps": 17941, "loss": 1.8478, "learning_rate": 9.811934633024514e-05, "epoch": 0.10283707708600412, "percentage": 10.28, "elapsed_time": "4:22:07", "remaining_time": "1 day, 14:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1846, "total_steps": 17941, "loss": 1.7884, "learning_rate": 9.811692644167318e-05, "epoch": 0.10289281533916728, "percentage": 10.29, "elapsed_time": "4:22:16", "remaining_time": "1 day, 14:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1847, "total_steps": 17941, "loss": 1.7511, "learning_rate": 9.811450502711288e-05, "epoch": 0.10294855359233042, "percentage": 10.29, "elapsed_time": "4:22:24", "remaining_time": "1 day, 14:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1848, "total_steps": 17941, "loss": 1.7348, "learning_rate": 9.8112082086641e-05, "epoch": 0.10300429184549356, "percentage": 10.3, "elapsed_time": "4:22:33", "remaining_time": "1 day, 14:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1849, "total_steps": 17941, "loss": 1.8117, "learning_rate": 9.810965762033439e-05, "epoch": 0.1030600300986567, "percentage": 10.31, "elapsed_time": "4:22:41", "remaining_time": "1 day, 14:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 17941, "loss": 1.6535, "learning_rate": 9.810723162826994e-05, "epoch": 0.10311576835181985, "percentage": 10.31, "elapsed_time": "4:22:50", "remaining_time": "1 day, 14:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1851, "total_steps": 17941, "loss": 1.8094, "learning_rate": 9.810480411052458e-05, "epoch": 0.103171506604983, "percentage": 10.32, "elapsed_time": "4:22:58", "remaining_time": "1 day, 14:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1852, "total_steps": 17941, "loss": 1.8347, "learning_rate": 9.81023750671753e-05, "epoch": 0.10322724485814615, "percentage": 10.32, "elapsed_time": "4:23:07", "remaining_time": "1 day, 14:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1853, "total_steps": 17941, "loss": 1.8038, "learning_rate": 9.809994449829916e-05, "epoch": 0.10328298311130929, "percentage": 10.33, "elapsed_time": "4:23:15", "remaining_time": "1 day, 14:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1854, "total_steps": 17941, "loss": 1.5616, "learning_rate": 9.809751240397321e-05, "epoch": 0.10333872136447243, "percentage": 10.33, "elapsed_time": "4:23:24", "remaining_time": "1 day, 14:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1855, "total_steps": 17941, "loss": 2.0217, "learning_rate": 9.80950787842746e-05, "epoch": 0.10339445961763559, "percentage": 10.34, "elapsed_time": "4:23:32", "remaining_time": "1 day, 14:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1856, "total_steps": 17941, "loss": 1.6151, "learning_rate": 9.809264363928049e-05, "epoch": 0.10345019787079873, "percentage": 10.35, "elapsed_time": "4:23:40", "remaining_time": "1 day, 14:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1857, "total_steps": 17941, "loss": 1.5242, "learning_rate": 9.809020696906815e-05, "epoch": 0.10350593612396188, "percentage": 10.35, "elapsed_time": "4:23:49", "remaining_time": "1 day, 14:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1858, "total_steps": 17941, "loss": 1.6917, "learning_rate": 9.80877687737148e-05, "epoch": 0.10356167437712502, "percentage": 10.36, "elapsed_time": "4:23:57", "remaining_time": "1 day, 14:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1859, "total_steps": 17941, "loss": 1.785, "learning_rate": 9.808532905329781e-05, "epoch": 0.10361741263028816, "percentage": 10.36, "elapsed_time": "4:24:06", "remaining_time": "1 day, 14:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1860, "total_steps": 17941, "loss": 1.8857, "learning_rate": 9.808288780789454e-05, "epoch": 0.10367315088345132, "percentage": 10.37, "elapsed_time": "4:24:14", "remaining_time": "1 day, 14:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1861, "total_steps": 17941, "loss": 1.5768, "learning_rate": 9.80804450375824e-05, "epoch": 0.10372888913661446, "percentage": 10.37, "elapsed_time": "4:24:23", "remaining_time": "1 day, 14:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1862, "total_steps": 17941, "loss": 2.1482, "learning_rate": 9.807800074243888e-05, "epoch": 0.1037846273897776, "percentage": 10.38, "elapsed_time": "4:24:31", "remaining_time": "1 day, 14:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1863, "total_steps": 17941, "loss": 1.6884, "learning_rate": 9.80755549225415e-05, "epoch": 0.10384036564294075, "percentage": 10.38, "elapsed_time": "4:24:39", "remaining_time": "1 day, 14:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1864, "total_steps": 17941, "loss": 1.9665, "learning_rate": 9.807310757796781e-05, "epoch": 0.1038961038961039, "percentage": 10.39, "elapsed_time": "4:24:48", "remaining_time": "1 day, 14:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1865, "total_steps": 17941, "loss": 1.9696, "learning_rate": 9.807065870879544e-05, "epoch": 0.10395184214926705, "percentage": 10.4, "elapsed_time": "4:24:56", "remaining_time": "1 day, 14:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1866, "total_steps": 17941, "loss": 1.6848, "learning_rate": 9.806820831510204e-05, "epoch": 0.10400758040243019, "percentage": 10.4, "elapsed_time": "4:25:05", "remaining_time": "1 day, 14:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1867, "total_steps": 17941, "loss": 1.6808, "learning_rate": 9.806575639696533e-05, "epoch": 0.10406331865559333, "percentage": 10.41, "elapsed_time": "4:25:13", "remaining_time": "1 day, 14:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1868, "total_steps": 17941, "loss": 1.8179, "learning_rate": 9.806330295446307e-05, "epoch": 0.10411905690875647, "percentage": 10.41, "elapsed_time": "4:25:22", "remaining_time": "1 day, 14:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1869, "total_steps": 17941, "loss": 1.5517, "learning_rate": 9.806084798767307e-05, "epoch": 0.10417479516191963, "percentage": 10.42, "elapsed_time": "4:25:30", "remaining_time": "1 day, 14:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1870, "total_steps": 17941, "loss": 1.7125, "learning_rate": 9.805839149667319e-05, "epoch": 0.10423053341508277, "percentage": 10.42, "elapsed_time": "4:25:39", "remaining_time": "1 day, 14:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1871, "total_steps": 17941, "loss": 1.9891, "learning_rate": 9.805593348154131e-05, "epoch": 0.10428627166824592, "percentage": 10.43, "elapsed_time": "4:25:48", "remaining_time": "1 day, 14:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1872, "total_steps": 17941, "loss": 1.779, "learning_rate": 9.805347394235543e-05, "epoch": 0.10434200992140906, "percentage": 10.43, "elapsed_time": "4:25:56", "remaining_time": "1 day, 14:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1873, "total_steps": 17941, "loss": 1.898, "learning_rate": 9.805101287919352e-05, "epoch": 0.1043977481745722, "percentage": 10.44, "elapsed_time": "4:26:04", "remaining_time": "1 day, 14:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1874, "total_steps": 17941, "loss": 1.9422, "learning_rate": 9.804855029213365e-05, "epoch": 0.10445348642773536, "percentage": 10.45, "elapsed_time": "4:26:14", "remaining_time": "1 day, 14:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1875, "total_steps": 17941, "loss": 1.776, "learning_rate": 9.804608618125388e-05, "epoch": 0.1045092246808985, "percentage": 10.45, "elapsed_time": "4:26:22", "remaining_time": "1 day, 14:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1876, "total_steps": 17941, "loss": 1.7196, "learning_rate": 9.804362054663241e-05, "epoch": 0.10456496293406164, "percentage": 10.46, "elapsed_time": "4:26:31", "remaining_time": "1 day, 14:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1877, "total_steps": 17941, "loss": 1.6667, "learning_rate": 9.80411533883474e-05, "epoch": 0.10462070118722479, "percentage": 10.46, "elapsed_time": "4:26:39", "remaining_time": "1 day, 14:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1878, "total_steps": 17941, "loss": 1.8897, "learning_rate": 9.80386847064771e-05, "epoch": 0.10467643944038794, "percentage": 10.47, "elapsed_time": "4:26:48", "remaining_time": "1 day, 14:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1879, "total_steps": 17941, "loss": 1.868, "learning_rate": 9.80362145010998e-05, "epoch": 0.10473217769355109, "percentage": 10.47, "elapsed_time": "4:26:56", "remaining_time": "1 day, 14:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1880, "total_steps": 17941, "loss": 1.7449, "learning_rate": 9.803374277229387e-05, "epoch": 0.10478791594671423, "percentage": 10.48, "elapsed_time": "4:27:05", "remaining_time": "1 day, 14:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1881, "total_steps": 17941, "loss": 1.7454, "learning_rate": 9.803126952013766e-05, "epoch": 0.10484365419987737, "percentage": 10.48, "elapsed_time": "4:27:13", "remaining_time": "1 day, 14:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1882, "total_steps": 17941, "loss": 1.5892, "learning_rate": 9.802879474470964e-05, "epoch": 0.10489939245304052, "percentage": 10.49, "elapsed_time": "4:27:22", "remaining_time": "1 day, 14:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1883, "total_steps": 17941, "loss": 1.608, "learning_rate": 9.802631844608825e-05, "epoch": 0.10495513070620367, "percentage": 10.5, "elapsed_time": "4:27:30", "remaining_time": "1 day, 14:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1884, "total_steps": 17941, "loss": 1.8286, "learning_rate": 9.802384062435206e-05, "epoch": 0.10501086895936682, "percentage": 10.5, "elapsed_time": "4:27:38", "remaining_time": "1 day, 14:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1885, "total_steps": 17941, "loss": 1.7811, "learning_rate": 9.802136127957965e-05, "epoch": 0.10506660721252996, "percentage": 10.51, "elapsed_time": "4:27:47", "remaining_time": "1 day, 14:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1886, "total_steps": 17941, "loss": 2.0036, "learning_rate": 9.801888041184963e-05, "epoch": 0.1051223454656931, "percentage": 10.51, "elapsed_time": "4:27:55", "remaining_time": "1 day, 14:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1887, "total_steps": 17941, "loss": 1.6716, "learning_rate": 9.801639802124071e-05, "epoch": 0.10517808371885626, "percentage": 10.52, "elapsed_time": "4:28:04", "remaining_time": "1 day, 14:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1888, "total_steps": 17941, "loss": 1.6815, "learning_rate": 9.801391410783161e-05, "epoch": 0.1052338219720194, "percentage": 10.52, "elapsed_time": "4:28:13", "remaining_time": "1 day, 14:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1889, "total_steps": 17941, "loss": 1.7429, "learning_rate": 9.801142867170106e-05, "epoch": 0.10528956022518254, "percentage": 10.53, "elapsed_time": "4:28:21", "remaining_time": "1 day, 14:00:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1890, "total_steps": 17941, "loss": 1.8671, "learning_rate": 9.800894171292793e-05, "epoch": 0.10534529847834569, "percentage": 10.53, "elapsed_time": "4:28:30", "remaining_time": "1 day, 14:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1891, "total_steps": 17941, "loss": 1.6347, "learning_rate": 9.80064532315911e-05, "epoch": 0.10540103673150883, "percentage": 10.54, "elapsed_time": "4:28:38", "remaining_time": "1 day, 14:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1892, "total_steps": 17941, "loss": 1.601, "learning_rate": 9.800396322776945e-05, "epoch": 0.10545677498467199, "percentage": 10.55, "elapsed_time": "4:28:46", "remaining_time": "1 day, 13:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1893, "total_steps": 17941, "loss": 1.7157, "learning_rate": 9.800147170154199e-05, "epoch": 0.10551251323783513, "percentage": 10.55, "elapsed_time": "4:28:55", "remaining_time": "1 day, 13:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1894, "total_steps": 17941, "loss": 1.7322, "learning_rate": 9.79989786529877e-05, "epoch": 0.10556825149099827, "percentage": 10.56, "elapsed_time": "4:29:04", "remaining_time": "1 day, 13:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1895, "total_steps": 17941, "loss": 2.0407, "learning_rate": 9.799648408218567e-05, "epoch": 0.10562398974416141, "percentage": 10.56, "elapsed_time": "4:29:12", "remaining_time": "1 day, 13:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1896, "total_steps": 17941, "loss": 1.6443, "learning_rate": 9.7993987989215e-05, "epoch": 0.10567972799732456, "percentage": 10.57, "elapsed_time": "4:29:21", "remaining_time": "1 day, 13:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1897, "total_steps": 17941, "loss": 1.6341, "learning_rate": 9.799149037415485e-05, "epoch": 0.10573546625048771, "percentage": 10.57, "elapsed_time": "4:29:30", "remaining_time": "1 day, 13:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1898, "total_steps": 17941, "loss": 1.7532, "learning_rate": 9.798899123708444e-05, "epoch": 0.10579120450365086, "percentage": 10.58, "elapsed_time": "4:29:38", "remaining_time": "1 day, 13:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1899, "total_steps": 17941, "loss": 1.7511, "learning_rate": 9.798649057808302e-05, "epoch": 0.105846942756814, "percentage": 10.58, "elapsed_time": "4:29:47", "remaining_time": "1 day, 13:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 17941, "loss": 1.8548, "learning_rate": 9.798398839722991e-05, "epoch": 0.10590268100997714, "percentage": 10.59, "elapsed_time": "4:29:55", "remaining_time": "1 day, 13:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1901, "total_steps": 17941, "loss": 1.7457, "learning_rate": 9.798148469460444e-05, "epoch": 0.1059584192631403, "percentage": 10.6, "elapsed_time": "4:30:03", "remaining_time": "1 day, 13:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1902, "total_steps": 17941, "loss": 1.6342, "learning_rate": 9.797897947028602e-05, "epoch": 0.10601415751630344, "percentage": 10.6, "elapsed_time": "4:30:12", "remaining_time": "1 day, 13:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1903, "total_steps": 17941, "loss": 1.6272, "learning_rate": 9.797647272435413e-05, "epoch": 0.10606989576946659, "percentage": 10.61, "elapsed_time": "4:30:20", "remaining_time": "1 day, 13:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1904, "total_steps": 17941, "loss": 1.6666, "learning_rate": 9.797396445688825e-05, "epoch": 0.10612563402262973, "percentage": 10.61, "elapsed_time": "4:30:29", "remaining_time": "1 day, 13:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1905, "total_steps": 17941, "loss": 1.7214, "learning_rate": 9.797145466796791e-05, "epoch": 0.10618137227579287, "percentage": 10.62, "elapsed_time": "4:30:37", "remaining_time": "1 day, 13:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1906, "total_steps": 17941, "loss": 1.7156, "learning_rate": 9.796894335767272e-05, "epoch": 0.10623711052895603, "percentage": 10.62, "elapsed_time": "4:30:46", "remaining_time": "1 day, 13:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1907, "total_steps": 17941, "loss": 1.7284, "learning_rate": 9.796643052608232e-05, "epoch": 0.10629284878211917, "percentage": 10.63, "elapsed_time": "4:30:54", "remaining_time": "1 day, 13:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1908, "total_steps": 17941, "loss": 1.514, "learning_rate": 9.796391617327643e-05, "epoch": 0.10634858703528231, "percentage": 10.63, "elapsed_time": "4:31:03", "remaining_time": "1 day, 13:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1909, "total_steps": 17941, "loss": 1.9562, "learning_rate": 9.796140029933474e-05, "epoch": 0.10640432528844546, "percentage": 10.64, "elapsed_time": "4:31:12", "remaining_time": "1 day, 13:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1910, "total_steps": 17941, "loss": 1.8475, "learning_rate": 9.795888290433708e-05, "epoch": 0.10646006354160861, "percentage": 10.65, "elapsed_time": "4:31:20", "remaining_time": "1 day, 13:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1911, "total_steps": 17941, "loss": 1.4198, "learning_rate": 9.795636398836328e-05, "epoch": 0.10651580179477176, "percentage": 10.65, "elapsed_time": "4:31:29", "remaining_time": "1 day, 13:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1912, "total_steps": 17941, "loss": 1.7098, "learning_rate": 9.795384355149321e-05, "epoch": 0.1065715400479349, "percentage": 10.66, "elapsed_time": "4:31:37", "remaining_time": "1 day, 13:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1913, "total_steps": 17941, "loss": 1.8379, "learning_rate": 9.795132159380683e-05, "epoch": 0.10662727830109804, "percentage": 10.66, "elapsed_time": "4:31:46", "remaining_time": "1 day, 13:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1914, "total_steps": 17941, "loss": 1.8069, "learning_rate": 9.794879811538409e-05, "epoch": 0.10668301655426118, "percentage": 10.67, "elapsed_time": "4:31:55", "remaining_time": "1 day, 13:56:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1915, "total_steps": 17941, "loss": 1.9336, "learning_rate": 9.794627311630503e-05, "epoch": 0.10673875480742434, "percentage": 10.67, "elapsed_time": "4:32:03", "remaining_time": "1 day, 13:56:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1916, "total_steps": 17941, "loss": 1.8024, "learning_rate": 9.794374659664975e-05, "epoch": 0.10679449306058748, "percentage": 10.68, "elapsed_time": "4:32:11", "remaining_time": "1 day, 13:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1917, "total_steps": 17941, "loss": 1.6553, "learning_rate": 9.794121855649834e-05, "epoch": 0.10685023131375063, "percentage": 10.69, "elapsed_time": "4:32:20", "remaining_time": "1 day, 13:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1918, "total_steps": 17941, "loss": 1.6452, "learning_rate": 9.793868899593101e-05, "epoch": 0.10690596956691377, "percentage": 10.69, "elapsed_time": "4:32:28", "remaining_time": "1 day, 13:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1919, "total_steps": 17941, "loss": 1.5787, "learning_rate": 9.793615791502794e-05, "epoch": 0.10696170782007691, "percentage": 10.7, "elapsed_time": "4:32:37", "remaining_time": "1 day, 13:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1920, "total_steps": 17941, "loss": 1.7273, "learning_rate": 9.793362531386946e-05, "epoch": 0.10701744607324007, "percentage": 10.7, "elapsed_time": "4:32:45", "remaining_time": "1 day, 13:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1921, "total_steps": 17941, "loss": 1.7061, "learning_rate": 9.793109119253584e-05, "epoch": 0.10707318432640321, "percentage": 10.71, "elapsed_time": "4:32:54", "remaining_time": "1 day, 13:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1922, "total_steps": 17941, "loss": 1.6418, "learning_rate": 9.792855555110747e-05, "epoch": 0.10712892257956635, "percentage": 10.71, "elapsed_time": "4:33:02", "remaining_time": "1 day, 13:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1923, "total_steps": 17941, "loss": 1.8774, "learning_rate": 9.792601838966477e-05, "epoch": 0.1071846608327295, "percentage": 10.72, "elapsed_time": "4:33:11", "remaining_time": "1 day, 13:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1924, "total_steps": 17941, "loss": 1.8705, "learning_rate": 9.792347970828819e-05, "epoch": 0.10724039908589265, "percentage": 10.72, "elapsed_time": "4:33:19", "remaining_time": "1 day, 13:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1925, "total_steps": 17941, "loss": 1.6882, "learning_rate": 9.792093950705824e-05, "epoch": 0.1072961373390558, "percentage": 10.73, "elapsed_time": "4:33:28", "remaining_time": "1 day, 13:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1926, "total_steps": 17941, "loss": 1.993, "learning_rate": 9.79183977860555e-05, "epoch": 0.10735187559221894, "percentage": 10.74, "elapsed_time": "4:33:36", "remaining_time": "1 day, 13:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1927, "total_steps": 17941, "loss": 1.7984, "learning_rate": 9.791585454536054e-05, "epoch": 0.10740761384538208, "percentage": 10.74, "elapsed_time": "4:33:44", "remaining_time": "1 day, 13:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1928, "total_steps": 17941, "loss": 1.781, "learning_rate": 9.791330978505406e-05, "epoch": 0.10746335209854523, "percentage": 10.75, "elapsed_time": "4:33:53", "remaining_time": "1 day, 13:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1929, "total_steps": 17941, "loss": 1.8367, "learning_rate": 9.791076350521675e-05, "epoch": 0.10751909035170838, "percentage": 10.75, "elapsed_time": "4:34:01", "remaining_time": "1 day, 13:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1930, "total_steps": 17941, "loss": 1.9812, "learning_rate": 9.790821570592937e-05, "epoch": 0.10757482860487153, "percentage": 10.76, "elapsed_time": "4:34:10", "remaining_time": "1 day, 13:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1931, "total_steps": 17941, "loss": 1.9631, "learning_rate": 9.790566638727268e-05, "epoch": 0.10763056685803467, "percentage": 10.76, "elapsed_time": "4:34:18", "remaining_time": "1 day, 13:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1932, "total_steps": 17941, "loss": 1.6961, "learning_rate": 9.790311554932758e-05, "epoch": 0.10768630511119781, "percentage": 10.77, "elapsed_time": "4:34:27", "remaining_time": "1 day, 13:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1933, "total_steps": 17941, "loss": 1.4829, "learning_rate": 9.790056319217495e-05, "epoch": 0.10774204336436097, "percentage": 10.77, "elapsed_time": "4:34:35", "remaining_time": "1 day, 13:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1934, "total_steps": 17941, "loss": 1.7646, "learning_rate": 9.789800931589574e-05, "epoch": 0.10779778161752411, "percentage": 10.78, "elapsed_time": "4:34:44", "remaining_time": "1 day, 13:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1935, "total_steps": 17941, "loss": 1.6985, "learning_rate": 9.789545392057093e-05, "epoch": 0.10785351987068725, "percentage": 10.79, "elapsed_time": "4:34:52", "remaining_time": "1 day, 13:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1936, "total_steps": 17941, "loss": 1.6734, "learning_rate": 9.789289700628158e-05, "epoch": 0.1079092581238504, "percentage": 10.79, "elapsed_time": "4:35:02", "remaining_time": "1 day, 13:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1937, "total_steps": 17941, "loss": 1.8051, "learning_rate": 9.789033857310876e-05, "epoch": 0.10796499637701354, "percentage": 10.8, "elapsed_time": "4:35:10", "remaining_time": "1 day, 13:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1938, "total_steps": 17941, "loss": 1.7073, "learning_rate": 9.788777862113363e-05, "epoch": 0.1080207346301767, "percentage": 10.8, "elapsed_time": "4:35:19", "remaining_time": "1 day, 13:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1939, "total_steps": 17941, "loss": 1.6106, "learning_rate": 9.788521715043736e-05, "epoch": 0.10807647288333984, "percentage": 10.81, "elapsed_time": "4:35:27", "remaining_time": "1 day, 13:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1940, "total_steps": 17941, "loss": 1.9005, "learning_rate": 9.78826541611012e-05, "epoch": 0.10813221113650298, "percentage": 10.81, "elapsed_time": "4:35:36", "remaining_time": "1 day, 13:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1941, "total_steps": 17941, "loss": 1.6169, "learning_rate": 9.788008965320643e-05, "epoch": 0.10818794938966612, "percentage": 10.82, "elapsed_time": "4:35:44", "remaining_time": "1 day, 13:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1942, "total_steps": 17941, "loss": 1.6712, "learning_rate": 9.787752362683438e-05, "epoch": 0.10824368764282927, "percentage": 10.82, "elapsed_time": "4:35:52", "remaining_time": "1 day, 13:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1943, "total_steps": 17941, "loss": 1.6697, "learning_rate": 9.78749560820664e-05, "epoch": 0.10829942589599242, "percentage": 10.83, "elapsed_time": "4:36:02", "remaining_time": "1 day, 13:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1944, "total_steps": 17941, "loss": 1.6955, "learning_rate": 9.787238701898397e-05, "epoch": 0.10835516414915557, "percentage": 10.84, "elapsed_time": "4:36:10", "remaining_time": "1 day, 13:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1945, "total_steps": 17941, "loss": 1.695, "learning_rate": 9.786981643766852e-05, "epoch": 0.10841090240231871, "percentage": 10.84, "elapsed_time": "4:36:19", "remaining_time": "1 day, 13:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1946, "total_steps": 17941, "loss": 1.8205, "learning_rate": 9.78672443382016e-05, "epoch": 0.10846664065548185, "percentage": 10.85, "elapsed_time": "4:36:27", "remaining_time": "1 day, 13:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1947, "total_steps": 17941, "loss": 1.7815, "learning_rate": 9.786467072066478e-05, "epoch": 0.10852237890864501, "percentage": 10.85, "elapsed_time": "4:36:35", "remaining_time": "1 day, 13:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1948, "total_steps": 17941, "loss": 2.0612, "learning_rate": 9.786209558513968e-05, "epoch": 0.10857811716180815, "percentage": 10.86, "elapsed_time": "4:36:44", "remaining_time": "1 day, 13:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1949, "total_steps": 17941, "loss": 1.8648, "learning_rate": 9.785951893170795e-05, "epoch": 0.1086338554149713, "percentage": 10.86, "elapsed_time": "4:36:52", "remaining_time": "1 day, 13:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1950, "total_steps": 17941, "loss": 1.7291, "learning_rate": 9.785694076045133e-05, "epoch": 0.10868959366813444, "percentage": 10.87, "elapsed_time": "4:37:01", "remaining_time": "1 day, 13:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1951, "total_steps": 17941, "loss": 1.9079, "learning_rate": 9.785436107145156e-05, "epoch": 0.10874533192129758, "percentage": 10.87, "elapsed_time": "4:37:09", "remaining_time": "1 day, 13:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1952, "total_steps": 17941, "loss": 1.888, "learning_rate": 9.785177986479048e-05, "epoch": 0.10880107017446074, "percentage": 10.88, "elapsed_time": "4:37:18", "remaining_time": "1 day, 13:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1953, "total_steps": 17941, "loss": 1.7309, "learning_rate": 9.784919714054993e-05, "epoch": 0.10885680842762388, "percentage": 10.89, "elapsed_time": "4:37:26", "remaining_time": "1 day, 13:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1954, "total_steps": 17941, "loss": 1.7366, "learning_rate": 9.784661289881183e-05, "epoch": 0.10891254668078702, "percentage": 10.89, "elapsed_time": "4:37:35", "remaining_time": "1 day, 13:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1955, "total_steps": 17941, "loss": 1.6749, "learning_rate": 9.784402713965815e-05, "epoch": 0.10896828493395017, "percentage": 10.9, "elapsed_time": "4:37:43", "remaining_time": "1 day, 13:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1956, "total_steps": 17941, "loss": 1.8123, "learning_rate": 9.784143986317084e-05, "epoch": 0.10902402318711332, "percentage": 10.9, "elapsed_time": "4:37:52", "remaining_time": "1 day, 13:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1957, "total_steps": 17941, "loss": 1.5919, "learning_rate": 9.783885106943203e-05, "epoch": 0.10907976144027647, "percentage": 10.91, "elapsed_time": "4:38:00", "remaining_time": "1 day, 13:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1958, "total_steps": 17941, "loss": 1.8938, "learning_rate": 9.783626075852377e-05, "epoch": 0.10913549969343961, "percentage": 10.91, "elapsed_time": "4:38:09", "remaining_time": "1 day, 13:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1959, "total_steps": 17941, "loss": 1.6972, "learning_rate": 9.783366893052822e-05, "epoch": 0.10919123794660275, "percentage": 10.92, "elapsed_time": "4:38:17", "remaining_time": "1 day, 13:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1960, "total_steps": 17941, "loss": 1.5967, "learning_rate": 9.783107558552759e-05, "epoch": 0.1092469761997659, "percentage": 10.92, "elapsed_time": "4:38:25", "remaining_time": "1 day, 13:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1961, "total_steps": 17941, "loss": 1.4359, "learning_rate": 9.782848072360411e-05, "epoch": 0.10930271445292905, "percentage": 10.93, "elapsed_time": "4:38:34", "remaining_time": "1 day, 13:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1962, "total_steps": 17941, "loss": 1.8727, "learning_rate": 9.782588434484008e-05, "epoch": 0.1093584527060922, "percentage": 10.94, "elapsed_time": "4:38:43", "remaining_time": "1 day, 13:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1963, "total_steps": 17941, "loss": 1.6863, "learning_rate": 9.782328644931784e-05, "epoch": 0.10941419095925534, "percentage": 10.94, "elapsed_time": "4:38:51", "remaining_time": "1 day, 13:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1964, "total_steps": 17941, "loss": 1.8686, "learning_rate": 9.782068703711979e-05, "epoch": 0.10946992921241848, "percentage": 10.95, "elapsed_time": "4:38:59", "remaining_time": "1 day, 13:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1965, "total_steps": 17941, "loss": 1.8671, "learning_rate": 9.781808610832837e-05, "epoch": 0.10952566746558162, "percentage": 10.95, "elapsed_time": "4:39:08", "remaining_time": "1 day, 13:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1966, "total_steps": 17941, "loss": 1.855, "learning_rate": 9.781548366302604e-05, "epoch": 0.10958140571874478, "percentage": 10.96, "elapsed_time": "4:39:16", "remaining_time": "1 day, 13:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1967, "total_steps": 17941, "loss": 1.8296, "learning_rate": 9.781287970129536e-05, "epoch": 0.10963714397190792, "percentage": 10.96, "elapsed_time": "4:39:25", "remaining_time": "1 day, 13:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1968, "total_steps": 17941, "loss": 1.6181, "learning_rate": 9.781027422321891e-05, "epoch": 0.10969288222507106, "percentage": 10.97, "elapsed_time": "4:39:33", "remaining_time": "1 day, 13:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1969, "total_steps": 17941, "loss": 1.8194, "learning_rate": 9.78076672288793e-05, "epoch": 0.10974862047823421, "percentage": 10.97, "elapsed_time": "4:39:43", "remaining_time": "1 day, 13:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1970, "total_steps": 17941, "loss": 1.857, "learning_rate": 9.780505871835924e-05, "epoch": 0.10980435873139736, "percentage": 10.98, "elapsed_time": "4:39:51", "remaining_time": "1 day, 13:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1971, "total_steps": 17941, "loss": 1.5722, "learning_rate": 9.780244869174142e-05, "epoch": 0.1098600969845605, "percentage": 10.99, "elapsed_time": "4:39:59", "remaining_time": "1 day, 13:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1972, "total_steps": 17941, "loss": 1.7926, "learning_rate": 9.779983714910865e-05, "epoch": 0.10991583523772365, "percentage": 10.99, "elapsed_time": "4:40:08", "remaining_time": "1 day, 13:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1973, "total_steps": 17941, "loss": 1.9054, "learning_rate": 9.779722409054374e-05, "epoch": 0.10997157349088679, "percentage": 11.0, "elapsed_time": "4:40:16", "remaining_time": "1 day, 13:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1974, "total_steps": 17941, "loss": 1.5573, "learning_rate": 9.779460951612955e-05, "epoch": 0.11002731174404994, "percentage": 11.0, "elapsed_time": "4:40:25", "remaining_time": "1 day, 13:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1975, "total_steps": 17941, "loss": 2.0516, "learning_rate": 9.779199342594902e-05, "epoch": 0.11008304999721309, "percentage": 11.01, "elapsed_time": "4:40:33", "remaining_time": "1 day, 13:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1976, "total_steps": 17941, "loss": 1.7119, "learning_rate": 9.778937582008509e-05, "epoch": 0.11013878825037623, "percentage": 11.01, "elapsed_time": "4:40:42", "remaining_time": "1 day, 13:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1977, "total_steps": 17941, "loss": 1.6784, "learning_rate": 9.77867566986208e-05, "epoch": 0.11019452650353938, "percentage": 11.02, "elapsed_time": "4:40:50", "remaining_time": "1 day, 13:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1978, "total_steps": 17941, "loss": 1.4993, "learning_rate": 9.77841360616392e-05, "epoch": 0.11025026475670252, "percentage": 11.03, "elapsed_time": "4:40:59", "remaining_time": "1 day, 13:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1979, "total_steps": 17941, "loss": 1.8278, "learning_rate": 9.778151390922341e-05, "epoch": 0.11030600300986568, "percentage": 11.03, "elapsed_time": "4:41:07", "remaining_time": "1 day, 13:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1980, "total_steps": 17941, "loss": 1.9032, "learning_rate": 9.777889024145657e-05, "epoch": 0.11036174126302882, "percentage": 11.04, "elapsed_time": "4:41:16", "remaining_time": "1 day, 13:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1981, "total_steps": 17941, "loss": 1.8758, "learning_rate": 9.777626505842193e-05, "epoch": 0.11041747951619196, "percentage": 11.04, "elapsed_time": "4:41:24", "remaining_time": "1 day, 13:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1982, "total_steps": 17941, "loss": 1.8698, "learning_rate": 9.777363836020268e-05, "epoch": 0.1104732177693551, "percentage": 11.05, "elapsed_time": "4:41:33", "remaining_time": "1 day, 13:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1983, "total_steps": 17941, "loss": 1.87, "learning_rate": 9.777101014688219e-05, "epoch": 0.11052895602251825, "percentage": 11.05, "elapsed_time": "4:41:41", "remaining_time": "1 day, 13:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1984, "total_steps": 17941, "loss": 1.9022, "learning_rate": 9.776838041854377e-05, "epoch": 0.1105846942756814, "percentage": 11.06, "elapsed_time": "4:41:50", "remaining_time": "1 day, 13:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1985, "total_steps": 17941, "loss": 2.0603, "learning_rate": 9.776574917527083e-05, "epoch": 0.11064043252884455, "percentage": 11.06, "elapsed_time": "4:41:58", "remaining_time": "1 day, 13:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1986, "total_steps": 17941, "loss": 1.7887, "learning_rate": 9.776311641714683e-05, "epoch": 0.11069617078200769, "percentage": 11.07, "elapsed_time": "4:42:07", "remaining_time": "1 day, 13:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1987, "total_steps": 17941, "loss": 1.7294, "learning_rate": 9.776048214425525e-05, "epoch": 0.11075190903517083, "percentage": 11.08, "elapsed_time": "4:42:15", "remaining_time": "1 day, 13:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1988, "total_steps": 17941, "loss": 1.7357, "learning_rate": 9.775784635667964e-05, "epoch": 0.11080764728833398, "percentage": 11.08, "elapsed_time": "4:42:24", "remaining_time": "1 day, 13:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1989, "total_steps": 17941, "loss": 1.7027, "learning_rate": 9.77552090545036e-05, "epoch": 0.11086338554149713, "percentage": 11.09, "elapsed_time": "4:42:32", "remaining_time": "1 day, 13:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1990, "total_steps": 17941, "loss": 1.9082, "learning_rate": 9.775257023781074e-05, "epoch": 0.11091912379466028, "percentage": 11.09, "elapsed_time": "4:42:41", "remaining_time": "1 day, 13:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1991, "total_steps": 17941, "loss": 1.8572, "learning_rate": 9.774992990668479e-05, "epoch": 0.11097486204782342, "percentage": 11.1, "elapsed_time": "4:42:50", "remaining_time": "1 day, 13:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1992, "total_steps": 17941, "loss": 1.9287, "learning_rate": 9.774728806120945e-05, "epoch": 0.11103060030098656, "percentage": 11.1, "elapsed_time": "4:42:58", "remaining_time": "1 day, 13:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1993, "total_steps": 17941, "loss": 1.6721, "learning_rate": 9.774464470146851e-05, "epoch": 0.11108633855414972, "percentage": 11.11, "elapsed_time": "4:43:06", "remaining_time": "1 day, 13:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1994, "total_steps": 17941, "loss": 1.6999, "learning_rate": 9.774199982754584e-05, "epoch": 0.11114207680731286, "percentage": 11.11, "elapsed_time": "4:43:15", "remaining_time": "1 day, 13:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1995, "total_steps": 17941, "loss": 1.6968, "learning_rate": 9.773935343952527e-05, "epoch": 0.111197815060476, "percentage": 11.12, "elapsed_time": "4:43:24", "remaining_time": "1 day, 13:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1996, "total_steps": 17941, "loss": 1.8122, "learning_rate": 9.773670553749075e-05, "epoch": 0.11125355331363915, "percentage": 11.13, "elapsed_time": "4:43:32", "remaining_time": "1 day, 13:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1997, "total_steps": 17941, "loss": 1.6712, "learning_rate": 9.773405612152626e-05, "epoch": 0.11130929156680229, "percentage": 11.13, "elapsed_time": "4:43:41", "remaining_time": "1 day, 13:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1998, "total_steps": 17941, "loss": 1.8872, "learning_rate": 9.773140519171582e-05, "epoch": 0.11136502981996545, "percentage": 11.14, "elapsed_time": "4:43:49", "remaining_time": "1 day, 13:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1999, "total_steps": 17941, "loss": 1.7659, "learning_rate": 9.77287527481435e-05, "epoch": 0.11142076807312859, "percentage": 11.14, "elapsed_time": "4:43:58", "remaining_time": "1 day, 13:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 17941, "loss": 1.9805, "learning_rate": 9.772609879089341e-05, "epoch": 0.11147650632629173, "percentage": 11.15, "elapsed_time": "4:44:06", "remaining_time": "1 day, 13:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2001, "total_steps": 17941, "loss": 1.7215, "learning_rate": 9.772344332004975e-05, "epoch": 0.11153224457945488, "percentage": 11.15, "elapsed_time": "4:44:14", "remaining_time": "1 day, 13:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2002, "total_steps": 17941, "loss": 1.8071, "learning_rate": 9.77207863356967e-05, "epoch": 0.11158798283261803, "percentage": 11.16, "elapsed_time": "4:44:23", "remaining_time": "1 day, 13:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2003, "total_steps": 17941, "loss": 1.6401, "learning_rate": 9.771812783791854e-05, "epoch": 0.11164372108578118, "percentage": 11.16, "elapsed_time": "4:44:31", "remaining_time": "1 day, 13:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2004, "total_steps": 17941, "loss": 1.7649, "learning_rate": 9.771546782679959e-05, "epoch": 0.11169945933894432, "percentage": 11.17, "elapsed_time": "4:44:40", "remaining_time": "1 day, 13:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2005, "total_steps": 17941, "loss": 1.9245, "learning_rate": 9.771280630242419e-05, "epoch": 0.11175519759210746, "percentage": 11.18, "elapsed_time": "4:44:48", "remaining_time": "1 day, 13:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2006, "total_steps": 17941, "loss": 1.6562, "learning_rate": 9.771014326487675e-05, "epoch": 0.1118109358452706, "percentage": 11.18, "elapsed_time": "4:44:57", "remaining_time": "1 day, 13:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2007, "total_steps": 17941, "loss": 1.8504, "learning_rate": 9.770747871424175e-05, "epoch": 0.11186667409843376, "percentage": 11.19, "elapsed_time": "4:45:05", "remaining_time": "1 day, 13:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2008, "total_steps": 17941, "loss": 1.5858, "learning_rate": 9.770481265060368e-05, "epoch": 0.1119224123515969, "percentage": 11.19, "elapsed_time": "4:45:14", "remaining_time": "1 day, 13:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2009, "total_steps": 17941, "loss": 1.8421, "learning_rate": 9.770214507404709e-05, "epoch": 0.11197815060476005, "percentage": 11.2, "elapsed_time": "4:45:23", "remaining_time": "1 day, 13:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2010, "total_steps": 17941, "loss": 1.7521, "learning_rate": 9.769947598465657e-05, "epoch": 0.11203388885792319, "percentage": 11.2, "elapsed_time": "4:45:31", "remaining_time": "1 day, 13:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2011, "total_steps": 17941, "loss": 1.8359, "learning_rate": 9.76968053825168e-05, "epoch": 0.11208962711108633, "percentage": 11.21, "elapsed_time": "4:45:39", "remaining_time": "1 day, 13:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2012, "total_steps": 17941, "loss": 1.7792, "learning_rate": 9.769413326771243e-05, "epoch": 0.11214536536424949, "percentage": 11.21, "elapsed_time": "4:45:48", "remaining_time": "1 day, 13:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2013, "total_steps": 17941, "loss": 1.8502, "learning_rate": 9.769145964032824e-05, "epoch": 0.11220110361741263, "percentage": 11.22, "elapsed_time": "4:45:56", "remaining_time": "1 day, 13:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2014, "total_steps": 17941, "loss": 1.9158, "learning_rate": 9.768878450044902e-05, "epoch": 0.11225684187057577, "percentage": 11.23, "elapsed_time": "4:46:05", "remaining_time": "1 day, 13:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2015, "total_steps": 17941, "loss": 1.5545, "learning_rate": 9.768610784815959e-05, "epoch": 0.11231258012373892, "percentage": 11.23, "elapsed_time": "4:46:13", "remaining_time": "1 day, 13:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2016, "total_steps": 17941, "loss": 1.6679, "learning_rate": 9.768342968354484e-05, "epoch": 0.11236831837690207, "percentage": 11.24, "elapsed_time": "4:46:22", "remaining_time": "1 day, 13:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2017, "total_steps": 17941, "loss": 1.7114, "learning_rate": 9.768075000668974e-05, "epoch": 0.11242405663006522, "percentage": 11.24, "elapsed_time": "4:46:30", "remaining_time": "1 day, 13:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2018, "total_steps": 17941, "loss": 1.8553, "learning_rate": 9.767806881767923e-05, "epoch": 0.11247979488322836, "percentage": 11.25, "elapsed_time": "4:46:38", "remaining_time": "1 day, 13:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2019, "total_steps": 17941, "loss": 1.9799, "learning_rate": 9.767538611659837e-05, "epoch": 0.1125355331363915, "percentage": 11.25, "elapsed_time": "4:46:47", "remaining_time": "1 day, 13:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2020, "total_steps": 17941, "loss": 2.0631, "learning_rate": 9.767270190353221e-05, "epoch": 0.11259127138955465, "percentage": 11.26, "elapsed_time": "4:46:55", "remaining_time": "1 day, 13:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2021, "total_steps": 17941, "loss": 1.8081, "learning_rate": 9.767001617856591e-05, "epoch": 0.1126470096427178, "percentage": 11.26, "elapsed_time": "4:47:04", "remaining_time": "1 day, 13:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2022, "total_steps": 17941, "loss": 1.6224, "learning_rate": 9.766732894178463e-05, "epoch": 0.11270274789588094, "percentage": 11.27, "elapsed_time": "4:47:12", "remaining_time": "1 day, 13:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2023, "total_steps": 17941, "loss": 1.8425, "learning_rate": 9.766464019327359e-05, "epoch": 0.11275848614904409, "percentage": 11.28, "elapsed_time": "4:47:21", "remaining_time": "1 day, 13:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2024, "total_steps": 17941, "loss": 1.8101, "learning_rate": 9.766194993311809e-05, "epoch": 0.11281422440220723, "percentage": 11.28, "elapsed_time": "4:47:29", "remaining_time": "1 day, 13:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2025, "total_steps": 17941, "loss": 1.7461, "learning_rate": 9.76592581614034e-05, "epoch": 0.11286996265537039, "percentage": 11.29, "elapsed_time": "4:47:38", "remaining_time": "1 day, 13:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2026, "total_steps": 17941, "loss": 1.9905, "learning_rate": 9.765656487821492e-05, "epoch": 0.11292570090853353, "percentage": 11.29, "elapsed_time": "4:47:46", "remaining_time": "1 day, 13:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2027, "total_steps": 17941, "loss": 1.7689, "learning_rate": 9.765387008363807e-05, "epoch": 0.11298143916169667, "percentage": 11.3, "elapsed_time": "4:47:54", "remaining_time": "1 day, 13:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2028, "total_steps": 17941, "loss": 1.7994, "learning_rate": 9.76511737777583e-05, "epoch": 0.11303717741485982, "percentage": 11.3, "elapsed_time": "4:48:03", "remaining_time": "1 day, 13:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2029, "total_steps": 17941, "loss": 1.5192, "learning_rate": 9.764847596066111e-05, "epoch": 0.11309291566802296, "percentage": 11.31, "elapsed_time": "4:48:11", "remaining_time": "1 day, 13:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2030, "total_steps": 17941, "loss": 1.5906, "learning_rate": 9.764577663243209e-05, "epoch": 0.11314865392118612, "percentage": 11.31, "elapsed_time": "4:48:20", "remaining_time": "1 day, 13:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2031, "total_steps": 17941, "loss": 1.4503, "learning_rate": 9.764307579315681e-05, "epoch": 0.11320439217434926, "percentage": 11.32, "elapsed_time": "4:48:28", "remaining_time": "1 day, 13:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2032, "total_steps": 17941, "loss": 1.7865, "learning_rate": 9.764037344292096e-05, "epoch": 0.1132601304275124, "percentage": 11.33, "elapsed_time": "4:48:37", "remaining_time": "1 day, 13:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2033, "total_steps": 17941, "loss": 1.6803, "learning_rate": 9.763766958181022e-05, "epoch": 0.11331586868067554, "percentage": 11.33, "elapsed_time": "4:48:45", "remaining_time": "1 day, 13:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2034, "total_steps": 17941, "loss": 1.902, "learning_rate": 9.763496420991037e-05, "epoch": 0.11337160693383869, "percentage": 11.34, "elapsed_time": "4:48:54", "remaining_time": "1 day, 13:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2035, "total_steps": 17941, "loss": 1.7774, "learning_rate": 9.763225732730716e-05, "epoch": 0.11342734518700184, "percentage": 11.34, "elapsed_time": "4:49:02", "remaining_time": "1 day, 13:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2036, "total_steps": 17941, "loss": 1.7369, "learning_rate": 9.762954893408646e-05, "epoch": 0.11348308344016499, "percentage": 11.35, "elapsed_time": "4:49:11", "remaining_time": "1 day, 13:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2037, "total_steps": 17941, "loss": 1.914, "learning_rate": 9.762683903033419e-05, "epoch": 0.11353882169332813, "percentage": 11.35, "elapsed_time": "4:49:19", "remaining_time": "1 day, 13:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2038, "total_steps": 17941, "loss": 1.8155, "learning_rate": 9.762412761613624e-05, "epoch": 0.11359455994649127, "percentage": 11.36, "elapsed_time": "4:49:28", "remaining_time": "1 day, 13:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2039, "total_steps": 17941, "loss": 1.6183, "learning_rate": 9.762141469157865e-05, "epoch": 0.11365029819965443, "percentage": 11.37, "elapsed_time": "4:49:36", "remaining_time": "1 day, 13:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2040, "total_steps": 17941, "loss": 1.887, "learning_rate": 9.761870025674743e-05, "epoch": 0.11370603645281757, "percentage": 11.37, "elapsed_time": "4:49:45", "remaining_time": "1 day, 13:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2041, "total_steps": 17941, "loss": 1.7928, "learning_rate": 9.761598431172868e-05, "epoch": 0.11376177470598071, "percentage": 11.38, "elapsed_time": "4:49:53", "remaining_time": "1 day, 13:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2042, "total_steps": 17941, "loss": 1.6132, "learning_rate": 9.761326685660852e-05, "epoch": 0.11381751295914386, "percentage": 11.38, "elapsed_time": "4:50:02", "remaining_time": "1 day, 13:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2043, "total_steps": 17941, "loss": 1.4053, "learning_rate": 9.761054789147315e-05, "epoch": 0.113873251212307, "percentage": 11.39, "elapsed_time": "4:50:10", "remaining_time": "1 day, 13:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2044, "total_steps": 17941, "loss": 1.649, "learning_rate": 9.760782741640879e-05, "epoch": 0.11392898946547016, "percentage": 11.39, "elapsed_time": "4:50:19", "remaining_time": "1 day, 13:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2045, "total_steps": 17941, "loss": 1.7286, "learning_rate": 9.76051054315017e-05, "epoch": 0.1139847277186333, "percentage": 11.4, "elapsed_time": "4:50:27", "remaining_time": "1 day, 13:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2046, "total_steps": 17941, "loss": 1.7911, "learning_rate": 9.760238193683824e-05, "epoch": 0.11404046597179644, "percentage": 11.4, "elapsed_time": "4:50:36", "remaining_time": "1 day, 13:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2047, "total_steps": 17941, "loss": 1.7731, "learning_rate": 9.759965693250477e-05, "epoch": 0.11409620422495959, "percentage": 11.41, "elapsed_time": "4:50:44", "remaining_time": "1 day, 13:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2048, "total_steps": 17941, "loss": 1.7917, "learning_rate": 9.75969304185877e-05, "epoch": 0.11415194247812274, "percentage": 11.42, "elapsed_time": "4:50:53", "remaining_time": "1 day, 13:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2049, "total_steps": 17941, "loss": 1.7298, "learning_rate": 9.75942023951735e-05, "epoch": 0.11420768073128588, "percentage": 11.42, "elapsed_time": "4:51:01", "remaining_time": "1 day, 13:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2050, "total_steps": 17941, "loss": 1.8422, "learning_rate": 9.75914728623487e-05, "epoch": 0.11426341898444903, "percentage": 11.43, "elapsed_time": "4:51:10", "remaining_time": "1 day, 13:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2051, "total_steps": 17941, "loss": 1.7194, "learning_rate": 9.758874182019986e-05, "epoch": 0.11431915723761217, "percentage": 11.43, "elapsed_time": "4:51:18", "remaining_time": "1 day, 13:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2052, "total_steps": 17941, "loss": 1.782, "learning_rate": 9.758600926881358e-05, "epoch": 0.11437489549077531, "percentage": 11.44, "elapsed_time": "4:51:26", "remaining_time": "1 day, 13:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2053, "total_steps": 17941, "loss": 1.8925, "learning_rate": 9.758327520827654e-05, "epoch": 0.11443063374393847, "percentage": 11.44, "elapsed_time": "4:51:35", "remaining_time": "1 day, 13:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2054, "total_steps": 17941, "loss": 1.5632, "learning_rate": 9.758053963867544e-05, "epoch": 0.11448637199710161, "percentage": 11.45, "elapsed_time": "4:51:43", "remaining_time": "1 day, 13:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2055, "total_steps": 17941, "loss": 2.0612, "learning_rate": 9.757780256009704e-05, "epoch": 0.11454211025026476, "percentage": 11.45, "elapsed_time": "4:51:52", "remaining_time": "1 day, 13:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2056, "total_steps": 17941, "loss": 1.4963, "learning_rate": 9.757506397262814e-05, "epoch": 0.1145978485034279, "percentage": 11.46, "elapsed_time": "4:52:00", "remaining_time": "1 day, 13:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2057, "total_steps": 17941, "loss": 1.7024, "learning_rate": 9.757232387635559e-05, "epoch": 0.11465358675659104, "percentage": 11.47, "elapsed_time": "4:52:09", "remaining_time": "1 day, 13:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2058, "total_steps": 17941, "loss": 1.7356, "learning_rate": 9.75695822713663e-05, "epoch": 0.1147093250097542, "percentage": 11.47, "elapsed_time": "4:52:17", "remaining_time": "1 day, 13:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2059, "total_steps": 17941, "loss": 1.9454, "learning_rate": 9.75668391577472e-05, "epoch": 0.11476506326291734, "percentage": 11.48, "elapsed_time": "4:52:25", "remaining_time": "1 day, 13:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2060, "total_steps": 17941, "loss": 1.7741, "learning_rate": 9.756409453558531e-05, "epoch": 0.11482080151608048, "percentage": 11.48, "elapsed_time": "4:52:34", "remaining_time": "1 day, 13:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2061, "total_steps": 17941, "loss": 1.6877, "learning_rate": 9.756134840496763e-05, "epoch": 0.11487653976924363, "percentage": 11.49, "elapsed_time": "4:52:43", "remaining_time": "1 day, 13:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2062, "total_steps": 17941, "loss": 1.8947, "learning_rate": 9.75586007659813e-05, "epoch": 0.11493227802240678, "percentage": 11.49, "elapsed_time": "4:52:51", "remaining_time": "1 day, 13:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2063, "total_steps": 17941, "loss": 1.632, "learning_rate": 9.755585161871344e-05, "epoch": 0.11498801627556993, "percentage": 11.5, "elapsed_time": "4:53:00", "remaining_time": "1 day, 13:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2064, "total_steps": 17941, "loss": 1.8176, "learning_rate": 9.755310096325123e-05, "epoch": 0.11504375452873307, "percentage": 11.5, "elapsed_time": "4:53:09", "remaining_time": "1 day, 13:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2065, "total_steps": 17941, "loss": 1.9844, "learning_rate": 9.755034879968193e-05, "epoch": 0.11509949278189621, "percentage": 11.51, "elapsed_time": "4:53:17", "remaining_time": "1 day, 13:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2066, "total_steps": 17941, "loss": 2.0891, "learning_rate": 9.754759512809277e-05, "epoch": 0.11515523103505935, "percentage": 11.52, "elapsed_time": "4:53:26", "remaining_time": "1 day, 13:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2067, "total_steps": 17941, "loss": 1.7906, "learning_rate": 9.754483994857115e-05, "epoch": 0.11521096928822251, "percentage": 11.52, "elapsed_time": "4:53:34", "remaining_time": "1 day, 13:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2068, "total_steps": 17941, "loss": 1.9245, "learning_rate": 9.75420832612044e-05, "epoch": 0.11526670754138565, "percentage": 11.53, "elapsed_time": "4:53:42", "remaining_time": "1 day, 13:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2069, "total_steps": 17941, "loss": 1.5529, "learning_rate": 9.753932506607995e-05, "epoch": 0.1153224457945488, "percentage": 11.53, "elapsed_time": "4:53:51", "remaining_time": "1 day, 13:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2070, "total_steps": 17941, "loss": 1.7138, "learning_rate": 9.753656536328528e-05, "epoch": 0.11537818404771194, "percentage": 11.54, "elapsed_time": "4:53:59", "remaining_time": "1 day, 13:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2071, "total_steps": 17941, "loss": 1.7991, "learning_rate": 9.753380415290792e-05, "epoch": 0.1154339223008751, "percentage": 11.54, "elapsed_time": "4:54:08", "remaining_time": "1 day, 13:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2072, "total_steps": 17941, "loss": 1.6249, "learning_rate": 9.753104143503544e-05, "epoch": 0.11548966055403824, "percentage": 11.55, "elapsed_time": "4:54:16", "remaining_time": "1 day, 13:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2073, "total_steps": 17941, "loss": 1.7194, "learning_rate": 9.752827720975544e-05, "epoch": 0.11554539880720138, "percentage": 11.55, "elapsed_time": "4:54:25", "remaining_time": "1 day, 13:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2074, "total_steps": 17941, "loss": 1.6221, "learning_rate": 9.75255114771556e-05, "epoch": 0.11560113706036453, "percentage": 11.56, "elapsed_time": "4:54:33", "remaining_time": "1 day, 13:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2075, "total_steps": 17941, "loss": 1.5454, "learning_rate": 9.752274423732364e-05, "epoch": 0.11565687531352767, "percentage": 11.57, "elapsed_time": "4:54:42", "remaining_time": "1 day, 13:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2076, "total_steps": 17941, "loss": 1.8162, "learning_rate": 9.75199754903473e-05, "epoch": 0.11571261356669083, "percentage": 11.57, "elapsed_time": "4:54:50", "remaining_time": "1 day, 13:33:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2077, "total_steps": 17941, "loss": 1.8913, "learning_rate": 9.75172052363144e-05, "epoch": 0.11576835181985397, "percentage": 11.58, "elapsed_time": "4:54:59", "remaining_time": "1 day, 13:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2078, "total_steps": 17941, "loss": 1.6392, "learning_rate": 9.751443347531279e-05, "epoch": 0.11582409007301711, "percentage": 11.58, "elapsed_time": "4:55:07", "remaining_time": "1 day, 13:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2079, "total_steps": 17941, "loss": 1.6481, "learning_rate": 9.751166020743037e-05, "epoch": 0.11587982832618025, "percentage": 11.59, "elapsed_time": "4:55:16", "remaining_time": "1 day, 13:32:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2080, "total_steps": 17941, "loss": 1.7507, "learning_rate": 9.750888543275511e-05, "epoch": 0.1159355665793434, "percentage": 11.59, "elapsed_time": "4:55:24", "remaining_time": "1 day, 13:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2081, "total_steps": 17941, "loss": 1.7667, "learning_rate": 9.750610915137502e-05, "epoch": 0.11599130483250655, "percentage": 11.6, "elapsed_time": "4:55:33", "remaining_time": "1 day, 13:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2082, "total_steps": 17941, "loss": 1.7303, "learning_rate": 9.750333136337811e-05, "epoch": 0.1160470430856697, "percentage": 11.6, "elapsed_time": "4:55:41", "remaining_time": "1 day, 13:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2083, "total_steps": 17941, "loss": 1.9936, "learning_rate": 9.750055206885249e-05, "epoch": 0.11610278133883284, "percentage": 11.61, "elapsed_time": "4:55:50", "remaining_time": "1 day, 13:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2084, "total_steps": 17941, "loss": 1.8642, "learning_rate": 9.74977712678863e-05, "epoch": 0.11615851959199598, "percentage": 11.62, "elapsed_time": "4:55:58", "remaining_time": "1 day, 13:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2085, "total_steps": 17941, "loss": 1.8, "learning_rate": 9.749498896056775e-05, "epoch": 0.11621425784515914, "percentage": 11.62, "elapsed_time": "4:56:06", "remaining_time": "1 day, 13:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2086, "total_steps": 17941, "loss": 1.8553, "learning_rate": 9.749220514698505e-05, "epoch": 0.11626999609832228, "percentage": 11.63, "elapsed_time": "4:56:15", "remaining_time": "1 day, 13:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2087, "total_steps": 17941, "loss": 1.5635, "learning_rate": 9.748941982722652e-05, "epoch": 0.11632573435148542, "percentage": 11.63, "elapsed_time": "4:56:23", "remaining_time": "1 day, 13:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2088, "total_steps": 17941, "loss": 2.0887, "learning_rate": 9.748663300138046e-05, "epoch": 0.11638147260464857, "percentage": 11.64, "elapsed_time": "4:56:32", "remaining_time": "1 day, 13:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2089, "total_steps": 17941, "loss": 1.7254, "learning_rate": 9.748384466953529e-05, "epoch": 0.11643721085781171, "percentage": 11.64, "elapsed_time": "4:56:40", "remaining_time": "1 day, 13:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2090, "total_steps": 17941, "loss": 2.0895, "learning_rate": 9.748105483177939e-05, "epoch": 0.11649294911097487, "percentage": 11.65, "elapsed_time": "4:56:49", "remaining_time": "1 day, 13:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2091, "total_steps": 17941, "loss": 1.6339, "learning_rate": 9.747826348820129e-05, "epoch": 0.11654868736413801, "percentage": 11.65, "elapsed_time": "4:56:57", "remaining_time": "1 day, 13:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2092, "total_steps": 17941, "loss": 1.8714, "learning_rate": 9.747547063888947e-05, "epoch": 0.11660442561730115, "percentage": 11.66, "elapsed_time": "4:57:06", "remaining_time": "1 day, 13:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2093, "total_steps": 17941, "loss": 1.8269, "learning_rate": 9.747267628393252e-05, "epoch": 0.1166601638704643, "percentage": 11.67, "elapsed_time": "4:57:14", "remaining_time": "1 day, 13:30:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2094, "total_steps": 17941, "loss": 1.7604, "learning_rate": 9.746988042341906e-05, "epoch": 0.11671590212362745, "percentage": 11.67, "elapsed_time": "4:57:23", "remaining_time": "1 day, 13:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2095, "total_steps": 17941, "loss": 2.2348, "learning_rate": 9.746708305743778e-05, "epoch": 0.1167716403767906, "percentage": 11.68, "elapsed_time": "4:57:31", "remaining_time": "1 day, 13:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2096, "total_steps": 17941, "loss": 1.811, "learning_rate": 9.746428418607737e-05, "epoch": 0.11682737862995374, "percentage": 11.68, "elapsed_time": "4:57:40", "remaining_time": "1 day, 13:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2097, "total_steps": 17941, "loss": 1.7822, "learning_rate": 9.746148380942661e-05, "epoch": 0.11688311688311688, "percentage": 11.69, "elapsed_time": "4:57:48", "remaining_time": "1 day, 13:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2098, "total_steps": 17941, "loss": 1.815, "learning_rate": 9.745868192757429e-05, "epoch": 0.11693885513628002, "percentage": 11.69, "elapsed_time": "4:57:56", "remaining_time": "1 day, 13:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2099, "total_steps": 17941, "loss": 1.6799, "learning_rate": 9.745587854060929e-05, "epoch": 0.11699459338944318, "percentage": 11.7, "elapsed_time": "4:58:05", "remaining_time": "1 day, 13:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2100, "total_steps": 17941, "loss": 1.3444, "learning_rate": 9.74530736486205e-05, "epoch": 0.11705033164260632, "percentage": 11.71, "elapsed_time": "4:58:13", "remaining_time": "1 day, 13:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2101, "total_steps": 17941, "loss": 1.6343, "learning_rate": 9.74502672516969e-05, "epoch": 0.11710606989576947, "percentage": 11.71, "elapsed_time": "4:58:22", "remaining_time": "1 day, 13:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2102, "total_steps": 17941, "loss": 1.8732, "learning_rate": 9.744745934992747e-05, "epoch": 0.11716180814893261, "percentage": 11.72, "elapsed_time": "4:58:31", "remaining_time": "1 day, 13:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2103, "total_steps": 17941, "loss": 1.823, "learning_rate": 9.744464994340126e-05, "epoch": 0.11721754640209577, "percentage": 11.72, "elapsed_time": "4:58:40", "remaining_time": "1 day, 13:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2104, "total_steps": 17941, "loss": 1.6152, "learning_rate": 9.744183903220738e-05, "epoch": 0.11727328465525891, "percentage": 11.73, "elapsed_time": "4:58:48", "remaining_time": "1 day, 13:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2105, "total_steps": 17941, "loss": 1.8159, "learning_rate": 9.743902661643498e-05, "epoch": 0.11732902290842205, "percentage": 11.73, "elapsed_time": "4:58:57", "remaining_time": "1 day, 13:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2106, "total_steps": 17941, "loss": 2.0891, "learning_rate": 9.743621269617324e-05, "epoch": 0.1173847611615852, "percentage": 11.74, "elapsed_time": "4:59:05", "remaining_time": "1 day, 13:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2107, "total_steps": 17941, "loss": 1.6851, "learning_rate": 9.74333972715114e-05, "epoch": 0.11744049941474834, "percentage": 11.74, "elapsed_time": "4:59:13", "remaining_time": "1 day, 13:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2108, "total_steps": 17941, "loss": 1.7487, "learning_rate": 9.743058034253876e-05, "epoch": 0.1174962376679115, "percentage": 11.75, "elapsed_time": "4:59:22", "remaining_time": "1 day, 13:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2109, "total_steps": 17941, "loss": 1.7077, "learning_rate": 9.742776190934464e-05, "epoch": 0.11755197592107464, "percentage": 11.76, "elapsed_time": "4:59:30", "remaining_time": "1 day, 13:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2110, "total_steps": 17941, "loss": 1.7193, "learning_rate": 9.742494197201845e-05, "epoch": 0.11760771417423778, "percentage": 11.76, "elapsed_time": "4:59:39", "remaining_time": "1 day, 13:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2111, "total_steps": 17941, "loss": 1.8341, "learning_rate": 9.742212053064959e-05, "epoch": 0.11766345242740092, "percentage": 11.77, "elapsed_time": "4:59:47", "remaining_time": "1 day, 13:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2112, "total_steps": 17941, "loss": 1.7452, "learning_rate": 9.741929758532758e-05, "epoch": 0.11771919068056406, "percentage": 11.77, "elapsed_time": "4:59:56", "remaining_time": "1 day, 13:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2113, "total_steps": 17941, "loss": 1.7242, "learning_rate": 9.741647313614191e-05, "epoch": 0.11777492893372722, "percentage": 11.78, "elapsed_time": "5:00:04", "remaining_time": "1 day, 13:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2114, "total_steps": 17941, "loss": 1.7484, "learning_rate": 9.741364718318216e-05, "epoch": 0.11783066718689036, "percentage": 11.78, "elapsed_time": "5:00:13", "remaining_time": "1 day, 13:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2115, "total_steps": 17941, "loss": 1.8975, "learning_rate": 9.741081972653798e-05, "epoch": 0.11788640544005351, "percentage": 11.79, "elapsed_time": "5:00:21", "remaining_time": "1 day, 13:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2116, "total_steps": 17941, "loss": 1.7848, "learning_rate": 9.740799076629902e-05, "epoch": 0.11794214369321665, "percentage": 11.79, "elapsed_time": "5:00:30", "remaining_time": "1 day, 13:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2117, "total_steps": 17941, "loss": 1.7087, "learning_rate": 9.7405160302555e-05, "epoch": 0.1179978819463798, "percentage": 11.8, "elapsed_time": "5:00:38", "remaining_time": "1 day, 13:27:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2118, "total_steps": 17941, "loss": 1.712, "learning_rate": 9.740232833539567e-05, "epoch": 0.11805362019954295, "percentage": 11.81, "elapsed_time": "5:00:47", "remaining_time": "1 day, 13:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2119, "total_steps": 17941, "loss": 1.6682, "learning_rate": 9.739949486491088e-05, "epoch": 0.11810935845270609, "percentage": 11.81, "elapsed_time": "5:00:56", "remaining_time": "1 day, 13:27:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2120, "total_steps": 17941, "loss": 1.7035, "learning_rate": 9.739665989119047e-05, "epoch": 0.11816509670586924, "percentage": 11.82, "elapsed_time": "5:01:04", "remaining_time": "1 day, 13:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2121, "total_steps": 17941, "loss": 1.6535, "learning_rate": 9.739382341432434e-05, "epoch": 0.11822083495903238, "percentage": 11.82, "elapsed_time": "5:01:13", "remaining_time": "1 day, 13:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2122, "total_steps": 17941, "loss": 1.9483, "learning_rate": 9.739098543440246e-05, "epoch": 0.11827657321219553, "percentage": 11.83, "elapsed_time": "5:01:21", "remaining_time": "1 day, 13:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2123, "total_steps": 17941, "loss": 1.6287, "learning_rate": 9.738814595151481e-05, "epoch": 0.11833231146535868, "percentage": 11.83, "elapsed_time": "5:01:29", "remaining_time": "1 day, 13:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2124, "total_steps": 17941, "loss": 1.8991, "learning_rate": 9.73853049657515e-05, "epoch": 0.11838804971852182, "percentage": 11.84, "elapsed_time": "5:01:38", "remaining_time": "1 day, 13:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2125, "total_steps": 17941, "loss": 1.7004, "learning_rate": 9.738246247720257e-05, "epoch": 0.11844378797168496, "percentage": 11.84, "elapsed_time": "5:01:46", "remaining_time": "1 day, 13:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2126, "total_steps": 17941, "loss": 1.8126, "learning_rate": 9.73796184859582e-05, "epoch": 0.11849952622484812, "percentage": 11.85, "elapsed_time": "5:01:55", "remaining_time": "1 day, 13:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2127, "total_steps": 17941, "loss": 1.6761, "learning_rate": 9.737677299210857e-05, "epoch": 0.11855526447801126, "percentage": 11.86, "elapsed_time": "5:02:03", "remaining_time": "1 day, 13:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2128, "total_steps": 17941, "loss": 1.6405, "learning_rate": 9.737392599574391e-05, "epoch": 0.1186110027311744, "percentage": 11.86, "elapsed_time": "5:02:12", "remaining_time": "1 day, 13:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2129, "total_steps": 17941, "loss": 1.8458, "learning_rate": 9.737107749695456e-05, "epoch": 0.11866674098433755, "percentage": 11.87, "elapsed_time": "5:02:21", "remaining_time": "1 day, 13:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2130, "total_steps": 17941, "loss": 1.9419, "learning_rate": 9.73682274958308e-05, "epoch": 0.11872247923750069, "percentage": 11.87, "elapsed_time": "5:02:29", "remaining_time": "1 day, 13:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2131, "total_steps": 17941, "loss": 2.0495, "learning_rate": 9.736537599246305e-05, "epoch": 0.11877821749066385, "percentage": 11.88, "elapsed_time": "5:02:38", "remaining_time": "1 day, 13:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2132, "total_steps": 17941, "loss": 1.7997, "learning_rate": 9.736252298694172e-05, "epoch": 0.11883395574382699, "percentage": 11.88, "elapsed_time": "5:02:46", "remaining_time": "1 day, 13:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2133, "total_steps": 17941, "loss": 2.0086, "learning_rate": 9.735966847935732e-05, "epoch": 0.11888969399699013, "percentage": 11.89, "elapsed_time": "5:02:55", "remaining_time": "1 day, 13:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2134, "total_steps": 17941, "loss": 1.8669, "learning_rate": 9.735681246980035e-05, "epoch": 0.11894543225015328, "percentage": 11.89, "elapsed_time": "5:03:04", "remaining_time": "1 day, 13:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2135, "total_steps": 17941, "loss": 1.4678, "learning_rate": 9.73539549583614e-05, "epoch": 0.11900117050331642, "percentage": 11.9, "elapsed_time": "5:03:13", "remaining_time": "1 day, 13:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2136, "total_steps": 17941, "loss": 1.758, "learning_rate": 9.73510959451311e-05, "epoch": 0.11905690875647958, "percentage": 11.91, "elapsed_time": "5:03:21", "remaining_time": "1 day, 13:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2137, "total_steps": 17941, "loss": 1.6377, "learning_rate": 9.734823543020009e-05, "epoch": 0.11911264700964272, "percentage": 11.91, "elapsed_time": "5:03:30", "remaining_time": "1 day, 13:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2138, "total_steps": 17941, "loss": 1.8973, "learning_rate": 9.734537341365914e-05, "epoch": 0.11916838526280586, "percentage": 11.92, "elapsed_time": "5:03:38", "remaining_time": "1 day, 13:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2139, "total_steps": 17941, "loss": 1.8316, "learning_rate": 9.734250989559896e-05, "epoch": 0.119224123515969, "percentage": 11.92, "elapsed_time": "5:03:47", "remaining_time": "1 day, 13:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2140, "total_steps": 17941, "loss": 1.9231, "learning_rate": 9.733964487611042e-05, "epoch": 0.11927986176913216, "percentage": 11.93, "elapsed_time": "5:03:55", "remaining_time": "1 day, 13:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2141, "total_steps": 17941, "loss": 1.7316, "learning_rate": 9.733677835528434e-05, "epoch": 0.1193356000222953, "percentage": 11.93, "elapsed_time": "5:04:04", "remaining_time": "1 day, 13:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2142, "total_steps": 17941, "loss": 1.7328, "learning_rate": 9.733391033321164e-05, "epoch": 0.11939133827545845, "percentage": 11.94, "elapsed_time": "5:04:12", "remaining_time": "1 day, 13:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2143, "total_steps": 17941, "loss": 1.9832, "learning_rate": 9.733104080998329e-05, "epoch": 0.11944707652862159, "percentage": 11.94, "elapsed_time": "5:04:21", "remaining_time": "1 day, 13:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2144, "total_steps": 17941, "loss": 1.6102, "learning_rate": 9.732816978569028e-05, "epoch": 0.11950281478178473, "percentage": 11.95, "elapsed_time": "5:04:30", "remaining_time": "1 day, 13:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2145, "total_steps": 17941, "loss": 1.6543, "learning_rate": 9.732529726042365e-05, "epoch": 0.11955855303494789, "percentage": 11.96, "elapsed_time": "5:04:38", "remaining_time": "1 day, 13:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2146, "total_steps": 17941, "loss": 1.8017, "learning_rate": 9.732242323427455e-05, "epoch": 0.11961429128811103, "percentage": 11.96, "elapsed_time": "5:04:47", "remaining_time": "1 day, 13:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2147, "total_steps": 17941, "loss": 2.0041, "learning_rate": 9.731954770733407e-05, "epoch": 0.11967002954127418, "percentage": 11.97, "elapsed_time": "5:04:55", "remaining_time": "1 day, 13:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2148, "total_steps": 17941, "loss": 1.716, "learning_rate": 9.731667067969344e-05, "epoch": 0.11972576779443732, "percentage": 11.97, "elapsed_time": "5:05:04", "remaining_time": "1 day, 13:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2149, "total_steps": 17941, "loss": 1.8201, "learning_rate": 9.731379215144388e-05, "epoch": 0.11978150604760048, "percentage": 11.98, "elapsed_time": "5:05:12", "remaining_time": "1 day, 13:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2150, "total_steps": 17941, "loss": 1.51, "learning_rate": 9.73109121226767e-05, "epoch": 0.11983724430076362, "percentage": 11.98, "elapsed_time": "5:05:21", "remaining_time": "1 day, 13:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2151, "total_steps": 17941, "loss": 2.0817, "learning_rate": 9.730803059348323e-05, "epoch": 0.11989298255392676, "percentage": 11.99, "elapsed_time": "5:05:29", "remaining_time": "1 day, 13:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2152, "total_steps": 17941, "loss": 1.854, "learning_rate": 9.730514756395485e-05, "epoch": 0.1199487208070899, "percentage": 11.99, "elapsed_time": "5:05:37", "remaining_time": "1 day, 13:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2153, "total_steps": 17941, "loss": 1.4719, "learning_rate": 9.7302263034183e-05, "epoch": 0.12000445906025305, "percentage": 12.0, "elapsed_time": "5:05:46", "remaining_time": "1 day, 13:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2154, "total_steps": 17941, "loss": 1.8686, "learning_rate": 9.729937700425916e-05, "epoch": 0.1200601973134162, "percentage": 12.01, "elapsed_time": "5:05:55", "remaining_time": "1 day, 13:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2155, "total_steps": 17941, "loss": 1.8232, "learning_rate": 9.729648947427484e-05, "epoch": 0.12011593556657935, "percentage": 12.01, "elapsed_time": "5:06:03", "remaining_time": "1 day, 13:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2156, "total_steps": 17941, "loss": 1.7735, "learning_rate": 9.729360044432166e-05, "epoch": 0.12017167381974249, "percentage": 12.02, "elapsed_time": "5:06:11", "remaining_time": "1 day, 13:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2157, "total_steps": 17941, "loss": 1.9485, "learning_rate": 9.729070991449119e-05, "epoch": 0.12022741207290563, "percentage": 12.02, "elapsed_time": "5:06:20", "remaining_time": "1 day, 13:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2158, "total_steps": 17941, "loss": 1.6713, "learning_rate": 9.728781788487513e-05, "epoch": 0.12028315032606877, "percentage": 12.03, "elapsed_time": "5:06:29", "remaining_time": "1 day, 13:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2159, "total_steps": 17941, "loss": 1.6913, "learning_rate": 9.72849243555652e-05, "epoch": 0.12033888857923193, "percentage": 12.03, "elapsed_time": "5:06:37", "remaining_time": "1 day, 13:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2160, "total_steps": 17941, "loss": 1.6557, "learning_rate": 9.728202932665316e-05, "epoch": 0.12039462683239507, "percentage": 12.04, "elapsed_time": "5:06:46", "remaining_time": "1 day, 13:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2161, "total_steps": 17941, "loss": 1.6087, "learning_rate": 9.727913279823081e-05, "epoch": 0.12045036508555822, "percentage": 12.05, "elapsed_time": "5:06:54", "remaining_time": "1 day, 13:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2162, "total_steps": 17941, "loss": 1.8017, "learning_rate": 9.727623477039005e-05, "epoch": 0.12050610333872136, "percentage": 12.05, "elapsed_time": "5:07:03", "remaining_time": "1 day, 13:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2163, "total_steps": 17941, "loss": 1.7577, "learning_rate": 9.727333524322274e-05, "epoch": 0.12056184159188452, "percentage": 12.06, "elapsed_time": "5:07:12", "remaining_time": "1 day, 13:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2164, "total_steps": 17941, "loss": 1.7025, "learning_rate": 9.727043421682087e-05, "epoch": 0.12061757984504766, "percentage": 12.06, "elapsed_time": "5:07:20", "remaining_time": "1 day, 13:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2165, "total_steps": 17941, "loss": 1.8185, "learning_rate": 9.726753169127643e-05, "epoch": 0.1206733180982108, "percentage": 12.07, "elapsed_time": "5:07:29", "remaining_time": "1 day, 13:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2166, "total_steps": 17941, "loss": 1.5869, "learning_rate": 9.726462766668147e-05, "epoch": 0.12072905635137395, "percentage": 12.07, "elapsed_time": "5:07:37", "remaining_time": "1 day, 13:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2167, "total_steps": 17941, "loss": 1.6207, "learning_rate": 9.72617221431281e-05, "epoch": 0.12078479460453709, "percentage": 12.08, "elapsed_time": "5:07:46", "remaining_time": "1 day, 13:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2168, "total_steps": 17941, "loss": 1.5611, "learning_rate": 9.725881512070845e-05, "epoch": 0.12084053285770024, "percentage": 12.08, "elapsed_time": "5:07:54", "remaining_time": "1 day, 13:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2169, "total_steps": 17941, "loss": 1.7524, "learning_rate": 9.725590659951473e-05, "epoch": 0.12089627111086339, "percentage": 12.09, "elapsed_time": "5:08:03", "remaining_time": "1 day, 13:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2170, "total_steps": 17941, "loss": 1.9093, "learning_rate": 9.725299657963916e-05, "epoch": 0.12095200936402653, "percentage": 12.1, "elapsed_time": "5:08:11", "remaining_time": "1 day, 13:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2171, "total_steps": 17941, "loss": 1.6196, "learning_rate": 9.725008506117405e-05, "epoch": 0.12100774761718967, "percentage": 12.1, "elapsed_time": "5:08:19", "remaining_time": "1 day, 13:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2172, "total_steps": 17941, "loss": 1.5592, "learning_rate": 9.724717204421175e-05, "epoch": 0.12106348587035283, "percentage": 12.11, "elapsed_time": "5:08:28", "remaining_time": "1 day, 13:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2173, "total_steps": 17941, "loss": 1.7796, "learning_rate": 9.724425752884458e-05, "epoch": 0.12111922412351597, "percentage": 12.11, "elapsed_time": "5:08:36", "remaining_time": "1 day, 13:19:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2174, "total_steps": 17941, "loss": 1.5684, "learning_rate": 9.724134151516504e-05, "epoch": 0.12117496237667912, "percentage": 12.12, "elapsed_time": "5:08:45", "remaining_time": "1 day, 13:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2175, "total_steps": 17941, "loss": 1.9183, "learning_rate": 9.72384240032656e-05, "epoch": 0.12123070062984226, "percentage": 12.12, "elapsed_time": "5:08:53", "remaining_time": "1 day, 13:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2176, "total_steps": 17941, "loss": 1.5609, "learning_rate": 9.723550499323874e-05, "epoch": 0.1212864388830054, "percentage": 12.13, "elapsed_time": "5:09:02", "remaining_time": "1 day, 13:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2177, "total_steps": 17941, "loss": 1.8593, "learning_rate": 9.723258448517707e-05, "epoch": 0.12134217713616856, "percentage": 12.13, "elapsed_time": "5:09:10", "remaining_time": "1 day, 13:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2178, "total_steps": 17941, "loss": 1.8673, "learning_rate": 9.722966247917322e-05, "epoch": 0.1213979153893317, "percentage": 12.14, "elapsed_time": "5:09:19", "remaining_time": "1 day, 13:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2179, "total_steps": 17941, "loss": 1.6219, "learning_rate": 9.722673897531983e-05, "epoch": 0.12145365364249484, "percentage": 12.15, "elapsed_time": "5:09:27", "remaining_time": "1 day, 13:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2180, "total_steps": 17941, "loss": 1.9298, "learning_rate": 9.722381397370963e-05, "epoch": 0.12150939189565799, "percentage": 12.15, "elapsed_time": "5:09:36", "remaining_time": "1 day, 13:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2181, "total_steps": 17941, "loss": 1.4028, "learning_rate": 9.722088747443539e-05, "epoch": 0.12156513014882113, "percentage": 12.16, "elapsed_time": "5:09:44", "remaining_time": "1 day, 13:18:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2182, "total_steps": 17941, "loss": 1.6988, "learning_rate": 9.721795947758991e-05, "epoch": 0.12162086840198429, "percentage": 12.16, "elapsed_time": "5:09:53", "remaining_time": "1 day, 13:18:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2183, "total_steps": 17941, "loss": 1.6624, "learning_rate": 9.721502998326607e-05, "epoch": 0.12167660665514743, "percentage": 12.17, "elapsed_time": "5:10:02", "remaining_time": "1 day, 13:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2184, "total_steps": 17941, "loss": 1.5275, "learning_rate": 9.721209899155675e-05, "epoch": 0.12173234490831057, "percentage": 12.17, "elapsed_time": "5:10:10", "remaining_time": "1 day, 13:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2185, "total_steps": 17941, "loss": 1.7458, "learning_rate": 9.720916650255492e-05, "epoch": 0.12178808316147371, "percentage": 12.18, "elapsed_time": "5:10:19", "remaining_time": "1 day, 13:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2186, "total_steps": 17941, "loss": 1.7205, "learning_rate": 9.720623251635357e-05, "epoch": 0.12184382141463687, "percentage": 12.18, "elapsed_time": "5:10:27", "remaining_time": "1 day, 13:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2187, "total_steps": 17941, "loss": 1.6508, "learning_rate": 9.720329703304577e-05, "epoch": 0.12189955966780001, "percentage": 12.19, "elapsed_time": "5:10:36", "remaining_time": "1 day, 13:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2188, "total_steps": 17941, "loss": 1.7847, "learning_rate": 9.720036005272459e-05, "epoch": 0.12195529792096316, "percentage": 12.2, "elapsed_time": "5:10:44", "remaining_time": "1 day, 13:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2189, "total_steps": 17941, "loss": 1.578, "learning_rate": 9.719742157548319e-05, "epoch": 0.1220110361741263, "percentage": 12.2, "elapsed_time": "5:10:53", "remaining_time": "1 day, 13:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2190, "total_steps": 17941, "loss": 1.7526, "learning_rate": 9.719448160141476e-05, "epoch": 0.12206677442728944, "percentage": 12.21, "elapsed_time": "5:11:02", "remaining_time": "1 day, 13:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2191, "total_steps": 17941, "loss": 1.369, "learning_rate": 9.719154013061253e-05, "epoch": 0.1221225126804526, "percentage": 12.21, "elapsed_time": "5:11:11", "remaining_time": "1 day, 13:16:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2192, "total_steps": 17941, "loss": 1.9266, "learning_rate": 9.71885971631698e-05, "epoch": 0.12217825093361574, "percentage": 12.22, "elapsed_time": "5:11:19", "remaining_time": "1 day, 13:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2193, "total_steps": 17941, "loss": 1.8049, "learning_rate": 9.71856526991799e-05, "epoch": 0.12223398918677889, "percentage": 12.22, "elapsed_time": "5:11:28", "remaining_time": "1 day, 13:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2194, "total_steps": 17941, "loss": 1.6141, "learning_rate": 9.71827067387362e-05, "epoch": 0.12228972743994203, "percentage": 12.23, "elapsed_time": "5:11:36", "remaining_time": "1 day, 13:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2195, "total_steps": 17941, "loss": 1.4462, "learning_rate": 9.717975928193214e-05, "epoch": 0.12234546569310518, "percentage": 12.23, "elapsed_time": "5:11:45", "remaining_time": "1 day, 13:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2196, "total_steps": 17941, "loss": 1.7872, "learning_rate": 9.717681032886119e-05, "epoch": 0.12240120394626833, "percentage": 12.24, "elapsed_time": "5:11:53", "remaining_time": "1 day, 13:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2197, "total_steps": 17941, "loss": 1.7539, "learning_rate": 9.717385987961686e-05, "epoch": 0.12245694219943147, "percentage": 12.25, "elapsed_time": "5:12:02", "remaining_time": "1 day, 13:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2198, "total_steps": 17941, "loss": 1.8575, "learning_rate": 9.717090793429276e-05, "epoch": 0.12251268045259461, "percentage": 12.25, "elapsed_time": "5:12:10", "remaining_time": "1 day, 13:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2199, "total_steps": 17941, "loss": 1.9104, "learning_rate": 9.716795449298248e-05, "epoch": 0.12256841870575776, "percentage": 12.26, "elapsed_time": "5:12:19", "remaining_time": "1 day, 13:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2200, "total_steps": 17941, "loss": 1.6201, "learning_rate": 9.71649995557797e-05, "epoch": 0.12262415695892091, "percentage": 12.26, "elapsed_time": "5:12:27", "remaining_time": "1 day, 13:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2201, "total_steps": 17941, "loss": 1.928, "learning_rate": 9.716204312277812e-05, "epoch": 0.12267989521208406, "percentage": 12.27, "elapsed_time": "5:12:36", "remaining_time": "1 day, 13:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2202, "total_steps": 17941, "loss": 1.6348, "learning_rate": 9.715908519407149e-05, "epoch": 0.1227356334652472, "percentage": 12.27, "elapsed_time": "5:12:44", "remaining_time": "1 day, 13:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2203, "total_steps": 17941, "loss": 1.8211, "learning_rate": 9.715612576975366e-05, "epoch": 0.12279137171841034, "percentage": 12.28, "elapsed_time": "5:12:53", "remaining_time": "1 day, 13:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2204, "total_steps": 17941, "loss": 1.8334, "learning_rate": 9.715316484991845e-05, "epoch": 0.12284710997157348, "percentage": 12.28, "elapsed_time": "5:13:01", "remaining_time": "1 day, 13:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2205, "total_steps": 17941, "loss": 1.8001, "learning_rate": 9.715020243465976e-05, "epoch": 0.12290284822473664, "percentage": 12.29, "elapsed_time": "5:13:10", "remaining_time": "1 day, 13:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2206, "total_steps": 17941, "loss": 1.4173, "learning_rate": 9.714723852407157e-05, "epoch": 0.12295858647789978, "percentage": 12.3, "elapsed_time": "5:13:18", "remaining_time": "1 day, 13:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2207, "total_steps": 17941, "loss": 1.7186, "learning_rate": 9.714427311824786e-05, "epoch": 0.12301432473106293, "percentage": 12.3, "elapsed_time": "5:13:27", "remaining_time": "1 day, 13:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2208, "total_steps": 17941, "loss": 1.6884, "learning_rate": 9.714130621728266e-05, "epoch": 0.12307006298422607, "percentage": 12.31, "elapsed_time": "5:13:35", "remaining_time": "1 day, 13:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2209, "total_steps": 17941, "loss": 1.8707, "learning_rate": 9.713833782127008e-05, "epoch": 0.12312580123738923, "percentage": 12.31, "elapsed_time": "5:13:44", "remaining_time": "1 day, 13:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2210, "total_steps": 17941, "loss": 1.555, "learning_rate": 9.713536793030429e-05, "epoch": 0.12318153949055237, "percentage": 12.32, "elapsed_time": "5:13:53", "remaining_time": "1 day, 13:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2211, "total_steps": 17941, "loss": 1.8188, "learning_rate": 9.713239654447943e-05, "epoch": 0.12323727774371551, "percentage": 12.32, "elapsed_time": "5:14:01", "remaining_time": "1 day, 13:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2212, "total_steps": 17941, "loss": 1.8096, "learning_rate": 9.712942366388975e-05, "epoch": 0.12329301599687865, "percentage": 12.33, "elapsed_time": "5:14:10", "remaining_time": "1 day, 13:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2213, "total_steps": 17941, "loss": 1.8329, "learning_rate": 9.712644928862953e-05, "epoch": 0.1233487542500418, "percentage": 12.33, "elapsed_time": "5:14:18", "remaining_time": "1 day, 13:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2214, "total_steps": 17941, "loss": 1.8994, "learning_rate": 9.712347341879311e-05, "epoch": 0.12340449250320495, "percentage": 12.34, "elapsed_time": "5:14:27", "remaining_time": "1 day, 13:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2215, "total_steps": 17941, "loss": 1.8856, "learning_rate": 9.712049605447486e-05, "epoch": 0.1234602307563681, "percentage": 12.35, "elapsed_time": "5:14:35", "remaining_time": "1 day, 13:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2216, "total_steps": 17941, "loss": 1.7319, "learning_rate": 9.711751719576922e-05, "epoch": 0.12351596900953124, "percentage": 12.35, "elapsed_time": "5:14:44", "remaining_time": "1 day, 13:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2217, "total_steps": 17941, "loss": 1.9889, "learning_rate": 9.711453684277063e-05, "epoch": 0.12357170726269438, "percentage": 12.36, "elapsed_time": "5:14:53", "remaining_time": "1 day, 13:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2218, "total_steps": 17941, "loss": 1.5177, "learning_rate": 9.711155499557364e-05, "epoch": 0.12362744551585754, "percentage": 12.36, "elapsed_time": "5:15:01", "remaining_time": "1 day, 13:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2219, "total_steps": 17941, "loss": 1.5376, "learning_rate": 9.710857165427281e-05, "epoch": 0.12368318376902068, "percentage": 12.37, "elapsed_time": "5:15:10", "remaining_time": "1 day, 13:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2220, "total_steps": 17941, "loss": 1.7389, "learning_rate": 9.710558681896274e-05, "epoch": 0.12373892202218383, "percentage": 12.37, "elapsed_time": "5:15:19", "remaining_time": "1 day, 13:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2221, "total_steps": 17941, "loss": 1.7281, "learning_rate": 9.71026004897381e-05, "epoch": 0.12379466027534697, "percentage": 12.38, "elapsed_time": "5:15:27", "remaining_time": "1 day, 13:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2222, "total_steps": 17941, "loss": 1.6421, "learning_rate": 9.70996126666936e-05, "epoch": 0.12385039852851011, "percentage": 12.39, "elapsed_time": "5:15:36", "remaining_time": "1 day, 13:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2223, "total_steps": 17941, "loss": 2.0405, "learning_rate": 9.7096623349924e-05, "epoch": 0.12390613678167327, "percentage": 12.39, "elapsed_time": "5:15:44", "remaining_time": "1 day, 13:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2224, "total_steps": 17941, "loss": 1.7629, "learning_rate": 9.70936325395241e-05, "epoch": 0.12396187503483641, "percentage": 12.4, "elapsed_time": "5:15:53", "remaining_time": "1 day, 13:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2225, "total_steps": 17941, "loss": 1.7357, "learning_rate": 9.709064023558874e-05, "epoch": 0.12401761328799955, "percentage": 12.4, "elapsed_time": "5:16:01", "remaining_time": "1 day, 13:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2226, "total_steps": 17941, "loss": 1.905, "learning_rate": 9.708764643821284e-05, "epoch": 0.1240733515411627, "percentage": 12.41, "elapsed_time": "5:16:10", "remaining_time": "1 day, 13:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2227, "total_steps": 17941, "loss": 1.7439, "learning_rate": 9.708465114749132e-05, "epoch": 0.12412908979432584, "percentage": 12.41, "elapsed_time": "5:16:18", "remaining_time": "1 day, 13:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2228, "total_steps": 17941, "loss": 1.7851, "learning_rate": 9.708165436351921e-05, "epoch": 0.124184828047489, "percentage": 12.42, "elapsed_time": "5:16:27", "remaining_time": "1 day, 13:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2229, "total_steps": 17941, "loss": 1.494, "learning_rate": 9.707865608639152e-05, "epoch": 0.12424056630065214, "percentage": 12.42, "elapsed_time": "5:16:35", "remaining_time": "1 day, 13:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2230, "total_steps": 17941, "loss": 1.973, "learning_rate": 9.707565631620334e-05, "epoch": 0.12429630455381528, "percentage": 12.43, "elapsed_time": "5:16:44", "remaining_time": "1 day, 13:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2231, "total_steps": 17941, "loss": 1.9693, "learning_rate": 9.707265505304982e-05, "epoch": 0.12435204280697842, "percentage": 12.44, "elapsed_time": "5:16:52", "remaining_time": "1 day, 13:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2232, "total_steps": 17941, "loss": 1.8978, "learning_rate": 9.706965229702614e-05, "epoch": 0.12440778106014158, "percentage": 12.44, "elapsed_time": "5:17:01", "remaining_time": "1 day, 13:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2233, "total_steps": 17941, "loss": 2.0298, "learning_rate": 9.70666480482275e-05, "epoch": 0.12446351931330472, "percentage": 12.45, "elapsed_time": "5:17:10", "remaining_time": "1 day, 13:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2234, "total_steps": 17941, "loss": 1.5383, "learning_rate": 9.706364230674923e-05, "epoch": 0.12451925756646787, "percentage": 12.45, "elapsed_time": "5:17:18", "remaining_time": "1 day, 13:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2235, "total_steps": 17941, "loss": 1.6472, "learning_rate": 9.706063507268661e-05, "epoch": 0.12457499581963101, "percentage": 12.46, "elapsed_time": "5:17:27", "remaining_time": "1 day, 13:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2236, "total_steps": 17941, "loss": 1.7692, "learning_rate": 9.705762634613502e-05, "epoch": 0.12463073407279415, "percentage": 12.46, "elapsed_time": "5:17:35", "remaining_time": "1 day, 13:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2237, "total_steps": 17941, "loss": 1.5998, "learning_rate": 9.705461612718991e-05, "epoch": 0.12468647232595731, "percentage": 12.47, "elapsed_time": "5:17:44", "remaining_time": "1 day, 13:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2238, "total_steps": 17941, "loss": 1.6545, "learning_rate": 9.705160441594671e-05, "epoch": 0.12474221057912045, "percentage": 12.47, "elapsed_time": "5:17:53", "remaining_time": "1 day, 13:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2239, "total_steps": 17941, "loss": 1.8984, "learning_rate": 9.704859121250095e-05, "epoch": 0.1247979488322836, "percentage": 12.48, "elapsed_time": "5:18:01", "remaining_time": "1 day, 13:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2240, "total_steps": 17941, "loss": 1.7794, "learning_rate": 9.704557651694818e-05, "epoch": 0.12485368708544674, "percentage": 12.49, "elapsed_time": "5:18:09", "remaining_time": "1 day, 13:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2241, "total_steps": 17941, "loss": 1.4191, "learning_rate": 9.704256032938403e-05, "epoch": 0.1249094253386099, "percentage": 12.49, "elapsed_time": "5:18:18", "remaining_time": "1 day, 13:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2242, "total_steps": 17941, "loss": 1.7634, "learning_rate": 9.703954264990414e-05, "epoch": 0.12496516359177304, "percentage": 12.5, "elapsed_time": "5:18:27", "remaining_time": "1 day, 13:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2243, "total_steps": 17941, "loss": 1.9257, "learning_rate": 9.703652347860422e-05, "epoch": 0.12502090184493617, "percentage": 12.5, "elapsed_time": "5:18:35", "remaining_time": "1 day, 13:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2244, "total_steps": 17941, "loss": 1.8102, "learning_rate": 9.703350281558002e-05, "epoch": 0.12507664009809932, "percentage": 12.51, "elapsed_time": "5:18:43", "remaining_time": "1 day, 13:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2245, "total_steps": 17941, "loss": 2.1658, "learning_rate": 9.703048066092733e-05, "epoch": 0.12513237835126248, "percentage": 12.51, "elapsed_time": "5:18:52", "remaining_time": "1 day, 13:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2246, "total_steps": 17941, "loss": 1.6586, "learning_rate": 9.7027457014742e-05, "epoch": 0.1251881166044256, "percentage": 12.52, "elapsed_time": "5:19:00", "remaining_time": "1 day, 13:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2247, "total_steps": 17941, "loss": 1.7678, "learning_rate": 9.702443187711992e-05, "epoch": 0.12524385485758877, "percentage": 12.52, "elapsed_time": "5:19:09", "remaining_time": "1 day, 13:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2248, "total_steps": 17941, "loss": 1.848, "learning_rate": 9.702140524815704e-05, "epoch": 0.12529959311075192, "percentage": 12.53, "elapsed_time": "5:19:17", "remaining_time": "1 day, 13:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2249, "total_steps": 17941, "loss": 1.8369, "learning_rate": 9.701837712794932e-05, "epoch": 0.12535533136391505, "percentage": 12.54, "elapsed_time": "5:19:26", "remaining_time": "1 day, 13:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2250, "total_steps": 17941, "loss": 1.8621, "learning_rate": 9.701534751659283e-05, "epoch": 0.1254110696170782, "percentage": 12.54, "elapsed_time": "5:19:34", "remaining_time": "1 day, 13:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2251, "total_steps": 17941, "loss": 1.7069, "learning_rate": 9.701231641418363e-05, "epoch": 0.12546680787024134, "percentage": 12.55, "elapsed_time": "5:19:43", "remaining_time": "1 day, 13:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2252, "total_steps": 17941, "loss": 1.7311, "learning_rate": 9.700928382081786e-05, "epoch": 0.1255225461234045, "percentage": 12.55, "elapsed_time": "5:19:51", "remaining_time": "1 day, 13:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2253, "total_steps": 17941, "loss": 1.6022, "learning_rate": 9.700624973659169e-05, "epoch": 0.12557828437656765, "percentage": 12.56, "elapsed_time": "5:20:00", "remaining_time": "1 day, 13:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2254, "total_steps": 17941, "loss": 1.6004, "learning_rate": 9.700321416160134e-05, "epoch": 0.12563402262973078, "percentage": 12.56, "elapsed_time": "5:20:08", "remaining_time": "1 day, 13:08:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2255, "total_steps": 17941, "loss": 1.627, "learning_rate": 9.70001770959431e-05, "epoch": 0.12568976088289394, "percentage": 12.57, "elapsed_time": "5:20:17", "remaining_time": "1 day, 13:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2256, "total_steps": 17941, "loss": 1.9893, "learning_rate": 9.699713853971324e-05, "epoch": 0.12574549913605707, "percentage": 12.57, "elapsed_time": "5:20:25", "remaining_time": "1 day, 13:07:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2257, "total_steps": 17941, "loss": 1.6269, "learning_rate": 9.699409849300818e-05, "epoch": 0.12580123738922022, "percentage": 12.58, "elapsed_time": "5:20:34", "remaining_time": "1 day, 13:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2258, "total_steps": 17941, "loss": 1.6803, "learning_rate": 9.69910569559243e-05, "epoch": 0.12585697564238338, "percentage": 12.59, "elapsed_time": "5:20:42", "remaining_time": "1 day, 13:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2259, "total_steps": 17941, "loss": 1.7217, "learning_rate": 9.698801392855808e-05, "epoch": 0.1259127138955465, "percentage": 12.59, "elapsed_time": "5:20:51", "remaining_time": "1 day, 13:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2260, "total_steps": 17941, "loss": 1.6904, "learning_rate": 9.698496941100601e-05, "epoch": 0.12596845214870966, "percentage": 12.6, "elapsed_time": "5:20:59", "remaining_time": "1 day, 13:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2261, "total_steps": 17941, "loss": 1.5411, "learning_rate": 9.698192340336468e-05, "epoch": 0.1260241904018728, "percentage": 12.6, "elapsed_time": "5:21:07", "remaining_time": "1 day, 13:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2262, "total_steps": 17941, "loss": 1.6144, "learning_rate": 9.697887590573063e-05, "epoch": 0.12607992865503595, "percentage": 12.61, "elapsed_time": "5:21:16", "remaining_time": "1 day, 13:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2263, "total_steps": 17941, "loss": 1.605, "learning_rate": 9.697582691820054e-05, "epoch": 0.1261356669081991, "percentage": 12.61, "elapsed_time": "5:21:24", "remaining_time": "1 day, 13:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2264, "total_steps": 17941, "loss": 1.0444, "learning_rate": 9.697277644087113e-05, "epoch": 0.12619140516136224, "percentage": 12.62, "elapsed_time": "5:21:34", "remaining_time": "1 day, 13:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2265, "total_steps": 17941, "loss": 1.7319, "learning_rate": 9.69697244738391e-05, "epoch": 0.1262471434145254, "percentage": 12.62, "elapsed_time": "5:21:42", "remaining_time": "1 day, 13:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2266, "total_steps": 17941, "loss": 1.9173, "learning_rate": 9.696667101720127e-05, "epoch": 0.12630288166768852, "percentage": 12.63, "elapsed_time": "5:21:51", "remaining_time": "1 day, 13:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2267, "total_steps": 17941, "loss": 1.6603, "learning_rate": 9.696361607105448e-05, "epoch": 0.12635861992085168, "percentage": 12.64, "elapsed_time": "5:21:59", "remaining_time": "1 day, 13:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2268, "total_steps": 17941, "loss": 1.7048, "learning_rate": 9.69605596354956e-05, "epoch": 0.12641435817401483, "percentage": 12.64, "elapsed_time": "5:22:08", "remaining_time": "1 day, 13:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2269, "total_steps": 17941, "loss": 1.669, "learning_rate": 9.695750171062156e-05, "epoch": 0.12647009642717796, "percentage": 12.65, "elapsed_time": "5:22:16", "remaining_time": "1 day, 13:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2270, "total_steps": 17941, "loss": 1.6744, "learning_rate": 9.695444229652935e-05, "epoch": 0.12652583468034112, "percentage": 12.65, "elapsed_time": "5:22:25", "remaining_time": "1 day, 13:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2271, "total_steps": 17941, "loss": 1.6182, "learning_rate": 9.6951381393316e-05, "epoch": 0.12658157293350428, "percentage": 12.66, "elapsed_time": "5:22:33", "remaining_time": "1 day, 13:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2272, "total_steps": 17941, "loss": 1.7818, "learning_rate": 9.694831900107857e-05, "epoch": 0.1266373111866674, "percentage": 12.66, "elapsed_time": "5:22:42", "remaining_time": "1 day, 13:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2273, "total_steps": 17941, "loss": 1.9646, "learning_rate": 9.69452551199142e-05, "epoch": 0.12669304943983056, "percentage": 12.67, "elapsed_time": "5:22:51", "remaining_time": "1 day, 13:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2274, "total_steps": 17941, "loss": 1.6862, "learning_rate": 9.694218974992005e-05, "epoch": 0.1267487876929937, "percentage": 12.67, "elapsed_time": "5:22:59", "remaining_time": "1 day, 13:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2275, "total_steps": 17941, "loss": 1.7259, "learning_rate": 9.693912289119332e-05, "epoch": 0.12680452594615685, "percentage": 12.68, "elapsed_time": "5:23:08", "remaining_time": "1 day, 13:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2276, "total_steps": 17941, "loss": 1.8426, "learning_rate": 9.693605454383128e-05, "epoch": 0.12686026419932, "percentage": 12.69, "elapsed_time": "5:23:16", "remaining_time": "1 day, 13:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2277, "total_steps": 17941, "loss": 1.9999, "learning_rate": 9.693298470793126e-05, "epoch": 0.12691600245248313, "percentage": 12.69, "elapsed_time": "5:23:25", "remaining_time": "1 day, 13:04:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2278, "total_steps": 17941, "loss": 1.736, "learning_rate": 9.69299133835906e-05, "epoch": 0.1269717407056463, "percentage": 12.7, "elapsed_time": "5:23:33", "remaining_time": "1 day, 13:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2279, "total_steps": 17941, "loss": 1.4284, "learning_rate": 9.69268405709067e-05, "epoch": 0.12702747895880942, "percentage": 12.7, "elapsed_time": "5:23:42", "remaining_time": "1 day, 13:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2280, "total_steps": 17941, "loss": 1.8972, "learning_rate": 9.692376626997703e-05, "epoch": 0.12708321721197258, "percentage": 12.71, "elapsed_time": "5:23:51", "remaining_time": "1 day, 13:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2281, "total_steps": 17941, "loss": 1.6173, "learning_rate": 9.692069048089907e-05, "epoch": 0.12713895546513573, "percentage": 12.71, "elapsed_time": "5:23:59", "remaining_time": "1 day, 13:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2282, "total_steps": 17941, "loss": 1.5599, "learning_rate": 9.691761320377037e-05, "epoch": 0.12719469371829886, "percentage": 12.72, "elapsed_time": "5:24:08", "remaining_time": "1 day, 13:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2283, "total_steps": 17941, "loss": 1.7705, "learning_rate": 9.691453443868854e-05, "epoch": 0.12725043197146202, "percentage": 12.73, "elapsed_time": "5:24:16", "remaining_time": "1 day, 13:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2284, "total_steps": 17941, "loss": 1.9065, "learning_rate": 9.691145418575122e-05, "epoch": 0.12730617022462515, "percentage": 12.73, "elapsed_time": "5:24:25", "remaining_time": "1 day, 13:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2285, "total_steps": 17941, "loss": 1.7623, "learning_rate": 9.690837244505607e-05, "epoch": 0.1273619084777883, "percentage": 12.74, "elapsed_time": "5:24:33", "remaining_time": "1 day, 13:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2286, "total_steps": 17941, "loss": 1.7758, "learning_rate": 9.690528921670084e-05, "epoch": 0.12741764673095146, "percentage": 12.74, "elapsed_time": "5:24:42", "remaining_time": "1 day, 13:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2287, "total_steps": 17941, "loss": 1.6409, "learning_rate": 9.69022045007833e-05, "epoch": 0.1274733849841146, "percentage": 12.75, "elapsed_time": "5:24:50", "remaining_time": "1 day, 13:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2288, "total_steps": 17941, "loss": 1.6144, "learning_rate": 9.689911829740133e-05, "epoch": 0.12752912323727775, "percentage": 12.75, "elapsed_time": "5:24:59", "remaining_time": "1 day, 13:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2289, "total_steps": 17941, "loss": 1.8711, "learning_rate": 9.689603060665273e-05, "epoch": 0.12758486149044088, "percentage": 12.76, "elapsed_time": "5:25:07", "remaining_time": "1 day, 13:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2290, "total_steps": 17941, "loss": 1.8228, "learning_rate": 9.689294142863548e-05, "epoch": 0.12764059974360403, "percentage": 12.76, "elapsed_time": "5:25:16", "remaining_time": "1 day, 13:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2291, "total_steps": 17941, "loss": 1.696, "learning_rate": 9.688985076344754e-05, "epoch": 0.1276963379967672, "percentage": 12.77, "elapsed_time": "5:25:24", "remaining_time": "1 day, 13:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2292, "total_steps": 17941, "loss": 1.6989, "learning_rate": 9.68867586111869e-05, "epoch": 0.12775207624993032, "percentage": 12.78, "elapsed_time": "5:25:33", "remaining_time": "1 day, 13:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2293, "total_steps": 17941, "loss": 1.6764, "learning_rate": 9.688366497195166e-05, "epoch": 0.12780781450309348, "percentage": 12.78, "elapsed_time": "5:25:41", "remaining_time": "1 day, 13:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2294, "total_steps": 17941, "loss": 1.4595, "learning_rate": 9.68805698458399e-05, "epoch": 0.12786355275625663, "percentage": 12.79, "elapsed_time": "5:25:49", "remaining_time": "1 day, 13:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2295, "total_steps": 17941, "loss": 1.4642, "learning_rate": 9.687747323294982e-05, "epoch": 0.12791929100941976, "percentage": 12.79, "elapsed_time": "5:25:58", "remaining_time": "1 day, 13:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2296, "total_steps": 17941, "loss": 1.7116, "learning_rate": 9.687437513337961e-05, "epoch": 0.12797502926258292, "percentage": 12.8, "elapsed_time": "5:26:07", "remaining_time": "1 day, 13:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2297, "total_steps": 17941, "loss": 1.637, "learning_rate": 9.687127554722749e-05, "epoch": 0.12803076751574605, "percentage": 12.8, "elapsed_time": "5:26:15", "remaining_time": "1 day, 13:02:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2298, "total_steps": 17941, "loss": 1.7629, "learning_rate": 9.68681744745918e-05, "epoch": 0.1280865057689092, "percentage": 12.81, "elapsed_time": "5:26:24", "remaining_time": "1 day, 13:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2299, "total_steps": 17941, "loss": 1.827, "learning_rate": 9.686507191557089e-05, "epoch": 0.12814224402207236, "percentage": 12.81, "elapsed_time": "5:26:33", "remaining_time": "1 day, 13:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2300, "total_steps": 17941, "loss": 1.9385, "learning_rate": 9.686196787026311e-05, "epoch": 0.1281979822752355, "percentage": 12.82, "elapsed_time": "5:26:41", "remaining_time": "1 day, 13:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2301, "total_steps": 17941, "loss": 1.8378, "learning_rate": 9.685886233876695e-05, "epoch": 0.12825372052839865, "percentage": 12.83, "elapsed_time": "5:26:50", "remaining_time": "1 day, 13:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2302, "total_steps": 17941, "loss": 1.6812, "learning_rate": 9.685575532118089e-05, "epoch": 0.12830945878156177, "percentage": 12.83, "elapsed_time": "5:26:58", "remaining_time": "1 day, 13:01:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2303, "total_steps": 17941, "loss": 1.9602, "learning_rate": 9.685264681760345e-05, "epoch": 0.12836519703472493, "percentage": 12.84, "elapsed_time": "5:27:07", "remaining_time": "1 day, 13:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2304, "total_steps": 17941, "loss": 1.8125, "learning_rate": 9.684953682813322e-05, "epoch": 0.1284209352878881, "percentage": 12.84, "elapsed_time": "5:27:15", "remaining_time": "1 day, 13:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2305, "total_steps": 17941, "loss": 1.5566, "learning_rate": 9.684642535286885e-05, "epoch": 0.12847667354105122, "percentage": 12.85, "elapsed_time": "5:27:24", "remaining_time": "1 day, 13:01:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2306, "total_steps": 17941, "loss": 1.5688, "learning_rate": 9.684331239190899e-05, "epoch": 0.12853241179421437, "percentage": 12.85, "elapsed_time": "5:27:33", "remaining_time": "1 day, 13:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2307, "total_steps": 17941, "loss": 1.7452, "learning_rate": 9.684019794535237e-05, "epoch": 0.1285881500473775, "percentage": 12.86, "elapsed_time": "5:27:41", "remaining_time": "1 day, 13:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2308, "total_steps": 17941, "loss": 1.6624, "learning_rate": 9.683708201329777e-05, "epoch": 0.12864388830054066, "percentage": 12.86, "elapsed_time": "5:27:50", "remaining_time": "1 day, 13:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2309, "total_steps": 17941, "loss": 1.7721, "learning_rate": 9.683396459584404e-05, "epoch": 0.12869962655370382, "percentage": 12.87, "elapsed_time": "5:27:58", "remaining_time": "1 day, 13:00:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2310, "total_steps": 17941, "loss": 2.1623, "learning_rate": 9.683084569308997e-05, "epoch": 0.12875536480686695, "percentage": 12.88, "elapsed_time": "5:28:07", "remaining_time": "1 day, 13:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2311, "total_steps": 17941, "loss": 1.7165, "learning_rate": 9.682772530513453e-05, "epoch": 0.1288111030600301, "percentage": 12.88, "elapsed_time": "5:28:15", "remaining_time": "1 day, 13:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2312, "total_steps": 17941, "loss": 1.6391, "learning_rate": 9.682460343207669e-05, "epoch": 0.12886684131319323, "percentage": 12.89, "elapsed_time": "5:28:24", "remaining_time": "1 day, 13:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2313, "total_steps": 17941, "loss": 1.891, "learning_rate": 9.682148007401541e-05, "epoch": 0.1289225795663564, "percentage": 12.89, "elapsed_time": "5:28:32", "remaining_time": "1 day, 12:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2314, "total_steps": 17941, "loss": 1.9901, "learning_rate": 9.681835523104978e-05, "epoch": 0.12897831781951954, "percentage": 12.9, "elapsed_time": "5:28:41", "remaining_time": "1 day, 12:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2315, "total_steps": 17941, "loss": 1.7748, "learning_rate": 9.681522890327889e-05, "epoch": 0.12903405607268267, "percentage": 12.9, "elapsed_time": "5:28:49", "remaining_time": "1 day, 12:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2316, "total_steps": 17941, "loss": 1.6, "learning_rate": 9.681210109080189e-05, "epoch": 0.12908979432584583, "percentage": 12.91, "elapsed_time": "5:28:58", "remaining_time": "1 day, 12:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2317, "total_steps": 17941, "loss": 1.6863, "learning_rate": 9.680897179371798e-05, "epoch": 0.129145532579009, "percentage": 12.91, "elapsed_time": "5:29:06", "remaining_time": "1 day, 12:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2318, "total_steps": 17941, "loss": 1.7456, "learning_rate": 9.68058410121264e-05, "epoch": 0.12920127083217212, "percentage": 12.92, "elapsed_time": "5:29:15", "remaining_time": "1 day, 12:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2319, "total_steps": 17941, "loss": 1.572, "learning_rate": 9.680270874612643e-05, "epoch": 0.12925700908533527, "percentage": 12.93, "elapsed_time": "5:29:23", "remaining_time": "1 day, 12:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2320, "total_steps": 17941, "loss": 1.7946, "learning_rate": 9.679957499581742e-05, "epoch": 0.1293127473384984, "percentage": 12.93, "elapsed_time": "5:29:32", "remaining_time": "1 day, 12:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2321, "total_steps": 17941, "loss": 1.7792, "learning_rate": 9.679643976129876e-05, "epoch": 0.12936848559166156, "percentage": 12.94, "elapsed_time": "5:29:40", "remaining_time": "1 day, 12:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2322, "total_steps": 17941, "loss": 2.0051, "learning_rate": 9.679330304266988e-05, "epoch": 0.12942422384482472, "percentage": 12.94, "elapsed_time": "5:29:49", "remaining_time": "1 day, 12:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2323, "total_steps": 17941, "loss": 1.8419, "learning_rate": 9.679016484003023e-05, "epoch": 0.12947996209798784, "percentage": 12.95, "elapsed_time": "5:29:57", "remaining_time": "1 day, 12:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2324, "total_steps": 17941, "loss": 1.7893, "learning_rate": 9.678702515347938e-05, "epoch": 0.129535700351151, "percentage": 12.95, "elapsed_time": "5:30:06", "remaining_time": "1 day, 12:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2325, "total_steps": 17941, "loss": 1.8868, "learning_rate": 9.678388398311686e-05, "epoch": 0.12959143860431413, "percentage": 12.96, "elapsed_time": "5:30:14", "remaining_time": "1 day, 12:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2326, "total_steps": 17941, "loss": 1.6472, "learning_rate": 9.678074132904231e-05, "epoch": 0.1296471768574773, "percentage": 12.96, "elapsed_time": "5:30:22", "remaining_time": "1 day, 12:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2327, "total_steps": 17941, "loss": 1.8353, "learning_rate": 9.677759719135542e-05, "epoch": 0.12970291511064044, "percentage": 12.97, "elapsed_time": "5:30:31", "remaining_time": "1 day, 12:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2328, "total_steps": 17941, "loss": 1.8419, "learning_rate": 9.677445157015585e-05, "epoch": 0.12975865336380357, "percentage": 12.98, "elapsed_time": "5:30:39", "remaining_time": "1 day, 12:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2329, "total_steps": 17941, "loss": 1.846, "learning_rate": 9.67713044655434e-05, "epoch": 0.12981439161696673, "percentage": 12.98, "elapsed_time": "5:30:49", "remaining_time": "1 day, 12:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2330, "total_steps": 17941, "loss": 1.734, "learning_rate": 9.676815587761787e-05, "epoch": 0.12987012987012986, "percentage": 12.99, "elapsed_time": "5:30:57", "remaining_time": "1 day, 12:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2331, "total_steps": 17941, "loss": 1.8124, "learning_rate": 9.676500580647912e-05, "epoch": 0.12992586812329301, "percentage": 12.99, "elapsed_time": "5:31:06", "remaining_time": "1 day, 12:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2332, "total_steps": 17941, "loss": 2.0132, "learning_rate": 9.676185425222704e-05, "epoch": 0.12998160637645617, "percentage": 13.0, "elapsed_time": "5:31:14", "remaining_time": "1 day, 12:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2333, "total_steps": 17941, "loss": 1.7686, "learning_rate": 9.675870121496158e-05, "epoch": 0.1300373446296193, "percentage": 13.0, "elapsed_time": "5:31:22", "remaining_time": "1 day, 12:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2334, "total_steps": 17941, "loss": 1.8113, "learning_rate": 9.675554669478272e-05, "epoch": 0.13009308288278246, "percentage": 13.01, "elapsed_time": "5:31:31", "remaining_time": "1 day, 12:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2335, "total_steps": 17941, "loss": 1.7593, "learning_rate": 9.675239069179056e-05, "epoch": 0.13014882113594559, "percentage": 13.01, "elapsed_time": "5:31:40", "remaining_time": "1 day, 12:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2336, "total_steps": 17941, "loss": 1.5302, "learning_rate": 9.674923320608513e-05, "epoch": 0.13020455938910874, "percentage": 13.02, "elapsed_time": "5:31:48", "remaining_time": "1 day, 12:56:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2337, "total_steps": 17941, "loss": 1.5793, "learning_rate": 9.674607423776661e-05, "epoch": 0.1302602976422719, "percentage": 13.03, "elapsed_time": "5:31:56", "remaining_time": "1 day, 12:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2338, "total_steps": 17941, "loss": 1.6392, "learning_rate": 9.674291378693515e-05, "epoch": 0.13031603589543503, "percentage": 13.03, "elapsed_time": "5:32:05", "remaining_time": "1 day, 12:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2339, "total_steps": 17941, "loss": 1.9403, "learning_rate": 9.673975185369098e-05, "epoch": 0.13037177414859819, "percentage": 13.04, "elapsed_time": "5:32:14", "remaining_time": "1 day, 12:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2340, "total_steps": 17941, "loss": 1.7093, "learning_rate": 9.673658843813442e-05, "epoch": 0.13042751240176134, "percentage": 13.04, "elapsed_time": "5:32:22", "remaining_time": "1 day, 12:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2341, "total_steps": 17941, "loss": 1.7645, "learning_rate": 9.673342354036574e-05, "epoch": 0.13048325065492447, "percentage": 13.05, "elapsed_time": "5:32:31", "remaining_time": "1 day, 12:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2342, "total_steps": 17941, "loss": 1.81, "learning_rate": 9.673025716048536e-05, "epoch": 0.13053898890808763, "percentage": 13.05, "elapsed_time": "5:32:39", "remaining_time": "1 day, 12:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2343, "total_steps": 17941, "loss": 2.0053, "learning_rate": 9.672708929859368e-05, "epoch": 0.13059472716125076, "percentage": 13.06, "elapsed_time": "5:32:48", "remaining_time": "1 day, 12:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2344, "total_steps": 17941, "loss": 1.7236, "learning_rate": 9.672391995479115e-05, "epoch": 0.1306504654144139, "percentage": 13.07, "elapsed_time": "5:32:56", "remaining_time": "1 day, 12:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2345, "total_steps": 17941, "loss": 1.7492, "learning_rate": 9.672074912917831e-05, "epoch": 0.13070620366757707, "percentage": 13.07, "elapsed_time": "5:33:05", "remaining_time": "1 day, 12:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2346, "total_steps": 17941, "loss": 1.9068, "learning_rate": 9.67175768218557e-05, "epoch": 0.1307619419207402, "percentage": 13.08, "elapsed_time": "5:33:13", "remaining_time": "1 day, 12:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2347, "total_steps": 17941, "loss": 1.7364, "learning_rate": 9.671440303292395e-05, "epoch": 0.13081768017390336, "percentage": 13.08, "elapsed_time": "5:33:22", "remaining_time": "1 day, 12:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2348, "total_steps": 17941, "loss": 1.5916, "learning_rate": 9.67112277624837e-05, "epoch": 0.13087341842706648, "percentage": 13.09, "elapsed_time": "5:33:30", "remaining_time": "1 day, 12:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2349, "total_steps": 17941, "loss": 1.7222, "learning_rate": 9.670805101063563e-05, "epoch": 0.13092915668022964, "percentage": 13.09, "elapsed_time": "5:33:39", "remaining_time": "1 day, 12:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2350, "total_steps": 17941, "loss": 1.6418, "learning_rate": 9.670487277748052e-05, "epoch": 0.1309848949333928, "percentage": 13.1, "elapsed_time": "5:33:47", "remaining_time": "1 day, 12:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2351, "total_steps": 17941, "loss": 1.7323, "learning_rate": 9.670169306311916e-05, "epoch": 0.13104063318655593, "percentage": 13.1, "elapsed_time": "5:33:56", "remaining_time": "1 day, 12:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2352, "total_steps": 17941, "loss": 1.4822, "learning_rate": 9.669851186765238e-05, "epoch": 0.13109637143971908, "percentage": 13.11, "elapsed_time": "5:34:04", "remaining_time": "1 day, 12:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2353, "total_steps": 17941, "loss": 1.767, "learning_rate": 9.669532919118108e-05, "epoch": 0.1311521096928822, "percentage": 13.12, "elapsed_time": "5:34:13", "remaining_time": "1 day, 12:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2354, "total_steps": 17941, "loss": 1.7228, "learning_rate": 9.669214503380617e-05, "epoch": 0.13120784794604537, "percentage": 13.12, "elapsed_time": "5:34:21", "remaining_time": "1 day, 12:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2355, "total_steps": 17941, "loss": 1.4792, "learning_rate": 9.668895939562868e-05, "epoch": 0.13126358619920853, "percentage": 13.13, "elapsed_time": "5:34:30", "remaining_time": "1 day, 12:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2356, "total_steps": 17941, "loss": 1.7285, "learning_rate": 9.66857722767496e-05, "epoch": 0.13131932445237166, "percentage": 13.13, "elapsed_time": "5:34:39", "remaining_time": "1 day, 12:53:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2357, "total_steps": 17941, "loss": 1.5942, "learning_rate": 9.668258367727002e-05, "epoch": 0.1313750627055348, "percentage": 13.14, "elapsed_time": "5:34:47", "remaining_time": "1 day, 12:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2358, "total_steps": 17941, "loss": 1.8991, "learning_rate": 9.667939359729109e-05, "epoch": 0.13143080095869794, "percentage": 13.14, "elapsed_time": "5:34:56", "remaining_time": "1 day, 12:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2359, "total_steps": 17941, "loss": 1.8247, "learning_rate": 9.667620203691393e-05, "epoch": 0.1314865392118611, "percentage": 13.15, "elapsed_time": "5:35:05", "remaining_time": "1 day, 12:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2360, "total_steps": 17941, "loss": 2.0837, "learning_rate": 9.667300899623976e-05, "epoch": 0.13154227746502425, "percentage": 13.15, "elapsed_time": "5:35:13", "remaining_time": "1 day, 12:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2361, "total_steps": 17941, "loss": 1.681, "learning_rate": 9.66698144753699e-05, "epoch": 0.13159801571818738, "percentage": 13.16, "elapsed_time": "5:35:21", "remaining_time": "1 day, 12:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2362, "total_steps": 17941, "loss": 1.7168, "learning_rate": 9.666661847440563e-05, "epoch": 0.13165375397135054, "percentage": 13.17, "elapsed_time": "5:35:30", "remaining_time": "1 day, 12:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2363, "total_steps": 17941, "loss": 1.8355, "learning_rate": 9.666342099344829e-05, "epoch": 0.1317094922245137, "percentage": 13.17, "elapsed_time": "5:35:39", "remaining_time": "1 day, 12:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2364, "total_steps": 17941, "loss": 1.6872, "learning_rate": 9.666022203259931e-05, "epoch": 0.13176523047767683, "percentage": 13.18, "elapsed_time": "5:35:47", "remaining_time": "1 day, 12:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2365, "total_steps": 17941, "loss": 1.6867, "learning_rate": 9.665702159196013e-05, "epoch": 0.13182096873083998, "percentage": 13.18, "elapsed_time": "5:35:56", "remaining_time": "1 day, 12:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2366, "total_steps": 17941, "loss": 1.5836, "learning_rate": 9.665381967163227e-05, "epoch": 0.1318767069840031, "percentage": 13.19, "elapsed_time": "5:36:04", "remaining_time": "1 day, 12:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2367, "total_steps": 17941, "loss": 1.6933, "learning_rate": 9.665061627171726e-05, "epoch": 0.13193244523716627, "percentage": 13.19, "elapsed_time": "5:36:13", "remaining_time": "1 day, 12:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2368, "total_steps": 17941, "loss": 2.0988, "learning_rate": 9.664741139231668e-05, "epoch": 0.13198818349032942, "percentage": 13.2, "elapsed_time": "5:36:22", "remaining_time": "1 day, 12:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2369, "total_steps": 17941, "loss": 1.7087, "learning_rate": 9.664420503353218e-05, "epoch": 0.13204392174349255, "percentage": 13.2, "elapsed_time": "5:36:31", "remaining_time": "1 day, 12:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2370, "total_steps": 17941, "loss": 1.8029, "learning_rate": 9.664099719546547e-05, "epoch": 0.1320996599966557, "percentage": 13.21, "elapsed_time": "5:36:39", "remaining_time": "1 day, 12:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2371, "total_steps": 17941, "loss": 1.7483, "learning_rate": 9.663778787821825e-05, "epoch": 0.13215539824981884, "percentage": 13.22, "elapsed_time": "5:36:48", "remaining_time": "1 day, 12:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2372, "total_steps": 17941, "loss": 1.7137, "learning_rate": 9.663457708189232e-05, "epoch": 0.132211136502982, "percentage": 13.22, "elapsed_time": "5:36:56", "remaining_time": "1 day, 12:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2373, "total_steps": 17941, "loss": 1.8748, "learning_rate": 9.66313648065895e-05, "epoch": 0.13226687475614515, "percentage": 13.23, "elapsed_time": "5:37:05", "remaining_time": "1 day, 12:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2374, "total_steps": 17941, "loss": 1.5948, "learning_rate": 9.662815105241168e-05, "epoch": 0.13232261300930828, "percentage": 13.23, "elapsed_time": "5:37:13", "remaining_time": "1 day, 12:51:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2375, "total_steps": 17941, "loss": 1.7724, "learning_rate": 9.662493581946074e-05, "epoch": 0.13237835126247144, "percentage": 13.24, "elapsed_time": "5:37:22", "remaining_time": "1 day, 12:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2376, "total_steps": 17941, "loss": 1.8068, "learning_rate": 9.66217191078387e-05, "epoch": 0.13243408951563457, "percentage": 13.24, "elapsed_time": "5:37:30", "remaining_time": "1 day, 12:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2377, "total_steps": 17941, "loss": 1.9129, "learning_rate": 9.661850091764756e-05, "epoch": 0.13248982776879772, "percentage": 13.25, "elapsed_time": "5:37:39", "remaining_time": "1 day, 12:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2378, "total_steps": 17941, "loss": 1.6931, "learning_rate": 9.661528124898937e-05, "epoch": 0.13254556602196088, "percentage": 13.25, "elapsed_time": "5:37:47", "remaining_time": "1 day, 12:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2379, "total_steps": 17941, "loss": 1.5938, "learning_rate": 9.661206010196624e-05, "epoch": 0.132601304275124, "percentage": 13.26, "elapsed_time": "5:37:56", "remaining_time": "1 day, 12:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2380, "total_steps": 17941, "loss": 2.0283, "learning_rate": 9.660883747668034e-05, "epoch": 0.13265704252828717, "percentage": 13.27, "elapsed_time": "5:38:04", "remaining_time": "1 day, 12:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2381, "total_steps": 17941, "loss": 1.8549, "learning_rate": 9.660561337323385e-05, "epoch": 0.1327127807814503, "percentage": 13.27, "elapsed_time": "5:38:13", "remaining_time": "1 day, 12:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2382, "total_steps": 17941, "loss": 2.0152, "learning_rate": 9.660238779172905e-05, "epoch": 0.13276851903461345, "percentage": 13.28, "elapsed_time": "5:38:21", "remaining_time": "1 day, 12:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2383, "total_steps": 17941, "loss": 1.7353, "learning_rate": 9.65991607322682e-05, "epoch": 0.1328242572877766, "percentage": 13.28, "elapsed_time": "5:38:30", "remaining_time": "1 day, 12:50:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2384, "total_steps": 17941, "loss": 1.6361, "learning_rate": 9.659593219495368e-05, "epoch": 0.13287999554093974, "percentage": 13.29, "elapsed_time": "5:38:38", "remaining_time": "1 day, 12:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2385, "total_steps": 17941, "loss": 1.682, "learning_rate": 9.659270217988786e-05, "epoch": 0.1329357337941029, "percentage": 13.29, "elapsed_time": "5:38:47", "remaining_time": "1 day, 12:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2386, "total_steps": 17941, "loss": 1.5736, "learning_rate": 9.658947068717316e-05, "epoch": 0.13299147204726605, "percentage": 13.3, "elapsed_time": "5:38:55", "remaining_time": "1 day, 12:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2387, "total_steps": 17941, "loss": 1.9172, "learning_rate": 9.658623771691211e-05, "epoch": 0.13304721030042918, "percentage": 13.3, "elapsed_time": "5:39:04", "remaining_time": "1 day, 12:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2388, "total_steps": 17941, "loss": 1.7751, "learning_rate": 9.658300326920722e-05, "epoch": 0.13310294855359234, "percentage": 13.31, "elapsed_time": "5:39:12", "remaining_time": "1 day, 12:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2389, "total_steps": 17941, "loss": 1.875, "learning_rate": 9.657976734416106e-05, "epoch": 0.13315868680675547, "percentage": 13.32, "elapsed_time": "5:39:21", "remaining_time": "1 day, 12:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2390, "total_steps": 17941, "loss": 1.7631, "learning_rate": 9.657652994187625e-05, "epoch": 0.13321442505991862, "percentage": 13.32, "elapsed_time": "5:39:30", "remaining_time": "1 day, 12:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2391, "total_steps": 17941, "loss": 1.6134, "learning_rate": 9.657329106245547e-05, "epoch": 0.13327016331308178, "percentage": 13.33, "elapsed_time": "5:39:39", "remaining_time": "1 day, 12:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2392, "total_steps": 17941, "loss": 1.7501, "learning_rate": 9.657005070600144e-05, "epoch": 0.1333259015662449, "percentage": 13.33, "elapsed_time": "5:39:47", "remaining_time": "1 day, 12:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2393, "total_steps": 17941, "loss": 1.7283, "learning_rate": 9.656680887261693e-05, "epoch": 0.13338163981940807, "percentage": 13.34, "elapsed_time": "5:39:55", "remaining_time": "1 day, 12:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2394, "total_steps": 17941, "loss": 1.7897, "learning_rate": 9.656356556240473e-05, "epoch": 0.1334373780725712, "percentage": 13.34, "elapsed_time": "5:40:04", "remaining_time": "1 day, 12:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2395, "total_steps": 17941, "loss": 1.7089, "learning_rate": 9.656032077546772e-05, "epoch": 0.13349311632573435, "percentage": 13.35, "elapsed_time": "5:40:12", "remaining_time": "1 day, 12:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2396, "total_steps": 17941, "loss": 1.8664, "learning_rate": 9.655707451190883e-05, "epoch": 0.1335488545788975, "percentage": 13.35, "elapsed_time": "5:40:21", "remaining_time": "1 day, 12:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2397, "total_steps": 17941, "loss": 1.5199, "learning_rate": 9.655382677183095e-05, "epoch": 0.13360459283206064, "percentage": 13.36, "elapsed_time": "5:40:29", "remaining_time": "1 day, 12:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2398, "total_steps": 17941, "loss": 1.9733, "learning_rate": 9.655057755533712e-05, "epoch": 0.1336603310852238, "percentage": 13.37, "elapsed_time": "5:40:38", "remaining_time": "1 day, 12:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2399, "total_steps": 17941, "loss": 1.8281, "learning_rate": 9.654732686253039e-05, "epoch": 0.13371606933838692, "percentage": 13.37, "elapsed_time": "5:40:46", "remaining_time": "1 day, 12:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2400, "total_steps": 17941, "loss": 1.592, "learning_rate": 9.654407469351383e-05, "epoch": 0.13377180759155008, "percentage": 13.38, "elapsed_time": "5:40:55", "remaining_time": "1 day, 12:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2401, "total_steps": 17941, "loss": 1.8503, "learning_rate": 9.654082104839059e-05, "epoch": 0.13382754584471324, "percentage": 13.38, "elapsed_time": "5:41:03", "remaining_time": "1 day, 12:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2402, "total_steps": 17941, "loss": 1.8579, "learning_rate": 9.653756592726386e-05, "epoch": 0.13388328409787636, "percentage": 13.39, "elapsed_time": "5:41:12", "remaining_time": "1 day, 12:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2403, "total_steps": 17941, "loss": 1.8618, "learning_rate": 9.653430933023689e-05, "epoch": 0.13393902235103952, "percentage": 13.39, "elapsed_time": "5:41:20", "remaining_time": "1 day, 12:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2404, "total_steps": 17941, "loss": 1.6213, "learning_rate": 9.653105125741292e-05, "epoch": 0.13399476060420265, "percentage": 13.4, "elapsed_time": "5:41:29", "remaining_time": "1 day, 12:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2405, "total_steps": 17941, "loss": 1.6255, "learning_rate": 9.65277917088953e-05, "epoch": 0.1340504988573658, "percentage": 13.41, "elapsed_time": "5:41:37", "remaining_time": "1 day, 12:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2406, "total_steps": 17941, "loss": 1.5653, "learning_rate": 9.652453068478741e-05, "epoch": 0.13410623711052896, "percentage": 13.41, "elapsed_time": "5:41:46", "remaining_time": "1 day, 12:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2407, "total_steps": 17941, "loss": 2.0985, "learning_rate": 9.652126818519266e-05, "epoch": 0.1341619753636921, "percentage": 13.42, "elapsed_time": "5:41:54", "remaining_time": "1 day, 12:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2408, "total_steps": 17941, "loss": 1.9636, "learning_rate": 9.651800421021453e-05, "epoch": 0.13421771361685525, "percentage": 13.42, "elapsed_time": "5:42:02", "remaining_time": "1 day, 12:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2409, "total_steps": 17941, "loss": 1.7129, "learning_rate": 9.651473875995651e-05, "epoch": 0.1342734518700184, "percentage": 13.43, "elapsed_time": "5:42:11", "remaining_time": "1 day, 12:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2410, "total_steps": 17941, "loss": 1.5304, "learning_rate": 9.651147183452219e-05, "epoch": 0.13432919012318154, "percentage": 13.43, "elapsed_time": "5:42:19", "remaining_time": "1 day, 12:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2411, "total_steps": 17941, "loss": 1.7844, "learning_rate": 9.650820343401515e-05, "epoch": 0.1343849283763447, "percentage": 13.44, "elapsed_time": "5:42:28", "remaining_time": "1 day, 12:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2412, "total_steps": 17941, "loss": 1.8585, "learning_rate": 9.650493355853906e-05, "epoch": 0.13444066662950782, "percentage": 13.44, "elapsed_time": "5:42:36", "remaining_time": "1 day, 12:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2413, "total_steps": 17941, "loss": 1.4576, "learning_rate": 9.650166220819764e-05, "epoch": 0.13449640488267098, "percentage": 13.45, "elapsed_time": "5:42:45", "remaining_time": "1 day, 12:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2414, "total_steps": 17941, "loss": 1.6994, "learning_rate": 9.64983893830946e-05, "epoch": 0.13455214313583413, "percentage": 13.46, "elapsed_time": "5:42:53", "remaining_time": "1 day, 12:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2415, "total_steps": 17941, "loss": 1.6614, "learning_rate": 9.649511508333375e-05, "epoch": 0.13460788138899726, "percentage": 13.46, "elapsed_time": "5:43:02", "remaining_time": "1 day, 12:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2416, "total_steps": 17941, "loss": 1.56, "learning_rate": 9.649183930901895e-05, "epoch": 0.13466361964216042, "percentage": 13.47, "elapsed_time": "5:43:11", "remaining_time": "1 day, 12:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2417, "total_steps": 17941, "loss": 1.7004, "learning_rate": 9.648856206025407e-05, "epoch": 0.13471935789532355, "percentage": 13.47, "elapsed_time": "5:43:19", "remaining_time": "1 day, 12:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2418, "total_steps": 17941, "loss": 1.7206, "learning_rate": 9.648528333714304e-05, "epoch": 0.1347750961484867, "percentage": 13.48, "elapsed_time": "5:43:28", "remaining_time": "1 day, 12:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2419, "total_steps": 17941, "loss": 1.757, "learning_rate": 9.648200313978986e-05, "epoch": 0.13483083440164986, "percentage": 13.48, "elapsed_time": "5:43:36", "remaining_time": "1 day, 12:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2420, "total_steps": 17941, "loss": 1.7236, "learning_rate": 9.647872146829855e-05, "epoch": 0.134886572654813, "percentage": 13.49, "elapsed_time": "5:43:45", "remaining_time": "1 day, 12:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2421, "total_steps": 17941, "loss": 1.7274, "learning_rate": 9.647543832277317e-05, "epoch": 0.13494231090797615, "percentage": 13.49, "elapsed_time": "5:43:53", "remaining_time": "1 day, 12:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2422, "total_steps": 17941, "loss": 1.9507, "learning_rate": 9.647215370331786e-05, "epoch": 0.13499804916113928, "percentage": 13.5, "elapsed_time": "5:44:02", "remaining_time": "1 day, 12:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2423, "total_steps": 17941, "loss": 1.9476, "learning_rate": 9.646886761003679e-05, "epoch": 0.13505378741430243, "percentage": 13.51, "elapsed_time": "5:44:10", "remaining_time": "1 day, 12:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2424, "total_steps": 17941, "loss": 1.7836, "learning_rate": 9.646558004303419e-05, "epoch": 0.1351095256674656, "percentage": 13.51, "elapsed_time": "5:44:19", "remaining_time": "1 day, 12:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2425, "total_steps": 17941, "loss": 1.7664, "learning_rate": 9.646229100241429e-05, "epoch": 0.13516526392062872, "percentage": 13.52, "elapsed_time": "5:44:27", "remaining_time": "1 day, 12:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2426, "total_steps": 17941, "loss": 2.0063, "learning_rate": 9.64590004882814e-05, "epoch": 0.13522100217379188, "percentage": 13.52, "elapsed_time": "5:44:36", "remaining_time": "1 day, 12:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2427, "total_steps": 17941, "loss": 1.8132, "learning_rate": 9.64557085007399e-05, "epoch": 0.135276740426955, "percentage": 13.53, "elapsed_time": "5:44:44", "remaining_time": "1 day, 12:43:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2428, "total_steps": 17941, "loss": 1.4198, "learning_rate": 9.64524150398942e-05, "epoch": 0.13533247868011816, "percentage": 13.53, "elapsed_time": "5:44:53", "remaining_time": "1 day, 12:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2429, "total_steps": 17941, "loss": 1.6062, "learning_rate": 9.64491201058487e-05, "epoch": 0.13538821693328132, "percentage": 13.54, "elapsed_time": "5:45:02", "remaining_time": "1 day, 12:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2430, "total_steps": 17941, "loss": 1.8179, "learning_rate": 9.644582369870794e-05, "epoch": 0.13544395518644445, "percentage": 13.54, "elapsed_time": "5:45:10", "remaining_time": "1 day, 12:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2431, "total_steps": 17941, "loss": 1.9697, "learning_rate": 9.644252581857647e-05, "epoch": 0.1354996934396076, "percentage": 13.55, "elapsed_time": "5:45:18", "remaining_time": "1 day, 12:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2432, "total_steps": 17941, "loss": 1.6746, "learning_rate": 9.643922646555883e-05, "epoch": 0.13555543169277076, "percentage": 13.56, "elapsed_time": "5:45:27", "remaining_time": "1 day, 12:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2433, "total_steps": 17941, "loss": 1.6561, "learning_rate": 9.64359256397597e-05, "epoch": 0.1356111699459339, "percentage": 13.56, "elapsed_time": "5:45:35", "remaining_time": "1 day, 12:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2434, "total_steps": 17941, "loss": 1.577, "learning_rate": 9.643262334128374e-05, "epoch": 0.13566690819909705, "percentage": 13.57, "elapsed_time": "5:45:44", "remaining_time": "1 day, 12:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2435, "total_steps": 17941, "loss": 1.6821, "learning_rate": 9.642931957023569e-05, "epoch": 0.13572264645226018, "percentage": 13.57, "elapsed_time": "5:45:53", "remaining_time": "1 day, 12:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2436, "total_steps": 17941, "loss": 1.4476, "learning_rate": 9.642601432672034e-05, "epoch": 0.13577838470542333, "percentage": 13.58, "elapsed_time": "5:46:01", "remaining_time": "1 day, 12:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2437, "total_steps": 17941, "loss": 1.9406, "learning_rate": 9.642270761084249e-05, "epoch": 0.1358341229585865, "percentage": 13.58, "elapsed_time": "5:46:10", "remaining_time": "1 day, 12:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2438, "total_steps": 17941, "loss": 1.6538, "learning_rate": 9.641939942270701e-05, "epoch": 0.13588986121174962, "percentage": 13.59, "elapsed_time": "5:46:18", "remaining_time": "1 day, 12:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2439, "total_steps": 17941, "loss": 1.8208, "learning_rate": 9.641608976241883e-05, "epoch": 0.13594559946491278, "percentage": 13.59, "elapsed_time": "5:46:27", "remaining_time": "1 day, 12:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2440, "total_steps": 17941, "loss": 1.6889, "learning_rate": 9.64127786300829e-05, "epoch": 0.1360013377180759, "percentage": 13.6, "elapsed_time": "5:46:36", "remaining_time": "1 day, 12:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2441, "total_steps": 17941, "loss": 2.0888, "learning_rate": 9.640946602580426e-05, "epoch": 0.13605707597123906, "percentage": 13.61, "elapsed_time": "5:46:44", "remaining_time": "1 day, 12:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2442, "total_steps": 17941, "loss": 1.7068, "learning_rate": 9.640615194968791e-05, "epoch": 0.13611281422440222, "percentage": 13.61, "elapsed_time": "5:46:53", "remaining_time": "1 day, 12:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2443, "total_steps": 17941, "loss": 1.7328, "learning_rate": 9.640283640183903e-05, "epoch": 0.13616855247756535, "percentage": 13.62, "elapsed_time": "5:47:01", "remaining_time": "1 day, 12:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2444, "total_steps": 17941, "loss": 1.7062, "learning_rate": 9.639951938236269e-05, "epoch": 0.1362242907307285, "percentage": 13.62, "elapsed_time": "5:47:10", "remaining_time": "1 day, 12:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2445, "total_steps": 17941, "loss": 1.8633, "learning_rate": 9.639620089136413e-05, "epoch": 0.13628002898389163, "percentage": 13.63, "elapsed_time": "5:47:18", "remaining_time": "1 day, 12:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2446, "total_steps": 17941, "loss": 1.9126, "learning_rate": 9.63928809289486e-05, "epoch": 0.1363357672370548, "percentage": 13.63, "elapsed_time": "5:47:27", "remaining_time": "1 day, 12:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2447, "total_steps": 17941, "loss": 1.6795, "learning_rate": 9.638955949522137e-05, "epoch": 0.13639150549021795, "percentage": 13.64, "elapsed_time": "5:47:35", "remaining_time": "1 day, 12:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2448, "total_steps": 17941, "loss": 1.008, "learning_rate": 9.638623659028779e-05, "epoch": 0.13644724374338107, "percentage": 13.64, "elapsed_time": "5:47:44", "remaining_time": "1 day, 12:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2449, "total_steps": 17941, "loss": 1.9597, "learning_rate": 9.63829122142532e-05, "epoch": 0.13650298199654423, "percentage": 13.65, "elapsed_time": "5:47:52", "remaining_time": "1 day, 12:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2450, "total_steps": 17941, "loss": 1.8801, "learning_rate": 9.637958636722311e-05, "epoch": 0.13655872024970736, "percentage": 13.66, "elapsed_time": "5:48:01", "remaining_time": "1 day, 12:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2451, "total_steps": 17941, "loss": 1.6802, "learning_rate": 9.637625904930292e-05, "epoch": 0.13661445850287052, "percentage": 13.66, "elapsed_time": "5:48:09", "remaining_time": "1 day, 12:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2452, "total_steps": 17941, "loss": 1.8041, "learning_rate": 9.63729302605982e-05, "epoch": 0.13667019675603367, "percentage": 13.67, "elapsed_time": "5:48:18", "remaining_time": "1 day, 12:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2453, "total_steps": 17941, "loss": 1.7381, "learning_rate": 9.636960000121451e-05, "epoch": 0.1367259350091968, "percentage": 13.67, "elapsed_time": "5:48:27", "remaining_time": "1 day, 12:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2454, "total_steps": 17941, "loss": 1.8356, "learning_rate": 9.636626827125745e-05, "epoch": 0.13678167326235996, "percentage": 13.68, "elapsed_time": "5:48:35", "remaining_time": "1 day, 12:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2455, "total_steps": 17941, "loss": 1.8636, "learning_rate": 9.63629350708327e-05, "epoch": 0.13683741151552312, "percentage": 13.68, "elapsed_time": "5:48:43", "remaining_time": "1 day, 12:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2456, "total_steps": 17941, "loss": 2.0967, "learning_rate": 9.635960040004597e-05, "epoch": 0.13689314976868625, "percentage": 13.69, "elapsed_time": "5:48:52", "remaining_time": "1 day, 12:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2457, "total_steps": 17941, "loss": 1.8931, "learning_rate": 9.635626425900301e-05, "epoch": 0.1369488880218494, "percentage": 13.69, "elapsed_time": "5:49:00", "remaining_time": "1 day, 12:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2458, "total_steps": 17941, "loss": 1.6546, "learning_rate": 9.635292664780962e-05, "epoch": 0.13700462627501253, "percentage": 13.7, "elapsed_time": "5:49:09", "remaining_time": "1 day, 12:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2459, "total_steps": 17941, "loss": 1.7135, "learning_rate": 9.634958756657165e-05, "epoch": 0.1370603645281757, "percentage": 13.71, "elapsed_time": "5:49:18", "remaining_time": "1 day, 12:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2460, "total_steps": 17941, "loss": 1.5297, "learning_rate": 9.634624701539498e-05, "epoch": 0.13711610278133884, "percentage": 13.71, "elapsed_time": "5:49:26", "remaining_time": "1 day, 12:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2461, "total_steps": 17941, "loss": 1.9089, "learning_rate": 9.63429049943856e-05, "epoch": 0.13717184103450197, "percentage": 13.72, "elapsed_time": "5:49:34", "remaining_time": "1 day, 12:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2462, "total_steps": 17941, "loss": 1.7987, "learning_rate": 9.633956150364947e-05, "epoch": 0.13722757928766513, "percentage": 13.72, "elapsed_time": "5:49:43", "remaining_time": "1 day, 12:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2463, "total_steps": 17941, "loss": 1.7035, "learning_rate": 9.633621654329261e-05, "epoch": 0.13728331754082826, "percentage": 13.73, "elapsed_time": "5:49:51", "remaining_time": "1 day, 12:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2464, "total_steps": 17941, "loss": 1.6676, "learning_rate": 9.633287011342113e-05, "epoch": 0.13733905579399142, "percentage": 13.73, "elapsed_time": "5:50:00", "remaining_time": "1 day, 12:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2465, "total_steps": 17941, "loss": 1.9683, "learning_rate": 9.632952221414116e-05, "epoch": 0.13739479404715457, "percentage": 13.74, "elapsed_time": "5:50:08", "remaining_time": "1 day, 12:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2466, "total_steps": 17941, "loss": 1.9232, "learning_rate": 9.632617284555886e-05, "epoch": 0.1374505323003177, "percentage": 13.75, "elapsed_time": "5:50:17", "remaining_time": "1 day, 12:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2467, "total_steps": 17941, "loss": 1.8352, "learning_rate": 9.632282200778045e-05, "epoch": 0.13750627055348086, "percentage": 13.75, "elapsed_time": "5:50:26", "remaining_time": "1 day, 12:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2468, "total_steps": 17941, "loss": 1.7636, "learning_rate": 9.631946970091221e-05, "epoch": 0.137562008806644, "percentage": 13.76, "elapsed_time": "5:50:34", "remaining_time": "1 day, 12:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2469, "total_steps": 17941, "loss": 1.7929, "learning_rate": 9.631611592506046e-05, "epoch": 0.13761774705980714, "percentage": 13.76, "elapsed_time": "5:50:43", "remaining_time": "1 day, 12:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2470, "total_steps": 17941, "loss": 1.89, "learning_rate": 9.631276068033154e-05, "epoch": 0.1376734853129703, "percentage": 13.77, "elapsed_time": "5:50:51", "remaining_time": "1 day, 12:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2471, "total_steps": 17941, "loss": 1.6766, "learning_rate": 9.630940396683188e-05, "epoch": 0.13772922356613343, "percentage": 13.77, "elapsed_time": "5:51:00", "remaining_time": "1 day, 12:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2472, "total_steps": 17941, "loss": 1.6168, "learning_rate": 9.630604578466794e-05, "epoch": 0.1377849618192966, "percentage": 13.78, "elapsed_time": "5:51:08", "remaining_time": "1 day, 12:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2473, "total_steps": 17941, "loss": 1.5592, "learning_rate": 9.63026861339462e-05, "epoch": 0.13784070007245972, "percentage": 13.78, "elapsed_time": "5:51:17", "remaining_time": "1 day, 12:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2474, "total_steps": 17941, "loss": 2.0793, "learning_rate": 9.629932501477321e-05, "epoch": 0.13789643832562287, "percentage": 13.79, "elapsed_time": "5:51:25", "remaining_time": "1 day, 12:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2475, "total_steps": 17941, "loss": 1.6693, "learning_rate": 9.629596242725558e-05, "epoch": 0.13795217657878603, "percentage": 13.8, "elapsed_time": "5:51:34", "remaining_time": "1 day, 12:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2476, "total_steps": 17941, "loss": 1.7398, "learning_rate": 9.629259837149995e-05, "epoch": 0.13800791483194916, "percentage": 13.8, "elapsed_time": "5:51:42", "remaining_time": "1 day, 12:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2477, "total_steps": 17941, "loss": 1.6665, "learning_rate": 9.6289232847613e-05, "epoch": 0.13806365308511231, "percentage": 13.81, "elapsed_time": "5:51:51", "remaining_time": "1 day, 12:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2478, "total_steps": 17941, "loss": 1.8411, "learning_rate": 9.628586585570149e-05, "epoch": 0.13811939133827547, "percentage": 13.81, "elapsed_time": "5:51:59", "remaining_time": "1 day, 12:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2479, "total_steps": 17941, "loss": 1.8821, "learning_rate": 9.628249739587217e-05, "epoch": 0.1381751295914386, "percentage": 13.82, "elapsed_time": "5:52:07", "remaining_time": "1 day, 12:36:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2480, "total_steps": 17941, "loss": 1.6075, "learning_rate": 9.627912746823187e-05, "epoch": 0.13823086784460176, "percentage": 13.82, "elapsed_time": "5:52:16", "remaining_time": "1 day, 12:36:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2481, "total_steps": 17941, "loss": 1.735, "learning_rate": 9.627575607288745e-05, "epoch": 0.13828660609776489, "percentage": 13.83, "elapsed_time": "5:52:24", "remaining_time": "1 day, 12:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2482, "total_steps": 17941, "loss": 2.0207, "learning_rate": 9.627238320994589e-05, "epoch": 0.13834234435092804, "percentage": 13.83, "elapsed_time": "5:52:33", "remaining_time": "1 day, 12:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2483, "total_steps": 17941, "loss": 1.64, "learning_rate": 9.626900887951412e-05, "epoch": 0.1383980826040912, "percentage": 13.84, "elapsed_time": "5:52:41", "remaining_time": "1 day, 12:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2484, "total_steps": 17941, "loss": 1.9062, "learning_rate": 9.626563308169914e-05, "epoch": 0.13845382085725433, "percentage": 13.85, "elapsed_time": "5:52:50", "remaining_time": "1 day, 12:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2485, "total_steps": 17941, "loss": 1.4852, "learning_rate": 9.626225581660803e-05, "epoch": 0.13850955911041749, "percentage": 13.85, "elapsed_time": "5:52:58", "remaining_time": "1 day, 12:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2486, "total_steps": 17941, "loss": 1.7517, "learning_rate": 9.625887708434788e-05, "epoch": 0.13856529736358061, "percentage": 13.86, "elapsed_time": "5:53:07", "remaining_time": "1 day, 12:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2487, "total_steps": 17941, "loss": 1.6785, "learning_rate": 9.625549688502589e-05, "epoch": 0.13862103561674377, "percentage": 13.86, "elapsed_time": "5:53:16", "remaining_time": "1 day, 12:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2488, "total_steps": 17941, "loss": 1.7213, "learning_rate": 9.62521152187492e-05, "epoch": 0.13867677386990693, "percentage": 13.87, "elapsed_time": "5:53:25", "remaining_time": "1 day, 12:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2489, "total_steps": 17941, "loss": 1.6256, "learning_rate": 9.624873208562509e-05, "epoch": 0.13873251212307006, "percentage": 13.87, "elapsed_time": "5:53:33", "remaining_time": "1 day, 12:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2490, "total_steps": 17941, "loss": 1.9997, "learning_rate": 9.624534748576085e-05, "epoch": 0.1387882503762332, "percentage": 13.88, "elapsed_time": "5:53:42", "remaining_time": "1 day, 12:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2491, "total_steps": 17941, "loss": 1.6544, "learning_rate": 9.624196141926381e-05, "epoch": 0.13884398862939634, "percentage": 13.88, "elapsed_time": "5:53:50", "remaining_time": "1 day, 12:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2492, "total_steps": 17941, "loss": 1.8297, "learning_rate": 9.623857388624138e-05, "epoch": 0.1388997268825595, "percentage": 13.89, "elapsed_time": "5:53:59", "remaining_time": "1 day, 12:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2493, "total_steps": 17941, "loss": 1.9136, "learning_rate": 9.623518488680095e-05, "epoch": 0.13895546513572266, "percentage": 13.9, "elapsed_time": "5:54:07", "remaining_time": "1 day, 12:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2494, "total_steps": 17941, "loss": 1.7471, "learning_rate": 9.623179442105004e-05, "epoch": 0.13901120338888578, "percentage": 13.9, "elapsed_time": "5:54:16", "remaining_time": "1 day, 12:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2495, "total_steps": 17941, "loss": 1.6395, "learning_rate": 9.622840248909617e-05, "epoch": 0.13906694164204894, "percentage": 13.91, "elapsed_time": "5:54:24", "remaining_time": "1 day, 12:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2496, "total_steps": 17941, "loss": 1.6751, "learning_rate": 9.622500909104689e-05, "epoch": 0.13912267989521207, "percentage": 13.91, "elapsed_time": "5:54:33", "remaining_time": "1 day, 12:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2497, "total_steps": 17941, "loss": 1.7681, "learning_rate": 9.622161422700984e-05, "epoch": 0.13917841814837523, "percentage": 13.92, "elapsed_time": "5:54:41", "remaining_time": "1 day, 12:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2498, "total_steps": 17941, "loss": 1.6317, "learning_rate": 9.621821789709267e-05, "epoch": 0.13923415640153838, "percentage": 13.92, "elapsed_time": "5:54:49", "remaining_time": "1 day, 12:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2499, "total_steps": 17941, "loss": 1.8691, "learning_rate": 9.62148201014031e-05, "epoch": 0.1392898946547015, "percentage": 13.93, "elapsed_time": "5:54:58", "remaining_time": "1 day, 12:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 17941, "loss": 1.6061, "learning_rate": 9.621142084004889e-05, "epoch": 0.13934563290786467, "percentage": 13.93, "elapsed_time": "5:55:06", "remaining_time": "1 day, 12:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2501, "total_steps": 17941, "loss": 1.9551, "learning_rate": 9.620802011313785e-05, "epoch": 0.13940137116102783, "percentage": 13.94, "elapsed_time": "5:55:15", "remaining_time": "1 day, 12:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2502, "total_steps": 17941, "loss": 1.8419, "learning_rate": 9.620461792077782e-05, "epoch": 0.13945710941419096, "percentage": 13.95, "elapsed_time": "5:55:24", "remaining_time": "1 day, 12:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2503, "total_steps": 17941, "loss": 1.9454, "learning_rate": 9.620121426307669e-05, "epoch": 0.1395128476673541, "percentage": 13.95, "elapsed_time": "5:55:32", "remaining_time": "1 day, 12:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2504, "total_steps": 17941, "loss": 1.6189, "learning_rate": 9.619780914014242e-05, "epoch": 0.13956858592051724, "percentage": 13.96, "elapsed_time": "5:55:41", "remaining_time": "1 day, 12:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2505, "total_steps": 17941, "loss": 1.7667, "learning_rate": 9.619440255208301e-05, "epoch": 0.1396243241736804, "percentage": 13.96, "elapsed_time": "5:55:50", "remaining_time": "1 day, 12:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2506, "total_steps": 17941, "loss": 1.6797, "learning_rate": 9.619099449900646e-05, "epoch": 0.13968006242684355, "percentage": 13.97, "elapsed_time": "5:55:58", "remaining_time": "1 day, 12:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2507, "total_steps": 17941, "loss": 1.9559, "learning_rate": 9.618758498102089e-05, "epoch": 0.13973580068000668, "percentage": 13.97, "elapsed_time": "5:56:07", "remaining_time": "1 day, 12:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2508, "total_steps": 17941, "loss": 1.7971, "learning_rate": 9.618417399823441e-05, "epoch": 0.13979153893316984, "percentage": 13.98, "elapsed_time": "5:56:15", "remaining_time": "1 day, 12:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2509, "total_steps": 17941, "loss": 1.8631, "learning_rate": 9.618076155075521e-05, "epoch": 0.13984727718633297, "percentage": 13.98, "elapsed_time": "5:56:24", "remaining_time": "1 day, 12:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2510, "total_steps": 17941, "loss": 1.7487, "learning_rate": 9.617734763869151e-05, "epoch": 0.13990301543949613, "percentage": 13.99, "elapsed_time": "5:56:33", "remaining_time": "1 day, 12:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2511, "total_steps": 17941, "loss": 1.6849, "learning_rate": 9.617393226215157e-05, "epoch": 0.13995875369265928, "percentage": 14.0, "elapsed_time": "5:56:41", "remaining_time": "1 day, 12:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2512, "total_steps": 17941, "loss": 1.7637, "learning_rate": 9.617051542124371e-05, "epoch": 0.1400144919458224, "percentage": 14.0, "elapsed_time": "5:56:49", "remaining_time": "1 day, 12:31:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2513, "total_steps": 17941, "loss": 1.6303, "learning_rate": 9.61670971160763e-05, "epoch": 0.14007023019898557, "percentage": 14.01, "elapsed_time": "5:56:58", "remaining_time": "1 day, 12:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2514, "total_steps": 17941, "loss": 1.5709, "learning_rate": 9.616367734675772e-05, "epoch": 0.1401259684521487, "percentage": 14.01, "elapsed_time": "5:57:06", "remaining_time": "1 day, 12:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2515, "total_steps": 17941, "loss": 1.8456, "learning_rate": 9.616025611339647e-05, "epoch": 0.14018170670531185, "percentage": 14.02, "elapsed_time": "5:57:15", "remaining_time": "1 day, 12:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2516, "total_steps": 17941, "loss": 1.7499, "learning_rate": 9.615683341610103e-05, "epoch": 0.140237444958475, "percentage": 14.02, "elapsed_time": "5:57:24", "remaining_time": "1 day, 12:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2517, "total_steps": 17941, "loss": 1.6875, "learning_rate": 9.615340925497995e-05, "epoch": 0.14029318321163814, "percentage": 14.03, "elapsed_time": "5:57:32", "remaining_time": "1 day, 12:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2518, "total_steps": 17941, "loss": 1.6336, "learning_rate": 9.61499836301418e-05, "epoch": 0.1403489214648013, "percentage": 14.03, "elapsed_time": "5:57:41", "remaining_time": "1 day, 12:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2519, "total_steps": 17941, "loss": 1.8164, "learning_rate": 9.614655654169527e-05, "epoch": 0.14040465971796443, "percentage": 14.04, "elapsed_time": "5:57:49", "remaining_time": "1 day, 12:30:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2520, "total_steps": 17941, "loss": 1.626, "learning_rate": 9.6143127989749e-05, "epoch": 0.14046039797112758, "percentage": 14.05, "elapsed_time": "5:57:58", "remaining_time": "1 day, 12:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2521, "total_steps": 17941, "loss": 2.0087, "learning_rate": 9.613969797441173e-05, "epoch": 0.14051613622429074, "percentage": 14.05, "elapsed_time": "5:58:06", "remaining_time": "1 day, 12:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2522, "total_steps": 17941, "loss": 1.74, "learning_rate": 9.613626649579229e-05, "epoch": 0.14057187447745387, "percentage": 14.06, "elapsed_time": "5:58:14", "remaining_time": "1 day, 12:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2523, "total_steps": 17941, "loss": 1.7088, "learning_rate": 9.613283355399945e-05, "epoch": 0.14062761273061702, "percentage": 14.06, "elapsed_time": "5:58:24", "remaining_time": "1 day, 12:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2524, "total_steps": 17941, "loss": 1.5665, "learning_rate": 9.61293991491421e-05, "epoch": 0.14068335098378018, "percentage": 14.07, "elapsed_time": "5:58:32", "remaining_time": "1 day, 12:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2525, "total_steps": 17941, "loss": 1.3456, "learning_rate": 9.612596328132915e-05, "epoch": 0.1407390892369433, "percentage": 14.07, "elapsed_time": "5:58:40", "remaining_time": "1 day, 12:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2526, "total_steps": 17941, "loss": 1.6111, "learning_rate": 9.61225259506696e-05, "epoch": 0.14079482749010647, "percentage": 14.08, "elapsed_time": "5:58:49", "remaining_time": "1 day, 12:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2527, "total_steps": 17941, "loss": 1.9546, "learning_rate": 9.611908715727244e-05, "epoch": 0.1408505657432696, "percentage": 14.09, "elapsed_time": "5:58:57", "remaining_time": "1 day, 12:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2528, "total_steps": 17941, "loss": 1.8488, "learning_rate": 9.611564690124672e-05, "epoch": 0.14090630399643275, "percentage": 14.09, "elapsed_time": "5:59:06", "remaining_time": "1 day, 12:29:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2529, "total_steps": 17941, "loss": 1.7367, "learning_rate": 9.611220518270155e-05, "epoch": 0.1409620422495959, "percentage": 14.1, "elapsed_time": "5:59:15", "remaining_time": "1 day, 12:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2530, "total_steps": 17941, "loss": 1.5207, "learning_rate": 9.61087620017461e-05, "epoch": 0.14101778050275904, "percentage": 14.1, "elapsed_time": "5:59:24", "remaining_time": "1 day, 12:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2531, "total_steps": 17941, "loss": 1.6592, "learning_rate": 9.610531735848953e-05, "epoch": 0.1410735187559222, "percentage": 14.11, "elapsed_time": "5:59:32", "remaining_time": "1 day, 12:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2532, "total_steps": 17941, "loss": 1.7567, "learning_rate": 9.610187125304111e-05, "epoch": 0.14112925700908532, "percentage": 14.11, "elapsed_time": "5:59:41", "remaining_time": "1 day, 12:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2533, "total_steps": 17941, "loss": 1.7151, "learning_rate": 9.609842368551014e-05, "epoch": 0.14118499526224848, "percentage": 14.12, "elapsed_time": "5:59:49", "remaining_time": "1 day, 12:28:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2534, "total_steps": 17941, "loss": 1.9591, "learning_rate": 9.609497465600595e-05, "epoch": 0.14124073351541164, "percentage": 14.12, "elapsed_time": "5:59:58", "remaining_time": "1 day, 12:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2535, "total_steps": 17941, "loss": 1.7296, "learning_rate": 9.60915241646379e-05, "epoch": 0.14129647176857477, "percentage": 14.13, "elapsed_time": "6:00:06", "remaining_time": "1 day, 12:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2536, "total_steps": 17941, "loss": 1.7645, "learning_rate": 9.608807221151543e-05, "epoch": 0.14135221002173792, "percentage": 14.14, "elapsed_time": "6:00:14", "remaining_time": "1 day, 12:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2537, "total_steps": 17941, "loss": 1.8227, "learning_rate": 9.608461879674802e-05, "epoch": 0.14140794827490105, "percentage": 14.14, "elapsed_time": "6:00:23", "remaining_time": "1 day, 12:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2538, "total_steps": 17941, "loss": 1.6495, "learning_rate": 9.608116392044521e-05, "epoch": 0.1414636865280642, "percentage": 14.15, "elapsed_time": "6:00:32", "remaining_time": "1 day, 12:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2539, "total_steps": 17941, "loss": 1.9329, "learning_rate": 9.607770758271655e-05, "epoch": 0.14151942478122737, "percentage": 14.15, "elapsed_time": "6:00:40", "remaining_time": "1 day, 12:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2540, "total_steps": 17941, "loss": 1.8535, "learning_rate": 9.607424978367165e-05, "epoch": 0.1415751630343905, "percentage": 14.16, "elapsed_time": "6:00:49", "remaining_time": "1 day, 12:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2541, "total_steps": 17941, "loss": 1.6956, "learning_rate": 9.607079052342018e-05, "epoch": 0.14163090128755365, "percentage": 14.16, "elapsed_time": "6:00:57", "remaining_time": "1 day, 12:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2542, "total_steps": 17941, "loss": 1.6842, "learning_rate": 9.606732980207184e-05, "epoch": 0.1416866395407168, "percentage": 14.17, "elapsed_time": "6:01:06", "remaining_time": "1 day, 12:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2543, "total_steps": 17941, "loss": 1.778, "learning_rate": 9.606386761973641e-05, "epoch": 0.14174237779387994, "percentage": 14.17, "elapsed_time": "6:01:14", "remaining_time": "1 day, 12:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2544, "total_steps": 17941, "loss": 1.8492, "learning_rate": 9.606040397652365e-05, "epoch": 0.1417981160470431, "percentage": 14.18, "elapsed_time": "6:01:22", "remaining_time": "1 day, 12:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2545, "total_steps": 17941, "loss": 1.8428, "learning_rate": 9.605693887254343e-05, "epoch": 0.14185385430020622, "percentage": 14.19, "elapsed_time": "6:01:31", "remaining_time": "1 day, 12:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2546, "total_steps": 17941, "loss": 1.786, "learning_rate": 9.605347230790565e-05, "epoch": 0.14190959255336938, "percentage": 14.19, "elapsed_time": "6:01:39", "remaining_time": "1 day, 12:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2547, "total_steps": 17941, "loss": 1.5936, "learning_rate": 9.605000428272023e-05, "epoch": 0.14196533080653254, "percentage": 14.2, "elapsed_time": "6:01:48", "remaining_time": "1 day, 12:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2548, "total_steps": 17941, "loss": 1.8033, "learning_rate": 9.604653479709717e-05, "epoch": 0.14202106905969566, "percentage": 14.2, "elapsed_time": "6:01:56", "remaining_time": "1 day, 12:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2549, "total_steps": 17941, "loss": 1.5892, "learning_rate": 9.60430638511465e-05, "epoch": 0.14207680731285882, "percentage": 14.21, "elapsed_time": "6:02:05", "remaining_time": "1 day, 12:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2550, "total_steps": 17941, "loss": 1.6489, "learning_rate": 9.603959144497827e-05, "epoch": 0.14213254556602195, "percentage": 14.21, "elapsed_time": "6:02:14", "remaining_time": "1 day, 12:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2551, "total_steps": 17941, "loss": 1.4806, "learning_rate": 9.603611757870266e-05, "epoch": 0.1421882838191851, "percentage": 14.22, "elapsed_time": "6:02:22", "remaining_time": "1 day, 12:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2552, "total_steps": 17941, "loss": 1.7944, "learning_rate": 9.603264225242978e-05, "epoch": 0.14224402207234826, "percentage": 14.22, "elapsed_time": "6:02:31", "remaining_time": "1 day, 12:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2553, "total_steps": 17941, "loss": 1.828, "learning_rate": 9.60291654662699e-05, "epoch": 0.1422997603255114, "percentage": 14.23, "elapsed_time": "6:02:39", "remaining_time": "1 day, 12:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2554, "total_steps": 17941, "loss": 1.8621, "learning_rate": 9.602568722033326e-05, "epoch": 0.14235549857867455, "percentage": 14.24, "elapsed_time": "6:02:48", "remaining_time": "1 day, 12:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2555, "total_steps": 17941, "loss": 1.8829, "learning_rate": 9.602220751473015e-05, "epoch": 0.14241123683183768, "percentage": 14.24, "elapsed_time": "6:02:57", "remaining_time": "1 day, 12:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2556, "total_steps": 17941, "loss": 1.6547, "learning_rate": 9.601872634957096e-05, "epoch": 0.14246697508500084, "percentage": 14.25, "elapsed_time": "6:03:05", "remaining_time": "1 day, 12:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2557, "total_steps": 17941, "loss": 1.6629, "learning_rate": 9.601524372496608e-05, "epoch": 0.142522713338164, "percentage": 14.25, "elapsed_time": "6:03:13", "remaining_time": "1 day, 12:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2558, "total_steps": 17941, "loss": 1.8285, "learning_rate": 9.601175964102596e-05, "epoch": 0.14257845159132712, "percentage": 14.26, "elapsed_time": "6:03:22", "remaining_time": "1 day, 12:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2559, "total_steps": 17941, "loss": 1.9544, "learning_rate": 9.600827409786107e-05, "epoch": 0.14263418984449028, "percentage": 14.26, "elapsed_time": "6:03:30", "remaining_time": "1 day, 12:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2560, "total_steps": 17941, "loss": 1.5243, "learning_rate": 9.600478709558199e-05, "epoch": 0.1426899280976534, "percentage": 14.27, "elapsed_time": "6:03:39", "remaining_time": "1 day, 12:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2561, "total_steps": 17941, "loss": 1.6888, "learning_rate": 9.600129863429929e-05, "epoch": 0.14274566635081656, "percentage": 14.27, "elapsed_time": "6:03:48", "remaining_time": "1 day, 12:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2562, "total_steps": 17941, "loss": 1.8205, "learning_rate": 9.599780871412359e-05, "epoch": 0.14280140460397972, "percentage": 14.28, "elapsed_time": "6:03:56", "remaining_time": "1 day, 12:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2563, "total_steps": 17941, "loss": 1.69, "learning_rate": 9.59943173351656e-05, "epoch": 0.14285714285714285, "percentage": 14.29, "elapsed_time": "6:04:05", "remaining_time": "1 day, 12:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2564, "total_steps": 17941, "loss": 1.918, "learning_rate": 9.599082449753602e-05, "epoch": 0.142912881110306, "percentage": 14.29, "elapsed_time": "6:04:13", "remaining_time": "1 day, 12:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2565, "total_steps": 17941, "loss": 1.7039, "learning_rate": 9.598733020134562e-05, "epoch": 0.14296861936346916, "percentage": 14.3, "elapsed_time": "6:04:22", "remaining_time": "1 day, 12:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2566, "total_steps": 17941, "loss": 1.6948, "learning_rate": 9.598383444670526e-05, "epoch": 0.1430243576166323, "percentage": 14.3, "elapsed_time": "6:04:30", "remaining_time": "1 day, 12:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2567, "total_steps": 17941, "loss": 1.6666, "learning_rate": 9.598033723372575e-05, "epoch": 0.14308009586979545, "percentage": 14.31, "elapsed_time": "6:04:39", "remaining_time": "1 day, 12:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2568, "total_steps": 17941, "loss": 1.9023, "learning_rate": 9.597683856251804e-05, "epoch": 0.14313583412295858, "percentage": 14.31, "elapsed_time": "6:04:47", "remaining_time": "1 day, 12:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2569, "total_steps": 17941, "loss": 1.6297, "learning_rate": 9.597333843319309e-05, "epoch": 0.14319157237612173, "percentage": 14.32, "elapsed_time": "6:04:55", "remaining_time": "1 day, 12:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2570, "total_steps": 17941, "loss": 1.6558, "learning_rate": 9.596983684586186e-05, "epoch": 0.1432473106292849, "percentage": 14.32, "elapsed_time": "6:05:04", "remaining_time": "1 day, 12:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2571, "total_steps": 17941, "loss": 1.78, "learning_rate": 9.596633380063544e-05, "epoch": 0.14330304888244802, "percentage": 14.33, "elapsed_time": "6:05:12", "remaining_time": "1 day, 12:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2572, "total_steps": 17941, "loss": 1.848, "learning_rate": 9.596282929762492e-05, "epoch": 0.14335878713561118, "percentage": 14.34, "elapsed_time": "6:05:21", "remaining_time": "1 day, 12:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2573, "total_steps": 17941, "loss": 1.847, "learning_rate": 9.595932333694142e-05, "epoch": 0.1434145253887743, "percentage": 14.34, "elapsed_time": "6:05:29", "remaining_time": "1 day, 12:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2574, "total_steps": 17941, "loss": 1.713, "learning_rate": 9.595581591869616e-05, "epoch": 0.14347026364193746, "percentage": 14.35, "elapsed_time": "6:05:38", "remaining_time": "1 day, 12:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2575, "total_steps": 17941, "loss": 1.9647, "learning_rate": 9.595230704300035e-05, "epoch": 0.14352600189510062, "percentage": 14.35, "elapsed_time": "6:05:46", "remaining_time": "1 day, 12:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2576, "total_steps": 17941, "loss": 1.7378, "learning_rate": 9.594879670996528e-05, "epoch": 0.14358174014826375, "percentage": 14.36, "elapsed_time": "6:05:55", "remaining_time": "1 day, 12:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2577, "total_steps": 17941, "loss": 1.7663, "learning_rate": 9.594528491970228e-05, "epoch": 0.1436374784014269, "percentage": 14.36, "elapsed_time": "6:06:03", "remaining_time": "1 day, 12:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2578, "total_steps": 17941, "loss": 1.6068, "learning_rate": 9.594177167232273e-05, "epoch": 0.14369321665459003, "percentage": 14.37, "elapsed_time": "6:06:11", "remaining_time": "1 day, 12:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2579, "total_steps": 17941, "loss": 1.6527, "learning_rate": 9.593825696793803e-05, "epoch": 0.1437489549077532, "percentage": 14.37, "elapsed_time": "6:06:20", "remaining_time": "1 day, 12:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2580, "total_steps": 17941, "loss": 1.5839, "learning_rate": 9.593474080665968e-05, "epoch": 0.14380469316091635, "percentage": 14.38, "elapsed_time": "6:06:28", "remaining_time": "1 day, 12:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2581, "total_steps": 17941, "loss": 1.8217, "learning_rate": 9.593122318859915e-05, "epoch": 0.14386043141407948, "percentage": 14.39, "elapsed_time": "6:06:37", "remaining_time": "1 day, 12:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2582, "total_steps": 17941, "loss": 1.8395, "learning_rate": 9.592770411386802e-05, "epoch": 0.14391616966724263, "percentage": 14.39, "elapsed_time": "6:06:45", "remaining_time": "1 day, 12:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2583, "total_steps": 17941, "loss": 1.8477, "learning_rate": 9.592418358257789e-05, "epoch": 0.14397190792040576, "percentage": 14.4, "elapsed_time": "6:06:54", "remaining_time": "1 day, 12:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2584, "total_steps": 17941, "loss": 1.6152, "learning_rate": 9.592066159484043e-05, "epoch": 0.14402764617356892, "percentage": 14.4, "elapsed_time": "6:07:02", "remaining_time": "1 day, 12:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2585, "total_steps": 17941, "loss": 1.8558, "learning_rate": 9.59171381507673e-05, "epoch": 0.14408338442673208, "percentage": 14.41, "elapsed_time": "6:07:11", "remaining_time": "1 day, 12:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2586, "total_steps": 17941, "loss": 1.8752, "learning_rate": 9.591361325047028e-05, "epoch": 0.1441391226798952, "percentage": 14.41, "elapsed_time": "6:07:20", "remaining_time": "1 day, 12:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2587, "total_steps": 17941, "loss": 1.6977, "learning_rate": 9.591008689406114e-05, "epoch": 0.14419486093305836, "percentage": 14.42, "elapsed_time": "6:07:28", "remaining_time": "1 day, 12:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2588, "total_steps": 17941, "loss": 1.8379, "learning_rate": 9.59065590816517e-05, "epoch": 0.14425059918622152, "percentage": 14.43, "elapsed_time": "6:07:37", "remaining_time": "1 day, 12:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2589, "total_steps": 17941, "loss": 1.98, "learning_rate": 9.590302981335387e-05, "epoch": 0.14430633743938465, "percentage": 14.43, "elapsed_time": "6:07:46", "remaining_time": "1 day, 12:20:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2590, "total_steps": 17941, "loss": 1.7123, "learning_rate": 9.589949908927957e-05, "epoch": 0.1443620756925478, "percentage": 14.44, "elapsed_time": "6:07:54", "remaining_time": "1 day, 12:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2591, "total_steps": 17941, "loss": 1.8578, "learning_rate": 9.589596690954077e-05, "epoch": 0.14441781394571093, "percentage": 14.44, "elapsed_time": "6:08:02", "remaining_time": "1 day, 12:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2592, "total_steps": 17941, "loss": 1.7641, "learning_rate": 9.589243327424951e-05, "epoch": 0.1444735521988741, "percentage": 14.45, "elapsed_time": "6:08:11", "remaining_time": "1 day, 12:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2593, "total_steps": 17941, "loss": 1.6991, "learning_rate": 9.588889818351781e-05, "epoch": 0.14452929045203725, "percentage": 14.45, "elapsed_time": "6:08:19", "remaining_time": "1 day, 12:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2594, "total_steps": 17941, "loss": 1.7019, "learning_rate": 9.588536163745782e-05, "epoch": 0.14458502870520037, "percentage": 14.46, "elapsed_time": "6:08:28", "remaining_time": "1 day, 12:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2595, "total_steps": 17941, "loss": 1.6645, "learning_rate": 9.58818236361817e-05, "epoch": 0.14464076695836353, "percentage": 14.46, "elapsed_time": "6:08:36", "remaining_time": "1 day, 12:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2596, "total_steps": 17941, "loss": 2.0606, "learning_rate": 9.587828417980163e-05, "epoch": 0.14469650521152666, "percentage": 14.47, "elapsed_time": "6:08:45", "remaining_time": "1 day, 12:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2597, "total_steps": 17941, "loss": 1.8879, "learning_rate": 9.587474326842987e-05, "epoch": 0.14475224346468982, "percentage": 14.48, "elapsed_time": "6:08:54", "remaining_time": "1 day, 12:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2598, "total_steps": 17941, "loss": 1.6668, "learning_rate": 9.587120090217874e-05, "epoch": 0.14480798171785297, "percentage": 14.48, "elapsed_time": "6:09:02", "remaining_time": "1 day, 12:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2599, "total_steps": 17941, "loss": 1.6322, "learning_rate": 9.586765708116056e-05, "epoch": 0.1448637199710161, "percentage": 14.49, "elapsed_time": "6:09:10", "remaining_time": "1 day, 12:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2600, "total_steps": 17941, "loss": 1.7002, "learning_rate": 9.586411180548771e-05, "epoch": 0.14491945822417926, "percentage": 14.49, "elapsed_time": "6:09:19", "remaining_time": "1 day, 12:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2601, "total_steps": 17941, "loss": 1.8232, "learning_rate": 9.586056507527266e-05, "epoch": 0.1449751964773424, "percentage": 14.5, "elapsed_time": "6:09:27", "remaining_time": "1 day, 12:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2602, "total_steps": 17941, "loss": 1.7799, "learning_rate": 9.585701689062785e-05, "epoch": 0.14503093473050555, "percentage": 14.5, "elapsed_time": "6:09:36", "remaining_time": "1 day, 12:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2603, "total_steps": 17941, "loss": 1.5724, "learning_rate": 9.585346725166584e-05, "epoch": 0.1450866729836687, "percentage": 14.51, "elapsed_time": "6:09:44", "remaining_time": "1 day, 12:18:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2604, "total_steps": 17941, "loss": 1.898, "learning_rate": 9.584991615849921e-05, "epoch": 0.14514241123683183, "percentage": 14.51, "elapsed_time": "6:09:53", "remaining_time": "1 day, 12:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2605, "total_steps": 17941, "loss": 1.5643, "learning_rate": 9.584636361124054e-05, "epoch": 0.145198149489995, "percentage": 14.52, "elapsed_time": "6:10:02", "remaining_time": "1 day, 12:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2606, "total_steps": 17941, "loss": 1.575, "learning_rate": 9.584280961000253e-05, "epoch": 0.14525388774315812, "percentage": 14.53, "elapsed_time": "6:10:10", "remaining_time": "1 day, 12:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2607, "total_steps": 17941, "loss": 1.7932, "learning_rate": 9.583925415489787e-05, "epoch": 0.14530962599632127, "percentage": 14.53, "elapsed_time": "6:10:19", "remaining_time": "1 day, 12:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2608, "total_steps": 17941, "loss": 2.0627, "learning_rate": 9.583569724603934e-05, "epoch": 0.14536536424948443, "percentage": 14.54, "elapsed_time": "6:10:27", "remaining_time": "1 day, 12:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2609, "total_steps": 17941, "loss": 1.7767, "learning_rate": 9.583213888353972e-05, "epoch": 0.14542110250264756, "percentage": 14.54, "elapsed_time": "6:10:36", "remaining_time": "1 day, 12:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2610, "total_steps": 17941, "loss": 2.05, "learning_rate": 9.582857906751191e-05, "epoch": 0.14547684075581072, "percentage": 14.55, "elapsed_time": "6:10:44", "remaining_time": "1 day, 12:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2611, "total_steps": 17941, "loss": 1.7722, "learning_rate": 9.582501779806874e-05, "epoch": 0.14553257900897387, "percentage": 14.55, "elapsed_time": "6:10:53", "remaining_time": "1 day, 12:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2612, "total_steps": 17941, "loss": 1.6958, "learning_rate": 9.582145507532319e-05, "epoch": 0.145588317262137, "percentage": 14.56, "elapsed_time": "6:11:01", "remaining_time": "1 day, 12:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2613, "total_steps": 17941, "loss": 1.8401, "learning_rate": 9.581789089938825e-05, "epoch": 0.14564405551530016, "percentage": 14.56, "elapsed_time": "6:11:09", "remaining_time": "1 day, 12:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2614, "total_steps": 17941, "loss": 1.7684, "learning_rate": 9.581432527037693e-05, "epoch": 0.1456997937684633, "percentage": 14.57, "elapsed_time": "6:11:18", "remaining_time": "1 day, 12:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2615, "total_steps": 17941, "loss": 1.7435, "learning_rate": 9.581075818840234e-05, "epoch": 0.14575553202162644, "percentage": 14.58, "elapsed_time": "6:11:27", "remaining_time": "1 day, 12:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2616, "total_steps": 17941, "loss": 1.8191, "learning_rate": 9.58071896535776e-05, "epoch": 0.1458112702747896, "percentage": 14.58, "elapsed_time": "6:11:35", "remaining_time": "1 day, 12:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2617, "total_steps": 17941, "loss": 1.877, "learning_rate": 9.580361966601588e-05, "epoch": 0.14586700852795273, "percentage": 14.59, "elapsed_time": "6:11:44", "remaining_time": "1 day, 12:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2618, "total_steps": 17941, "loss": 1.6282, "learning_rate": 9.580004822583038e-05, "epoch": 0.1459227467811159, "percentage": 14.59, "elapsed_time": "6:11:52", "remaining_time": "1 day, 12:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2619, "total_steps": 17941, "loss": 1.7076, "learning_rate": 9.579647533313439e-05, "epoch": 0.14597848503427902, "percentage": 14.6, "elapsed_time": "6:12:01", "remaining_time": "1 day, 12:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2620, "total_steps": 17941, "loss": 1.6271, "learning_rate": 9.579290098804122e-05, "epoch": 0.14603422328744217, "percentage": 14.6, "elapsed_time": "6:12:09", "remaining_time": "1 day, 12:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2621, "total_steps": 17941, "loss": 1.8687, "learning_rate": 9.578932519066422e-05, "epoch": 0.14608996154060533, "percentage": 14.61, "elapsed_time": "6:12:17", "remaining_time": "1 day, 12:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2622, "total_steps": 17941, "loss": 1.6985, "learning_rate": 9.57857479411168e-05, "epoch": 0.14614569979376846, "percentage": 14.61, "elapsed_time": "6:12:26", "remaining_time": "1 day, 12:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2623, "total_steps": 17941, "loss": 1.7291, "learning_rate": 9.57821692395124e-05, "epoch": 0.14620143804693161, "percentage": 14.62, "elapsed_time": "6:12:34", "remaining_time": "1 day, 12:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2624, "total_steps": 17941, "loss": 1.729, "learning_rate": 9.577858908596451e-05, "epoch": 0.14625717630009474, "percentage": 14.63, "elapsed_time": "6:12:43", "remaining_time": "1 day, 12:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2625, "total_steps": 17941, "loss": 1.4164, "learning_rate": 9.57750074805867e-05, "epoch": 0.1463129145532579, "percentage": 14.63, "elapsed_time": "6:12:51", "remaining_time": "1 day, 12:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2626, "total_steps": 17941, "loss": 1.7282, "learning_rate": 9.577142442349254e-05, "epoch": 0.14636865280642106, "percentage": 14.64, "elapsed_time": "6:13:00", "remaining_time": "1 day, 12:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2627, "total_steps": 17941, "loss": 1.8092, "learning_rate": 9.576783991479565e-05, "epoch": 0.14642439105958419, "percentage": 14.64, "elapsed_time": "6:13:08", "remaining_time": "1 day, 12:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2628, "total_steps": 17941, "loss": 1.8241, "learning_rate": 9.576425395460973e-05, "epoch": 0.14648012931274734, "percentage": 14.65, "elapsed_time": "6:13:17", "remaining_time": "1 day, 12:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2629, "total_steps": 17941, "loss": 1.9425, "learning_rate": 9.576066654304849e-05, "epoch": 0.14653586756591047, "percentage": 14.65, "elapsed_time": "6:13:25", "remaining_time": "1 day, 12:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2630, "total_steps": 17941, "loss": 1.4287, "learning_rate": 9.575707768022572e-05, "epoch": 0.14659160581907363, "percentage": 14.66, "elapsed_time": "6:13:34", "remaining_time": "1 day, 12:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2631, "total_steps": 17941, "loss": 1.9308, "learning_rate": 9.575348736625523e-05, "epoch": 0.14664734407223678, "percentage": 14.66, "elapsed_time": "6:13:42", "remaining_time": "1 day, 12:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2632, "total_steps": 17941, "loss": 1.8831, "learning_rate": 9.574989560125087e-05, "epoch": 0.14670308232539991, "percentage": 14.67, "elapsed_time": "6:13:51", "remaining_time": "1 day, 12:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2633, "total_steps": 17941, "loss": 1.5871, "learning_rate": 9.574630238532658e-05, "epoch": 0.14675882057856307, "percentage": 14.68, "elapsed_time": "6:14:00", "remaining_time": "1 day, 12:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2634, "total_steps": 17941, "loss": 1.8394, "learning_rate": 9.574270771859628e-05, "epoch": 0.14681455883172623, "percentage": 14.68, "elapsed_time": "6:14:08", "remaining_time": "1 day, 12:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2635, "total_steps": 17941, "loss": 1.8598, "learning_rate": 9.5739111601174e-05, "epoch": 0.14687029708488936, "percentage": 14.69, "elapsed_time": "6:14:17", "remaining_time": "1 day, 12:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2636, "total_steps": 17941, "loss": 1.5862, "learning_rate": 9.573551403317378e-05, "epoch": 0.1469260353380525, "percentage": 14.69, "elapsed_time": "6:14:25", "remaining_time": "1 day, 12:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2637, "total_steps": 17941, "loss": 1.8026, "learning_rate": 9.573191501470971e-05, "epoch": 0.14698177359121564, "percentage": 14.7, "elapsed_time": "6:14:33", "remaining_time": "1 day, 12:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2638, "total_steps": 17941, "loss": 1.7529, "learning_rate": 9.572831454589592e-05, "epoch": 0.1470375118443788, "percentage": 14.7, "elapsed_time": "6:14:42", "remaining_time": "1 day, 12:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2639, "total_steps": 17941, "loss": 1.7851, "learning_rate": 9.572471262684662e-05, "epoch": 0.14709325009754196, "percentage": 14.71, "elapsed_time": "6:14:50", "remaining_time": "1 day, 12:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2640, "total_steps": 17941, "loss": 1.7617, "learning_rate": 9.572110925767601e-05, "epoch": 0.14714898835070508, "percentage": 14.71, "elapsed_time": "6:14:59", "remaining_time": "1 day, 12:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2641, "total_steps": 17941, "loss": 1.6418, "learning_rate": 9.571750443849841e-05, "epoch": 0.14720472660386824, "percentage": 14.72, "elapsed_time": "6:15:07", "remaining_time": "1 day, 12:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2642, "total_steps": 17941, "loss": 2.0309, "learning_rate": 9.571389816942811e-05, "epoch": 0.14726046485703137, "percentage": 14.73, "elapsed_time": "6:15:16", "remaining_time": "1 day, 12:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2643, "total_steps": 17941, "loss": 1.8764, "learning_rate": 9.571029045057948e-05, "epoch": 0.14731620311019453, "percentage": 14.73, "elapsed_time": "6:15:25", "remaining_time": "1 day, 12:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2644, "total_steps": 17941, "loss": 1.6183, "learning_rate": 9.570668128206697e-05, "epoch": 0.14737194136335768, "percentage": 14.74, "elapsed_time": "6:15:33", "remaining_time": "1 day, 12:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2645, "total_steps": 17941, "loss": 1.738, "learning_rate": 9.5703070664005e-05, "epoch": 0.1474276796165208, "percentage": 14.74, "elapsed_time": "6:15:42", "remaining_time": "1 day, 12:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2646, "total_steps": 17941, "loss": 1.7379, "learning_rate": 9.56994585965081e-05, "epoch": 0.14748341786968397, "percentage": 14.75, "elapsed_time": "6:15:50", "remaining_time": "1 day, 12:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2647, "total_steps": 17941, "loss": 1.6596, "learning_rate": 9.569584507969082e-05, "epoch": 0.1475391561228471, "percentage": 14.75, "elapsed_time": "6:15:59", "remaining_time": "1 day, 12:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2648, "total_steps": 17941, "loss": 1.7998, "learning_rate": 9.569223011366776e-05, "epoch": 0.14759489437601025, "percentage": 14.76, "elapsed_time": "6:16:07", "remaining_time": "1 day, 12:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2649, "total_steps": 17941, "loss": 1.5843, "learning_rate": 9.568861369855357e-05, "epoch": 0.1476506326291734, "percentage": 14.77, "elapsed_time": "6:16:16", "remaining_time": "1 day, 12:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2650, "total_steps": 17941, "loss": 1.6966, "learning_rate": 9.568499583446293e-05, "epoch": 0.14770637088233654, "percentage": 14.77, "elapsed_time": "6:16:24", "remaining_time": "1 day, 12:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2651, "total_steps": 17941, "loss": 1.7318, "learning_rate": 9.568137652151059e-05, "epoch": 0.1477621091354997, "percentage": 14.78, "elapsed_time": "6:16:33", "remaining_time": "1 day, 12:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2652, "total_steps": 17941, "loss": 1.8252, "learning_rate": 9.567775575981133e-05, "epoch": 0.14781784738866283, "percentage": 14.78, "elapsed_time": "6:16:42", "remaining_time": "1 day, 12:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2653, "total_steps": 17941, "loss": 1.8455, "learning_rate": 9.567413354947997e-05, "epoch": 0.14787358564182598, "percentage": 14.79, "elapsed_time": "6:16:50", "remaining_time": "1 day, 12:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2654, "total_steps": 17941, "loss": 1.8003, "learning_rate": 9.56705098906314e-05, "epoch": 0.14792932389498914, "percentage": 14.79, "elapsed_time": "6:16:59", "remaining_time": "1 day, 12:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2655, "total_steps": 17941, "loss": 1.765, "learning_rate": 9.566688478338053e-05, "epoch": 0.14798506214815227, "percentage": 14.8, "elapsed_time": "6:17:07", "remaining_time": "1 day, 12:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2656, "total_steps": 17941, "loss": 1.686, "learning_rate": 9.566325822784232e-05, "epoch": 0.14804080040131543, "percentage": 14.8, "elapsed_time": "6:17:15", "remaining_time": "1 day, 12:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2657, "total_steps": 17941, "loss": 1.9386, "learning_rate": 9.56596302241318e-05, "epoch": 0.14809653865447858, "percentage": 14.81, "elapsed_time": "6:17:24", "remaining_time": "1 day, 12:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2658, "total_steps": 17941, "loss": 1.6464, "learning_rate": 9.565600077236403e-05, "epoch": 0.1481522769076417, "percentage": 14.82, "elapsed_time": "6:17:32", "remaining_time": "1 day, 12:10:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2659, "total_steps": 17941, "loss": 2.0237, "learning_rate": 9.565236987265411e-05, "epoch": 0.14820801516080487, "percentage": 14.82, "elapsed_time": "6:17:41", "remaining_time": "1 day, 12:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2660, "total_steps": 17941, "loss": 1.9181, "learning_rate": 9.564873752511718e-05, "epoch": 0.148263753413968, "percentage": 14.83, "elapsed_time": "6:17:49", "remaining_time": "1 day, 12:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2661, "total_steps": 17941, "loss": 1.9004, "learning_rate": 9.564510372986845e-05, "epoch": 0.14831949166713115, "percentage": 14.83, "elapsed_time": "6:17:58", "remaining_time": "1 day, 12:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2662, "total_steps": 17941, "loss": 1.4634, "learning_rate": 9.564146848702316e-05, "epoch": 0.1483752299202943, "percentage": 14.84, "elapsed_time": "6:18:06", "remaining_time": "1 day, 12:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2663, "total_steps": 17941, "loss": 1.7994, "learning_rate": 9.56378317966966e-05, "epoch": 0.14843096817345744, "percentage": 14.84, "elapsed_time": "6:18:15", "remaining_time": "1 day, 12:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2664, "total_steps": 17941, "loss": 1.493, "learning_rate": 9.56341936590041e-05, "epoch": 0.1484867064266206, "percentage": 14.85, "elapsed_time": "6:18:23", "remaining_time": "1 day, 12:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2665, "total_steps": 17941, "loss": 1.747, "learning_rate": 9.563055407406104e-05, "epoch": 0.14854244467978373, "percentage": 14.85, "elapsed_time": "6:18:32", "remaining_time": "1 day, 12:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2666, "total_steps": 17941, "loss": 1.7043, "learning_rate": 9.562691304198286e-05, "epoch": 0.14859818293294688, "percentage": 14.86, "elapsed_time": "6:18:40", "remaining_time": "1 day, 12:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2667, "total_steps": 17941, "loss": 1.8348, "learning_rate": 9.5623270562885e-05, "epoch": 0.14865392118611004, "percentage": 14.87, "elapsed_time": "6:18:49", "remaining_time": "1 day, 12:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2668, "total_steps": 17941, "loss": 1.5255, "learning_rate": 9.561962663688302e-05, "epoch": 0.14870965943927317, "percentage": 14.87, "elapsed_time": "6:18:58", "remaining_time": "1 day, 12:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2669, "total_steps": 17941, "loss": 1.5113, "learning_rate": 9.561598126409245e-05, "epoch": 0.14876539769243632, "percentage": 14.88, "elapsed_time": "6:19:06", "remaining_time": "1 day, 12:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2670, "total_steps": 17941, "loss": 1.5927, "learning_rate": 9.561233444462894e-05, "epoch": 0.14882113594559945, "percentage": 14.88, "elapsed_time": "6:19:14", "remaining_time": "1 day, 12:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2671, "total_steps": 17941, "loss": 1.9007, "learning_rate": 9.56086861786081e-05, "epoch": 0.1488768741987626, "percentage": 14.89, "elapsed_time": "6:19:23", "remaining_time": "1 day, 12:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2672, "total_steps": 17941, "loss": 1.5592, "learning_rate": 9.560503646614564e-05, "epoch": 0.14893261245192577, "percentage": 14.89, "elapsed_time": "6:19:31", "remaining_time": "1 day, 12:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2673, "total_steps": 17941, "loss": 1.5822, "learning_rate": 9.560138530735734e-05, "epoch": 0.1489883507050889, "percentage": 14.9, "elapsed_time": "6:19:40", "remaining_time": "1 day, 12:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2674, "total_steps": 17941, "loss": 1.703, "learning_rate": 9.559773270235896e-05, "epoch": 0.14904408895825205, "percentage": 14.9, "elapsed_time": "6:19:48", "remaining_time": "1 day, 12:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2675, "total_steps": 17941, "loss": 1.7473, "learning_rate": 9.559407865126636e-05, "epoch": 0.14909982721141518, "percentage": 14.91, "elapsed_time": "6:19:57", "remaining_time": "1 day, 12:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2676, "total_steps": 17941, "loss": 1.6382, "learning_rate": 9.559042315419542e-05, "epoch": 0.14915556546457834, "percentage": 14.92, "elapsed_time": "6:20:05", "remaining_time": "1 day, 12:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2677, "total_steps": 17941, "loss": 1.7602, "learning_rate": 9.558676621126206e-05, "epoch": 0.1492113037177415, "percentage": 14.92, "elapsed_time": "6:20:14", "remaining_time": "1 day, 12:08:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2678, "total_steps": 17941, "loss": 1.7686, "learning_rate": 9.558310782258227e-05, "epoch": 0.14926704197090462, "percentage": 14.93, "elapsed_time": "6:20:22", "remaining_time": "1 day, 12:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2679, "total_steps": 17941, "loss": 1.6661, "learning_rate": 9.557944798827205e-05, "epoch": 0.14932278022406778, "percentage": 14.93, "elapsed_time": "6:20:30", "remaining_time": "1 day, 12:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2680, "total_steps": 17941, "loss": 1.6757, "learning_rate": 9.557578670844751e-05, "epoch": 0.14937851847723094, "percentage": 14.94, "elapsed_time": "6:20:39", "remaining_time": "1 day, 12:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2681, "total_steps": 17941, "loss": 1.8146, "learning_rate": 9.557212398322473e-05, "epoch": 0.14943425673039407, "percentage": 14.94, "elapsed_time": "6:20:47", "remaining_time": "1 day, 12:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2682, "total_steps": 17941, "loss": 1.7437, "learning_rate": 9.556845981271989e-05, "epoch": 0.14948999498355722, "percentage": 14.95, "elapsed_time": "6:20:56", "remaining_time": "1 day, 12:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2683, "total_steps": 17941, "loss": 2.0424, "learning_rate": 9.556479419704918e-05, "epoch": 0.14954573323672035, "percentage": 14.95, "elapsed_time": "6:21:04", "remaining_time": "1 day, 12:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2684, "total_steps": 17941, "loss": 1.6523, "learning_rate": 9.556112713632885e-05, "epoch": 0.1496014714898835, "percentage": 14.96, "elapsed_time": "6:21:13", "remaining_time": "1 day, 12:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2685, "total_steps": 17941, "loss": 1.8348, "learning_rate": 9.555745863067522e-05, "epoch": 0.14965720974304667, "percentage": 14.97, "elapsed_time": "6:21:21", "remaining_time": "1 day, 12:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2686, "total_steps": 17941, "loss": 1.6003, "learning_rate": 9.555378868020461e-05, "epoch": 0.1497129479962098, "percentage": 14.97, "elapsed_time": "6:21:30", "remaining_time": "1 day, 12:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2687, "total_steps": 17941, "loss": 1.6412, "learning_rate": 9.555011728503343e-05, "epoch": 0.14976868624937295, "percentage": 14.98, "elapsed_time": "6:21:38", "remaining_time": "1 day, 12:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2688, "total_steps": 17941, "loss": 1.6397, "learning_rate": 9.554644444527812e-05, "epoch": 0.14982442450253608, "percentage": 14.98, "elapsed_time": "6:21:47", "remaining_time": "1 day, 12:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2689, "total_steps": 17941, "loss": 2.0408, "learning_rate": 9.554277016105512e-05, "epoch": 0.14988016275569924, "percentage": 14.99, "elapsed_time": "6:21:55", "remaining_time": "1 day, 12:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2690, "total_steps": 17941, "loss": 1.7599, "learning_rate": 9.5539094432481e-05, "epoch": 0.1499359010088624, "percentage": 14.99, "elapsed_time": "6:22:03", "remaining_time": "1 day, 12:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2691, "total_steps": 17941, "loss": 1.6704, "learning_rate": 9.55354172596723e-05, "epoch": 0.14999163926202552, "percentage": 15.0, "elapsed_time": "6:22:12", "remaining_time": "1 day, 12:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2692, "total_steps": 17941, "loss": 1.7792, "learning_rate": 9.553173864274567e-05, "epoch": 0.15004737751518868, "percentage": 15.0, "elapsed_time": "6:22:20", "remaining_time": "1 day, 12:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2693, "total_steps": 17941, "loss": 1.7461, "learning_rate": 9.552805858181775e-05, "epoch": 0.1501031157683518, "percentage": 15.01, "elapsed_time": "6:22:29", "remaining_time": "1 day, 12:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2694, "total_steps": 17941, "loss": 1.7735, "learning_rate": 9.552437707700526e-05, "epoch": 0.15015885402151496, "percentage": 15.02, "elapsed_time": "6:22:37", "remaining_time": "1 day, 12:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2695, "total_steps": 17941, "loss": 1.6318, "learning_rate": 9.552069412842495e-05, "epoch": 0.15021459227467812, "percentage": 15.02, "elapsed_time": "6:22:46", "remaining_time": "1 day, 12:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2696, "total_steps": 17941, "loss": 1.665, "learning_rate": 9.551700973619364e-05, "epoch": 0.15027033052784125, "percentage": 15.03, "elapsed_time": "6:22:54", "remaining_time": "1 day, 12:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2697, "total_steps": 17941, "loss": 1.743, "learning_rate": 9.551332390042816e-05, "epoch": 0.1503260687810044, "percentage": 15.03, "elapsed_time": "6:23:03", "remaining_time": "1 day, 12:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2698, "total_steps": 17941, "loss": 1.9245, "learning_rate": 9.55096366212454e-05, "epoch": 0.15038180703416754, "percentage": 15.04, "elapsed_time": "6:23:11", "remaining_time": "1 day, 12:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2699, "total_steps": 17941, "loss": 1.5553, "learning_rate": 9.55059478987623e-05, "epoch": 0.1504375452873307, "percentage": 15.04, "elapsed_time": "6:23:19", "remaining_time": "1 day, 12:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2700, "total_steps": 17941, "loss": 1.4489, "learning_rate": 9.550225773309586e-05, "epoch": 0.15049328354049385, "percentage": 15.05, "elapsed_time": "6:23:28", "remaining_time": "1 day, 12:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2701, "total_steps": 17941, "loss": 1.9052, "learning_rate": 9.54985661243631e-05, "epoch": 0.15054902179365698, "percentage": 15.05, "elapsed_time": "6:23:36", "remaining_time": "1 day, 12:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2702, "total_steps": 17941, "loss": 1.5049, "learning_rate": 9.54948730726811e-05, "epoch": 0.15060476004682014, "percentage": 15.06, "elapsed_time": "6:23:45", "remaining_time": "1 day, 12:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2703, "total_steps": 17941, "loss": 1.8818, "learning_rate": 9.549117857816697e-05, "epoch": 0.1506604982999833, "percentage": 15.07, "elapsed_time": "6:23:53", "remaining_time": "1 day, 12:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2704, "total_steps": 17941, "loss": 1.6683, "learning_rate": 9.548748264093789e-05, "epoch": 0.15071623655314642, "percentage": 15.07, "elapsed_time": "6:24:02", "remaining_time": "1 day, 12:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2705, "total_steps": 17941, "loss": 1.6966, "learning_rate": 9.548378526111108e-05, "epoch": 0.15077197480630958, "percentage": 15.08, "elapsed_time": "6:24:10", "remaining_time": "1 day, 12:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2706, "total_steps": 17941, "loss": 1.8303, "learning_rate": 9.54800864388038e-05, "epoch": 0.1508277130594727, "percentage": 15.08, "elapsed_time": "6:24:19", "remaining_time": "1 day, 12:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2707, "total_steps": 17941, "loss": 1.8624, "learning_rate": 9.547638617413333e-05, "epoch": 0.15088345131263586, "percentage": 15.09, "elapsed_time": "6:24:27", "remaining_time": "1 day, 12:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2708, "total_steps": 17941, "loss": 1.5654, "learning_rate": 9.547268446721702e-05, "epoch": 0.15093918956579902, "percentage": 15.09, "elapsed_time": "6:24:35", "remaining_time": "1 day, 12:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2709, "total_steps": 17941, "loss": 1.6074, "learning_rate": 9.54689813181723e-05, "epoch": 0.15099492781896215, "percentage": 15.1, "elapsed_time": "6:24:44", "remaining_time": "1 day, 12:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2710, "total_steps": 17941, "loss": 1.8095, "learning_rate": 9.54652767271166e-05, "epoch": 0.1510506660721253, "percentage": 15.11, "elapsed_time": "6:24:53", "remaining_time": "1 day, 12:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2711, "total_steps": 17941, "loss": 1.8065, "learning_rate": 9.54615706941674e-05, "epoch": 0.15110640432528843, "percentage": 15.11, "elapsed_time": "6:25:01", "remaining_time": "1 day, 12:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2712, "total_steps": 17941, "loss": 1.5857, "learning_rate": 9.545786321944223e-05, "epoch": 0.1511621425784516, "percentage": 15.12, "elapsed_time": "6:25:10", "remaining_time": "1 day, 12:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2713, "total_steps": 17941, "loss": 1.5847, "learning_rate": 9.545415430305869e-05, "epoch": 0.15121788083161475, "percentage": 15.12, "elapsed_time": "6:25:18", "remaining_time": "1 day, 12:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2714, "total_steps": 17941, "loss": 1.7911, "learning_rate": 9.545044394513439e-05, "epoch": 0.15127361908477788, "percentage": 15.13, "elapsed_time": "6:25:26", "remaining_time": "1 day, 12:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2715, "total_steps": 17941, "loss": 1.7341, "learning_rate": 9.544673214578698e-05, "epoch": 0.15132935733794103, "percentage": 15.13, "elapsed_time": "6:25:35", "remaining_time": "1 day, 12:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2716, "total_steps": 17941, "loss": 1.6531, "learning_rate": 9.544301890513423e-05, "epoch": 0.15138509559110416, "percentage": 15.14, "elapsed_time": "6:25:44", "remaining_time": "1 day, 12:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2717, "total_steps": 17941, "loss": 1.7704, "learning_rate": 9.543930422329386e-05, "epoch": 0.15144083384426732, "percentage": 15.14, "elapsed_time": "6:25:53", "remaining_time": "1 day, 12:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2718, "total_steps": 17941, "loss": 1.6427, "learning_rate": 9.543558810038368e-05, "epoch": 0.15149657209743048, "percentage": 15.15, "elapsed_time": "6:26:01", "remaining_time": "1 day, 12:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2719, "total_steps": 17941, "loss": 1.9572, "learning_rate": 9.543187053652156e-05, "epoch": 0.1515523103505936, "percentage": 15.16, "elapsed_time": "6:26:09", "remaining_time": "1 day, 12:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2720, "total_steps": 17941, "loss": 1.6761, "learning_rate": 9.54281515318254e-05, "epoch": 0.15160804860375676, "percentage": 15.16, "elapsed_time": "6:26:18", "remaining_time": "1 day, 12:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2721, "total_steps": 17941, "loss": 1.8216, "learning_rate": 9.542443108641312e-05, "epoch": 0.1516637868569199, "percentage": 15.17, "elapsed_time": "6:26:26", "remaining_time": "1 day, 12:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2722, "total_steps": 17941, "loss": 1.5411, "learning_rate": 9.542070920040274e-05, "epoch": 0.15171952511008305, "percentage": 15.17, "elapsed_time": "6:26:35", "remaining_time": "1 day, 12:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2723, "total_steps": 17941, "loss": 1.848, "learning_rate": 9.541698587391229e-05, "epoch": 0.1517752633632462, "percentage": 15.18, "elapsed_time": "6:26:43", "remaining_time": "1 day, 12:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2724, "total_steps": 17941, "loss": 1.7717, "learning_rate": 9.541326110705983e-05, "epoch": 0.15183100161640933, "percentage": 15.18, "elapsed_time": "6:26:52", "remaining_time": "1 day, 12:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2725, "total_steps": 17941, "loss": 1.6865, "learning_rate": 9.540953489996354e-05, "epoch": 0.1518867398695725, "percentage": 15.19, "elapsed_time": "6:27:01", "remaining_time": "1 day, 12:01:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2726, "total_steps": 17941, "loss": 1.7526, "learning_rate": 9.540580725274153e-05, "epoch": 0.15194247812273565, "percentage": 15.19, "elapsed_time": "6:27:09", "remaining_time": "1 day, 12:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2727, "total_steps": 17941, "loss": 1.7543, "learning_rate": 9.540207816551206e-05, "epoch": 0.15199821637589878, "percentage": 15.2, "elapsed_time": "6:27:18", "remaining_time": "1 day, 12:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2728, "total_steps": 17941, "loss": 1.4261, "learning_rate": 9.539834763839337e-05, "epoch": 0.15205395462906193, "percentage": 15.21, "elapsed_time": "6:27:26", "remaining_time": "1 day, 12:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2729, "total_steps": 17941, "loss": 1.9545, "learning_rate": 9.539461567150378e-05, "epoch": 0.15210969288222506, "percentage": 15.21, "elapsed_time": "6:27:35", "remaining_time": "1 day, 12:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2730, "total_steps": 17941, "loss": 1.7021, "learning_rate": 9.539088226496167e-05, "epoch": 0.15216543113538822, "percentage": 15.22, "elapsed_time": "6:27:43", "remaining_time": "1 day, 12:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2731, "total_steps": 17941, "loss": 1.7132, "learning_rate": 9.538714741888541e-05, "epoch": 0.15222116938855138, "percentage": 15.22, "elapsed_time": "6:27:52", "remaining_time": "1 day, 12:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2732, "total_steps": 17941, "loss": 1.6896, "learning_rate": 9.538341113339346e-05, "epoch": 0.1522769076417145, "percentage": 15.23, "elapsed_time": "6:28:00", "remaining_time": "1 day, 12:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2733, "total_steps": 17941, "loss": 1.7815, "learning_rate": 9.537967340860432e-05, "epoch": 0.15233264589487766, "percentage": 15.23, "elapsed_time": "6:28:09", "remaining_time": "1 day, 11:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2734, "total_steps": 17941, "loss": 1.8918, "learning_rate": 9.537593424463651e-05, "epoch": 0.1523883841480408, "percentage": 15.24, "elapsed_time": "6:28:17", "remaining_time": "1 day, 11:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2735, "total_steps": 17941, "loss": 1.7225, "learning_rate": 9.537219364160863e-05, "epoch": 0.15244412240120395, "percentage": 15.24, "elapsed_time": "6:28:26", "remaining_time": "1 day, 11:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2736, "total_steps": 17941, "loss": 1.5232, "learning_rate": 9.536845159963932e-05, "epoch": 0.1524998606543671, "percentage": 15.25, "elapsed_time": "6:28:34", "remaining_time": "1 day, 11:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2737, "total_steps": 17941, "loss": 1.8193, "learning_rate": 9.536470811884723e-05, "epoch": 0.15255559890753023, "percentage": 15.26, "elapsed_time": "6:28:43", "remaining_time": "1 day, 11:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2738, "total_steps": 17941, "loss": 1.9167, "learning_rate": 9.536096319935108e-05, "epoch": 0.1526113371606934, "percentage": 15.26, "elapsed_time": "6:28:52", "remaining_time": "1 day, 11:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2739, "total_steps": 17941, "loss": 1.8613, "learning_rate": 9.535721684126967e-05, "epoch": 0.15266707541385652, "percentage": 15.27, "elapsed_time": "6:29:00", "remaining_time": "1 day, 11:59:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2740, "total_steps": 17941, "loss": 1.6646, "learning_rate": 9.535346904472177e-05, "epoch": 0.15272281366701967, "percentage": 15.27, "elapsed_time": "6:29:09", "remaining_time": "1 day, 11:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2741, "total_steps": 17941, "loss": 1.7495, "learning_rate": 9.53497198098263e-05, "epoch": 0.15277855192018283, "percentage": 15.28, "elapsed_time": "6:29:17", "remaining_time": "1 day, 11:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2742, "total_steps": 17941, "loss": 1.9952, "learning_rate": 9.53459691367021e-05, "epoch": 0.15283429017334596, "percentage": 15.28, "elapsed_time": "6:29:26", "remaining_time": "1 day, 11:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2743, "total_steps": 17941, "loss": 1.9164, "learning_rate": 9.534221702546814e-05, "epoch": 0.15289002842650912, "percentage": 15.29, "elapsed_time": "6:29:34", "remaining_time": "1 day, 11:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2744, "total_steps": 17941, "loss": 1.7106, "learning_rate": 9.533846347624343e-05, "epoch": 0.15294576667967225, "percentage": 15.29, "elapsed_time": "6:29:43", "remaining_time": "1 day, 11:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2745, "total_steps": 17941, "loss": 1.6197, "learning_rate": 9.533470848914698e-05, "epoch": 0.1530015049328354, "percentage": 15.3, "elapsed_time": "6:29:51", "remaining_time": "1 day, 11:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2746, "total_steps": 17941, "loss": 1.7638, "learning_rate": 9.533095206429792e-05, "epoch": 0.15305724318599856, "percentage": 15.31, "elapsed_time": "6:30:00", "remaining_time": "1 day, 11:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2747, "total_steps": 17941, "loss": 1.5744, "learning_rate": 9.532719420181535e-05, "epoch": 0.1531129814391617, "percentage": 15.31, "elapsed_time": "6:30:08", "remaining_time": "1 day, 11:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2748, "total_steps": 17941, "loss": 1.748, "learning_rate": 9.532343490181845e-05, "epoch": 0.15316871969232485, "percentage": 15.32, "elapsed_time": "6:30:17", "remaining_time": "1 day, 11:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2749, "total_steps": 17941, "loss": 1.8845, "learning_rate": 9.531967416442646e-05, "epoch": 0.153224457945488, "percentage": 15.32, "elapsed_time": "6:30:25", "remaining_time": "1 day, 11:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2750, "total_steps": 17941, "loss": 1.7691, "learning_rate": 9.531591198975863e-05, "epoch": 0.15328019619865113, "percentage": 15.33, "elapsed_time": "6:30:34", "remaining_time": "1 day, 11:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2751, "total_steps": 17941, "loss": 1.6964, "learning_rate": 9.531214837793429e-05, "epoch": 0.1533359344518143, "percentage": 15.33, "elapsed_time": "6:30:42", "remaining_time": "1 day, 11:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2752, "total_steps": 17941, "loss": 1.6693, "learning_rate": 9.530838332907278e-05, "epoch": 0.15339167270497742, "percentage": 15.34, "elapsed_time": "6:30:51", "remaining_time": "1 day, 11:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2753, "total_steps": 17941, "loss": 1.932, "learning_rate": 9.530461684329352e-05, "epoch": 0.15344741095814057, "percentage": 15.34, "elapsed_time": "6:30:59", "remaining_time": "1 day, 11:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2754, "total_steps": 17941, "loss": 1.6084, "learning_rate": 9.530084892071596e-05, "epoch": 0.15350314921130373, "percentage": 15.35, "elapsed_time": "6:31:08", "remaining_time": "1 day, 11:56:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2755, "total_steps": 17941, "loss": 1.8431, "learning_rate": 9.52970795614596e-05, "epoch": 0.15355888746446686, "percentage": 15.36, "elapsed_time": "6:31:16", "remaining_time": "1 day, 11:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2756, "total_steps": 17941, "loss": 1.7747, "learning_rate": 9.529330876564398e-05, "epoch": 0.15361462571763002, "percentage": 15.36, "elapsed_time": "6:31:25", "remaining_time": "1 day, 11:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2757, "total_steps": 17941, "loss": 1.7633, "learning_rate": 9.528953653338867e-05, "epoch": 0.15367036397079314, "percentage": 15.37, "elapsed_time": "6:31:33", "remaining_time": "1 day, 11:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2758, "total_steps": 17941, "loss": 1.7155, "learning_rate": 9.528576286481332e-05, "epoch": 0.1537261022239563, "percentage": 15.37, "elapsed_time": "6:31:41", "remaining_time": "1 day, 11:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2759, "total_steps": 17941, "loss": 1.7427, "learning_rate": 9.52819877600376e-05, "epoch": 0.15378184047711946, "percentage": 15.38, "elapsed_time": "6:31:50", "remaining_time": "1 day, 11:56:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2760, "total_steps": 17941, "loss": 1.9338, "learning_rate": 9.527821121918126e-05, "epoch": 0.1538375787302826, "percentage": 15.38, "elapsed_time": "6:31:58", "remaining_time": "1 day, 11:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2761, "total_steps": 17941, "loss": 1.6865, "learning_rate": 9.527443324236403e-05, "epoch": 0.15389331698344574, "percentage": 15.39, "elapsed_time": "6:32:07", "remaining_time": "1 day, 11:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2762, "total_steps": 17941, "loss": 1.4843, "learning_rate": 9.527065382970576e-05, "epoch": 0.15394905523660887, "percentage": 15.39, "elapsed_time": "6:32:15", "remaining_time": "1 day, 11:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2763, "total_steps": 17941, "loss": 1.7174, "learning_rate": 9.52668729813263e-05, "epoch": 0.15400479348977203, "percentage": 15.4, "elapsed_time": "6:32:24", "remaining_time": "1 day, 11:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2764, "total_steps": 17941, "loss": 1.8855, "learning_rate": 9.526309069734553e-05, "epoch": 0.1540605317429352, "percentage": 15.41, "elapsed_time": "6:32:32", "remaining_time": "1 day, 11:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2765, "total_steps": 17941, "loss": 1.7095, "learning_rate": 9.525930697788345e-05, "epoch": 0.15411626999609832, "percentage": 15.41, "elapsed_time": "6:32:41", "remaining_time": "1 day, 11:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2766, "total_steps": 17941, "loss": 1.5436, "learning_rate": 9.525552182306003e-05, "epoch": 0.15417200824926147, "percentage": 15.42, "elapsed_time": "6:32:49", "remaining_time": "1 day, 11:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2767, "total_steps": 17941, "loss": 1.8488, "learning_rate": 9.525173523299531e-05, "epoch": 0.1542277465024246, "percentage": 15.42, "elapsed_time": "6:32:58", "remaining_time": "1 day, 11:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2768, "total_steps": 17941, "loss": 1.6764, "learning_rate": 9.524794720780938e-05, "epoch": 0.15428348475558776, "percentage": 15.43, "elapsed_time": "6:33:06", "remaining_time": "1 day, 11:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2769, "total_steps": 17941, "loss": 1.7393, "learning_rate": 9.524415774762239e-05, "epoch": 0.15433922300875091, "percentage": 15.43, "elapsed_time": "6:33:15", "remaining_time": "1 day, 11:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2770, "total_steps": 17941, "loss": 1.6587, "learning_rate": 9.52403668525545e-05, "epoch": 0.15439496126191404, "percentage": 15.44, "elapsed_time": "6:33:23", "remaining_time": "1 day, 11:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2771, "total_steps": 17941, "loss": 1.5704, "learning_rate": 9.523657452272594e-05, "epoch": 0.1544506995150772, "percentage": 15.45, "elapsed_time": "6:33:32", "remaining_time": "1 day, 11:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2772, "total_steps": 17941, "loss": 1.6701, "learning_rate": 9.5232780758257e-05, "epoch": 0.15450643776824036, "percentage": 15.45, "elapsed_time": "6:33:40", "remaining_time": "1 day, 11:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2773, "total_steps": 17941, "loss": 1.7997, "learning_rate": 9.522898555926796e-05, "epoch": 0.15456217602140349, "percentage": 15.46, "elapsed_time": "6:33:49", "remaining_time": "1 day, 11:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2774, "total_steps": 17941, "loss": 1.4629, "learning_rate": 9.52251889258792e-05, "epoch": 0.15461791427456664, "percentage": 15.46, "elapsed_time": "6:33:57", "remaining_time": "1 day, 11:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2775, "total_steps": 17941, "loss": 1.7481, "learning_rate": 9.522139085821113e-05, "epoch": 0.15467365252772977, "percentage": 15.47, "elapsed_time": "6:34:06", "remaining_time": "1 day, 11:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2776, "total_steps": 17941, "loss": 1.781, "learning_rate": 9.521759135638422e-05, "epoch": 0.15472939078089293, "percentage": 15.47, "elapsed_time": "6:34:14", "remaining_time": "1 day, 11:53:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2777, "total_steps": 17941, "loss": 1.5232, "learning_rate": 9.521379042051894e-05, "epoch": 0.15478512903405608, "percentage": 15.48, "elapsed_time": "6:34:22", "remaining_time": "1 day, 11:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2778, "total_steps": 17941, "loss": 1.663, "learning_rate": 9.520998805073584e-05, "epoch": 0.1548408672872192, "percentage": 15.48, "elapsed_time": "6:34:31", "remaining_time": "1 day, 11:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2779, "total_steps": 17941, "loss": 1.632, "learning_rate": 9.52061842471555e-05, "epoch": 0.15489660554038237, "percentage": 15.49, "elapsed_time": "6:34:39", "remaining_time": "1 day, 11:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2780, "total_steps": 17941, "loss": 1.7983, "learning_rate": 9.520237900989858e-05, "epoch": 0.1549523437935455, "percentage": 15.5, "elapsed_time": "6:34:48", "remaining_time": "1 day, 11:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2781, "total_steps": 17941, "loss": 2.0205, "learning_rate": 9.519857233908574e-05, "epoch": 0.15500808204670866, "percentage": 15.5, "elapsed_time": "6:34:56", "remaining_time": "1 day, 11:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2782, "total_steps": 17941, "loss": 1.9992, "learning_rate": 9.519476423483771e-05, "epoch": 0.1550638202998718, "percentage": 15.51, "elapsed_time": "6:35:05", "remaining_time": "1 day, 11:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2783, "total_steps": 17941, "loss": 1.8583, "learning_rate": 9.519095469727527e-05, "epoch": 0.15511955855303494, "percentage": 15.51, "elapsed_time": "6:35:14", "remaining_time": "1 day, 11:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2784, "total_steps": 17941, "loss": 1.9257, "learning_rate": 9.518714372651922e-05, "epoch": 0.1551752968061981, "percentage": 15.52, "elapsed_time": "6:35:23", "remaining_time": "1 day, 11:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2785, "total_steps": 17941, "loss": 1.8291, "learning_rate": 9.518333132269043e-05, "epoch": 0.15523103505936123, "percentage": 15.52, "elapsed_time": "6:35:31", "remaining_time": "1 day, 11:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2786, "total_steps": 17941, "loss": 1.5859, "learning_rate": 9.517951748590983e-05, "epoch": 0.15528677331252438, "percentage": 15.53, "elapsed_time": "6:35:40", "remaining_time": "1 day, 11:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2787, "total_steps": 17941, "loss": 1.7556, "learning_rate": 9.517570221629833e-05, "epoch": 0.15534251156568754, "percentage": 15.53, "elapsed_time": "6:35:48", "remaining_time": "1 day, 11:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2788, "total_steps": 17941, "loss": 1.8201, "learning_rate": 9.517188551397695e-05, "epoch": 0.15539824981885067, "percentage": 15.54, "elapsed_time": "6:35:57", "remaining_time": "1 day, 11:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2789, "total_steps": 17941, "loss": 1.7392, "learning_rate": 9.516806737906674e-05, "epoch": 0.15545398807201383, "percentage": 15.55, "elapsed_time": "6:36:05", "remaining_time": "1 day, 11:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2790, "total_steps": 17941, "loss": 1.7216, "learning_rate": 9.516424781168877e-05, "epoch": 0.15550972632517696, "percentage": 15.55, "elapsed_time": "6:36:14", "remaining_time": "1 day, 11:51:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2791, "total_steps": 17941, "loss": 1.561, "learning_rate": 9.516042681196419e-05, "epoch": 0.1555654645783401, "percentage": 15.56, "elapsed_time": "6:36:22", "remaining_time": "1 day, 11:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2792, "total_steps": 17941, "loss": 2.061, "learning_rate": 9.515660438001417e-05, "epoch": 0.15562120283150327, "percentage": 15.56, "elapsed_time": "6:36:31", "remaining_time": "1 day, 11:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2793, "total_steps": 17941, "loss": 1.5716, "learning_rate": 9.515278051595996e-05, "epoch": 0.1556769410846664, "percentage": 15.57, "elapsed_time": "6:36:39", "remaining_time": "1 day, 11:51:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2794, "total_steps": 17941, "loss": 1.5369, "learning_rate": 9.514895521992278e-05, "epoch": 0.15573267933782955, "percentage": 15.57, "elapsed_time": "6:36:48", "remaining_time": "1 day, 11:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2795, "total_steps": 17941, "loss": 1.9497, "learning_rate": 9.5145128492024e-05, "epoch": 0.1557884175909927, "percentage": 15.58, "elapsed_time": "6:36:56", "remaining_time": "1 day, 11:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2796, "total_steps": 17941, "loss": 1.7145, "learning_rate": 9.514130033238494e-05, "epoch": 0.15584415584415584, "percentage": 15.58, "elapsed_time": "6:37:05", "remaining_time": "1 day, 11:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2797, "total_steps": 17941, "loss": 1.599, "learning_rate": 9.513747074112705e-05, "epoch": 0.155899894097319, "percentage": 15.59, "elapsed_time": "6:37:13", "remaining_time": "1 day, 11:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2798, "total_steps": 17941, "loss": 1.6787, "learning_rate": 9.513363971837174e-05, "epoch": 0.15595563235048213, "percentage": 15.6, "elapsed_time": "6:37:21", "remaining_time": "1 day, 11:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2799, "total_steps": 17941, "loss": 1.6852, "learning_rate": 9.512980726424052e-05, "epoch": 0.15601137060364528, "percentage": 15.6, "elapsed_time": "6:37:30", "remaining_time": "1 day, 11:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2800, "total_steps": 17941, "loss": 1.6972, "learning_rate": 9.512597337885496e-05, "epoch": 0.15606710885680844, "percentage": 15.61, "elapsed_time": "6:37:39", "remaining_time": "1 day, 11:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2801, "total_steps": 17941, "loss": 1.6794, "learning_rate": 9.51221380623366e-05, "epoch": 0.15612284710997157, "percentage": 15.61, "elapsed_time": "6:37:47", "remaining_time": "1 day, 11:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2802, "total_steps": 17941, "loss": 1.6826, "learning_rate": 9.511830131480712e-05, "epoch": 0.15617858536313473, "percentage": 15.62, "elapsed_time": "6:37:55", "remaining_time": "1 day, 11:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2803, "total_steps": 17941, "loss": 1.6276, "learning_rate": 9.511446313638819e-05, "epoch": 0.15623432361629785, "percentage": 15.62, "elapsed_time": "6:38:04", "remaining_time": "1 day, 11:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2804, "total_steps": 17941, "loss": 1.7685, "learning_rate": 9.51106235272015e-05, "epoch": 0.156290061869461, "percentage": 15.63, "elapsed_time": "6:38:12", "remaining_time": "1 day, 11:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2805, "total_steps": 17941, "loss": 1.6194, "learning_rate": 9.510678248736887e-05, "epoch": 0.15634580012262417, "percentage": 15.63, "elapsed_time": "6:38:21", "remaining_time": "1 day, 11:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2806, "total_steps": 17941, "loss": 1.8121, "learning_rate": 9.510294001701208e-05, "epoch": 0.1564015383757873, "percentage": 15.64, "elapsed_time": "6:38:29", "remaining_time": "1 day, 11:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2807, "total_steps": 17941, "loss": 1.7674, "learning_rate": 9.509909611625298e-05, "epoch": 0.15645727662895045, "percentage": 15.65, "elapsed_time": "6:38:38", "remaining_time": "1 day, 11:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2808, "total_steps": 17941, "loss": 1.5738, "learning_rate": 9.509525078521353e-05, "epoch": 0.15651301488211358, "percentage": 15.65, "elapsed_time": "6:38:46", "remaining_time": "1 day, 11:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2809, "total_steps": 17941, "loss": 1.7126, "learning_rate": 9.509140402401563e-05, "epoch": 0.15656875313527674, "percentage": 15.66, "elapsed_time": "6:38:55", "remaining_time": "1 day, 11:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2810, "total_steps": 17941, "loss": 1.8056, "learning_rate": 9.508755583278131e-05, "epoch": 0.1566244913884399, "percentage": 15.66, "elapsed_time": "6:39:03", "remaining_time": "1 day, 11:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2811, "total_steps": 17941, "loss": 1.7569, "learning_rate": 9.508370621163259e-05, "epoch": 0.15668022964160302, "percentage": 15.67, "elapsed_time": "6:39:11", "remaining_time": "1 day, 11:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2812, "total_steps": 17941, "loss": 2.0115, "learning_rate": 9.507985516069154e-05, "epoch": 0.15673596789476618, "percentage": 15.67, "elapsed_time": "6:39:20", "remaining_time": "1 day, 11:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2813, "total_steps": 17941, "loss": 2.0173, "learning_rate": 9.507600268008034e-05, "epoch": 0.1567917061479293, "percentage": 15.68, "elapsed_time": "6:39:28", "remaining_time": "1 day, 11:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2814, "total_steps": 17941, "loss": 1.711, "learning_rate": 9.507214876992116e-05, "epoch": 0.15684744440109247, "percentage": 15.68, "elapsed_time": "6:39:38", "remaining_time": "1 day, 11:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2815, "total_steps": 17941, "loss": 1.7613, "learning_rate": 9.506829343033619e-05, "epoch": 0.15690318265425562, "percentage": 15.69, "elapsed_time": "6:39:46", "remaining_time": "1 day, 11:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2816, "total_steps": 17941, "loss": 1.9146, "learning_rate": 9.506443666144773e-05, "epoch": 0.15695892090741875, "percentage": 15.7, "elapsed_time": "6:39:55", "remaining_time": "1 day, 11:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2817, "total_steps": 17941, "loss": 1.5925, "learning_rate": 9.506057846337808e-05, "epoch": 0.1570146591605819, "percentage": 15.7, "elapsed_time": "6:40:04", "remaining_time": "1 day, 11:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2818, "total_steps": 17941, "loss": 1.7269, "learning_rate": 9.505671883624959e-05, "epoch": 0.15707039741374507, "percentage": 15.71, "elapsed_time": "6:40:12", "remaining_time": "1 day, 11:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2819, "total_steps": 17941, "loss": 1.9239, "learning_rate": 9.505285778018469e-05, "epoch": 0.1571261356669082, "percentage": 15.71, "elapsed_time": "6:40:21", "remaining_time": "1 day, 11:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2820, "total_steps": 17941, "loss": 1.4883, "learning_rate": 9.504899529530582e-05, "epoch": 0.15718187392007135, "percentage": 15.72, "elapsed_time": "6:40:29", "remaining_time": "1 day, 11:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2821, "total_steps": 17941, "loss": 1.5673, "learning_rate": 9.504513138173547e-05, "epoch": 0.15723761217323448, "percentage": 15.72, "elapsed_time": "6:40:38", "remaining_time": "1 day, 11:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2822, "total_steps": 17941, "loss": 1.492, "learning_rate": 9.504126603959618e-05, "epoch": 0.15729335042639764, "percentage": 15.73, "elapsed_time": "6:40:46", "remaining_time": "1 day, 11:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2823, "total_steps": 17941, "loss": 1.916, "learning_rate": 9.503739926901055e-05, "epoch": 0.1573490886795608, "percentage": 15.73, "elapsed_time": "6:40:55", "remaining_time": "1 day, 11:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2824, "total_steps": 17941, "loss": 1.8255, "learning_rate": 9.50335310701012e-05, "epoch": 0.15740482693272392, "percentage": 15.74, "elapsed_time": "6:41:03", "remaining_time": "1 day, 11:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2825, "total_steps": 17941, "loss": 1.9614, "learning_rate": 9.50296614429908e-05, "epoch": 0.15746056518588708, "percentage": 15.75, "elapsed_time": "6:41:12", "remaining_time": "1 day, 11:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2826, "total_steps": 17941, "loss": 1.5858, "learning_rate": 9.502579038780207e-05, "epoch": 0.1575163034390502, "percentage": 15.75, "elapsed_time": "6:41:20", "remaining_time": "1 day, 11:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2827, "total_steps": 17941, "loss": 1.6746, "learning_rate": 9.50219179046578e-05, "epoch": 0.15757204169221337, "percentage": 15.76, "elapsed_time": "6:41:29", "remaining_time": "1 day, 11:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2828, "total_steps": 17941, "loss": 1.5768, "learning_rate": 9.50180439936808e-05, "epoch": 0.15762777994537652, "percentage": 15.76, "elapsed_time": "6:41:37", "remaining_time": "1 day, 11:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2829, "total_steps": 17941, "loss": 2.0199, "learning_rate": 9.501416865499391e-05, "epoch": 0.15768351819853965, "percentage": 15.77, "elapsed_time": "6:41:46", "remaining_time": "1 day, 11:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2830, "total_steps": 17941, "loss": 1.6215, "learning_rate": 9.501029188872004e-05, "epoch": 0.1577392564517028, "percentage": 15.77, "elapsed_time": "6:41:54", "remaining_time": "1 day, 11:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2831, "total_steps": 17941, "loss": 1.6355, "learning_rate": 9.500641369498214e-05, "epoch": 0.15779499470486594, "percentage": 15.78, "elapsed_time": "6:42:02", "remaining_time": "1 day, 11:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2832, "total_steps": 17941, "loss": 2.107, "learning_rate": 9.50025340739032e-05, "epoch": 0.1578507329580291, "percentage": 15.79, "elapsed_time": "6:42:11", "remaining_time": "1 day, 11:45:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2833, "total_steps": 17941, "loss": 1.5787, "learning_rate": 9.499865302560626e-05, "epoch": 0.15790647121119225, "percentage": 15.79, "elapsed_time": "6:42:19", "remaining_time": "1 day, 11:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2834, "total_steps": 17941, "loss": 1.6343, "learning_rate": 9.49947705502144e-05, "epoch": 0.15796220946435538, "percentage": 15.8, "elapsed_time": "6:42:28", "remaining_time": "1 day, 11:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2835, "total_steps": 17941, "loss": 1.8281, "learning_rate": 9.499088664785077e-05, "epoch": 0.15801794771751854, "percentage": 15.8, "elapsed_time": "6:42:36", "remaining_time": "1 day, 11:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2836, "total_steps": 17941, "loss": 1.7294, "learning_rate": 9.498700131863853e-05, "epoch": 0.15807368597068167, "percentage": 15.81, "elapsed_time": "6:42:45", "remaining_time": "1 day, 11:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2837, "total_steps": 17941, "loss": 1.6611, "learning_rate": 9.49831145627009e-05, "epoch": 0.15812942422384482, "percentage": 15.81, "elapsed_time": "6:42:53", "remaining_time": "1 day, 11:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2838, "total_steps": 17941, "loss": 1.4057, "learning_rate": 9.497922638016114e-05, "epoch": 0.15818516247700798, "percentage": 15.82, "elapsed_time": "6:43:02", "remaining_time": "1 day, 11:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2839, "total_steps": 17941, "loss": 1.7803, "learning_rate": 9.497533677114257e-05, "epoch": 0.1582409007301711, "percentage": 15.82, "elapsed_time": "6:43:10", "remaining_time": "1 day, 11:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2840, "total_steps": 17941, "loss": 1.7828, "learning_rate": 9.497144573576855e-05, "epoch": 0.15829663898333426, "percentage": 15.83, "elapsed_time": "6:43:19", "remaining_time": "1 day, 11:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2841, "total_steps": 17941, "loss": 1.9224, "learning_rate": 9.496755327416245e-05, "epoch": 0.15835237723649742, "percentage": 15.84, "elapsed_time": "6:43:27", "remaining_time": "1 day, 11:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2842, "total_steps": 17941, "loss": 1.6932, "learning_rate": 9.496365938644775e-05, "epoch": 0.15840811548966055, "percentage": 15.84, "elapsed_time": "6:43:35", "remaining_time": "1 day, 11:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2843, "total_steps": 17941, "loss": 1.7235, "learning_rate": 9.495976407274794e-05, "epoch": 0.1584638537428237, "percentage": 15.85, "elapsed_time": "6:43:44", "remaining_time": "1 day, 11:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2844, "total_steps": 17941, "loss": 1.7368, "learning_rate": 9.495586733318654e-05, "epoch": 0.15851959199598684, "percentage": 15.85, "elapsed_time": "6:43:52", "remaining_time": "1 day, 11:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2845, "total_steps": 17941, "loss": 1.5822, "learning_rate": 9.495196916788714e-05, "epoch": 0.15857533024915, "percentage": 15.86, "elapsed_time": "6:44:01", "remaining_time": "1 day, 11:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2846, "total_steps": 17941, "loss": 1.7119, "learning_rate": 9.494806957697337e-05, "epoch": 0.15863106850231315, "percentage": 15.86, "elapsed_time": "6:44:09", "remaining_time": "1 day, 11:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2847, "total_steps": 17941, "loss": 1.7597, "learning_rate": 9.49441685605689e-05, "epoch": 0.15868680675547628, "percentage": 15.87, "elapsed_time": "6:44:18", "remaining_time": "1 day, 11:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2848, "total_steps": 17941, "loss": 2.1445, "learning_rate": 9.494026611879744e-05, "epoch": 0.15874254500863944, "percentage": 15.87, "elapsed_time": "6:44:27", "remaining_time": "1 day, 11:43:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2849, "total_steps": 17941, "loss": 1.5885, "learning_rate": 9.493636225178276e-05, "epoch": 0.15879828326180256, "percentage": 15.88, "elapsed_time": "6:44:35", "remaining_time": "1 day, 11:43:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2850, "total_steps": 17941, "loss": 1.7934, "learning_rate": 9.493245695964866e-05, "epoch": 0.15885402151496572, "percentage": 15.89, "elapsed_time": "6:44:44", "remaining_time": "1 day, 11:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2851, "total_steps": 17941, "loss": 1.7025, "learning_rate": 9.492855024251901e-05, "epoch": 0.15890975976812888, "percentage": 15.89, "elapsed_time": "6:44:52", "remaining_time": "1 day, 11:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2852, "total_steps": 17941, "loss": 1.6258, "learning_rate": 9.492464210051771e-05, "epoch": 0.158965498021292, "percentage": 15.9, "elapsed_time": "6:45:01", "remaining_time": "1 day, 11:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2853, "total_steps": 17941, "loss": 1.9171, "learning_rate": 9.492073253376865e-05, "epoch": 0.15902123627445516, "percentage": 15.9, "elapsed_time": "6:45:09", "remaining_time": "1 day, 11:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2854, "total_steps": 17941, "loss": 1.9891, "learning_rate": 9.491682154239589e-05, "epoch": 0.1590769745276183, "percentage": 15.91, "elapsed_time": "6:45:18", "remaining_time": "1 day, 11:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2855, "total_steps": 17941, "loss": 1.9522, "learning_rate": 9.491290912652344e-05, "epoch": 0.15913271278078145, "percentage": 15.91, "elapsed_time": "6:45:26", "remaining_time": "1 day, 11:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2856, "total_steps": 17941, "loss": 2.0334, "learning_rate": 9.490899528627536e-05, "epoch": 0.1591884510339446, "percentage": 15.92, "elapsed_time": "6:45:34", "remaining_time": "1 day, 11:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2857, "total_steps": 17941, "loss": 1.8532, "learning_rate": 9.490508002177579e-05, "epoch": 0.15924418928710773, "percentage": 15.92, "elapsed_time": "6:45:43", "remaining_time": "1 day, 11:42:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2858, "total_steps": 17941, "loss": 1.6041, "learning_rate": 9.490116333314889e-05, "epoch": 0.1592999275402709, "percentage": 15.93, "elapsed_time": "6:45:51", "remaining_time": "1 day, 11:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2859, "total_steps": 17941, "loss": 1.9383, "learning_rate": 9.489724522051888e-05, "epoch": 0.15935566579343402, "percentage": 15.94, "elapsed_time": "6:46:00", "remaining_time": "1 day, 11:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2860, "total_steps": 17941, "loss": 1.8919, "learning_rate": 9.489332568401004e-05, "epoch": 0.15941140404659718, "percentage": 15.94, "elapsed_time": "6:46:08", "remaining_time": "1 day, 11:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2861, "total_steps": 17941, "loss": 1.8347, "learning_rate": 9.488940472374663e-05, "epoch": 0.15946714229976033, "percentage": 15.95, "elapsed_time": "6:46:17", "remaining_time": "1 day, 11:41:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2862, "total_steps": 17941, "loss": 1.697, "learning_rate": 9.488548233985305e-05, "epoch": 0.15952288055292346, "percentage": 15.95, "elapsed_time": "6:46:25", "remaining_time": "1 day, 11:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2863, "total_steps": 17941, "loss": 1.9557, "learning_rate": 9.488155853245366e-05, "epoch": 0.15957861880608662, "percentage": 15.96, "elapsed_time": "6:46:34", "remaining_time": "1 day, 11:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2864, "total_steps": 17941, "loss": 1.6364, "learning_rate": 9.487763330167291e-05, "epoch": 0.15963435705924978, "percentage": 15.96, "elapsed_time": "6:46:42", "remaining_time": "1 day, 11:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2865, "total_steps": 17941, "loss": 1.7917, "learning_rate": 9.487370664763529e-05, "epoch": 0.1596900953124129, "percentage": 15.97, "elapsed_time": "6:46:51", "remaining_time": "1 day, 11:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2866, "total_steps": 17941, "loss": 1.8552, "learning_rate": 9.486977857046532e-05, "epoch": 0.15974583356557606, "percentage": 15.97, "elapsed_time": "6:46:59", "remaining_time": "1 day, 11:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2867, "total_steps": 17941, "loss": 1.6089, "learning_rate": 9.486584907028758e-05, "epoch": 0.1598015718187392, "percentage": 15.98, "elapsed_time": "6:47:08", "remaining_time": "1 day, 11:40:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2868, "total_steps": 17941, "loss": 1.5357, "learning_rate": 9.48619181472267e-05, "epoch": 0.15985731007190235, "percentage": 15.99, "elapsed_time": "6:47:16", "remaining_time": "1 day, 11:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2869, "total_steps": 17941, "loss": 1.7628, "learning_rate": 9.485798580140735e-05, "epoch": 0.1599130483250655, "percentage": 15.99, "elapsed_time": "6:47:24", "remaining_time": "1 day, 11:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2870, "total_steps": 17941, "loss": 1.6318, "learning_rate": 9.485405203295421e-05, "epoch": 0.15996878657822863, "percentage": 16.0, "elapsed_time": "6:47:33", "remaining_time": "1 day, 11:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2871, "total_steps": 17941, "loss": 1.6422, "learning_rate": 9.485011684199207e-05, "epoch": 0.1600245248313918, "percentage": 16.0, "elapsed_time": "6:47:41", "remaining_time": "1 day, 11:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2872, "total_steps": 17941, "loss": 1.5466, "learning_rate": 9.484618022864571e-05, "epoch": 0.16008026308455492, "percentage": 16.01, "elapsed_time": "6:47:50", "remaining_time": "1 day, 11:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2873, "total_steps": 17941, "loss": 2.0925, "learning_rate": 9.484224219304e-05, "epoch": 0.16013600133771808, "percentage": 16.01, "elapsed_time": "6:47:58", "remaining_time": "1 day, 11:39:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2874, "total_steps": 17941, "loss": 1.6183, "learning_rate": 9.48383027352998e-05, "epoch": 0.16019173959088123, "percentage": 16.02, "elapsed_time": "6:48:07", "remaining_time": "1 day, 11:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2875, "total_steps": 17941, "loss": 1.5593, "learning_rate": 9.483436185555007e-05, "epoch": 0.16024747784404436, "percentage": 16.02, "elapsed_time": "6:48:15", "remaining_time": "1 day, 11:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2876, "total_steps": 17941, "loss": 1.7093, "learning_rate": 9.483041955391578e-05, "epoch": 0.16030321609720752, "percentage": 16.03, "elapsed_time": "6:48:24", "remaining_time": "1 day, 11:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2877, "total_steps": 17941, "loss": 1.7555, "learning_rate": 9.482647583052196e-05, "epoch": 0.16035895435037065, "percentage": 16.04, "elapsed_time": "6:48:33", "remaining_time": "1 day, 11:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2878, "total_steps": 17941, "loss": 1.7709, "learning_rate": 9.48225306854937e-05, "epoch": 0.1604146926035338, "percentage": 16.04, "elapsed_time": "6:48:41", "remaining_time": "1 day, 11:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2879, "total_steps": 17941, "loss": 1.7296, "learning_rate": 9.481858411895608e-05, "epoch": 0.16047043085669696, "percentage": 16.05, "elapsed_time": "6:48:49", "remaining_time": "1 day, 11:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2880, "total_steps": 17941, "loss": 1.7808, "learning_rate": 9.481463613103429e-05, "epoch": 0.1605261691098601, "percentage": 16.05, "elapsed_time": "6:48:58", "remaining_time": "1 day, 11:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2881, "total_steps": 17941, "loss": 1.6362, "learning_rate": 9.481068672185353e-05, "epoch": 0.16058190736302325, "percentage": 16.06, "elapsed_time": "6:49:06", "remaining_time": "1 day, 11:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2882, "total_steps": 17941, "loss": 1.5913, "learning_rate": 9.480673589153904e-05, "epoch": 0.16063764561618638, "percentage": 16.06, "elapsed_time": "6:49:15", "remaining_time": "1 day, 11:38:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2883, "total_steps": 17941, "loss": 1.6744, "learning_rate": 9.480278364021614e-05, "epoch": 0.16069338386934953, "percentage": 16.07, "elapsed_time": "6:49:24", "remaining_time": "1 day, 11:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2884, "total_steps": 17941, "loss": 1.5185, "learning_rate": 9.479882996801017e-05, "epoch": 0.1607491221225127, "percentage": 16.07, "elapsed_time": "6:49:32", "remaining_time": "1 day, 11:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2885, "total_steps": 17941, "loss": 1.5259, "learning_rate": 9.479487487504649e-05, "epoch": 0.16080486037567582, "percentage": 16.08, "elapsed_time": "6:49:41", "remaining_time": "1 day, 11:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2886, "total_steps": 17941, "loss": 1.7626, "learning_rate": 9.479091836145057e-05, "epoch": 0.16086059862883897, "percentage": 16.09, "elapsed_time": "6:49:49", "remaining_time": "1 day, 11:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2887, "total_steps": 17941, "loss": 1.6936, "learning_rate": 9.478696042734785e-05, "epoch": 0.16091633688200213, "percentage": 16.09, "elapsed_time": "6:49:57", "remaining_time": "1 day, 11:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2888, "total_steps": 17941, "loss": 1.4811, "learning_rate": 9.478300107286389e-05, "epoch": 0.16097207513516526, "percentage": 16.1, "elapsed_time": "6:50:06", "remaining_time": "1 day, 11:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2889, "total_steps": 17941, "loss": 1.7184, "learning_rate": 9.477904029812422e-05, "epoch": 0.16102781338832842, "percentage": 16.1, "elapsed_time": "6:50:14", "remaining_time": "1 day, 11:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2890, "total_steps": 17941, "loss": 1.4053, "learning_rate": 9.477507810325448e-05, "epoch": 0.16108355164149155, "percentage": 16.11, "elapsed_time": "6:50:23", "remaining_time": "1 day, 11:37:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2891, "total_steps": 17941, "loss": 2.0827, "learning_rate": 9.477111448838031e-05, "epoch": 0.1611392898946547, "percentage": 16.11, "elapsed_time": "6:50:31", "remaining_time": "1 day, 11:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2892, "total_steps": 17941, "loss": 1.8864, "learning_rate": 9.476714945362745e-05, "epoch": 0.16119502814781786, "percentage": 16.12, "elapsed_time": "6:50:40", "remaining_time": "1 day, 11:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2893, "total_steps": 17941, "loss": 1.9475, "learning_rate": 9.47631829991216e-05, "epoch": 0.161250766400981, "percentage": 16.13, "elapsed_time": "6:50:48", "remaining_time": "1 day, 11:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2894, "total_steps": 17941, "loss": 1.9044, "learning_rate": 9.475921512498857e-05, "epoch": 0.16130650465414414, "percentage": 16.13, "elapsed_time": "6:50:57", "remaining_time": "1 day, 11:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2895, "total_steps": 17941, "loss": 1.5211, "learning_rate": 9.475524583135421e-05, "epoch": 0.16136224290730727, "percentage": 16.14, "elapsed_time": "6:51:05", "remaining_time": "1 day, 11:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2896, "total_steps": 17941, "loss": 1.7724, "learning_rate": 9.475127511834438e-05, "epoch": 0.16141798116047043, "percentage": 16.14, "elapsed_time": "6:51:13", "remaining_time": "1 day, 11:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2897, "total_steps": 17941, "loss": 1.8392, "learning_rate": 9.474730298608504e-05, "epoch": 0.1614737194136336, "percentage": 16.15, "elapsed_time": "6:51:22", "remaining_time": "1 day, 11:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2898, "total_steps": 17941, "loss": 1.7909, "learning_rate": 9.474332943470213e-05, "epoch": 0.16152945766679672, "percentage": 16.15, "elapsed_time": "6:51:30", "remaining_time": "1 day, 11:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2899, "total_steps": 17941, "loss": 1.9106, "learning_rate": 9.47393544643217e-05, "epoch": 0.16158519591995987, "percentage": 16.16, "elapsed_time": "6:51:39", "remaining_time": "1 day, 11:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2900, "total_steps": 17941, "loss": 1.922, "learning_rate": 9.473537807506977e-05, "epoch": 0.161640934173123, "percentage": 16.16, "elapsed_time": "6:51:47", "remaining_time": "1 day, 11:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2901, "total_steps": 17941, "loss": 1.5719, "learning_rate": 9.47314002670725e-05, "epoch": 0.16169667242628616, "percentage": 16.17, "elapsed_time": "6:51:56", "remaining_time": "1 day, 11:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2902, "total_steps": 17941, "loss": 1.6517, "learning_rate": 9.472742104045599e-05, "epoch": 0.16175241067944932, "percentage": 16.18, "elapsed_time": "6:52:04", "remaining_time": "1 day, 11:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2903, "total_steps": 17941, "loss": 1.7661, "learning_rate": 9.472344039534646e-05, "epoch": 0.16180814893261244, "percentage": 16.18, "elapsed_time": "6:52:13", "remaining_time": "1 day, 11:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2904, "total_steps": 17941, "loss": 1.6874, "learning_rate": 9.471945833187018e-05, "epoch": 0.1618638871857756, "percentage": 16.19, "elapsed_time": "6:52:21", "remaining_time": "1 day, 11:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2905, "total_steps": 17941, "loss": 1.6745, "learning_rate": 9.471547485015341e-05, "epoch": 0.16191962543893873, "percentage": 16.19, "elapsed_time": "6:52:29", "remaining_time": "1 day, 11:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2906, "total_steps": 17941, "loss": 1.7141, "learning_rate": 9.471148995032247e-05, "epoch": 0.1619753636921019, "percentage": 16.2, "elapsed_time": "6:52:38", "remaining_time": "1 day, 11:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2907, "total_steps": 17941, "loss": 1.595, "learning_rate": 9.470750363250378e-05, "epoch": 0.16203110194526504, "percentage": 16.2, "elapsed_time": "6:52:46", "remaining_time": "1 day, 11:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2908, "total_steps": 17941, "loss": 1.8687, "learning_rate": 9.470351589682372e-05, "epoch": 0.16208684019842817, "percentage": 16.21, "elapsed_time": "6:52:55", "remaining_time": "1 day, 11:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2909, "total_steps": 17941, "loss": 1.8964, "learning_rate": 9.469952674340877e-05, "epoch": 0.16214257845159133, "percentage": 16.21, "elapsed_time": "6:53:03", "remaining_time": "1 day, 11:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2910, "total_steps": 17941, "loss": 1.6171, "learning_rate": 9.469553617238546e-05, "epoch": 0.16219831670475449, "percentage": 16.22, "elapsed_time": "6:53:12", "remaining_time": "1 day, 11:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2911, "total_steps": 17941, "loss": 1.7592, "learning_rate": 9.469154418388034e-05, "epoch": 0.16225405495791762, "percentage": 16.23, "elapsed_time": "6:53:20", "remaining_time": "1 day, 11:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2912, "total_steps": 17941, "loss": 1.6709, "learning_rate": 9.468755077801999e-05, "epoch": 0.16230979321108077, "percentage": 16.23, "elapsed_time": "6:53:29", "remaining_time": "1 day, 11:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2913, "total_steps": 17941, "loss": 1.7304, "learning_rate": 9.468355595493109e-05, "epoch": 0.1623655314642439, "percentage": 16.24, "elapsed_time": "6:53:37", "remaining_time": "1 day, 11:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2914, "total_steps": 17941, "loss": 1.7252, "learning_rate": 9.467955971474031e-05, "epoch": 0.16242126971740706, "percentage": 16.24, "elapsed_time": "6:53:46", "remaining_time": "1 day, 11:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2915, "total_steps": 17941, "loss": 1.7643, "learning_rate": 9.46755620575744e-05, "epoch": 0.16247700797057021, "percentage": 16.25, "elapsed_time": "6:53:54", "remaining_time": "1 day, 11:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2916, "total_steps": 17941, "loss": 1.7263, "learning_rate": 9.467156298356015e-05, "epoch": 0.16253274622373334, "percentage": 16.25, "elapsed_time": "6:54:02", "remaining_time": "1 day, 11:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2917, "total_steps": 17941, "loss": 1.7771, "learning_rate": 9.466756249282435e-05, "epoch": 0.1625884844768965, "percentage": 16.26, "elapsed_time": "6:54:11", "remaining_time": "1 day, 11:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2918, "total_steps": 17941, "loss": 1.7372, "learning_rate": 9.466356058549393e-05, "epoch": 0.16264422273005963, "percentage": 16.26, "elapsed_time": "6:54:19", "remaining_time": "1 day, 11:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2919, "total_steps": 17941, "loss": 1.7296, "learning_rate": 9.465955726169575e-05, "epoch": 0.16269996098322279, "percentage": 16.27, "elapsed_time": "6:54:28", "remaining_time": "1 day, 11:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2920, "total_steps": 17941, "loss": 1.7907, "learning_rate": 9.46555525215568e-05, "epoch": 0.16275569923638594, "percentage": 16.28, "elapsed_time": "6:54:36", "remaining_time": "1 day, 11:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2921, "total_steps": 17941, "loss": 1.8558, "learning_rate": 9.46515463652041e-05, "epoch": 0.16281143748954907, "percentage": 16.28, "elapsed_time": "6:54:45", "remaining_time": "1 day, 11:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2922, "total_steps": 17941, "loss": 1.8673, "learning_rate": 9.464753879276467e-05, "epoch": 0.16286717574271223, "percentage": 16.29, "elapsed_time": "6:54:53", "remaining_time": "1 day, 11:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2923, "total_steps": 17941, "loss": 1.8252, "learning_rate": 9.464352980436562e-05, "epoch": 0.16292291399587536, "percentage": 16.29, "elapsed_time": "6:55:02", "remaining_time": "1 day, 11:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2924, "total_steps": 17941, "loss": 1.564, "learning_rate": 9.463951940013411e-05, "epoch": 0.1629786522490385, "percentage": 16.3, "elapsed_time": "6:55:10", "remaining_time": "1 day, 11:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2925, "total_steps": 17941, "loss": 1.731, "learning_rate": 9.46355075801973e-05, "epoch": 0.16303439050220167, "percentage": 16.3, "elapsed_time": "6:55:18", "remaining_time": "1 day, 11:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2926, "total_steps": 17941, "loss": 1.7954, "learning_rate": 9.463149434468244e-05, "epoch": 0.1630901287553648, "percentage": 16.31, "elapsed_time": "6:55:27", "remaining_time": "1 day, 11:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2927, "total_steps": 17941, "loss": 1.6639, "learning_rate": 9.46274796937168e-05, "epoch": 0.16314586700852796, "percentage": 16.31, "elapsed_time": "6:55:35", "remaining_time": "1 day, 11:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2928, "total_steps": 17941, "loss": 1.5104, "learning_rate": 9.462346362742767e-05, "epoch": 0.16320160526169109, "percentage": 16.32, "elapsed_time": "6:55:45", "remaining_time": "1 day, 11:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2929, "total_steps": 17941, "loss": 1.7081, "learning_rate": 9.461944614594248e-05, "epoch": 0.16325734351485424, "percentage": 16.33, "elapsed_time": "6:55:53", "remaining_time": "1 day, 11:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2930, "total_steps": 17941, "loss": 1.8709, "learning_rate": 9.461542724938859e-05, "epoch": 0.1633130817680174, "percentage": 16.33, "elapsed_time": "6:56:02", "remaining_time": "1 day, 11:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2931, "total_steps": 17941, "loss": 1.7861, "learning_rate": 9.461140693789349e-05, "epoch": 0.16336882002118053, "percentage": 16.34, "elapsed_time": "6:56:10", "remaining_time": "1 day, 11:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2932, "total_steps": 17941, "loss": 1.745, "learning_rate": 9.460738521158466e-05, "epoch": 0.16342455827434368, "percentage": 16.34, "elapsed_time": "6:56:19", "remaining_time": "1 day, 11:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2933, "total_steps": 17941, "loss": 1.8071, "learning_rate": 9.460336207058964e-05, "epoch": 0.16348029652750684, "percentage": 16.35, "elapsed_time": "6:56:27", "remaining_time": "1 day, 11:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2934, "total_steps": 17941, "loss": 1.7359, "learning_rate": 9.459933751503604e-05, "epoch": 0.16353603478066997, "percentage": 16.35, "elapsed_time": "6:56:35", "remaining_time": "1 day, 11:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2935, "total_steps": 17941, "loss": 1.6545, "learning_rate": 9.459531154505147e-05, "epoch": 0.16359177303383313, "percentage": 16.36, "elapsed_time": "6:56:44", "remaining_time": "1 day, 11:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2936, "total_steps": 17941, "loss": 1.5666, "learning_rate": 9.459128416076365e-05, "epoch": 0.16364751128699626, "percentage": 16.36, "elapsed_time": "6:56:52", "remaining_time": "1 day, 11:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2937, "total_steps": 17941, "loss": 1.8546, "learning_rate": 9.458725536230027e-05, "epoch": 0.1637032495401594, "percentage": 16.37, "elapsed_time": "6:57:01", "remaining_time": "1 day, 11:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2938, "total_steps": 17941, "loss": 1.6707, "learning_rate": 9.458322514978912e-05, "epoch": 0.16375898779332257, "percentage": 16.38, "elapsed_time": "6:57:09", "remaining_time": "1 day, 11:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2939, "total_steps": 17941, "loss": 1.6807, "learning_rate": 9.4579193523358e-05, "epoch": 0.1638147260464857, "percentage": 16.38, "elapsed_time": "6:57:18", "remaining_time": "1 day, 11:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2940, "total_steps": 17941, "loss": 1.7966, "learning_rate": 9.457516048313478e-05, "epoch": 0.16387046429964885, "percentage": 16.39, "elapsed_time": "6:57:26", "remaining_time": "1 day, 11:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2941, "total_steps": 17941, "loss": 1.8103, "learning_rate": 9.457112602924735e-05, "epoch": 0.16392620255281198, "percentage": 16.39, "elapsed_time": "6:57:35", "remaining_time": "1 day, 11:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2942, "total_steps": 17941, "loss": 1.7992, "learning_rate": 9.456709016182368e-05, "epoch": 0.16398194080597514, "percentage": 16.4, "elapsed_time": "6:57:43", "remaining_time": "1 day, 11:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2943, "total_steps": 17941, "loss": 1.8232, "learning_rate": 9.456305288099174e-05, "epoch": 0.1640376790591383, "percentage": 16.4, "elapsed_time": "6:57:52", "remaining_time": "1 day, 11:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2944, "total_steps": 17941, "loss": 1.8106, "learning_rate": 9.45590141868796e-05, "epoch": 0.16409341731230143, "percentage": 16.41, "elapsed_time": "6:58:00", "remaining_time": "1 day, 11:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2945, "total_steps": 17941, "loss": 1.6316, "learning_rate": 9.455497407961532e-05, "epoch": 0.16414915556546458, "percentage": 16.41, "elapsed_time": "6:58:09", "remaining_time": "1 day, 11:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2946, "total_steps": 17941, "loss": 1.4846, "learning_rate": 9.455093255932704e-05, "epoch": 0.1642048938186277, "percentage": 16.42, "elapsed_time": "6:58:18", "remaining_time": "1 day, 11:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2947, "total_steps": 17941, "loss": 1.7717, "learning_rate": 9.454688962614293e-05, "epoch": 0.16426063207179087, "percentage": 16.43, "elapsed_time": "6:58:26", "remaining_time": "1 day, 11:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2948, "total_steps": 17941, "loss": 1.8829, "learning_rate": 9.45428452801912e-05, "epoch": 0.16431637032495403, "percentage": 16.43, "elapsed_time": "6:58:34", "remaining_time": "1 day, 11:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2949, "total_steps": 17941, "loss": 1.8933, "learning_rate": 9.453879952160013e-05, "epoch": 0.16437210857811715, "percentage": 16.44, "elapsed_time": "6:58:43", "remaining_time": "1 day, 11:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2950, "total_steps": 17941, "loss": 1.6009, "learning_rate": 9.4534752350498e-05, "epoch": 0.1644278468312803, "percentage": 16.44, "elapsed_time": "6:58:51", "remaining_time": "1 day, 11:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2951, "total_steps": 17941, "loss": 1.9932, "learning_rate": 9.45307037670132e-05, "epoch": 0.16448358508444344, "percentage": 16.45, "elapsed_time": "6:59:00", "remaining_time": "1 day, 11:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2952, "total_steps": 17941, "loss": 1.9729, "learning_rate": 9.452665377127409e-05, "epoch": 0.1645393233376066, "percentage": 16.45, "elapsed_time": "6:59:08", "remaining_time": "1 day, 11:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2953, "total_steps": 17941, "loss": 1.8995, "learning_rate": 9.452260236340915e-05, "epoch": 0.16459506159076975, "percentage": 16.46, "elapsed_time": "6:59:17", "remaining_time": "1 day, 11:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2954, "total_steps": 17941, "loss": 1.8313, "learning_rate": 9.451854954354684e-05, "epoch": 0.16465079984393288, "percentage": 16.47, "elapsed_time": "6:59:25", "remaining_time": "1 day, 11:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2955, "total_steps": 17941, "loss": 1.6307, "learning_rate": 9.451449531181572e-05, "epoch": 0.16470653809709604, "percentage": 16.47, "elapsed_time": "6:59:34", "remaining_time": "1 day, 11:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2956, "total_steps": 17941, "loss": 1.7253, "learning_rate": 9.451043966834431e-05, "epoch": 0.1647622763502592, "percentage": 16.48, "elapsed_time": "6:59:42", "remaining_time": "1 day, 11:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2957, "total_steps": 17941, "loss": 1.5122, "learning_rate": 9.450638261326128e-05, "epoch": 0.16481801460342232, "percentage": 16.48, "elapsed_time": "6:59:51", "remaining_time": "1 day, 11:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2958, "total_steps": 17941, "loss": 1.7602, "learning_rate": 9.450232414669528e-05, "epoch": 0.16487375285658548, "percentage": 16.49, "elapsed_time": "6:59:59", "remaining_time": "1 day, 11:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2959, "total_steps": 17941, "loss": 1.9841, "learning_rate": 9.449826426877504e-05, "epoch": 0.1649294911097486, "percentage": 16.49, "elapsed_time": "7:00:08", "remaining_time": "1 day, 11:27:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2960, "total_steps": 17941, "loss": 1.7965, "learning_rate": 9.44942029796293e-05, "epoch": 0.16498522936291177, "percentage": 16.5, "elapsed_time": "7:00:16", "remaining_time": "1 day, 11:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2961, "total_steps": 17941, "loss": 2.1267, "learning_rate": 9.449014027938685e-05, "epoch": 0.16504096761607492, "percentage": 16.5, "elapsed_time": "7:00:25", "remaining_time": "1 day, 11:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2962, "total_steps": 17941, "loss": 1.7952, "learning_rate": 9.448607616817655e-05, "epoch": 0.16509670586923805, "percentage": 16.51, "elapsed_time": "7:00:33", "remaining_time": "1 day, 11:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2963, "total_steps": 17941, "loss": 1.8026, "learning_rate": 9.448201064612728e-05, "epoch": 0.1651524441224012, "percentage": 16.52, "elapsed_time": "7:00:42", "remaining_time": "1 day, 11:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2964, "total_steps": 17941, "loss": 2.1377, "learning_rate": 9.447794371336799e-05, "epoch": 0.16520818237556434, "percentage": 16.52, "elapsed_time": "7:00:50", "remaining_time": "1 day, 11:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2965, "total_steps": 17941, "loss": 1.9586, "learning_rate": 9.447387537002765e-05, "epoch": 0.1652639206287275, "percentage": 16.53, "elapsed_time": "7:00:58", "remaining_time": "1 day, 11:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2966, "total_steps": 17941, "loss": 1.4828, "learning_rate": 9.446980561623527e-05, "epoch": 0.16531965888189065, "percentage": 16.53, "elapsed_time": "7:01:08", "remaining_time": "1 day, 11:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2967, "total_steps": 17941, "loss": 1.789, "learning_rate": 9.446573445211994e-05, "epoch": 0.16537539713505378, "percentage": 16.54, "elapsed_time": "7:01:16", "remaining_time": "1 day, 11:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2968, "total_steps": 17941, "loss": 1.709, "learning_rate": 9.446166187781077e-05, "epoch": 0.16543113538821694, "percentage": 16.54, "elapsed_time": "7:01:24", "remaining_time": "1 day, 11:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2969, "total_steps": 17941, "loss": 1.6335, "learning_rate": 9.445758789343691e-05, "epoch": 0.16548687364138007, "percentage": 16.55, "elapsed_time": "7:01:33", "remaining_time": "1 day, 11:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2970, "total_steps": 17941, "loss": 1.6666, "learning_rate": 9.445351249912757e-05, "epoch": 0.16554261189454322, "percentage": 16.55, "elapsed_time": "7:01:41", "remaining_time": "1 day, 11:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2971, "total_steps": 17941, "loss": 1.9109, "learning_rate": 9.4449435695012e-05, "epoch": 0.16559835014770638, "percentage": 16.56, "elapsed_time": "7:01:50", "remaining_time": "1 day, 11:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2972, "total_steps": 17941, "loss": 1.781, "learning_rate": 9.444535748121949e-05, "epoch": 0.1656540884008695, "percentage": 16.57, "elapsed_time": "7:01:58", "remaining_time": "1 day, 11:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2973, "total_steps": 17941, "loss": 1.7213, "learning_rate": 9.444127785787938e-05, "epoch": 0.16570982665403267, "percentage": 16.57, "elapsed_time": "7:02:07", "remaining_time": "1 day, 11:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2974, "total_steps": 17941, "loss": 1.8224, "learning_rate": 9.443719682512102e-05, "epoch": 0.1657655649071958, "percentage": 16.58, "elapsed_time": "7:02:15", "remaining_time": "1 day, 11:25:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2975, "total_steps": 17941, "loss": 1.8449, "learning_rate": 9.443311438307389e-05, "epoch": 0.16582130316035895, "percentage": 16.58, "elapsed_time": "7:02:24", "remaining_time": "1 day, 11:24:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2976, "total_steps": 17941, "loss": 1.6679, "learning_rate": 9.442903053186743e-05, "epoch": 0.1658770414135221, "percentage": 16.59, "elapsed_time": "7:02:32", "remaining_time": "1 day, 11:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2977, "total_steps": 17941, "loss": 1.6812, "learning_rate": 9.442494527163115e-05, "epoch": 0.16593277966668524, "percentage": 16.59, "elapsed_time": "7:02:41", "remaining_time": "1 day, 11:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2978, "total_steps": 17941, "loss": 1.7849, "learning_rate": 9.442085860249461e-05, "epoch": 0.1659885179198484, "percentage": 16.6, "elapsed_time": "7:02:49", "remaining_time": "1 day, 11:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2979, "total_steps": 17941, "loss": 1.8582, "learning_rate": 9.441677052458745e-05, "epoch": 0.16604425617301155, "percentage": 16.6, "elapsed_time": "7:02:58", "remaining_time": "1 day, 11:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2980, "total_steps": 17941, "loss": 2.0226, "learning_rate": 9.441268103803928e-05, "epoch": 0.16609999442617468, "percentage": 16.61, "elapsed_time": "7:03:06", "remaining_time": "1 day, 11:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2981, "total_steps": 17941, "loss": 1.577, "learning_rate": 9.440859014297982e-05, "epoch": 0.16615573267933784, "percentage": 16.62, "elapsed_time": "7:03:14", "remaining_time": "1 day, 11:24:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2982, "total_steps": 17941, "loss": 1.7272, "learning_rate": 9.440449783953883e-05, "epoch": 0.16621147093250097, "percentage": 16.62, "elapsed_time": "7:03:23", "remaining_time": "1 day, 11:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2983, "total_steps": 17941, "loss": 1.7481, "learning_rate": 9.440040412784603e-05, "epoch": 0.16626720918566412, "percentage": 16.63, "elapsed_time": "7:03:31", "remaining_time": "1 day, 11:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2984, "total_steps": 17941, "loss": 1.9244, "learning_rate": 9.439630900803129e-05, "epoch": 0.16632294743882728, "percentage": 16.63, "elapsed_time": "7:03:40", "remaining_time": "1 day, 11:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2985, "total_steps": 17941, "loss": 1.5845, "learning_rate": 9.439221248022447e-05, "epoch": 0.1663786856919904, "percentage": 16.64, "elapsed_time": "7:03:48", "remaining_time": "1 day, 11:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2986, "total_steps": 17941, "loss": 1.8841, "learning_rate": 9.43881145445555e-05, "epoch": 0.16643442394515356, "percentage": 16.64, "elapsed_time": "7:03:57", "remaining_time": "1 day, 11:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2987, "total_steps": 17941, "loss": 1.7537, "learning_rate": 9.438401520115434e-05, "epoch": 0.1664901621983167, "percentage": 16.65, "elapsed_time": "7:04:06", "remaining_time": "1 day, 11:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2988, "total_steps": 17941, "loss": 1.9331, "learning_rate": 9.4379914450151e-05, "epoch": 0.16654590045147985, "percentage": 16.65, "elapsed_time": "7:04:14", "remaining_time": "1 day, 11:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2989, "total_steps": 17941, "loss": 1.5948, "learning_rate": 9.437581229167551e-05, "epoch": 0.166601638704643, "percentage": 16.66, "elapsed_time": "7:04:23", "remaining_time": "1 day, 11:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2990, "total_steps": 17941, "loss": 1.7629, "learning_rate": 9.4371708725858e-05, "epoch": 0.16665737695780614, "percentage": 16.67, "elapsed_time": "7:04:31", "remaining_time": "1 day, 11:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2991, "total_steps": 17941, "loss": 1.766, "learning_rate": 9.436760375282859e-05, "epoch": 0.1667131152109693, "percentage": 16.67, "elapsed_time": "7:04:40", "remaining_time": "1 day, 11:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2992, "total_steps": 17941, "loss": 1.8319, "learning_rate": 9.436349737271745e-05, "epoch": 0.16676885346413242, "percentage": 16.68, "elapsed_time": "7:04:48", "remaining_time": "1 day, 11:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2993, "total_steps": 17941, "loss": 1.7975, "learning_rate": 9.435938958565487e-05, "epoch": 0.16682459171729558, "percentage": 16.68, "elapsed_time": "7:04:56", "remaining_time": "1 day, 11:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2994, "total_steps": 17941, "loss": 1.7058, "learning_rate": 9.435528039177105e-05, "epoch": 0.16688032997045874, "percentage": 16.69, "elapsed_time": "7:05:05", "remaining_time": "1 day, 11:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2995, "total_steps": 17941, "loss": 1.7305, "learning_rate": 9.435116979119635e-05, "epoch": 0.16693606822362186, "percentage": 16.69, "elapsed_time": "7:05:14", "remaining_time": "1 day, 11:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2996, "total_steps": 17941, "loss": 1.6901, "learning_rate": 9.434705778406114e-05, "epoch": 0.16699180647678502, "percentage": 16.7, "elapsed_time": "7:05:22", "remaining_time": "1 day, 11:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2997, "total_steps": 17941, "loss": 1.7462, "learning_rate": 9.434294437049582e-05, "epoch": 0.16704754472994815, "percentage": 16.7, "elapsed_time": "7:05:30", "remaining_time": "1 day, 11:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2998, "total_steps": 17941, "loss": 1.7997, "learning_rate": 9.433882955063084e-05, "epoch": 0.1671032829831113, "percentage": 16.71, "elapsed_time": "7:05:39", "remaining_time": "1 day, 11:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2999, "total_steps": 17941, "loss": 1.923, "learning_rate": 9.43347133245967e-05, "epoch": 0.16715902123627446, "percentage": 16.72, "elapsed_time": "7:05:47", "remaining_time": "1 day, 11:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 17941, "loss": 1.7263, "learning_rate": 9.433059569252394e-05, "epoch": 0.1672147594894376, "percentage": 16.72, "elapsed_time": "7:05:56", "remaining_time": "1 day, 11:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3001, "total_steps": 17941, "loss": 1.5881, "learning_rate": 9.432647665454315e-05, "epoch": 0.16727049774260075, "percentage": 16.73, "elapsed_time": "7:06:05", "remaining_time": "1 day, 11:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3002, "total_steps": 17941, "loss": 1.9409, "learning_rate": 9.432235621078497e-05, "epoch": 0.1673262359957639, "percentage": 16.73, "elapsed_time": "7:06:14", "remaining_time": "1 day, 11:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3003, "total_steps": 17941, "loss": 1.8471, "learning_rate": 9.431823436138005e-05, "epoch": 0.16738197424892703, "percentage": 16.74, "elapsed_time": "7:06:22", "remaining_time": "1 day, 11:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3004, "total_steps": 17941, "loss": 1.6844, "learning_rate": 9.431411110645915e-05, "epoch": 0.1674377125020902, "percentage": 16.74, "elapsed_time": "7:06:31", "remaining_time": "1 day, 11:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3005, "total_steps": 17941, "loss": 1.7333, "learning_rate": 9.4309986446153e-05, "epoch": 0.16749345075525332, "percentage": 16.75, "elapsed_time": "7:06:39", "remaining_time": "1 day, 11:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3006, "total_steps": 17941, "loss": 1.9837, "learning_rate": 9.430586038059244e-05, "epoch": 0.16754918900841648, "percentage": 16.75, "elapsed_time": "7:06:47", "remaining_time": "1 day, 11:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3007, "total_steps": 17941, "loss": 1.7391, "learning_rate": 9.430173290990829e-05, "epoch": 0.16760492726157963, "percentage": 16.76, "elapsed_time": "7:06:56", "remaining_time": "1 day, 11:20:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3008, "total_steps": 17941, "loss": 1.5325, "learning_rate": 9.429760403423148e-05, "epoch": 0.16766066551474276, "percentage": 16.77, "elapsed_time": "7:07:04", "remaining_time": "1 day, 11:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3009, "total_steps": 17941, "loss": 1.5849, "learning_rate": 9.429347375369295e-05, "epoch": 0.16771640376790592, "percentage": 16.77, "elapsed_time": "7:07:13", "remaining_time": "1 day, 11:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3010, "total_steps": 17941, "loss": 1.7995, "learning_rate": 9.428934206842365e-05, "epoch": 0.16777214202106905, "percentage": 16.78, "elapsed_time": "7:07:21", "remaining_time": "1 day, 11:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3011, "total_steps": 17941, "loss": 1.7941, "learning_rate": 9.428520897855469e-05, "epoch": 0.1678278802742322, "percentage": 16.78, "elapsed_time": "7:07:30", "remaining_time": "1 day, 11:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3012, "total_steps": 17941, "loss": 1.8987, "learning_rate": 9.428107448421708e-05, "epoch": 0.16788361852739536, "percentage": 16.79, "elapsed_time": "7:07:38", "remaining_time": "1 day, 11:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3013, "total_steps": 17941, "loss": 1.2377, "learning_rate": 9.427693858554196e-05, "epoch": 0.1679393567805585, "percentage": 16.79, "elapsed_time": "7:07:47", "remaining_time": "1 day, 11:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3014, "total_steps": 17941, "loss": 1.8915, "learning_rate": 9.42728012826605e-05, "epoch": 0.16799509503372165, "percentage": 16.8, "elapsed_time": "7:07:55", "remaining_time": "1 day, 11:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3015, "total_steps": 17941, "loss": 1.9298, "learning_rate": 9.426866257570391e-05, "epoch": 0.16805083328688478, "percentage": 16.81, "elapsed_time": "7:08:04", "remaining_time": "1 day, 11:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3016, "total_steps": 17941, "loss": 1.6459, "learning_rate": 9.426452246480347e-05, "epoch": 0.16810657154004793, "percentage": 16.81, "elapsed_time": "7:08:12", "remaining_time": "1 day, 11:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3017, "total_steps": 17941, "loss": 1.8506, "learning_rate": 9.426038095009042e-05, "epoch": 0.1681623097932111, "percentage": 16.82, "elapsed_time": "7:08:21", "remaining_time": "1 day, 11:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3018, "total_steps": 17941, "loss": 1.5642, "learning_rate": 9.425623803169616e-05, "epoch": 0.16821804804637422, "percentage": 16.82, "elapsed_time": "7:08:30", "remaining_time": "1 day, 11:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3019, "total_steps": 17941, "loss": 1.7475, "learning_rate": 9.425209370975208e-05, "epoch": 0.16827378629953738, "percentage": 16.83, "elapsed_time": "7:08:38", "remaining_time": "1 day, 11:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3020, "total_steps": 17941, "loss": 1.8123, "learning_rate": 9.424794798438958e-05, "epoch": 0.1683295245527005, "percentage": 16.83, "elapsed_time": "7:08:47", "remaining_time": "1 day, 11:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3021, "total_steps": 17941, "loss": 1.9773, "learning_rate": 9.424380085574015e-05, "epoch": 0.16838526280586366, "percentage": 16.84, "elapsed_time": "7:08:55", "remaining_time": "1 day, 11:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3022, "total_steps": 17941, "loss": 1.8269, "learning_rate": 9.423965232393532e-05, "epoch": 0.16844100105902682, "percentage": 16.84, "elapsed_time": "7:09:04", "remaining_time": "1 day, 11:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3023, "total_steps": 17941, "loss": 1.7838, "learning_rate": 9.423550238910666e-05, "epoch": 0.16849673931218995, "percentage": 16.85, "elapsed_time": "7:09:12", "remaining_time": "1 day, 11:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3024, "total_steps": 17941, "loss": 1.7805, "learning_rate": 9.423135105138577e-05, "epoch": 0.1685524775653531, "percentage": 16.86, "elapsed_time": "7:09:22", "remaining_time": "1 day, 11:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3025, "total_steps": 17941, "loss": 1.8054, "learning_rate": 9.42271983109043e-05, "epoch": 0.16860821581851626, "percentage": 16.86, "elapsed_time": "7:09:30", "remaining_time": "1 day, 11:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3026, "total_steps": 17941, "loss": 1.7666, "learning_rate": 9.422304416779397e-05, "epoch": 0.1686639540716794, "percentage": 16.87, "elapsed_time": "7:09:38", "remaining_time": "1 day, 11:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3027, "total_steps": 17941, "loss": 1.8725, "learning_rate": 9.421888862218651e-05, "epoch": 0.16871969232484255, "percentage": 16.87, "elapsed_time": "7:09:47", "remaining_time": "1 day, 11:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3028, "total_steps": 17941, "loss": 1.873, "learning_rate": 9.421473167421373e-05, "epoch": 0.16877543057800568, "percentage": 16.88, "elapsed_time": "7:09:55", "remaining_time": "1 day, 11:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3029, "total_steps": 17941, "loss": 1.6385, "learning_rate": 9.421057332400744e-05, "epoch": 0.16883116883116883, "percentage": 16.88, "elapsed_time": "7:10:04", "remaining_time": "1 day, 11:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3030, "total_steps": 17941, "loss": 1.758, "learning_rate": 9.420641357169954e-05, "epoch": 0.168886907084332, "percentage": 16.89, "elapsed_time": "7:10:12", "remaining_time": "1 day, 11:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3031, "total_steps": 17941, "loss": 1.829, "learning_rate": 9.420225241742193e-05, "epoch": 0.16894264533749512, "percentage": 16.89, "elapsed_time": "7:10:21", "remaining_time": "1 day, 11:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3032, "total_steps": 17941, "loss": 1.7447, "learning_rate": 9.419808986130661e-05, "epoch": 0.16899838359065827, "percentage": 16.9, "elapsed_time": "7:10:29", "remaining_time": "1 day, 11:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3033, "total_steps": 17941, "loss": 1.7367, "learning_rate": 9.419392590348555e-05, "epoch": 0.1690541218438214, "percentage": 16.91, "elapsed_time": "7:10:38", "remaining_time": "1 day, 11:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3034, "total_steps": 17941, "loss": 1.8542, "learning_rate": 9.418976054409084e-05, "epoch": 0.16910986009698456, "percentage": 16.91, "elapsed_time": "7:10:46", "remaining_time": "1 day, 11:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3035, "total_steps": 17941, "loss": 1.5941, "learning_rate": 9.418559378325457e-05, "epoch": 0.16916559835014772, "percentage": 16.92, "elapsed_time": "7:10:54", "remaining_time": "1 day, 11:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3036, "total_steps": 17941, "loss": 1.6894, "learning_rate": 9.418142562110888e-05, "epoch": 0.16922133660331085, "percentage": 16.92, "elapsed_time": "7:11:03", "remaining_time": "1 day, 11:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3037, "total_steps": 17941, "loss": 1.5647, "learning_rate": 9.417725605778598e-05, "epoch": 0.169277074856474, "percentage": 16.93, "elapsed_time": "7:11:11", "remaining_time": "1 day, 11:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3038, "total_steps": 17941, "loss": 1.7843, "learning_rate": 9.417308509341806e-05, "epoch": 0.16933281310963713, "percentage": 16.93, "elapsed_time": "7:11:20", "remaining_time": "1 day, 11:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3039, "total_steps": 17941, "loss": 1.8156, "learning_rate": 9.416891272813747e-05, "epoch": 0.1693885513628003, "percentage": 16.94, "elapsed_time": "7:11:28", "remaining_time": "1 day, 11:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3040, "total_steps": 17941, "loss": 1.7029, "learning_rate": 9.416473896207645e-05, "epoch": 0.16944428961596344, "percentage": 16.94, "elapsed_time": "7:11:37", "remaining_time": "1 day, 11:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3041, "total_steps": 17941, "loss": 1.8892, "learning_rate": 9.416056379536744e-05, "epoch": 0.16950002786912657, "percentage": 16.95, "elapsed_time": "7:11:45", "remaining_time": "1 day, 11:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3042, "total_steps": 17941, "loss": 1.7344, "learning_rate": 9.415638722814279e-05, "epoch": 0.16955576612228973, "percentage": 16.96, "elapsed_time": "7:11:54", "remaining_time": "1 day, 11:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3043, "total_steps": 17941, "loss": 1.4281, "learning_rate": 9.415220926053501e-05, "epoch": 0.16961150437545286, "percentage": 16.96, "elapsed_time": "7:12:02", "remaining_time": "1 day, 11:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3044, "total_steps": 17941, "loss": 1.772, "learning_rate": 9.414802989267657e-05, "epoch": 0.16966724262861602, "percentage": 16.97, "elapsed_time": "7:12:11", "remaining_time": "1 day, 11:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3045, "total_steps": 17941, "loss": 1.6814, "learning_rate": 9.414384912470002e-05, "epoch": 0.16972298088177917, "percentage": 16.97, "elapsed_time": "7:12:19", "remaining_time": "1 day, 11:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3046, "total_steps": 17941, "loss": 1.7041, "learning_rate": 9.413966695673795e-05, "epoch": 0.1697787191349423, "percentage": 16.98, "elapsed_time": "7:12:28", "remaining_time": "1 day, 11:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3047, "total_steps": 17941, "loss": 1.8597, "learning_rate": 9.413548338892301e-05, "epoch": 0.16983445738810546, "percentage": 16.98, "elapsed_time": "7:12:36", "remaining_time": "1 day, 11:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3048, "total_steps": 17941, "loss": 2.115, "learning_rate": 9.413129842138786e-05, "epoch": 0.16989019564126862, "percentage": 16.99, "elapsed_time": "7:12:45", "remaining_time": "1 day, 11:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3049, "total_steps": 17941, "loss": 1.5559, "learning_rate": 9.412711205426521e-05, "epoch": 0.16994593389443174, "percentage": 16.99, "elapsed_time": "7:12:53", "remaining_time": "1 day, 11:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3050, "total_steps": 17941, "loss": 1.8423, "learning_rate": 9.412292428768787e-05, "epoch": 0.1700016721475949, "percentage": 17.0, "elapsed_time": "7:13:02", "remaining_time": "1 day, 11:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3051, "total_steps": 17941, "loss": 1.6792, "learning_rate": 9.411873512178862e-05, "epoch": 0.17005741040075803, "percentage": 17.01, "elapsed_time": "7:13:10", "remaining_time": "1 day, 11:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3052, "total_steps": 17941, "loss": 1.8432, "learning_rate": 9.41145445567003e-05, "epoch": 0.1701131486539212, "percentage": 17.01, "elapsed_time": "7:13:19", "remaining_time": "1 day, 11:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3053, "total_steps": 17941, "loss": 1.9316, "learning_rate": 9.411035259255585e-05, "epoch": 0.17016888690708434, "percentage": 17.02, "elapsed_time": "7:13:27", "remaining_time": "1 day, 11:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3054, "total_steps": 17941, "loss": 1.8668, "learning_rate": 9.41061592294882e-05, "epoch": 0.17022462516024747, "percentage": 17.02, "elapsed_time": "7:13:36", "remaining_time": "1 day, 11:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3055, "total_steps": 17941, "loss": 1.9025, "learning_rate": 9.410196446763034e-05, "epoch": 0.17028036341341063, "percentage": 17.03, "elapsed_time": "7:13:44", "remaining_time": "1 day, 11:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3056, "total_steps": 17941, "loss": 1.7351, "learning_rate": 9.409776830711528e-05, "epoch": 0.17033610166657376, "percentage": 17.03, "elapsed_time": "7:13:53", "remaining_time": "1 day, 11:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3057, "total_steps": 17941, "loss": 2.0981, "learning_rate": 9.409357074807612e-05, "epoch": 0.17039183991973691, "percentage": 17.04, "elapsed_time": "7:14:01", "remaining_time": "1 day, 11:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3058, "total_steps": 17941, "loss": 1.74, "learning_rate": 9.4089371790646e-05, "epoch": 0.17044757817290007, "percentage": 17.04, "elapsed_time": "7:14:10", "remaining_time": "1 day, 11:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3059, "total_steps": 17941, "loss": 1.7409, "learning_rate": 9.408517143495806e-05, "epoch": 0.1705033164260632, "percentage": 17.05, "elapsed_time": "7:14:18", "remaining_time": "1 day, 11:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3060, "total_steps": 17941, "loss": 1.6624, "learning_rate": 9.40809696811455e-05, "epoch": 0.17055905467922636, "percentage": 17.06, "elapsed_time": "7:14:27", "remaining_time": "1 day, 11:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3061, "total_steps": 17941, "loss": 1.7723, "learning_rate": 9.40767665293416e-05, "epoch": 0.1706147929323895, "percentage": 17.06, "elapsed_time": "7:14:35", "remaining_time": "1 day, 11:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3062, "total_steps": 17941, "loss": 1.771, "learning_rate": 9.407256197967965e-05, "epoch": 0.17067053118555264, "percentage": 17.07, "elapsed_time": "7:14:44", "remaining_time": "1 day, 11:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3063, "total_steps": 17941, "loss": 1.5427, "learning_rate": 9.4068356032293e-05, "epoch": 0.1707262694387158, "percentage": 17.07, "elapsed_time": "7:14:52", "remaining_time": "1 day, 11:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3064, "total_steps": 17941, "loss": 1.7884, "learning_rate": 9.406414868731502e-05, "epoch": 0.17078200769187893, "percentage": 17.08, "elapsed_time": "7:15:01", "remaining_time": "1 day, 11:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3065, "total_steps": 17941, "loss": 1.7756, "learning_rate": 9.405993994487917e-05, "epoch": 0.17083774594504209, "percentage": 17.08, "elapsed_time": "7:15:09", "remaining_time": "1 day, 11:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3066, "total_steps": 17941, "loss": 1.7589, "learning_rate": 9.40557298051189e-05, "epoch": 0.17089348419820521, "percentage": 17.09, "elapsed_time": "7:15:18", "remaining_time": "1 day, 11:11:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3067, "total_steps": 17941, "loss": 1.7427, "learning_rate": 9.405151826816776e-05, "epoch": 0.17094922245136837, "percentage": 17.09, "elapsed_time": "7:15:26", "remaining_time": "1 day, 11:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3068, "total_steps": 17941, "loss": 1.8757, "learning_rate": 9.404730533415929e-05, "epoch": 0.17100496070453153, "percentage": 17.1, "elapsed_time": "7:15:35", "remaining_time": "1 day, 11:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3069, "total_steps": 17941, "loss": 1.8219, "learning_rate": 9.40430910032271e-05, "epoch": 0.17106069895769466, "percentage": 17.11, "elapsed_time": "7:15:43", "remaining_time": "1 day, 11:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3070, "total_steps": 17941, "loss": 1.9808, "learning_rate": 9.403887527550486e-05, "epoch": 0.1711164372108578, "percentage": 17.11, "elapsed_time": "7:15:52", "remaining_time": "1 day, 11:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3071, "total_steps": 17941, "loss": 1.6841, "learning_rate": 9.403465815112626e-05, "epoch": 0.17117217546402097, "percentage": 17.12, "elapsed_time": "7:16:00", "remaining_time": "1 day, 11:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3072, "total_steps": 17941, "loss": 1.5559, "learning_rate": 9.403043963022505e-05, "epoch": 0.1712279137171841, "percentage": 17.12, "elapsed_time": "7:16:09", "remaining_time": "1 day, 11:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3073, "total_steps": 17941, "loss": 1.8316, "learning_rate": 9.4026219712935e-05, "epoch": 0.17128365197034726, "percentage": 17.13, "elapsed_time": "7:16:17", "remaining_time": "1 day, 11:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3074, "total_steps": 17941, "loss": 1.678, "learning_rate": 9.402199839938996e-05, "epoch": 0.17133939022351038, "percentage": 17.13, "elapsed_time": "7:16:26", "remaining_time": "1 day, 11:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3075, "total_steps": 17941, "loss": 1.5931, "learning_rate": 9.401777568972379e-05, "epoch": 0.17139512847667354, "percentage": 17.14, "elapsed_time": "7:16:34", "remaining_time": "1 day, 11:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3076, "total_steps": 17941, "loss": 1.8761, "learning_rate": 9.401355158407042e-05, "epoch": 0.1714508667298367, "percentage": 17.15, "elapsed_time": "7:16:42", "remaining_time": "1 day, 11:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3077, "total_steps": 17941, "loss": 1.6682, "learning_rate": 9.400932608256381e-05, "epoch": 0.17150660498299983, "percentage": 17.15, "elapsed_time": "7:16:51", "remaining_time": "1 day, 11:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3078, "total_steps": 17941, "loss": 1.6889, "learning_rate": 9.400509918533798e-05, "epoch": 0.17156234323616298, "percentage": 17.16, "elapsed_time": "7:16:59", "remaining_time": "1 day, 11:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3079, "total_steps": 17941, "loss": 1.6925, "learning_rate": 9.400087089252695e-05, "epoch": 0.1716180814893261, "percentage": 17.16, "elapsed_time": "7:17:08", "remaining_time": "1 day, 11:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3080, "total_steps": 17941, "loss": 1.4425, "learning_rate": 9.399664120426484e-05, "epoch": 0.17167381974248927, "percentage": 17.17, "elapsed_time": "7:17:16", "remaining_time": "1 day, 11:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3081, "total_steps": 17941, "loss": 1.6485, "learning_rate": 9.39924101206858e-05, "epoch": 0.17172955799565243, "percentage": 17.17, "elapsed_time": "7:17:25", "remaining_time": "1 day, 11:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3082, "total_steps": 17941, "loss": 1.835, "learning_rate": 9.3988177641924e-05, "epoch": 0.17178529624881556, "percentage": 17.18, "elapsed_time": "7:17:33", "remaining_time": "1 day, 11:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3083, "total_steps": 17941, "loss": 1.7104, "learning_rate": 9.398394376811368e-05, "epoch": 0.1718410345019787, "percentage": 17.18, "elapsed_time": "7:17:42", "remaining_time": "1 day, 11:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3084, "total_steps": 17941, "loss": 1.5808, "learning_rate": 9.397970849938911e-05, "epoch": 0.17189677275514184, "percentage": 17.19, "elapsed_time": "7:17:50", "remaining_time": "1 day, 11:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3085, "total_steps": 17941, "loss": 1.771, "learning_rate": 9.39754718358846e-05, "epoch": 0.171952511008305, "percentage": 17.2, "elapsed_time": "7:17:59", "remaining_time": "1 day, 11:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3086, "total_steps": 17941, "loss": 1.8713, "learning_rate": 9.397123377773451e-05, "epoch": 0.17200824926146815, "percentage": 17.2, "elapsed_time": "7:18:07", "remaining_time": "1 day, 11:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3087, "total_steps": 17941, "loss": 1.5279, "learning_rate": 9.396699432507325e-05, "epoch": 0.17206398751463128, "percentage": 17.21, "elapsed_time": "7:18:16", "remaining_time": "1 day, 11:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3088, "total_steps": 17941, "loss": 1.8924, "learning_rate": 9.396275347803529e-05, "epoch": 0.17211972576779444, "percentage": 17.21, "elapsed_time": "7:18:25", "remaining_time": "1 day, 11:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3089, "total_steps": 17941, "loss": 1.7562, "learning_rate": 9.395851123675512e-05, "epoch": 0.1721754640209576, "percentage": 17.22, "elapsed_time": "7:18:33", "remaining_time": "1 day, 11:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3090, "total_steps": 17941, "loss": 1.599, "learning_rate": 9.395426760136726e-05, "epoch": 0.17223120227412073, "percentage": 17.22, "elapsed_time": "7:18:42", "remaining_time": "1 day, 11:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3091, "total_steps": 17941, "loss": 1.7657, "learning_rate": 9.39500225720063e-05, "epoch": 0.17228694052728388, "percentage": 17.23, "elapsed_time": "7:18:50", "remaining_time": "1 day, 11:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3092, "total_steps": 17941, "loss": 1.684, "learning_rate": 9.394577614880687e-05, "epoch": 0.172342678780447, "percentage": 17.23, "elapsed_time": "7:18:58", "remaining_time": "1 day, 11:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3093, "total_steps": 17941, "loss": 1.8619, "learning_rate": 9.394152833190364e-05, "epoch": 0.17239841703361017, "percentage": 17.24, "elapsed_time": "7:19:07", "remaining_time": "1 day, 11:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3094, "total_steps": 17941, "loss": 1.6454, "learning_rate": 9.393727912143134e-05, "epoch": 0.17245415528677333, "percentage": 17.25, "elapsed_time": "7:19:16", "remaining_time": "1 day, 11:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3095, "total_steps": 17941, "loss": 1.6498, "learning_rate": 9.39330285175247e-05, "epoch": 0.17250989353993645, "percentage": 17.25, "elapsed_time": "7:19:24", "remaining_time": "1 day, 11:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3096, "total_steps": 17941, "loss": 1.8345, "learning_rate": 9.392877652031855e-05, "epoch": 0.1725656317930996, "percentage": 17.26, "elapsed_time": "7:19:33", "remaining_time": "1 day, 11:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3097, "total_steps": 17941, "loss": 1.5056, "learning_rate": 9.392452312994773e-05, "epoch": 0.17262137004626274, "percentage": 17.26, "elapsed_time": "7:19:41", "remaining_time": "1 day, 11:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3098, "total_steps": 17941, "loss": 1.5868, "learning_rate": 9.392026834654714e-05, "epoch": 0.1726771082994259, "percentage": 17.27, "elapsed_time": "7:19:50", "remaining_time": "1 day, 11:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3099, "total_steps": 17941, "loss": 1.8988, "learning_rate": 9.39160121702517e-05, "epoch": 0.17273284655258905, "percentage": 17.27, "elapsed_time": "7:19:58", "remaining_time": "1 day, 11:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3100, "total_steps": 17941, "loss": 1.7228, "learning_rate": 9.391175460119642e-05, "epoch": 0.17278858480575218, "percentage": 17.28, "elapsed_time": "7:20:07", "remaining_time": "1 day, 11:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3101, "total_steps": 17941, "loss": 1.6436, "learning_rate": 9.39074956395163e-05, "epoch": 0.17284432305891534, "percentage": 17.28, "elapsed_time": "7:20:15", "remaining_time": "1 day, 11:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3102, "total_steps": 17941, "loss": 1.498, "learning_rate": 9.390323528534641e-05, "epoch": 0.17290006131207847, "percentage": 17.29, "elapsed_time": "7:20:24", "remaining_time": "1 day, 11:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3103, "total_steps": 17941, "loss": 1.6834, "learning_rate": 9.389897353882188e-05, "epoch": 0.17295579956524162, "percentage": 17.3, "elapsed_time": "7:20:33", "remaining_time": "1 day, 11:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3104, "total_steps": 17941, "loss": 1.4012, "learning_rate": 9.389471040007784e-05, "epoch": 0.17301153781840478, "percentage": 17.3, "elapsed_time": "7:20:42", "remaining_time": "1 day, 11:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3105, "total_steps": 17941, "loss": 1.7005, "learning_rate": 9.389044586924953e-05, "epoch": 0.1730672760715679, "percentage": 17.31, "elapsed_time": "7:20:50", "remaining_time": "1 day, 11:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3106, "total_steps": 17941, "loss": 1.6934, "learning_rate": 9.388617994647218e-05, "epoch": 0.17312301432473107, "percentage": 17.31, "elapsed_time": "7:20:59", "remaining_time": "1 day, 11:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3107, "total_steps": 17941, "loss": 1.5041, "learning_rate": 9.388191263188107e-05, "epoch": 0.1731787525778942, "percentage": 17.32, "elapsed_time": "7:21:07", "remaining_time": "1 day, 11:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3108, "total_steps": 17941, "loss": 1.6184, "learning_rate": 9.387764392561153e-05, "epoch": 0.17323449083105735, "percentage": 17.32, "elapsed_time": "7:21:15", "remaining_time": "1 day, 11:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3109, "total_steps": 17941, "loss": 1.8302, "learning_rate": 9.387337382779894e-05, "epoch": 0.1732902290842205, "percentage": 17.33, "elapsed_time": "7:21:24", "remaining_time": "1 day, 11:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3110, "total_steps": 17941, "loss": 1.6565, "learning_rate": 9.386910233857875e-05, "epoch": 0.17334596733738364, "percentage": 17.33, "elapsed_time": "7:21:32", "remaining_time": "1 day, 11:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3111, "total_steps": 17941, "loss": 1.5957, "learning_rate": 9.386482945808641e-05, "epoch": 0.1734017055905468, "percentage": 17.34, "elapsed_time": "7:21:41", "remaining_time": "1 day, 11:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3112, "total_steps": 17941, "loss": 1.7147, "learning_rate": 9.386055518645742e-05, "epoch": 0.17345744384370995, "percentage": 17.35, "elapsed_time": "7:21:49", "remaining_time": "1 day, 11:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3113, "total_steps": 17941, "loss": 2.0401, "learning_rate": 9.385627952382736e-05, "epoch": 0.17351318209687308, "percentage": 17.35, "elapsed_time": "7:21:58", "remaining_time": "1 day, 11:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3114, "total_steps": 17941, "loss": 1.9242, "learning_rate": 9.38520024703318e-05, "epoch": 0.17356892035003624, "percentage": 17.36, "elapsed_time": "7:22:06", "remaining_time": "1 day, 11:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3115, "total_steps": 17941, "loss": 1.689, "learning_rate": 9.38477240261064e-05, "epoch": 0.17362465860319937, "percentage": 17.36, "elapsed_time": "7:22:15", "remaining_time": "1 day, 11:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3116, "total_steps": 17941, "loss": 1.7896, "learning_rate": 9.384344419128684e-05, "epoch": 0.17368039685636252, "percentage": 17.37, "elapsed_time": "7:22:23", "remaining_time": "1 day, 11:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3117, "total_steps": 17941, "loss": 1.7828, "learning_rate": 9.383916296600886e-05, "epoch": 0.17373613510952568, "percentage": 17.37, "elapsed_time": "7:22:32", "remaining_time": "1 day, 11:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3118, "total_steps": 17941, "loss": 1.9487, "learning_rate": 9.383488035040821e-05, "epoch": 0.1737918733626888, "percentage": 17.38, "elapsed_time": "7:22:41", "remaining_time": "1 day, 11:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3119, "total_steps": 17941, "loss": 1.6792, "learning_rate": 9.383059634462077e-05, "epoch": 0.17384761161585197, "percentage": 17.38, "elapsed_time": "7:22:49", "remaining_time": "1 day, 11:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3120, "total_steps": 17941, "loss": 1.6627, "learning_rate": 9.382631094878234e-05, "epoch": 0.1739033498690151, "percentage": 17.39, "elapsed_time": "7:22:58", "remaining_time": "1 day, 11:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3121, "total_steps": 17941, "loss": 1.7446, "learning_rate": 9.382202416302885e-05, "epoch": 0.17395908812217825, "percentage": 17.4, "elapsed_time": "7:23:06", "remaining_time": "1 day, 11:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3122, "total_steps": 17941, "loss": 1.6078, "learning_rate": 9.381773598749626e-05, "epoch": 0.1740148263753414, "percentage": 17.4, "elapsed_time": "7:23:15", "remaining_time": "1 day, 11:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3123, "total_steps": 17941, "loss": 1.792, "learning_rate": 9.381344642232056e-05, "epoch": 0.17407056462850454, "percentage": 17.41, "elapsed_time": "7:23:24", "remaining_time": "1 day, 11:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3124, "total_steps": 17941, "loss": 1.788, "learning_rate": 9.380915546763778e-05, "epoch": 0.1741263028816677, "percentage": 17.41, "elapsed_time": "7:23:32", "remaining_time": "1 day, 11:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3125, "total_steps": 17941, "loss": 1.8515, "learning_rate": 9.380486312358402e-05, "epoch": 0.17418204113483082, "percentage": 17.42, "elapsed_time": "7:23:41", "remaining_time": "1 day, 11:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3126, "total_steps": 17941, "loss": 1.5184, "learning_rate": 9.380056939029541e-05, "epoch": 0.17423777938799398, "percentage": 17.42, "elapsed_time": "7:23:50", "remaining_time": "1 day, 11:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3127, "total_steps": 17941, "loss": 1.8659, "learning_rate": 9.379627426790812e-05, "epoch": 0.17429351764115714, "percentage": 17.43, "elapsed_time": "7:23:58", "remaining_time": "1 day, 11:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3128, "total_steps": 17941, "loss": 1.7891, "learning_rate": 9.379197775655833e-05, "epoch": 0.17434925589432027, "percentage": 17.43, "elapsed_time": "7:24:07", "remaining_time": "1 day, 11:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3129, "total_steps": 17941, "loss": 1.4975, "learning_rate": 9.378767985638235e-05, "epoch": 0.17440499414748342, "percentage": 17.44, "elapsed_time": "7:24:16", "remaining_time": "1 day, 11:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3130, "total_steps": 17941, "loss": 1.9019, "learning_rate": 9.378338056751647e-05, "epoch": 0.17446073240064655, "percentage": 17.45, "elapsed_time": "7:24:24", "remaining_time": "1 day, 11:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3131, "total_steps": 17941, "loss": 1.7563, "learning_rate": 9.377907989009702e-05, "epoch": 0.1745164706538097, "percentage": 17.45, "elapsed_time": "7:24:32", "remaining_time": "1 day, 11:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3132, "total_steps": 17941, "loss": 2.009, "learning_rate": 9.37747778242604e-05, "epoch": 0.17457220890697286, "percentage": 17.46, "elapsed_time": "7:24:41", "remaining_time": "1 day, 11:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3133, "total_steps": 17941, "loss": 1.8264, "learning_rate": 9.377047437014308e-05, "epoch": 0.174627947160136, "percentage": 17.46, "elapsed_time": "7:24:49", "remaining_time": "1 day, 11:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3134, "total_steps": 17941, "loss": 1.6131, "learning_rate": 9.376616952788149e-05, "epoch": 0.17468368541329915, "percentage": 17.47, "elapsed_time": "7:24:58", "remaining_time": "1 day, 11:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3135, "total_steps": 17941, "loss": 1.7159, "learning_rate": 9.376186329761219e-05, "epoch": 0.1747394236664623, "percentage": 17.47, "elapsed_time": "7:25:06", "remaining_time": "1 day, 11:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3136, "total_steps": 17941, "loss": 1.5203, "learning_rate": 9.375755567947173e-05, "epoch": 0.17479516191962544, "percentage": 17.48, "elapsed_time": "7:25:15", "remaining_time": "1 day, 11:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3137, "total_steps": 17941, "loss": 1.7154, "learning_rate": 9.375324667359673e-05, "epoch": 0.1748509001727886, "percentage": 17.49, "elapsed_time": "7:25:23", "remaining_time": "1 day, 11:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3138, "total_steps": 17941, "loss": 1.7277, "learning_rate": 9.374893628012384e-05, "epoch": 0.17490663842595172, "percentage": 17.49, "elapsed_time": "7:25:32", "remaining_time": "1 day, 11:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3139, "total_steps": 17941, "loss": 1.7931, "learning_rate": 9.374462449918976e-05, "epoch": 0.17496237667911488, "percentage": 17.5, "elapsed_time": "7:25:40", "remaining_time": "1 day, 11:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3140, "total_steps": 17941, "loss": 1.8076, "learning_rate": 9.374031133093124e-05, "epoch": 0.17501811493227803, "percentage": 17.5, "elapsed_time": "7:25:48", "remaining_time": "1 day, 11:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3141, "total_steps": 17941, "loss": 1.7212, "learning_rate": 9.373599677548508e-05, "epoch": 0.17507385318544116, "percentage": 17.51, "elapsed_time": "7:25:57", "remaining_time": "1 day, 11:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3142, "total_steps": 17941, "loss": 1.9175, "learning_rate": 9.373168083298809e-05, "epoch": 0.17512959143860432, "percentage": 17.51, "elapsed_time": "7:26:05", "remaining_time": "1 day, 11:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3143, "total_steps": 17941, "loss": 1.842, "learning_rate": 9.372736350357717e-05, "epoch": 0.17518532969176745, "percentage": 17.52, "elapsed_time": "7:26:14", "remaining_time": "1 day, 11:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3144, "total_steps": 17941, "loss": 1.8881, "learning_rate": 9.372304478738922e-05, "epoch": 0.1752410679449306, "percentage": 17.52, "elapsed_time": "7:26:22", "remaining_time": "1 day, 11:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3145, "total_steps": 17941, "loss": 1.7381, "learning_rate": 9.371872468456122e-05, "epoch": 0.17529680619809376, "percentage": 17.53, "elapsed_time": "7:26:31", "remaining_time": "1 day, 11:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3146, "total_steps": 17941, "loss": 1.745, "learning_rate": 9.371440319523016e-05, "epoch": 0.1753525444512569, "percentage": 17.54, "elapsed_time": "7:26:39", "remaining_time": "1 day, 11:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3147, "total_steps": 17941, "loss": 1.8071, "learning_rate": 9.37100803195331e-05, "epoch": 0.17540828270442005, "percentage": 17.54, "elapsed_time": "7:26:48", "remaining_time": "1 day, 11:00:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3148, "total_steps": 17941, "loss": 1.8659, "learning_rate": 9.370575605760716e-05, "epoch": 0.17546402095758318, "percentage": 17.55, "elapsed_time": "7:26:56", "remaining_time": "1 day, 11:00:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3149, "total_steps": 17941, "loss": 1.5791, "learning_rate": 9.370143040958943e-05, "epoch": 0.17551975921074633, "percentage": 17.55, "elapsed_time": "7:27:04", "remaining_time": "1 day, 11:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3150, "total_steps": 17941, "loss": 1.7657, "learning_rate": 9.369710337561714e-05, "epoch": 0.1755754974639095, "percentage": 17.56, "elapsed_time": "7:27:13", "remaining_time": "1 day, 10:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3151, "total_steps": 17941, "loss": 2.0541, "learning_rate": 9.36927749558275e-05, "epoch": 0.17563123571707262, "percentage": 17.56, "elapsed_time": "7:27:21", "remaining_time": "1 day, 10:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3152, "total_steps": 17941, "loss": 1.762, "learning_rate": 9.368844515035779e-05, "epoch": 0.17568697397023578, "percentage": 17.57, "elapsed_time": "7:27:30", "remaining_time": "1 day, 10:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3153, "total_steps": 17941, "loss": 1.5928, "learning_rate": 9.368411395934533e-05, "epoch": 0.1757427122233989, "percentage": 17.57, "elapsed_time": "7:27:38", "remaining_time": "1 day, 10:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3154, "total_steps": 17941, "loss": 1.9292, "learning_rate": 9.367978138292747e-05, "epoch": 0.17579845047656206, "percentage": 17.58, "elapsed_time": "7:27:47", "remaining_time": "1 day, 10:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3155, "total_steps": 17941, "loss": 1.8832, "learning_rate": 9.36754474212416e-05, "epoch": 0.17585418872972522, "percentage": 17.59, "elapsed_time": "7:27:55", "remaining_time": "1 day, 10:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3156, "total_steps": 17941, "loss": 1.4679, "learning_rate": 9.36711120744252e-05, "epoch": 0.17590992698288835, "percentage": 17.59, "elapsed_time": "7:28:03", "remaining_time": "1 day, 10:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3157, "total_steps": 17941, "loss": 1.7744, "learning_rate": 9.366677534261572e-05, "epoch": 0.1759656652360515, "percentage": 17.6, "elapsed_time": "7:28:12", "remaining_time": "1 day, 10:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3158, "total_steps": 17941, "loss": 1.8169, "learning_rate": 9.366243722595074e-05, "epoch": 0.17602140348921466, "percentage": 17.6, "elapsed_time": "7:28:21", "remaining_time": "1 day, 10:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3159, "total_steps": 17941, "loss": 1.8714, "learning_rate": 9.365809772456782e-05, "epoch": 0.1760771417423778, "percentage": 17.61, "elapsed_time": "7:28:29", "remaining_time": "1 day, 10:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3160, "total_steps": 17941, "loss": 1.797, "learning_rate": 9.365375683860458e-05, "epoch": 0.17613287999554095, "percentage": 17.61, "elapsed_time": "7:28:38", "remaining_time": "1 day, 10:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3161, "total_steps": 17941, "loss": 1.8027, "learning_rate": 9.36494145681987e-05, "epoch": 0.17618861824870408, "percentage": 17.62, "elapsed_time": "7:28:47", "remaining_time": "1 day, 10:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3162, "total_steps": 17941, "loss": 1.7254, "learning_rate": 9.364507091348788e-05, "epoch": 0.17624435650186723, "percentage": 17.62, "elapsed_time": "7:28:55", "remaining_time": "1 day, 10:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3163, "total_steps": 17941, "loss": 1.7505, "learning_rate": 9.364072587460988e-05, "epoch": 0.1763000947550304, "percentage": 17.63, "elapsed_time": "7:29:04", "remaining_time": "1 day, 10:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3164, "total_steps": 17941, "loss": 1.7651, "learning_rate": 9.363637945170249e-05, "epoch": 0.17635583300819352, "percentage": 17.64, "elapsed_time": "7:29:12", "remaining_time": "1 day, 10:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3165, "total_steps": 17941, "loss": 1.7096, "learning_rate": 9.363203164490356e-05, "epoch": 0.17641157126135668, "percentage": 17.64, "elapsed_time": "7:29:21", "remaining_time": "1 day, 10:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3166, "total_steps": 17941, "loss": 2.0557, "learning_rate": 9.362768245435098e-05, "epoch": 0.1764673095145198, "percentage": 17.65, "elapsed_time": "7:29:30", "remaining_time": "1 day, 10:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3167, "total_steps": 17941, "loss": 1.6362, "learning_rate": 9.362333188018269e-05, "epoch": 0.17652304776768296, "percentage": 17.65, "elapsed_time": "7:29:38", "remaining_time": "1 day, 10:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3168, "total_steps": 17941, "loss": 1.6019, "learning_rate": 9.361897992253665e-05, "epoch": 0.17657878602084612, "percentage": 17.66, "elapsed_time": "7:29:47", "remaining_time": "1 day, 10:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3169, "total_steps": 17941, "loss": 1.7042, "learning_rate": 9.361462658155089e-05, "epoch": 0.17663452427400925, "percentage": 17.66, "elapsed_time": "7:29:55", "remaining_time": "1 day, 10:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3170, "total_steps": 17941, "loss": 1.7224, "learning_rate": 9.361027185736346e-05, "epoch": 0.1766902625271724, "percentage": 17.67, "elapsed_time": "7:30:04", "remaining_time": "1 day, 10:57:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3171, "total_steps": 17941, "loss": 1.6534, "learning_rate": 9.360591575011245e-05, "epoch": 0.17674600078033553, "percentage": 17.67, "elapsed_time": "7:30:12", "remaining_time": "1 day, 10:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3172, "total_steps": 17941, "loss": 1.8964, "learning_rate": 9.360155825993607e-05, "epoch": 0.1768017390334987, "percentage": 17.68, "elapsed_time": "7:30:21", "remaining_time": "1 day, 10:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3173, "total_steps": 17941, "loss": 1.7262, "learning_rate": 9.359719938697246e-05, "epoch": 0.17685747728666185, "percentage": 17.69, "elapsed_time": "7:30:29", "remaining_time": "1 day, 10:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3174, "total_steps": 17941, "loss": 1.7775, "learning_rate": 9.359283913135988e-05, "epoch": 0.17691321553982498, "percentage": 17.69, "elapsed_time": "7:30:38", "remaining_time": "1 day, 10:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3175, "total_steps": 17941, "loss": 1.9756, "learning_rate": 9.358847749323659e-05, "epoch": 0.17696895379298813, "percentage": 17.7, "elapsed_time": "7:30:46", "remaining_time": "1 day, 10:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3176, "total_steps": 17941, "loss": 1.7427, "learning_rate": 9.358411447274094e-05, "epoch": 0.17702469204615126, "percentage": 17.7, "elapsed_time": "7:30:54", "remaining_time": "1 day, 10:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3177, "total_steps": 17941, "loss": 1.8076, "learning_rate": 9.357975007001129e-05, "epoch": 0.17708043029931442, "percentage": 17.71, "elapsed_time": "7:31:03", "remaining_time": "1 day, 10:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3178, "total_steps": 17941, "loss": 1.6826, "learning_rate": 9.357538428518607e-05, "epoch": 0.17713616855247757, "percentage": 17.71, "elapsed_time": "7:31:11", "remaining_time": "1 day, 10:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3179, "total_steps": 17941, "loss": 1.6545, "learning_rate": 9.357101711840372e-05, "epoch": 0.1771919068056407, "percentage": 17.72, "elapsed_time": "7:31:20", "remaining_time": "1 day, 10:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3180, "total_steps": 17941, "loss": 1.4337, "learning_rate": 9.356664856980273e-05, "epoch": 0.17724764505880386, "percentage": 17.72, "elapsed_time": "7:31:28", "remaining_time": "1 day, 10:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3181, "total_steps": 17941, "loss": 1.7241, "learning_rate": 9.356227863952168e-05, "epoch": 0.17730338331196702, "percentage": 17.73, "elapsed_time": "7:31:37", "remaining_time": "1 day, 10:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3182, "total_steps": 17941, "loss": 1.5474, "learning_rate": 9.355790732769911e-05, "epoch": 0.17735912156513015, "percentage": 17.74, "elapsed_time": "7:31:45", "remaining_time": "1 day, 10:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3183, "total_steps": 17941, "loss": 1.5795, "learning_rate": 9.35535346344737e-05, "epoch": 0.1774148598182933, "percentage": 17.74, "elapsed_time": "7:31:54", "remaining_time": "1 day, 10:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3184, "total_steps": 17941, "loss": 1.8093, "learning_rate": 9.354916055998409e-05, "epoch": 0.17747059807145643, "percentage": 17.75, "elapsed_time": "7:32:02", "remaining_time": "1 day, 10:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3185, "total_steps": 17941, "loss": 2.0041, "learning_rate": 9.354478510436902e-05, "epoch": 0.1775263363246196, "percentage": 17.75, "elapsed_time": "7:32:10", "remaining_time": "1 day, 10:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3186, "total_steps": 17941, "loss": 1.7329, "learning_rate": 9.354040826776727e-05, "epoch": 0.17758207457778274, "percentage": 17.76, "elapsed_time": "7:32:19", "remaining_time": "1 day, 10:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3187, "total_steps": 17941, "loss": 1.7857, "learning_rate": 9.35360300503176e-05, "epoch": 0.17763781283094587, "percentage": 17.76, "elapsed_time": "7:32:27", "remaining_time": "1 day, 10:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3188, "total_steps": 17941, "loss": 1.7757, "learning_rate": 9.35316504521589e-05, "epoch": 0.17769355108410903, "percentage": 17.77, "elapsed_time": "7:32:36", "remaining_time": "1 day, 10:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3189, "total_steps": 17941, "loss": 1.7656, "learning_rate": 9.352726947343006e-05, "epoch": 0.17774928933727216, "percentage": 17.77, "elapsed_time": "7:32:44", "remaining_time": "1 day, 10:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3190, "total_steps": 17941, "loss": 1.7716, "learning_rate": 9.352288711427001e-05, "epoch": 0.17780502759043532, "percentage": 17.78, "elapsed_time": "7:32:53", "remaining_time": "1 day, 10:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3191, "total_steps": 17941, "loss": 1.7623, "learning_rate": 9.351850337481773e-05, "epoch": 0.17786076584359847, "percentage": 17.79, "elapsed_time": "7:33:01", "remaining_time": "1 day, 10:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3192, "total_steps": 17941, "loss": 1.7835, "learning_rate": 9.351411825521228e-05, "epoch": 0.1779165040967616, "percentage": 17.79, "elapsed_time": "7:33:10", "remaining_time": "1 day, 10:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3193, "total_steps": 17941, "loss": 1.9064, "learning_rate": 9.350973175559267e-05, "epoch": 0.17797224234992476, "percentage": 17.8, "elapsed_time": "7:33:18", "remaining_time": "1 day, 10:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3194, "total_steps": 17941, "loss": 1.7245, "learning_rate": 9.350534387609807e-05, "epoch": 0.1780279806030879, "percentage": 17.8, "elapsed_time": "7:33:26", "remaining_time": "1 day, 10:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3195, "total_steps": 17941, "loss": 1.6991, "learning_rate": 9.35009546168676e-05, "epoch": 0.17808371885625104, "percentage": 17.81, "elapsed_time": "7:33:35", "remaining_time": "1 day, 10:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3196, "total_steps": 17941, "loss": 1.747, "learning_rate": 9.34965639780405e-05, "epoch": 0.1781394571094142, "percentage": 17.81, "elapsed_time": "7:33:43", "remaining_time": "1 day, 10:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3197, "total_steps": 17941, "loss": 1.8114, "learning_rate": 9.349217195975598e-05, "epoch": 0.17819519536257733, "percentage": 17.82, "elapsed_time": "7:33:52", "remaining_time": "1 day, 10:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3198, "total_steps": 17941, "loss": 1.7719, "learning_rate": 9.348777856215334e-05, "epoch": 0.1782509336157405, "percentage": 17.83, "elapsed_time": "7:34:00", "remaining_time": "1 day, 10:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3199, "total_steps": 17941, "loss": 1.7989, "learning_rate": 9.348338378537192e-05, "epoch": 0.17830667186890362, "percentage": 17.83, "elapsed_time": "7:34:09", "remaining_time": "1 day, 10:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3200, "total_steps": 17941, "loss": 1.5998, "learning_rate": 9.347898762955109e-05, "epoch": 0.17836241012206677, "percentage": 17.84, "elapsed_time": "7:34:17", "remaining_time": "1 day, 10:52:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3201, "total_steps": 17941, "loss": 1.7352, "learning_rate": 9.347459009483028e-05, "epoch": 0.17841814837522993, "percentage": 17.84, "elapsed_time": "7:34:26", "remaining_time": "1 day, 10:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3202, "total_steps": 17941, "loss": 1.8595, "learning_rate": 9.347019118134893e-05, "epoch": 0.17847388662839306, "percentage": 17.85, "elapsed_time": "7:34:34", "remaining_time": "1 day, 10:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3203, "total_steps": 17941, "loss": 1.8312, "learning_rate": 9.346579088924658e-05, "epoch": 0.17852962488155621, "percentage": 17.85, "elapsed_time": "7:34:43", "remaining_time": "1 day, 10:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3204, "total_steps": 17941, "loss": 1.9124, "learning_rate": 9.346138921866276e-05, "epoch": 0.17858536313471937, "percentage": 17.86, "elapsed_time": "7:34:51", "remaining_time": "1 day, 10:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3205, "total_steps": 17941, "loss": 1.8279, "learning_rate": 9.345698616973707e-05, "epoch": 0.1786411013878825, "percentage": 17.86, "elapsed_time": "7:35:00", "remaining_time": "1 day, 10:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3206, "total_steps": 17941, "loss": 1.8218, "learning_rate": 9.345258174260915e-05, "epoch": 0.17869683964104566, "percentage": 17.87, "elapsed_time": "7:35:09", "remaining_time": "1 day, 10:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3207, "total_steps": 17941, "loss": 1.6772, "learning_rate": 9.344817593741868e-05, "epoch": 0.1787525778942088, "percentage": 17.88, "elapsed_time": "7:35:18", "remaining_time": "1 day, 10:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3208, "total_steps": 17941, "loss": 1.8402, "learning_rate": 9.344376875430539e-05, "epoch": 0.17880831614737194, "percentage": 17.88, "elapsed_time": "7:35:26", "remaining_time": "1 day, 10:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3209, "total_steps": 17941, "loss": 2.0245, "learning_rate": 9.343936019340906e-05, "epoch": 0.1788640544005351, "percentage": 17.89, "elapsed_time": "7:35:35", "remaining_time": "1 day, 10:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3210, "total_steps": 17941, "loss": 1.7243, "learning_rate": 9.343495025486948e-05, "epoch": 0.17891979265369823, "percentage": 17.89, "elapsed_time": "7:35:43", "remaining_time": "1 day, 10:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3211, "total_steps": 17941, "loss": 1.8062, "learning_rate": 9.343053893882654e-05, "epoch": 0.17897553090686139, "percentage": 17.9, "elapsed_time": "7:35:52", "remaining_time": "1 day, 10:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3212, "total_steps": 17941, "loss": 1.9111, "learning_rate": 9.34261262454201e-05, "epoch": 0.17903126916002451, "percentage": 17.9, "elapsed_time": "7:36:01", "remaining_time": "1 day, 10:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3213, "total_steps": 17941, "loss": 1.892, "learning_rate": 9.342171217479014e-05, "epoch": 0.17908700741318767, "percentage": 17.91, "elapsed_time": "7:36:09", "remaining_time": "1 day, 10:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3214, "total_steps": 17941, "loss": 1.7303, "learning_rate": 9.341729672707664e-05, "epoch": 0.17914274566635083, "percentage": 17.91, "elapsed_time": "7:36:18", "remaining_time": "1 day, 10:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3215, "total_steps": 17941, "loss": 1.5011, "learning_rate": 9.341287990241962e-05, "epoch": 0.17919848391951396, "percentage": 17.92, "elapsed_time": "7:36:26", "remaining_time": "1 day, 10:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3216, "total_steps": 17941, "loss": 1.8355, "learning_rate": 9.340846170095917e-05, "epoch": 0.1792542221726771, "percentage": 17.93, "elapsed_time": "7:36:34", "remaining_time": "1 day, 10:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3217, "total_steps": 17941, "loss": 1.8892, "learning_rate": 9.34040421228354e-05, "epoch": 0.17930996042584024, "percentage": 17.93, "elapsed_time": "7:36:43", "remaining_time": "1 day, 10:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3218, "total_steps": 17941, "loss": 1.6359, "learning_rate": 9.339962116818848e-05, "epoch": 0.1793656986790034, "percentage": 17.94, "elapsed_time": "7:36:52", "remaining_time": "1 day, 10:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3219, "total_steps": 17941, "loss": 1.7594, "learning_rate": 9.339519883715862e-05, "epoch": 0.17942143693216656, "percentage": 17.94, "elapsed_time": "7:37:01", "remaining_time": "1 day, 10:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3220, "total_steps": 17941, "loss": 1.5873, "learning_rate": 9.339077512988606e-05, "epoch": 0.17947717518532968, "percentage": 17.95, "elapsed_time": "7:37:09", "remaining_time": "1 day, 10:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3221, "total_steps": 17941, "loss": 1.6675, "learning_rate": 9.338635004651108e-05, "epoch": 0.17953291343849284, "percentage": 17.95, "elapsed_time": "7:37:18", "remaining_time": "1 day, 10:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3222, "total_steps": 17941, "loss": 1.8268, "learning_rate": 9.338192358717406e-05, "epoch": 0.17958865169165597, "percentage": 17.96, "elapsed_time": "7:37:27", "remaining_time": "1 day, 10:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3223, "total_steps": 17941, "loss": 1.6647, "learning_rate": 9.337749575201535e-05, "epoch": 0.17964438994481913, "percentage": 17.96, "elapsed_time": "7:37:35", "remaining_time": "1 day, 10:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3224, "total_steps": 17941, "loss": 1.7202, "learning_rate": 9.337306654117538e-05, "epoch": 0.17970012819798228, "percentage": 17.97, "elapsed_time": "7:37:44", "remaining_time": "1 day, 10:49:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3225, "total_steps": 17941, "loss": 1.4645, "learning_rate": 9.336863595479462e-05, "epoch": 0.1797558664511454, "percentage": 17.98, "elapsed_time": "7:37:52", "remaining_time": "1 day, 10:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3226, "total_steps": 17941, "loss": 1.8443, "learning_rate": 9.33642039930136e-05, "epoch": 0.17981160470430857, "percentage": 17.98, "elapsed_time": "7:38:00", "remaining_time": "1 day, 10:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3227, "total_steps": 17941, "loss": 1.98, "learning_rate": 9.335977065597285e-05, "epoch": 0.17986734295747173, "percentage": 17.99, "elapsed_time": "7:38:09", "remaining_time": "1 day, 10:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3228, "total_steps": 17941, "loss": 1.5549, "learning_rate": 9.335533594381297e-05, "epoch": 0.17992308121063486, "percentage": 17.99, "elapsed_time": "7:38:18", "remaining_time": "1 day, 10:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3229, "total_steps": 17941, "loss": 1.5479, "learning_rate": 9.335089985667463e-05, "epoch": 0.179978819463798, "percentage": 18.0, "elapsed_time": "7:38:26", "remaining_time": "1 day, 10:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3230, "total_steps": 17941, "loss": 1.7899, "learning_rate": 9.334646239469848e-05, "epoch": 0.18003455771696114, "percentage": 18.0, "elapsed_time": "7:38:34", "remaining_time": "1 day, 10:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3231, "total_steps": 17941, "loss": 1.7351, "learning_rate": 9.334202355802528e-05, "epoch": 0.1800902959701243, "percentage": 18.01, "elapsed_time": "7:38:43", "remaining_time": "1 day, 10:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3232, "total_steps": 17941, "loss": 1.6461, "learning_rate": 9.333758334679581e-05, "epoch": 0.18014603422328745, "percentage": 18.01, "elapsed_time": "7:38:52", "remaining_time": "1 day, 10:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3233, "total_steps": 17941, "loss": 1.6368, "learning_rate": 9.333314176115084e-05, "epoch": 0.18020177247645058, "percentage": 18.02, "elapsed_time": "7:39:00", "remaining_time": "1 day, 10:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3234, "total_steps": 17941, "loss": 2.0446, "learning_rate": 9.33286988012313e-05, "epoch": 0.18025751072961374, "percentage": 18.03, "elapsed_time": "7:39:08", "remaining_time": "1 day, 10:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3235, "total_steps": 17941, "loss": 1.8455, "learning_rate": 9.332425446717803e-05, "epoch": 0.18031324898277687, "percentage": 18.03, "elapsed_time": "7:39:17", "remaining_time": "1 day, 10:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3236, "total_steps": 17941, "loss": 1.4925, "learning_rate": 9.331980875913202e-05, "epoch": 0.18036898723594003, "percentage": 18.04, "elapsed_time": "7:39:25", "remaining_time": "1 day, 10:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3237, "total_steps": 17941, "loss": 1.7695, "learning_rate": 9.331536167723423e-05, "epoch": 0.18042472548910318, "percentage": 18.04, "elapsed_time": "7:39:34", "remaining_time": "1 day, 10:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3238, "total_steps": 17941, "loss": 1.8594, "learning_rate": 9.331091322162573e-05, "epoch": 0.1804804637422663, "percentage": 18.05, "elapsed_time": "7:39:42", "remaining_time": "1 day, 10:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3239, "total_steps": 17941, "loss": 1.8194, "learning_rate": 9.330646339244759e-05, "epoch": 0.18053620199542947, "percentage": 18.05, "elapsed_time": "7:39:51", "remaining_time": "1 day, 10:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3240, "total_steps": 17941, "loss": 1.6584, "learning_rate": 9.330201218984092e-05, "epoch": 0.1805919402485926, "percentage": 18.06, "elapsed_time": "7:39:59", "remaining_time": "1 day, 10:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3241, "total_steps": 17941, "loss": 1.757, "learning_rate": 9.329755961394688e-05, "epoch": 0.18064767850175575, "percentage": 18.06, "elapsed_time": "7:40:08", "remaining_time": "1 day, 10:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3242, "total_steps": 17941, "loss": 1.6786, "learning_rate": 9.32931056649067e-05, "epoch": 0.1807034167549189, "percentage": 18.07, "elapsed_time": "7:40:17", "remaining_time": "1 day, 10:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3243, "total_steps": 17941, "loss": 1.457, "learning_rate": 9.328865034286161e-05, "epoch": 0.18075915500808204, "percentage": 18.08, "elapsed_time": "7:40:25", "remaining_time": "1 day, 10:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3244, "total_steps": 17941, "loss": 1.691, "learning_rate": 9.328419364795295e-05, "epoch": 0.1808148932612452, "percentage": 18.08, "elapsed_time": "7:40:34", "remaining_time": "1 day, 10:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3245, "total_steps": 17941, "loss": 1.6702, "learning_rate": 9.327973558032201e-05, "epoch": 0.18087063151440833, "percentage": 18.09, "elapsed_time": "7:40:42", "remaining_time": "1 day, 10:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3246, "total_steps": 17941, "loss": 1.6912, "learning_rate": 9.32752761401102e-05, "epoch": 0.18092636976757148, "percentage": 18.09, "elapsed_time": "7:40:50", "remaining_time": "1 day, 10:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3247, "total_steps": 17941, "loss": 1.7894, "learning_rate": 9.327081532745896e-05, "epoch": 0.18098210802073464, "percentage": 18.1, "elapsed_time": "7:40:59", "remaining_time": "1 day, 10:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3248, "total_steps": 17941, "loss": 2.0331, "learning_rate": 9.326635314250971e-05, "epoch": 0.18103784627389777, "percentage": 18.1, "elapsed_time": "7:41:08", "remaining_time": "1 day, 10:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3249, "total_steps": 17941, "loss": 1.8261, "learning_rate": 9.326188958540403e-05, "epoch": 0.18109358452706092, "percentage": 18.11, "elapsed_time": "7:41:16", "remaining_time": "1 day, 10:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3250, "total_steps": 17941, "loss": 1.5244, "learning_rate": 9.325742465628342e-05, "epoch": 0.18114932278022408, "percentage": 18.11, "elapsed_time": "7:41:25", "remaining_time": "1 day, 10:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3251, "total_steps": 17941, "loss": 1.8512, "learning_rate": 9.325295835528953e-05, "epoch": 0.1812050610333872, "percentage": 18.12, "elapsed_time": "7:41:34", "remaining_time": "1 day, 10:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3252, "total_steps": 17941, "loss": 1.8405, "learning_rate": 9.324849068256397e-05, "epoch": 0.18126079928655037, "percentage": 18.13, "elapsed_time": "7:41:42", "remaining_time": "1 day, 10:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3253, "total_steps": 17941, "loss": 1.7193, "learning_rate": 9.324402163824846e-05, "epoch": 0.1813165375397135, "percentage": 18.13, "elapsed_time": "7:41:51", "remaining_time": "1 day, 10:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3254, "total_steps": 17941, "loss": 1.6715, "learning_rate": 9.323955122248468e-05, "epoch": 0.18137227579287665, "percentage": 18.14, "elapsed_time": "7:41:59", "remaining_time": "1 day, 10:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3255, "total_steps": 17941, "loss": 1.5796, "learning_rate": 9.323507943541447e-05, "epoch": 0.1814280140460398, "percentage": 18.14, "elapsed_time": "7:42:08", "remaining_time": "1 day, 10:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3256, "total_steps": 17941, "loss": 1.7856, "learning_rate": 9.323060627717961e-05, "epoch": 0.18148375229920294, "percentage": 18.15, "elapsed_time": "7:42:16", "remaining_time": "1 day, 10:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3257, "total_steps": 17941, "loss": 1.7715, "learning_rate": 9.322613174792197e-05, "epoch": 0.1815394905523661, "percentage": 18.15, "elapsed_time": "7:42:25", "remaining_time": "1 day, 10:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3258, "total_steps": 17941, "loss": 1.9437, "learning_rate": 9.322165584778347e-05, "epoch": 0.18159522880552922, "percentage": 18.16, "elapsed_time": "7:42:33", "remaining_time": "1 day, 10:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3259, "total_steps": 17941, "loss": 1.5789, "learning_rate": 9.321717857690601e-05, "epoch": 0.18165096705869238, "percentage": 18.17, "elapsed_time": "7:42:42", "remaining_time": "1 day, 10:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3260, "total_steps": 17941, "loss": 1.7718, "learning_rate": 9.321269993543166e-05, "epoch": 0.18170670531185554, "percentage": 18.17, "elapsed_time": "7:42:51", "remaining_time": "1 day, 10:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3261, "total_steps": 17941, "loss": 1.6088, "learning_rate": 9.320821992350239e-05, "epoch": 0.18176244356501867, "percentage": 18.18, "elapsed_time": "7:43:00", "remaining_time": "1 day, 10:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3262, "total_steps": 17941, "loss": 1.6355, "learning_rate": 9.320373854126032e-05, "epoch": 0.18181818181818182, "percentage": 18.18, "elapsed_time": "7:43:08", "remaining_time": "1 day, 10:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3263, "total_steps": 17941, "loss": 1.8282, "learning_rate": 9.319925578884754e-05, "epoch": 0.18187392007134495, "percentage": 18.19, "elapsed_time": "7:43:17", "remaining_time": "1 day, 10:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3264, "total_steps": 17941, "loss": 1.8765, "learning_rate": 9.319477166640626e-05, "epoch": 0.1819296583245081, "percentage": 18.19, "elapsed_time": "7:43:25", "remaining_time": "1 day, 10:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3265, "total_steps": 17941, "loss": 1.7684, "learning_rate": 9.319028617407865e-05, "epoch": 0.18198539657767127, "percentage": 18.2, "elapsed_time": "7:43:33", "remaining_time": "1 day, 10:43:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3266, "total_steps": 17941, "loss": 1.9083, "learning_rate": 9.318579931200697e-05, "epoch": 0.1820411348308344, "percentage": 18.2, "elapsed_time": "7:43:42", "remaining_time": "1 day, 10:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3267, "total_steps": 17941, "loss": 1.6844, "learning_rate": 9.318131108033355e-05, "epoch": 0.18209687308399755, "percentage": 18.21, "elapsed_time": "7:43:50", "remaining_time": "1 day, 10:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3268, "total_steps": 17941, "loss": 1.9451, "learning_rate": 9.31768214792007e-05, "epoch": 0.18215261133716068, "percentage": 18.22, "elapsed_time": "7:43:59", "remaining_time": "1 day, 10:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3269, "total_steps": 17941, "loss": 1.7534, "learning_rate": 9.31723305087508e-05, "epoch": 0.18220834959032384, "percentage": 18.22, "elapsed_time": "7:44:07", "remaining_time": "1 day, 10:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3270, "total_steps": 17941, "loss": 1.876, "learning_rate": 9.316783816912629e-05, "epoch": 0.182264087843487, "percentage": 18.23, "elapsed_time": "7:44:16", "remaining_time": "1 day, 10:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3271, "total_steps": 17941, "loss": 1.7254, "learning_rate": 9.316334446046966e-05, "epoch": 0.18231982609665012, "percentage": 18.23, "elapsed_time": "7:44:24", "remaining_time": "1 day, 10:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3272, "total_steps": 17941, "loss": 1.6292, "learning_rate": 9.315884938292339e-05, "epoch": 0.18237556434981328, "percentage": 18.24, "elapsed_time": "7:44:32", "remaining_time": "1 day, 10:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3273, "total_steps": 17941, "loss": 2.0649, "learning_rate": 9.315435293663005e-05, "epoch": 0.18243130260297644, "percentage": 18.24, "elapsed_time": "7:44:41", "remaining_time": "1 day, 10:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3274, "total_steps": 17941, "loss": 1.8282, "learning_rate": 9.314985512173223e-05, "epoch": 0.18248704085613957, "percentage": 18.25, "elapsed_time": "7:44:49", "remaining_time": "1 day, 10:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3275, "total_steps": 17941, "loss": 1.7501, "learning_rate": 9.31453559383726e-05, "epoch": 0.18254277910930272, "percentage": 18.25, "elapsed_time": "7:44:58", "remaining_time": "1 day, 10:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3276, "total_steps": 17941, "loss": 1.7287, "learning_rate": 9.314085538669383e-05, "epoch": 0.18259851736246585, "percentage": 18.26, "elapsed_time": "7:45:07", "remaining_time": "1 day, 10:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3277, "total_steps": 17941, "loss": 1.6779, "learning_rate": 9.313635346683865e-05, "epoch": 0.182654255615629, "percentage": 18.27, "elapsed_time": "7:45:15", "remaining_time": "1 day, 10:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3278, "total_steps": 17941, "loss": 1.7884, "learning_rate": 9.313185017894985e-05, "epoch": 0.18270999386879216, "percentage": 18.27, "elapsed_time": "7:45:24", "remaining_time": "1 day, 10:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3279, "total_steps": 17941, "loss": 1.5747, "learning_rate": 9.312734552317023e-05, "epoch": 0.1827657321219553, "percentage": 18.28, "elapsed_time": "7:45:32", "remaining_time": "1 day, 10:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3280, "total_steps": 17941, "loss": 1.4992, "learning_rate": 9.312283949964267e-05, "epoch": 0.18282147037511845, "percentage": 18.28, "elapsed_time": "7:45:41", "remaining_time": "1 day, 10:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3281, "total_steps": 17941, "loss": 1.5226, "learning_rate": 9.311833210851007e-05, "epoch": 0.18287720862828158, "percentage": 18.29, "elapsed_time": "7:45:49", "remaining_time": "1 day, 10:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3282, "total_steps": 17941, "loss": 1.6106, "learning_rate": 9.311382334991536e-05, "epoch": 0.18293294688144474, "percentage": 18.29, "elapsed_time": "7:45:57", "remaining_time": "1 day, 10:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3283, "total_steps": 17941, "loss": 1.9531, "learning_rate": 9.310931322400156e-05, "epoch": 0.1829886851346079, "percentage": 18.3, "elapsed_time": "7:46:06", "remaining_time": "1 day, 10:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3284, "total_steps": 17941, "loss": 1.9566, "learning_rate": 9.310480173091168e-05, "epoch": 0.18304442338777102, "percentage": 18.3, "elapsed_time": "7:46:14", "remaining_time": "1 day, 10:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3285, "total_steps": 17941, "loss": 1.8004, "learning_rate": 9.31002888707888e-05, "epoch": 0.18310016164093418, "percentage": 18.31, "elapsed_time": "7:46:23", "remaining_time": "1 day, 10:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3286, "total_steps": 17941, "loss": 1.8203, "learning_rate": 9.309577464377606e-05, "epoch": 0.1831558998940973, "percentage": 18.32, "elapsed_time": "7:46:31", "remaining_time": "1 day, 10:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3287, "total_steps": 17941, "loss": 1.8127, "learning_rate": 9.309125905001659e-05, "epoch": 0.18321163814726046, "percentage": 18.32, "elapsed_time": "7:46:40", "remaining_time": "1 day, 10:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3288, "total_steps": 17941, "loss": 1.5432, "learning_rate": 9.308674208965364e-05, "epoch": 0.18326737640042362, "percentage": 18.33, "elapsed_time": "7:46:49", "remaining_time": "1 day, 10:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3289, "total_steps": 17941, "loss": 1.853, "learning_rate": 9.308222376283045e-05, "epoch": 0.18332311465358675, "percentage": 18.33, "elapsed_time": "7:46:58", "remaining_time": "1 day, 10:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3290, "total_steps": 17941, "loss": 1.531, "learning_rate": 9.30777040696903e-05, "epoch": 0.1833788529067499, "percentage": 18.34, "elapsed_time": "7:47:06", "remaining_time": "1 day, 10:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3291, "total_steps": 17941, "loss": 2.0149, "learning_rate": 9.307318301037656e-05, "epoch": 0.18343459115991304, "percentage": 18.34, "elapsed_time": "7:47:15", "remaining_time": "1 day, 10:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3292, "total_steps": 17941, "loss": 1.6388, "learning_rate": 9.306866058503257e-05, "epoch": 0.1834903294130762, "percentage": 18.35, "elapsed_time": "7:47:23", "remaining_time": "1 day, 10:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3293, "total_steps": 17941, "loss": 1.8719, "learning_rate": 9.306413679380177e-05, "epoch": 0.18354606766623935, "percentage": 18.35, "elapsed_time": "7:47:32", "remaining_time": "1 day, 10:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3294, "total_steps": 17941, "loss": 1.7592, "learning_rate": 9.305961163682764e-05, "epoch": 0.18360180591940248, "percentage": 18.36, "elapsed_time": "7:47:40", "remaining_time": "1 day, 10:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3295, "total_steps": 17941, "loss": 1.834, "learning_rate": 9.305508511425367e-05, "epoch": 0.18365754417256563, "percentage": 18.37, "elapsed_time": "7:47:48", "remaining_time": "1 day, 10:39:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3296, "total_steps": 17941, "loss": 1.8606, "learning_rate": 9.305055722622344e-05, "epoch": 0.1837132824257288, "percentage": 18.37, "elapsed_time": "7:47:57", "remaining_time": "1 day, 10:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3297, "total_steps": 17941, "loss": 1.8952, "learning_rate": 9.304602797288054e-05, "epoch": 0.18376902067889192, "percentage": 18.38, "elapsed_time": "7:48:05", "remaining_time": "1 day, 10:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3298, "total_steps": 17941, "loss": 1.9215, "learning_rate": 9.30414973543686e-05, "epoch": 0.18382475893205508, "percentage": 18.38, "elapsed_time": "7:48:14", "remaining_time": "1 day, 10:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3299, "total_steps": 17941, "loss": 1.5506, "learning_rate": 9.303696537083132e-05, "epoch": 0.1838804971852182, "percentage": 18.39, "elapsed_time": "7:48:22", "remaining_time": "1 day, 10:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3300, "total_steps": 17941, "loss": 1.5003, "learning_rate": 9.303243202241242e-05, "epoch": 0.18393623543838136, "percentage": 18.39, "elapsed_time": "7:48:31", "remaining_time": "1 day, 10:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3301, "total_steps": 17941, "loss": 1.5837, "learning_rate": 9.302789730925567e-05, "epoch": 0.18399197369154452, "percentage": 18.4, "elapsed_time": "7:48:39", "remaining_time": "1 day, 10:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3302, "total_steps": 17941, "loss": 1.8285, "learning_rate": 9.30233612315049e-05, "epoch": 0.18404771194470765, "percentage": 18.4, "elapsed_time": "7:48:48", "remaining_time": "1 day, 10:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3303, "total_steps": 17941, "loss": 1.6032, "learning_rate": 9.301882378930394e-05, "epoch": 0.1841034501978708, "percentage": 18.41, "elapsed_time": "7:48:56", "remaining_time": "1 day, 10:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3304, "total_steps": 17941, "loss": 1.9998, "learning_rate": 9.301428498279671e-05, "epoch": 0.18415918845103393, "percentage": 18.42, "elapsed_time": "7:49:05", "remaining_time": "1 day, 10:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3305, "total_steps": 17941, "loss": 1.6816, "learning_rate": 9.300974481212715e-05, "epoch": 0.1842149267041971, "percentage": 18.42, "elapsed_time": "7:49:13", "remaining_time": "1 day, 10:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3306, "total_steps": 17941, "loss": 1.4649, "learning_rate": 9.300520327743924e-05, "epoch": 0.18427066495736025, "percentage": 18.43, "elapsed_time": "7:49:21", "remaining_time": "1 day, 10:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3307, "total_steps": 17941, "loss": 1.6704, "learning_rate": 9.300066037887704e-05, "epoch": 0.18432640321052338, "percentage": 18.43, "elapsed_time": "7:49:30", "remaining_time": "1 day, 10:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3308, "total_steps": 17941, "loss": 1.9368, "learning_rate": 9.29961161165846e-05, "epoch": 0.18438214146368653, "percentage": 18.44, "elapsed_time": "7:49:38", "remaining_time": "1 day, 10:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3309, "total_steps": 17941, "loss": 1.663, "learning_rate": 9.299157049070603e-05, "epoch": 0.18443787971684966, "percentage": 18.44, "elapsed_time": "7:49:47", "remaining_time": "1 day, 10:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3310, "total_steps": 17941, "loss": 1.6634, "learning_rate": 9.298702350138551e-05, "epoch": 0.18449361797001282, "percentage": 18.45, "elapsed_time": "7:49:55", "remaining_time": "1 day, 10:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3311, "total_steps": 17941, "loss": 1.7772, "learning_rate": 9.298247514876724e-05, "epoch": 0.18454935622317598, "percentage": 18.45, "elapsed_time": "7:50:04", "remaining_time": "1 day, 10:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3312, "total_steps": 17941, "loss": 1.7826, "learning_rate": 9.297792543299545e-05, "epoch": 0.1846050944763391, "percentage": 18.46, "elapsed_time": "7:50:12", "remaining_time": "1 day, 10:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3313, "total_steps": 17941, "loss": 2.0859, "learning_rate": 9.297337435421446e-05, "epoch": 0.18466083272950226, "percentage": 18.47, "elapsed_time": "7:50:21", "remaining_time": "1 day, 10:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3314, "total_steps": 17941, "loss": 1.6861, "learning_rate": 9.296882191256857e-05, "epoch": 0.1847165709826654, "percentage": 18.47, "elapsed_time": "7:50:29", "remaining_time": "1 day, 10:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3315, "total_steps": 17941, "loss": 1.6616, "learning_rate": 9.29642681082022e-05, "epoch": 0.18477230923582855, "percentage": 18.48, "elapsed_time": "7:50:37", "remaining_time": "1 day, 10:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3316, "total_steps": 17941, "loss": 1.8831, "learning_rate": 9.295971294125973e-05, "epoch": 0.1848280474889917, "percentage": 18.48, "elapsed_time": "7:50:47", "remaining_time": "1 day, 10:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3317, "total_steps": 17941, "loss": 1.6373, "learning_rate": 9.295515641188563e-05, "epoch": 0.18488378574215483, "percentage": 18.49, "elapsed_time": "7:50:55", "remaining_time": "1 day, 10:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3318, "total_steps": 17941, "loss": 1.6668, "learning_rate": 9.295059852022443e-05, "epoch": 0.184939523995318, "percentage": 18.49, "elapsed_time": "7:51:04", "remaining_time": "1 day, 10:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3319, "total_steps": 17941, "loss": 1.5566, "learning_rate": 9.294603926642064e-05, "epoch": 0.18499526224848115, "percentage": 18.5, "elapsed_time": "7:51:12", "remaining_time": "1 day, 10:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3320, "total_steps": 17941, "loss": 1.8183, "learning_rate": 9.294147865061891e-05, "epoch": 0.18505100050164427, "percentage": 18.51, "elapsed_time": "7:51:21", "remaining_time": "1 day, 10:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3321, "total_steps": 17941, "loss": 1.4792, "learning_rate": 9.293691667296382e-05, "epoch": 0.18510673875480743, "percentage": 18.51, "elapsed_time": "7:51:29", "remaining_time": "1 day, 10:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3322, "total_steps": 17941, "loss": 1.8202, "learning_rate": 9.293235333360009e-05, "epoch": 0.18516247700797056, "percentage": 18.52, "elapsed_time": "7:51:38", "remaining_time": "1 day, 10:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3323, "total_steps": 17941, "loss": 1.698, "learning_rate": 9.29277886326724e-05, "epoch": 0.18521821526113372, "percentage": 18.52, "elapsed_time": "7:51:46", "remaining_time": "1 day, 10:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3324, "total_steps": 17941, "loss": 1.8882, "learning_rate": 9.292322257032555e-05, "epoch": 0.18527395351429687, "percentage": 18.53, "elapsed_time": "7:51:55", "remaining_time": "1 day, 10:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3325, "total_steps": 17941, "loss": 1.8684, "learning_rate": 9.291865514670435e-05, "epoch": 0.18532969176746, "percentage": 18.53, "elapsed_time": "7:52:03", "remaining_time": "1 day, 10:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3326, "total_steps": 17941, "loss": 1.7726, "learning_rate": 9.291408636195364e-05, "epoch": 0.18538543002062316, "percentage": 18.54, "elapsed_time": "7:52:11", "remaining_time": "1 day, 10:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3327, "total_steps": 17941, "loss": 1.8152, "learning_rate": 9.29095162162183e-05, "epoch": 0.1854411682737863, "percentage": 18.54, "elapsed_time": "7:52:20", "remaining_time": "1 day, 10:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3328, "total_steps": 17941, "loss": 1.7364, "learning_rate": 9.290494470964332e-05, "epoch": 0.18549690652694945, "percentage": 18.55, "elapsed_time": "7:52:28", "remaining_time": "1 day, 10:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3329, "total_steps": 17941, "loss": 1.6331, "learning_rate": 9.290037184237362e-05, "epoch": 0.1855526447801126, "percentage": 18.56, "elapsed_time": "7:52:37", "remaining_time": "1 day, 10:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3330, "total_steps": 17941, "loss": 1.9186, "learning_rate": 9.289579761455426e-05, "epoch": 0.18560838303327573, "percentage": 18.56, "elapsed_time": "7:52:45", "remaining_time": "1 day, 10:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3331, "total_steps": 17941, "loss": 1.8436, "learning_rate": 9.289122202633029e-05, "epoch": 0.1856641212864389, "percentage": 18.57, "elapsed_time": "7:52:54", "remaining_time": "1 day, 10:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3332, "total_steps": 17941, "loss": 1.8193, "learning_rate": 9.288664507784686e-05, "epoch": 0.18571985953960202, "percentage": 18.57, "elapsed_time": "7:53:02", "remaining_time": "1 day, 10:34:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3333, "total_steps": 17941, "loss": 1.5945, "learning_rate": 9.288206676924906e-05, "epoch": 0.18577559779276517, "percentage": 18.58, "elapsed_time": "7:53:10", "remaining_time": "1 day, 10:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3334, "total_steps": 17941, "loss": 1.8746, "learning_rate": 9.287748710068214e-05, "epoch": 0.18583133604592833, "percentage": 18.58, "elapsed_time": "7:53:19", "remaining_time": "1 day, 10:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3335, "total_steps": 17941, "loss": 1.6635, "learning_rate": 9.287290607229131e-05, "epoch": 0.18588707429909146, "percentage": 18.59, "elapsed_time": "7:53:27", "remaining_time": "1 day, 10:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3336, "total_steps": 17941, "loss": 1.6587, "learning_rate": 9.286832368422187e-05, "epoch": 0.18594281255225462, "percentage": 18.59, "elapsed_time": "7:53:36", "remaining_time": "1 day, 10:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3337, "total_steps": 17941, "loss": 1.8244, "learning_rate": 9.286373993661916e-05, "epoch": 0.18599855080541774, "percentage": 18.6, "elapsed_time": "7:53:44", "remaining_time": "1 day, 10:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3338, "total_steps": 17941, "loss": 1.8085, "learning_rate": 9.28591548296285e-05, "epoch": 0.1860542890585809, "percentage": 18.61, "elapsed_time": "7:53:53", "remaining_time": "1 day, 10:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3339, "total_steps": 17941, "loss": 1.7652, "learning_rate": 9.285456836339537e-05, "epoch": 0.18611002731174406, "percentage": 18.61, "elapsed_time": "7:54:02", "remaining_time": "1 day, 10:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3340, "total_steps": 17941, "loss": 1.7365, "learning_rate": 9.284998053806516e-05, "epoch": 0.1861657655649072, "percentage": 18.62, "elapsed_time": "7:54:10", "remaining_time": "1 day, 10:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3341, "total_steps": 17941, "loss": 1.8217, "learning_rate": 9.284539135378341e-05, "epoch": 0.18622150381807034, "percentage": 18.62, "elapsed_time": "7:54:19", "remaining_time": "1 day, 10:32:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3342, "total_steps": 17941, "loss": 1.7073, "learning_rate": 9.284080081069565e-05, "epoch": 0.1862772420712335, "percentage": 18.63, "elapsed_time": "7:54:27", "remaining_time": "1 day, 10:32:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3343, "total_steps": 17941, "loss": 1.6885, "learning_rate": 9.283620890894749e-05, "epoch": 0.18633298032439663, "percentage": 18.63, "elapsed_time": "7:54:36", "remaining_time": "1 day, 10:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3344, "total_steps": 17941, "loss": 1.8512, "learning_rate": 9.283161564868452e-05, "epoch": 0.1863887185775598, "percentage": 18.64, "elapsed_time": "7:54:44", "remaining_time": "1 day, 10:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3345, "total_steps": 17941, "loss": 1.8003, "learning_rate": 9.282702103005243e-05, "epoch": 0.18644445683072292, "percentage": 18.64, "elapsed_time": "7:54:53", "remaining_time": "1 day, 10:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3346, "total_steps": 17941, "loss": 1.7775, "learning_rate": 9.282242505319693e-05, "epoch": 0.18650019508388607, "percentage": 18.65, "elapsed_time": "7:55:01", "remaining_time": "1 day, 10:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3347, "total_steps": 17941, "loss": 1.4253, "learning_rate": 9.281782771826378e-05, "epoch": 0.18655593333704923, "percentage": 18.66, "elapsed_time": "7:55:10", "remaining_time": "1 day, 10:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3348, "total_steps": 17941, "loss": 1.7682, "learning_rate": 9.281322902539878e-05, "epoch": 0.18661167159021236, "percentage": 18.66, "elapsed_time": "7:55:18", "remaining_time": "1 day, 10:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3349, "total_steps": 17941, "loss": 1.5904, "learning_rate": 9.280862897474776e-05, "epoch": 0.18666740984337551, "percentage": 18.67, "elapsed_time": "7:55:27", "remaining_time": "1 day, 10:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3350, "total_steps": 17941, "loss": 1.9147, "learning_rate": 9.280402756645663e-05, "epoch": 0.18672314809653864, "percentage": 18.67, "elapsed_time": "7:55:35", "remaining_time": "1 day, 10:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3351, "total_steps": 17941, "loss": 1.7212, "learning_rate": 9.279942480067131e-05, "epoch": 0.1867788863497018, "percentage": 18.68, "elapsed_time": "7:55:44", "remaining_time": "1 day, 10:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3352, "total_steps": 17941, "loss": 1.8177, "learning_rate": 9.279482067753777e-05, "epoch": 0.18683462460286496, "percentage": 18.68, "elapsed_time": "7:55:52", "remaining_time": "1 day, 10:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3353, "total_steps": 17941, "loss": 1.7726, "learning_rate": 9.279021519720203e-05, "epoch": 0.18689036285602809, "percentage": 18.69, "elapsed_time": "7:56:01", "remaining_time": "1 day, 10:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3354, "total_steps": 17941, "loss": 1.7335, "learning_rate": 9.278560835981016e-05, "epoch": 0.18694610110919124, "percentage": 18.69, "elapsed_time": "7:56:09", "remaining_time": "1 day, 10:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3355, "total_steps": 17941, "loss": 1.8071, "learning_rate": 9.278100016550825e-05, "epoch": 0.18700183936235437, "percentage": 18.7, "elapsed_time": "7:56:18", "remaining_time": "1 day, 10:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3356, "total_steps": 17941, "loss": 1.7673, "learning_rate": 9.277639061444244e-05, "epoch": 0.18705757761551753, "percentage": 18.71, "elapsed_time": "7:56:26", "remaining_time": "1 day, 10:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3357, "total_steps": 17941, "loss": 1.686, "learning_rate": 9.277177970675893e-05, "epoch": 0.18711331586868069, "percentage": 18.71, "elapsed_time": "7:56:34", "remaining_time": "1 day, 10:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3358, "total_steps": 17941, "loss": 1.8069, "learning_rate": 9.276716744260392e-05, "epoch": 0.18716905412184381, "percentage": 18.72, "elapsed_time": "7:56:43", "remaining_time": "1 day, 10:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3359, "total_steps": 17941, "loss": 1.7838, "learning_rate": 9.276255382212373e-05, "epoch": 0.18722479237500697, "percentage": 18.72, "elapsed_time": "7:56:51", "remaining_time": "1 day, 10:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3360, "total_steps": 17941, "loss": 1.6363, "learning_rate": 9.275793884546465e-05, "epoch": 0.1872805306281701, "percentage": 18.73, "elapsed_time": "7:57:00", "remaining_time": "1 day, 10:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3361, "total_steps": 17941, "loss": 1.7624, "learning_rate": 9.275332251277305e-05, "epoch": 0.18733626888133326, "percentage": 18.73, "elapsed_time": "7:57:08", "remaining_time": "1 day, 10:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3362, "total_steps": 17941, "loss": 1.785, "learning_rate": 9.274870482419533e-05, "epoch": 0.1873920071344964, "percentage": 18.74, "elapsed_time": "7:57:17", "remaining_time": "1 day, 10:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3363, "total_steps": 17941, "loss": 1.7629, "learning_rate": 9.274408577987792e-05, "epoch": 0.18744774538765954, "percentage": 18.74, "elapsed_time": "7:57:25", "remaining_time": "1 day, 10:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3364, "total_steps": 17941, "loss": 1.6675, "learning_rate": 9.273946537996734e-05, "epoch": 0.1875034836408227, "percentage": 18.75, "elapsed_time": "7:57:34", "remaining_time": "1 day, 10:29:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3365, "total_steps": 17941, "loss": 1.8703, "learning_rate": 9.273484362461011e-05, "epoch": 0.18755922189398586, "percentage": 18.76, "elapsed_time": "7:57:42", "remaining_time": "1 day, 10:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3366, "total_steps": 17941, "loss": 1.646, "learning_rate": 9.273022051395278e-05, "epoch": 0.18761496014714898, "percentage": 18.76, "elapsed_time": "7:57:51", "remaining_time": "1 day, 10:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3367, "total_steps": 17941, "loss": 1.7221, "learning_rate": 9.272559604814201e-05, "epoch": 0.18767069840031214, "percentage": 18.77, "elapsed_time": "7:57:59", "remaining_time": "1 day, 10:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3368, "total_steps": 17941, "loss": 1.5933, "learning_rate": 9.272097022732443e-05, "epoch": 0.18772643665347527, "percentage": 18.77, "elapsed_time": "7:58:07", "remaining_time": "1 day, 10:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3369, "total_steps": 17941, "loss": 1.7312, "learning_rate": 9.271634305164675e-05, "epoch": 0.18778217490663843, "percentage": 18.78, "elapsed_time": "7:58:16", "remaining_time": "1 day, 10:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3370, "total_steps": 17941, "loss": 1.7442, "learning_rate": 9.271171452125575e-05, "epoch": 0.18783791315980158, "percentage": 18.78, "elapsed_time": "7:58:24", "remaining_time": "1 day, 10:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3371, "total_steps": 17941, "loss": 1.7939, "learning_rate": 9.270708463629815e-05, "epoch": 0.1878936514129647, "percentage": 18.79, "elapsed_time": "7:58:33", "remaining_time": "1 day, 10:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3372, "total_steps": 17941, "loss": 1.8941, "learning_rate": 9.270245339692086e-05, "epoch": 0.18794938966612787, "percentage": 18.79, "elapsed_time": "7:58:41", "remaining_time": "1 day, 10:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3373, "total_steps": 17941, "loss": 1.6895, "learning_rate": 9.269782080327071e-05, "epoch": 0.188005127919291, "percentage": 18.8, "elapsed_time": "7:58:50", "remaining_time": "1 day, 10:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3374, "total_steps": 17941, "loss": 1.6734, "learning_rate": 9.269318685549463e-05, "epoch": 0.18806086617245416, "percentage": 18.81, "elapsed_time": "7:58:58", "remaining_time": "1 day, 10:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3375, "total_steps": 17941, "loss": 1.848, "learning_rate": 9.268855155373957e-05, "epoch": 0.1881166044256173, "percentage": 18.81, "elapsed_time": "7:59:07", "remaining_time": "1 day, 10:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3376, "total_steps": 17941, "loss": 1.4297, "learning_rate": 9.268391489815257e-05, "epoch": 0.18817234267878044, "percentage": 18.82, "elapsed_time": "7:59:15", "remaining_time": "1 day, 10:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3377, "total_steps": 17941, "loss": 1.8073, "learning_rate": 9.267927688888062e-05, "epoch": 0.1882280809319436, "percentage": 18.82, "elapsed_time": "7:59:24", "remaining_time": "1 day, 10:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3378, "total_steps": 17941, "loss": 1.751, "learning_rate": 9.267463752607089e-05, "epoch": 0.18828381918510673, "percentage": 18.83, "elapsed_time": "7:59:33", "remaining_time": "1 day, 10:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3379, "total_steps": 17941, "loss": 1.498, "learning_rate": 9.266999680987043e-05, "epoch": 0.18833955743826988, "percentage": 18.83, "elapsed_time": "7:59:41", "remaining_time": "1 day, 10:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3380, "total_steps": 17941, "loss": 1.4733, "learning_rate": 9.266535474042647e-05, "epoch": 0.18839529569143304, "percentage": 18.84, "elapsed_time": "7:59:50", "remaining_time": "1 day, 10:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3381, "total_steps": 17941, "loss": 1.904, "learning_rate": 9.266071131788621e-05, "epoch": 0.18845103394459617, "percentage": 18.85, "elapsed_time": "7:59:58", "remaining_time": "1 day, 10:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3382, "total_steps": 17941, "loss": 1.8644, "learning_rate": 9.26560665423969e-05, "epoch": 0.18850677219775933, "percentage": 18.85, "elapsed_time": "8:00:06", "remaining_time": "1 day, 10:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3383, "total_steps": 17941, "loss": 1.6917, "learning_rate": 9.265142041410589e-05, "epoch": 0.18856251045092245, "percentage": 18.86, "elapsed_time": "8:00:15", "remaining_time": "1 day, 10:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3384, "total_steps": 17941, "loss": 1.7944, "learning_rate": 9.26467729331605e-05, "epoch": 0.1886182487040856, "percentage": 18.86, "elapsed_time": "8:00:23", "remaining_time": "1 day, 10:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3385, "total_steps": 17941, "loss": 1.9372, "learning_rate": 9.26421240997081e-05, "epoch": 0.18867398695724877, "percentage": 18.87, "elapsed_time": "8:00:32", "remaining_time": "1 day, 10:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3386, "total_steps": 17941, "loss": 1.9591, "learning_rate": 9.263747391389615e-05, "epoch": 0.1887297252104119, "percentage": 18.87, "elapsed_time": "8:00:40", "remaining_time": "1 day, 10:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3387, "total_steps": 17941, "loss": 1.5718, "learning_rate": 9.263282237587213e-05, "epoch": 0.18878546346357505, "percentage": 18.88, "elapsed_time": "8:00:49", "remaining_time": "1 day, 10:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3388, "total_steps": 17941, "loss": 1.7829, "learning_rate": 9.262816948578354e-05, "epoch": 0.1888412017167382, "percentage": 18.88, "elapsed_time": "8:00:57", "remaining_time": "1 day, 10:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3389, "total_steps": 17941, "loss": 1.8848, "learning_rate": 9.262351524377797e-05, "epoch": 0.18889693996990134, "percentage": 18.89, "elapsed_time": "8:01:06", "remaining_time": "1 day, 10:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3390, "total_steps": 17941, "loss": 1.3356, "learning_rate": 9.261885965000298e-05, "epoch": 0.1889526782230645, "percentage": 18.9, "elapsed_time": "8:01:14", "remaining_time": "1 day, 10:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3391, "total_steps": 17941, "loss": 1.7632, "learning_rate": 9.261420270460628e-05, "epoch": 0.18900841647622763, "percentage": 18.9, "elapsed_time": "8:01:23", "remaining_time": "1 day, 10:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3392, "total_steps": 17941, "loss": 1.6608, "learning_rate": 9.26095444077355e-05, "epoch": 0.18906415472939078, "percentage": 18.91, "elapsed_time": "8:01:31", "remaining_time": "1 day, 10:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3393, "total_steps": 17941, "loss": 1.8704, "learning_rate": 9.260488475953842e-05, "epoch": 0.18911989298255394, "percentage": 18.91, "elapsed_time": "8:01:40", "remaining_time": "1 day, 10:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3394, "total_steps": 17941, "loss": 1.515, "learning_rate": 9.26002237601628e-05, "epoch": 0.18917563123571707, "percentage": 18.92, "elapsed_time": "8:01:49", "remaining_time": "1 day, 10:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3395, "total_steps": 17941, "loss": 1.448, "learning_rate": 9.259556140975644e-05, "epoch": 0.18923136948888022, "percentage": 18.92, "elapsed_time": "8:01:57", "remaining_time": "1 day, 10:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3396, "total_steps": 17941, "loss": 1.7052, "learning_rate": 9.259089770846723e-05, "epoch": 0.18928710774204335, "percentage": 18.93, "elapsed_time": "8:02:06", "remaining_time": "1 day, 10:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3397, "total_steps": 17941, "loss": 1.8782, "learning_rate": 9.258623265644309e-05, "epoch": 0.1893428459952065, "percentage": 18.93, "elapsed_time": "8:02:14", "remaining_time": "1 day, 10:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3398, "total_steps": 17941, "loss": 1.6754, "learning_rate": 9.258156625383192e-05, "epoch": 0.18939858424836967, "percentage": 18.94, "elapsed_time": "8:02:23", "remaining_time": "1 day, 10:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3399, "total_steps": 17941, "loss": 1.7709, "learning_rate": 9.257689850078174e-05, "epoch": 0.1894543225015328, "percentage": 18.95, "elapsed_time": "8:02:31", "remaining_time": "1 day, 10:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3400, "total_steps": 17941, "loss": 1.6806, "learning_rate": 9.257222939744059e-05, "epoch": 0.18951006075469595, "percentage": 18.95, "elapsed_time": "8:02:39", "remaining_time": "1 day, 10:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3401, "total_steps": 17941, "loss": 1.6614, "learning_rate": 9.256755894395652e-05, "epoch": 0.18956579900785908, "percentage": 18.96, "elapsed_time": "8:02:48", "remaining_time": "1 day, 10:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3402, "total_steps": 17941, "loss": 1.9115, "learning_rate": 9.256288714047767e-05, "epoch": 0.18962153726102224, "percentage": 18.96, "elapsed_time": "8:02:56", "remaining_time": "1 day, 10:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3403, "total_steps": 17941, "loss": 1.6686, "learning_rate": 9.255821398715221e-05, "epoch": 0.1896772755141854, "percentage": 18.97, "elapsed_time": "8:03:05", "remaining_time": "1 day, 10:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3404, "total_steps": 17941, "loss": 1.5406, "learning_rate": 9.255353948412833e-05, "epoch": 0.18973301376734852, "percentage": 18.97, "elapsed_time": "8:03:13", "remaining_time": "1 day, 10:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3405, "total_steps": 17941, "loss": 1.8979, "learning_rate": 9.254886363155429e-05, "epoch": 0.18978875202051168, "percentage": 18.98, "elapsed_time": "8:03:22", "remaining_time": "1 day, 10:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3406, "total_steps": 17941, "loss": 1.7284, "learning_rate": 9.254418642957835e-05, "epoch": 0.1898444902736748, "percentage": 18.98, "elapsed_time": "8:03:30", "remaining_time": "1 day, 10:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3407, "total_steps": 17941, "loss": 1.7517, "learning_rate": 9.253950787834889e-05, "epoch": 0.18990022852683797, "percentage": 18.99, "elapsed_time": "8:03:39", "remaining_time": "1 day, 10:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3408, "total_steps": 17941, "loss": 1.7069, "learning_rate": 9.253482797801425e-05, "epoch": 0.18995596678000112, "percentage": 19.0, "elapsed_time": "8:03:48", "remaining_time": "1 day, 10:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3409, "total_steps": 17941, "loss": 1.4309, "learning_rate": 9.253014672872285e-05, "epoch": 0.19001170503316425, "percentage": 19.0, "elapsed_time": "8:03:56", "remaining_time": "1 day, 10:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3410, "total_steps": 17941, "loss": 1.6337, "learning_rate": 9.252546413062319e-05, "epoch": 0.1900674432863274, "percentage": 19.01, "elapsed_time": "8:04:05", "remaining_time": "1 day, 10:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3411, "total_steps": 17941, "loss": 1.4486, "learning_rate": 9.252078018386374e-05, "epoch": 0.19012318153949057, "percentage": 19.01, "elapsed_time": "8:04:13", "remaining_time": "1 day, 10:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3412, "total_steps": 17941, "loss": 1.524, "learning_rate": 9.251609488859304e-05, "epoch": 0.1901789197926537, "percentage": 19.02, "elapsed_time": "8:04:22", "remaining_time": "1 day, 10:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3413, "total_steps": 17941, "loss": 1.6331, "learning_rate": 9.251140824495972e-05, "epoch": 0.19023465804581685, "percentage": 19.02, "elapsed_time": "8:04:31", "remaining_time": "1 day, 10:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3414, "total_steps": 17941, "loss": 1.6409, "learning_rate": 9.250672025311237e-05, "epoch": 0.19029039629897998, "percentage": 19.03, "elapsed_time": "8:04:39", "remaining_time": "1 day, 10:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3415, "total_steps": 17941, "loss": 1.7712, "learning_rate": 9.250203091319968e-05, "epoch": 0.19034613455214314, "percentage": 19.03, "elapsed_time": "8:04:48", "remaining_time": "1 day, 10:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3416, "total_steps": 17941, "loss": 1.888, "learning_rate": 9.24973402253704e-05, "epoch": 0.1904018728053063, "percentage": 19.04, "elapsed_time": "8:04:56", "remaining_time": "1 day, 10:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3417, "total_steps": 17941, "loss": 1.6808, "learning_rate": 9.249264818977324e-05, "epoch": 0.19045761105846942, "percentage": 19.05, "elapsed_time": "8:05:05", "remaining_time": "1 day, 10:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3418, "total_steps": 17941, "loss": 1.8398, "learning_rate": 9.248795480655704e-05, "epoch": 0.19051334931163258, "percentage": 19.05, "elapsed_time": "8:05:13", "remaining_time": "1 day, 10:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3419, "total_steps": 17941, "loss": 1.7295, "learning_rate": 9.248326007587063e-05, "epoch": 0.1905690875647957, "percentage": 19.06, "elapsed_time": "8:05:22", "remaining_time": "1 day, 10:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3420, "total_steps": 17941, "loss": 1.7717, "learning_rate": 9.247856399786292e-05, "epoch": 0.19062482581795887, "percentage": 19.06, "elapsed_time": "8:05:30", "remaining_time": "1 day, 10:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3421, "total_steps": 17941, "loss": 1.5417, "learning_rate": 9.247386657268283e-05, "epoch": 0.19068056407112202, "percentage": 19.07, "elapsed_time": "8:05:39", "remaining_time": "1 day, 10:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3422, "total_steps": 17941, "loss": 1.8882, "learning_rate": 9.24691678004793e-05, "epoch": 0.19073630232428515, "percentage": 19.07, "elapsed_time": "8:05:47", "remaining_time": "1 day, 10:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3423, "total_steps": 17941, "loss": 1.8083, "learning_rate": 9.24644676814014e-05, "epoch": 0.1907920405774483, "percentage": 19.08, "elapsed_time": "8:05:56", "remaining_time": "1 day, 10:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3424, "total_steps": 17941, "loss": 1.8532, "learning_rate": 9.245976621559817e-05, "epoch": 0.19084777883061144, "percentage": 19.08, "elapsed_time": "8:06:04", "remaining_time": "1 day, 10:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3425, "total_steps": 17941, "loss": 1.5365, "learning_rate": 9.24550634032187e-05, "epoch": 0.1909035170837746, "percentage": 19.09, "elapsed_time": "8:06:13", "remaining_time": "1 day, 10:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3426, "total_steps": 17941, "loss": 1.854, "learning_rate": 9.245035924441217e-05, "epoch": 0.19095925533693775, "percentage": 19.1, "elapsed_time": "8:06:21", "remaining_time": "1 day, 10:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3427, "total_steps": 17941, "loss": 1.7373, "learning_rate": 9.244565373932774e-05, "epoch": 0.19101499359010088, "percentage": 19.1, "elapsed_time": "8:06:29", "remaining_time": "1 day, 10:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3428, "total_steps": 17941, "loss": 1.746, "learning_rate": 9.244094688811465e-05, "epoch": 0.19107073184326404, "percentage": 19.11, "elapsed_time": "8:06:38", "remaining_time": "1 day, 10:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3429, "total_steps": 17941, "loss": 1.3836, "learning_rate": 9.243623869092218e-05, "epoch": 0.19112647009642716, "percentage": 19.11, "elapsed_time": "8:06:46", "remaining_time": "1 day, 10:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3430, "total_steps": 17941, "loss": 1.8499, "learning_rate": 9.24315291478996e-05, "epoch": 0.19118220834959032, "percentage": 19.12, "elapsed_time": "8:06:55", "remaining_time": "1 day, 10:19:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3431, "total_steps": 17941, "loss": 1.6767, "learning_rate": 9.242681825919635e-05, "epoch": 0.19123794660275348, "percentage": 19.12, "elapsed_time": "8:07:03", "remaining_time": "1 day, 10:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3432, "total_steps": 17941, "loss": 1.7963, "learning_rate": 9.242210602496178e-05, "epoch": 0.1912936848559166, "percentage": 19.13, "elapsed_time": "8:07:12", "remaining_time": "1 day, 10:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3433, "total_steps": 17941, "loss": 1.7885, "learning_rate": 9.241739244534534e-05, "epoch": 0.19134942310907976, "percentage": 19.13, "elapsed_time": "8:07:20", "remaining_time": "1 day, 10:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3434, "total_steps": 17941, "loss": 1.7971, "learning_rate": 9.241267752049653e-05, "epoch": 0.19140516136224292, "percentage": 19.14, "elapsed_time": "8:07:29", "remaining_time": "1 day, 10:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3435, "total_steps": 17941, "loss": 1.7376, "learning_rate": 9.240796125056486e-05, "epoch": 0.19146089961540605, "percentage": 19.15, "elapsed_time": "8:07:37", "remaining_time": "1 day, 10:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3436, "total_steps": 17941, "loss": 1.6705, "learning_rate": 9.240324363569992e-05, "epoch": 0.1915166378685692, "percentage": 19.15, "elapsed_time": "8:07:46", "remaining_time": "1 day, 10:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3437, "total_steps": 17941, "loss": 1.8505, "learning_rate": 9.239852467605132e-05, "epoch": 0.19157237612173234, "percentage": 19.16, "elapsed_time": "8:07:54", "remaining_time": "1 day, 10:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3438, "total_steps": 17941, "loss": 1.7993, "learning_rate": 9.239380437176872e-05, "epoch": 0.1916281143748955, "percentage": 19.16, "elapsed_time": "8:08:03", "remaining_time": "1 day, 10:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3439, "total_steps": 17941, "loss": 1.803, "learning_rate": 9.238908272300181e-05, "epoch": 0.19168385262805865, "percentage": 19.17, "elapsed_time": "8:08:11", "remaining_time": "1 day, 10:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3440, "total_steps": 17941, "loss": 1.6364, "learning_rate": 9.238435972990036e-05, "epoch": 0.19173959088122178, "percentage": 19.17, "elapsed_time": "8:08:20", "remaining_time": "1 day, 10:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3441, "total_steps": 17941, "loss": 1.8069, "learning_rate": 9.237963539261412e-05, "epoch": 0.19179532913438493, "percentage": 19.18, "elapsed_time": "8:08:28", "remaining_time": "1 day, 10:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3442, "total_steps": 17941, "loss": 1.6969, "learning_rate": 9.237490971129294e-05, "epoch": 0.19185106738754806, "percentage": 19.19, "elapsed_time": "8:08:37", "remaining_time": "1 day, 10:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3443, "total_steps": 17941, "loss": 1.7135, "learning_rate": 9.23701826860867e-05, "epoch": 0.19190680564071122, "percentage": 19.19, "elapsed_time": "8:08:45", "remaining_time": "1 day, 10:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3444, "total_steps": 17941, "loss": 1.8724, "learning_rate": 9.236545431714529e-05, "epoch": 0.19196254389387438, "percentage": 19.2, "elapsed_time": "8:08:54", "remaining_time": "1 day, 10:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3445, "total_steps": 17941, "loss": 1.7944, "learning_rate": 9.236072460461867e-05, "epoch": 0.1920182821470375, "percentage": 19.2, "elapsed_time": "8:09:03", "remaining_time": "1 day, 10:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3446, "total_steps": 17941, "loss": 1.5557, "learning_rate": 9.235599354865686e-05, "epoch": 0.19207402040020066, "percentage": 19.21, "elapsed_time": "8:09:11", "remaining_time": "1 day, 10:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3447, "total_steps": 17941, "loss": 1.8263, "learning_rate": 9.235126114940989e-05, "epoch": 0.1921297586533638, "percentage": 19.21, "elapsed_time": "8:09:20", "remaining_time": "1 day, 10:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3448, "total_steps": 17941, "loss": 1.7186, "learning_rate": 9.234652740702781e-05, "epoch": 0.19218549690652695, "percentage": 19.22, "elapsed_time": "8:09:29", "remaining_time": "1 day, 10:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3449, "total_steps": 17941, "loss": 1.5176, "learning_rate": 9.23417923216608e-05, "epoch": 0.1922412351596901, "percentage": 19.22, "elapsed_time": "8:09:37", "remaining_time": "1 day, 10:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3450, "total_steps": 17941, "loss": 1.8129, "learning_rate": 9.233705589345902e-05, "epoch": 0.19229697341285323, "percentage": 19.23, "elapsed_time": "8:09:45", "remaining_time": "1 day, 10:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3451, "total_steps": 17941, "loss": 1.5314, "learning_rate": 9.233231812257265e-05, "epoch": 0.1923527116660164, "percentage": 19.24, "elapsed_time": "8:09:54", "remaining_time": "1 day, 10:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3452, "total_steps": 17941, "loss": 1.6043, "learning_rate": 9.232757900915197e-05, "epoch": 0.19240844991917952, "percentage": 19.24, "elapsed_time": "8:10:02", "remaining_time": "1 day, 10:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3453, "total_steps": 17941, "loss": 1.8168, "learning_rate": 9.232283855334727e-05, "epoch": 0.19246418817234268, "percentage": 19.25, "elapsed_time": "8:10:11", "remaining_time": "1 day, 10:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3454, "total_steps": 17941, "loss": 1.7076, "learning_rate": 9.231809675530888e-05, "epoch": 0.19251992642550583, "percentage": 19.25, "elapsed_time": "8:10:20", "remaining_time": "1 day, 10:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3455, "total_steps": 17941, "loss": 1.8021, "learning_rate": 9.23133536151872e-05, "epoch": 0.19257566467866896, "percentage": 19.26, "elapsed_time": "8:10:28", "remaining_time": "1 day, 10:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3456, "total_steps": 17941, "loss": 1.659, "learning_rate": 9.230860913313266e-05, "epoch": 0.19263140293183212, "percentage": 19.26, "elapsed_time": "8:10:37", "remaining_time": "1 day, 10:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3457, "total_steps": 17941, "loss": 1.8172, "learning_rate": 9.23038633092957e-05, "epoch": 0.19268714118499528, "percentage": 19.27, "elapsed_time": "8:10:45", "remaining_time": "1 day, 10:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3458, "total_steps": 17941, "loss": 1.6086, "learning_rate": 9.229911614382685e-05, "epoch": 0.1927428794381584, "percentage": 19.27, "elapsed_time": "8:10:54", "remaining_time": "1 day, 10:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3459, "total_steps": 17941, "loss": 1.7102, "learning_rate": 9.229436763687665e-05, "epoch": 0.19279861769132156, "percentage": 19.28, "elapsed_time": "8:11:02", "remaining_time": "1 day, 10:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3460, "total_steps": 17941, "loss": 1.6291, "learning_rate": 9.228961778859572e-05, "epoch": 0.1928543559444847, "percentage": 19.29, "elapsed_time": "8:11:11", "remaining_time": "1 day, 10:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3461, "total_steps": 17941, "loss": 1.7628, "learning_rate": 9.228486659913467e-05, "epoch": 0.19291009419764785, "percentage": 19.29, "elapsed_time": "8:11:19", "remaining_time": "1 day, 10:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3462, "total_steps": 17941, "loss": 1.6604, "learning_rate": 9.228011406864417e-05, "epoch": 0.192965832450811, "percentage": 19.3, "elapsed_time": "8:11:27", "remaining_time": "1 day, 10:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3463, "total_steps": 17941, "loss": 1.6571, "learning_rate": 9.227536019727498e-05, "epoch": 0.19302157070397413, "percentage": 19.3, "elapsed_time": "8:11:36", "remaining_time": "1 day, 10:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3464, "total_steps": 17941, "loss": 1.6586, "learning_rate": 9.227060498517785e-05, "epoch": 0.1930773089571373, "percentage": 19.31, "elapsed_time": "8:11:44", "remaining_time": "1 day, 10:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3465, "total_steps": 17941, "loss": 1.6693, "learning_rate": 9.226584843250357e-05, "epoch": 0.19313304721030042, "percentage": 19.31, "elapsed_time": "8:11:53", "remaining_time": "1 day, 10:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3466, "total_steps": 17941, "loss": 1.8516, "learning_rate": 9.226109053940302e-05, "epoch": 0.19318878546346357, "percentage": 19.32, "elapsed_time": "8:12:02", "remaining_time": "1 day, 10:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3467, "total_steps": 17941, "loss": 1.8369, "learning_rate": 9.225633130602707e-05, "epoch": 0.19324452371662673, "percentage": 19.32, "elapsed_time": "8:12:10", "remaining_time": "1 day, 10:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3468, "total_steps": 17941, "loss": 1.7936, "learning_rate": 9.225157073252666e-05, "epoch": 0.19330026196978986, "percentage": 19.33, "elapsed_time": "8:12:20", "remaining_time": "1 day, 10:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3469, "total_steps": 17941, "loss": 1.8398, "learning_rate": 9.224680881905279e-05, "epoch": 0.19335600022295302, "percentage": 19.34, "elapsed_time": "8:12:28", "remaining_time": "1 day, 10:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3470, "total_steps": 17941, "loss": 1.8699, "learning_rate": 9.224204556575644e-05, "epoch": 0.19341173847611615, "percentage": 19.34, "elapsed_time": "8:12:36", "remaining_time": "1 day, 10:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3471, "total_steps": 17941, "loss": 1.6961, "learning_rate": 9.22372809727887e-05, "epoch": 0.1934674767292793, "percentage": 19.35, "elapsed_time": "8:12:45", "remaining_time": "1 day, 10:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3472, "total_steps": 17941, "loss": 1.6302, "learning_rate": 9.223251504030066e-05, "epoch": 0.19352321498244246, "percentage": 19.35, "elapsed_time": "8:12:54", "remaining_time": "1 day, 10:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3473, "total_steps": 17941, "loss": 1.765, "learning_rate": 9.222774776844349e-05, "epoch": 0.1935789532356056, "percentage": 19.36, "elapsed_time": "8:13:03", "remaining_time": "1 day, 10:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3474, "total_steps": 17941, "loss": 1.783, "learning_rate": 9.222297915736834e-05, "epoch": 0.19363469148876875, "percentage": 19.36, "elapsed_time": "8:13:11", "remaining_time": "1 day, 10:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3475, "total_steps": 17941, "loss": 1.6188, "learning_rate": 9.22182092072265e-05, "epoch": 0.19369042974193187, "percentage": 19.37, "elapsed_time": "8:13:20", "remaining_time": "1 day, 10:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3476, "total_steps": 17941, "loss": 1.7017, "learning_rate": 9.221343791816918e-05, "epoch": 0.19374616799509503, "percentage": 19.37, "elapsed_time": "8:13:28", "remaining_time": "1 day, 10:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3477, "total_steps": 17941, "loss": 1.7064, "learning_rate": 9.220866529034776e-05, "epoch": 0.1938019062482582, "percentage": 19.38, "elapsed_time": "8:13:37", "remaining_time": "1 day, 10:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3478, "total_steps": 17941, "loss": 1.7807, "learning_rate": 9.220389132391356e-05, "epoch": 0.19385764450142132, "percentage": 19.39, "elapsed_time": "8:13:45", "remaining_time": "1 day, 10:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3479, "total_steps": 17941, "loss": 1.5785, "learning_rate": 9.219911601901799e-05, "epoch": 0.19391338275458447, "percentage": 19.39, "elapsed_time": "8:13:54", "remaining_time": "1 day, 10:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3480, "total_steps": 17941, "loss": 2.0297, "learning_rate": 9.21943393758125e-05, "epoch": 0.19396912100774763, "percentage": 19.4, "elapsed_time": "8:14:02", "remaining_time": "1 day, 10:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3481, "total_steps": 17941, "loss": 1.6824, "learning_rate": 9.218956139444858e-05, "epoch": 0.19402485926091076, "percentage": 19.4, "elapsed_time": "8:14:10", "remaining_time": "1 day, 10:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3482, "total_steps": 17941, "loss": 1.7264, "learning_rate": 9.218478207507775e-05, "epoch": 0.19408059751407392, "percentage": 19.41, "elapsed_time": "8:14:19", "remaining_time": "1 day, 10:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3483, "total_steps": 17941, "loss": 1.7967, "learning_rate": 9.218000141785158e-05, "epoch": 0.19413633576723704, "percentage": 19.41, "elapsed_time": "8:14:27", "remaining_time": "1 day, 10:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3484, "total_steps": 17941, "loss": 2.0026, "learning_rate": 9.21752194229217e-05, "epoch": 0.1941920740204002, "percentage": 19.42, "elapsed_time": "8:14:36", "remaining_time": "1 day, 10:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3485, "total_steps": 17941, "loss": 1.8374, "learning_rate": 9.217043609043975e-05, "epoch": 0.19424781227356336, "percentage": 19.42, "elapsed_time": "8:14:44", "remaining_time": "1 day, 10:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3486, "total_steps": 17941, "loss": 1.6248, "learning_rate": 9.216565142055745e-05, "epoch": 0.1943035505267265, "percentage": 19.43, "elapsed_time": "8:14:53", "remaining_time": "1 day, 10:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3487, "total_steps": 17941, "loss": 1.8659, "learning_rate": 9.216086541342652e-05, "epoch": 0.19435928877988964, "percentage": 19.44, "elapsed_time": "8:15:01", "remaining_time": "1 day, 10:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3488, "total_steps": 17941, "loss": 1.7026, "learning_rate": 9.215607806919877e-05, "epoch": 0.19441502703305277, "percentage": 19.44, "elapsed_time": "8:15:10", "remaining_time": "1 day, 10:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3489, "total_steps": 17941, "loss": 1.8766, "learning_rate": 9.2151289388026e-05, "epoch": 0.19447076528621593, "percentage": 19.45, "elapsed_time": "8:15:18", "remaining_time": "1 day, 10:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3490, "total_steps": 17941, "loss": 1.372, "learning_rate": 9.214649937006008e-05, "epoch": 0.1945265035393791, "percentage": 19.45, "elapsed_time": "8:15:27", "remaining_time": "1 day, 10:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3491, "total_steps": 17941, "loss": 1.8491, "learning_rate": 9.214170801545294e-05, "epoch": 0.19458224179254222, "percentage": 19.46, "elapsed_time": "8:15:35", "remaining_time": "1 day, 10:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3492, "total_steps": 17941, "loss": 1.4738, "learning_rate": 9.213691532435654e-05, "epoch": 0.19463798004570537, "percentage": 19.46, "elapsed_time": "8:15:43", "remaining_time": "1 day, 10:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3493, "total_steps": 17941, "loss": 1.5871, "learning_rate": 9.213212129692284e-05, "epoch": 0.1946937182988685, "percentage": 19.47, "elapsed_time": "8:15:52", "remaining_time": "1 day, 10:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3494, "total_steps": 17941, "loss": 1.6355, "learning_rate": 9.212732593330389e-05, "epoch": 0.19474945655203166, "percentage": 19.47, "elapsed_time": "8:16:00", "remaining_time": "1 day, 10:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3495, "total_steps": 17941, "loss": 1.8903, "learning_rate": 9.21225292336518e-05, "epoch": 0.19480519480519481, "percentage": 19.48, "elapsed_time": "8:16:09", "remaining_time": "1 day, 10:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3496, "total_steps": 17941, "loss": 1.9006, "learning_rate": 9.211773119811867e-05, "epoch": 0.19486093305835794, "percentage": 19.49, "elapsed_time": "8:16:17", "remaining_time": "1 day, 10:10:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3497, "total_steps": 17941, "loss": 1.5601, "learning_rate": 9.211293182685667e-05, "epoch": 0.1949166713115211, "percentage": 19.49, "elapsed_time": "8:16:26", "remaining_time": "1 day, 10:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3498, "total_steps": 17941, "loss": 1.7871, "learning_rate": 9.210813112001802e-05, "epoch": 0.19497240956468423, "percentage": 19.5, "elapsed_time": "8:16:34", "remaining_time": "1 day, 10:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3499, "total_steps": 17941, "loss": 1.69, "learning_rate": 9.210332907775494e-05, "epoch": 0.19502814781784739, "percentage": 19.5, "elapsed_time": "8:16:43", "remaining_time": "1 day, 10:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 17941, "loss": 1.916, "learning_rate": 9.209852570021975e-05, "epoch": 0.19508388607101054, "percentage": 19.51, "elapsed_time": "8:16:51", "remaining_time": "1 day, 10:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3501, "total_steps": 17941, "loss": 1.6651, "learning_rate": 9.209372098756476e-05, "epoch": 0.19513962432417367, "percentage": 19.51, "elapsed_time": "8:17:00", "remaining_time": "1 day, 10:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3502, "total_steps": 17941, "loss": 1.7589, "learning_rate": 9.208891493994239e-05, "epoch": 0.19519536257733683, "percentage": 19.52, "elapsed_time": "8:17:08", "remaining_time": "1 day, 10:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3503, "total_steps": 17941, "loss": 1.5889, "learning_rate": 9.208410755750501e-05, "epoch": 0.19525110083049999, "percentage": 19.53, "elapsed_time": "8:17:17", "remaining_time": "1 day, 10:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3504, "total_steps": 17941, "loss": 1.8472, "learning_rate": 9.207929884040511e-05, "epoch": 0.19530683908366311, "percentage": 19.53, "elapsed_time": "8:17:25", "remaining_time": "1 day, 10:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3505, "total_steps": 17941, "loss": 1.6471, "learning_rate": 9.20744887887952e-05, "epoch": 0.19536257733682627, "percentage": 19.54, "elapsed_time": "8:17:33", "remaining_time": "1 day, 10:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3506, "total_steps": 17941, "loss": 1.5727, "learning_rate": 9.206967740282783e-05, "epoch": 0.1954183155899894, "percentage": 19.54, "elapsed_time": "8:17:42", "remaining_time": "1 day, 10:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3507, "total_steps": 17941, "loss": 1.635, "learning_rate": 9.206486468265555e-05, "epoch": 0.19547405384315256, "percentage": 19.55, "elapsed_time": "8:17:50", "remaining_time": "1 day, 10:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3508, "total_steps": 17941, "loss": 1.7088, "learning_rate": 9.206005062843102e-05, "epoch": 0.1955297920963157, "percentage": 19.55, "elapsed_time": "8:17:59", "remaining_time": "1 day, 10:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3509, "total_steps": 17941, "loss": 1.7032, "learning_rate": 9.205523524030693e-05, "epoch": 0.19558553034947884, "percentage": 19.56, "elapsed_time": "8:18:07", "remaining_time": "1 day, 10:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3510, "total_steps": 17941, "loss": 1.8822, "learning_rate": 9.205041851843596e-05, "epoch": 0.195641268602642, "percentage": 19.56, "elapsed_time": "8:18:16", "remaining_time": "1 day, 10:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3511, "total_steps": 17941, "loss": 1.333, "learning_rate": 9.20456004629709e-05, "epoch": 0.19569700685580513, "percentage": 19.57, "elapsed_time": "8:18:24", "remaining_time": "1 day, 10:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3512, "total_steps": 17941, "loss": 1.8277, "learning_rate": 9.204078107406454e-05, "epoch": 0.19575274510896828, "percentage": 19.58, "elapsed_time": "8:18:33", "remaining_time": "1 day, 10:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3513, "total_steps": 17941, "loss": 1.5545, "learning_rate": 9.203596035186969e-05, "epoch": 0.19580848336213144, "percentage": 19.58, "elapsed_time": "8:18:41", "remaining_time": "1 day, 10:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3514, "total_steps": 17941, "loss": 1.6811, "learning_rate": 9.203113829653927e-05, "epoch": 0.19586422161529457, "percentage": 19.59, "elapsed_time": "8:18:49", "remaining_time": "1 day, 10:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3515, "total_steps": 17941, "loss": 1.548, "learning_rate": 9.202631490822622e-05, "epoch": 0.19591995986845773, "percentage": 19.59, "elapsed_time": "8:18:58", "remaining_time": "1 day, 10:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3516, "total_steps": 17941, "loss": 1.6624, "learning_rate": 9.202149018708347e-05, "epoch": 0.19597569812162086, "percentage": 19.6, "elapsed_time": "8:19:06", "remaining_time": "1 day, 10:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3517, "total_steps": 17941, "loss": 1.8557, "learning_rate": 9.201666413326408e-05, "epoch": 0.196031436374784, "percentage": 19.6, "elapsed_time": "8:19:15", "remaining_time": "1 day, 10:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3518, "total_steps": 17941, "loss": 1.5435, "learning_rate": 9.201183674692107e-05, "epoch": 0.19608717462794717, "percentage": 19.61, "elapsed_time": "8:19:23", "remaining_time": "1 day, 10:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3519, "total_steps": 17941, "loss": 1.4683, "learning_rate": 9.200700802820754e-05, "epoch": 0.1961429128811103, "percentage": 19.61, "elapsed_time": "8:19:32", "remaining_time": "1 day, 10:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3520, "total_steps": 17941, "loss": 1.8706, "learning_rate": 9.200217797727662e-05, "epoch": 0.19619865113427346, "percentage": 19.62, "elapsed_time": "8:19:40", "remaining_time": "1 day, 10:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3521, "total_steps": 17941, "loss": 1.5608, "learning_rate": 9.199734659428152e-05, "epoch": 0.19625438938743658, "percentage": 19.63, "elapsed_time": "8:19:49", "remaining_time": "1 day, 10:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3522, "total_steps": 17941, "loss": 1.7221, "learning_rate": 9.199251387937545e-05, "epoch": 0.19631012764059974, "percentage": 19.63, "elapsed_time": "8:19:57", "remaining_time": "1 day, 10:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3523, "total_steps": 17941, "loss": 1.7989, "learning_rate": 9.198767983271166e-05, "epoch": 0.1963658658937629, "percentage": 19.64, "elapsed_time": "8:20:06", "remaining_time": "1 day, 10:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3524, "total_steps": 17941, "loss": 2.0033, "learning_rate": 9.198284445444348e-05, "epoch": 0.19642160414692603, "percentage": 19.64, "elapsed_time": "8:20:14", "remaining_time": "1 day, 10:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3525, "total_steps": 17941, "loss": 1.9705, "learning_rate": 9.197800774472426e-05, "epoch": 0.19647734240008918, "percentage": 19.65, "elapsed_time": "8:20:23", "remaining_time": "1 day, 10:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3526, "total_steps": 17941, "loss": 1.0644, "learning_rate": 9.197316970370737e-05, "epoch": 0.19653308065325234, "percentage": 19.65, "elapsed_time": "8:20:31", "remaining_time": "1 day, 10:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3527, "total_steps": 17941, "loss": 1.662, "learning_rate": 9.196833033154625e-05, "epoch": 0.19658881890641547, "percentage": 19.66, "elapsed_time": "8:20:39", "remaining_time": "1 day, 10:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3528, "total_steps": 17941, "loss": 1.7743, "learning_rate": 9.19634896283944e-05, "epoch": 0.19664455715957863, "percentage": 19.66, "elapsed_time": "8:20:48", "remaining_time": "1 day, 10:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3529, "total_steps": 17941, "loss": 1.7682, "learning_rate": 9.195864759440531e-05, "epoch": 0.19670029541274175, "percentage": 19.67, "elapsed_time": "8:20:56", "remaining_time": "1 day, 10:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3530, "total_steps": 17941, "loss": 1.6731, "learning_rate": 9.195380422973257e-05, "epoch": 0.1967560336659049, "percentage": 19.68, "elapsed_time": "8:21:05", "remaining_time": "1 day, 10:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3531, "total_steps": 17941, "loss": 1.4618, "learning_rate": 9.194895953452976e-05, "epoch": 0.19681177191906807, "percentage": 19.68, "elapsed_time": "8:21:13", "remaining_time": "1 day, 10:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3532, "total_steps": 17941, "loss": 1.7007, "learning_rate": 9.194411350895053e-05, "epoch": 0.1968675101722312, "percentage": 19.69, "elapsed_time": "8:21:22", "remaining_time": "1 day, 10:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3533, "total_steps": 17941, "loss": 1.8571, "learning_rate": 9.193926615314857e-05, "epoch": 0.19692324842539435, "percentage": 19.69, "elapsed_time": "8:21:31", "remaining_time": "1 day, 10:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3534, "total_steps": 17941, "loss": 1.4968, "learning_rate": 9.193441746727762e-05, "epoch": 0.19697898667855748, "percentage": 19.7, "elapsed_time": "8:21:39", "remaining_time": "1 day, 10:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3535, "total_steps": 17941, "loss": 1.8938, "learning_rate": 9.192956745149144e-05, "epoch": 0.19703472493172064, "percentage": 19.7, "elapsed_time": "8:21:47", "remaining_time": "1 day, 10:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3536, "total_steps": 17941, "loss": 2.0865, "learning_rate": 9.192471610594384e-05, "epoch": 0.1970904631848838, "percentage": 19.71, "elapsed_time": "8:21:56", "remaining_time": "1 day, 10:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3537, "total_steps": 17941, "loss": 1.7354, "learning_rate": 9.191986343078868e-05, "epoch": 0.19714620143804693, "percentage": 19.71, "elapsed_time": "8:22:04", "remaining_time": "1 day, 10:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3538, "total_steps": 17941, "loss": 1.5218, "learning_rate": 9.191500942617988e-05, "epoch": 0.19720193969121008, "percentage": 19.72, "elapsed_time": "8:22:13", "remaining_time": "1 day, 10:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3539, "total_steps": 17941, "loss": 1.6676, "learning_rate": 9.191015409227134e-05, "epoch": 0.1972576779443732, "percentage": 19.73, "elapsed_time": "8:22:21", "remaining_time": "1 day, 10:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3540, "total_steps": 17941, "loss": 1.8602, "learning_rate": 9.190529742921707e-05, "epoch": 0.19731341619753637, "percentage": 19.73, "elapsed_time": "8:22:30", "remaining_time": "1 day, 10:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3541, "total_steps": 17941, "loss": 1.7324, "learning_rate": 9.190043943717111e-05, "epoch": 0.19736915445069952, "percentage": 19.74, "elapsed_time": "8:22:39", "remaining_time": "1 day, 10:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3542, "total_steps": 17941, "loss": 1.8098, "learning_rate": 9.189558011628749e-05, "epoch": 0.19742489270386265, "percentage": 19.74, "elapsed_time": "8:22:47", "remaining_time": "1 day, 10:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3543, "total_steps": 17941, "loss": 1.9953, "learning_rate": 9.189071946672033e-05, "epoch": 0.1974806309570258, "percentage": 19.75, "elapsed_time": "8:22:56", "remaining_time": "1 day, 10:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3544, "total_steps": 17941, "loss": 1.6697, "learning_rate": 9.18858574886238e-05, "epoch": 0.19753636921018894, "percentage": 19.75, "elapsed_time": "8:23:04", "remaining_time": "1 day, 10:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3545, "total_steps": 17941, "loss": 1.4443, "learning_rate": 9.188099418215208e-05, "epoch": 0.1975921074633521, "percentage": 19.76, "elapsed_time": "8:23:13", "remaining_time": "1 day, 10:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3546, "total_steps": 17941, "loss": 1.738, "learning_rate": 9.187612954745942e-05, "epoch": 0.19764784571651525, "percentage": 19.76, "elapsed_time": "8:23:21", "remaining_time": "1 day, 10:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3547, "total_steps": 17941, "loss": 1.7746, "learning_rate": 9.187126358470006e-05, "epoch": 0.19770358396967838, "percentage": 19.77, "elapsed_time": "8:23:30", "remaining_time": "1 day, 10:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3548, "total_steps": 17941, "loss": 1.5869, "learning_rate": 9.186639629402836e-05, "epoch": 0.19775932222284154, "percentage": 19.78, "elapsed_time": "8:23:38", "remaining_time": "1 day, 10:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3549, "total_steps": 17941, "loss": 1.4967, "learning_rate": 9.186152767559866e-05, "epoch": 0.1978150604760047, "percentage": 19.78, "elapsed_time": "8:23:47", "remaining_time": "1 day, 10:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3550, "total_steps": 17941, "loss": 1.7457, "learning_rate": 9.185665772956539e-05, "epoch": 0.19787079872916782, "percentage": 19.79, "elapsed_time": "8:23:56", "remaining_time": "1 day, 10:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3551, "total_steps": 17941, "loss": 1.6194, "learning_rate": 9.185178645608297e-05, "epoch": 0.19792653698233098, "percentage": 19.79, "elapsed_time": "8:24:04", "remaining_time": "1 day, 10:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3552, "total_steps": 17941, "loss": 1.8616, "learning_rate": 9.184691385530588e-05, "epoch": 0.1979822752354941, "percentage": 19.8, "elapsed_time": "8:24:13", "remaining_time": "1 day, 10:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3553, "total_steps": 17941, "loss": 1.5835, "learning_rate": 9.184203992738869e-05, "epoch": 0.19803801348865727, "percentage": 19.8, "elapsed_time": "8:24:21", "remaining_time": "1 day, 10:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3554, "total_steps": 17941, "loss": 1.6874, "learning_rate": 9.183716467248593e-05, "epoch": 0.19809375174182042, "percentage": 19.81, "elapsed_time": "8:24:30", "remaining_time": "1 day, 10:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3555, "total_steps": 17941, "loss": 1.7946, "learning_rate": 9.183228809075223e-05, "epoch": 0.19814948999498355, "percentage": 19.81, "elapsed_time": "8:24:38", "remaining_time": "1 day, 10:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3556, "total_steps": 17941, "loss": 1.6509, "learning_rate": 9.182741018234228e-05, "epoch": 0.1982052282481467, "percentage": 19.82, "elapsed_time": "8:24:47", "remaining_time": "1 day, 10:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3557, "total_steps": 17941, "loss": 1.6885, "learning_rate": 9.182253094741073e-05, "epoch": 0.19826096650130984, "percentage": 19.83, "elapsed_time": "8:24:55", "remaining_time": "1 day, 10:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3558, "total_steps": 17941, "loss": 1.7431, "learning_rate": 9.181765038611234e-05, "epoch": 0.198316704754473, "percentage": 19.83, "elapsed_time": "8:25:04", "remaining_time": "1 day, 10:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3559, "total_steps": 17941, "loss": 1.763, "learning_rate": 9.18127684986019e-05, "epoch": 0.19837244300763615, "percentage": 19.84, "elapsed_time": "8:25:13", "remaining_time": "1 day, 10:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3560, "total_steps": 17941, "loss": 1.9388, "learning_rate": 9.180788528503423e-05, "epoch": 0.19842818126079928, "percentage": 19.84, "elapsed_time": "8:25:21", "remaining_time": "1 day, 10:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3561, "total_steps": 17941, "loss": 1.8491, "learning_rate": 9.18030007455642e-05, "epoch": 0.19848391951396244, "percentage": 19.85, "elapsed_time": "8:25:30", "remaining_time": "1 day, 10:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3562, "total_steps": 17941, "loss": 1.657, "learning_rate": 9.179811488034671e-05, "epoch": 0.19853965776712557, "percentage": 19.85, "elapsed_time": "8:25:39", "remaining_time": "1 day, 10:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3563, "total_steps": 17941, "loss": 1.8632, "learning_rate": 9.17932276895367e-05, "epoch": 0.19859539602028872, "percentage": 19.86, "elapsed_time": "8:25:47", "remaining_time": "1 day, 10:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3564, "total_steps": 17941, "loss": 2.2768, "learning_rate": 9.17883391732892e-05, "epoch": 0.19865113427345188, "percentage": 19.87, "elapsed_time": "8:25:55", "remaining_time": "1 day, 10:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3565, "total_steps": 17941, "loss": 1.7145, "learning_rate": 9.178344933175922e-05, "epoch": 0.198706872526615, "percentage": 19.87, "elapsed_time": "8:26:04", "remaining_time": "1 day, 10:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3566, "total_steps": 17941, "loss": 1.6678, "learning_rate": 9.177855816510184e-05, "epoch": 0.19876261077977816, "percentage": 19.88, "elapsed_time": "8:26:12", "remaining_time": "1 day, 10:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3567, "total_steps": 17941, "loss": 1.6745, "learning_rate": 9.177366567347216e-05, "epoch": 0.1988183490329413, "percentage": 19.88, "elapsed_time": "8:26:21", "remaining_time": "1 day, 10:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3568, "total_steps": 17941, "loss": 1.7337, "learning_rate": 9.176877185702539e-05, "epoch": 0.19887408728610445, "percentage": 19.89, "elapsed_time": "8:26:29", "remaining_time": "1 day, 10:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3569, "total_steps": 17941, "loss": 1.754, "learning_rate": 9.17638767159167e-05, "epoch": 0.1989298255392676, "percentage": 19.89, "elapsed_time": "8:26:38", "remaining_time": "1 day, 10:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3570, "total_steps": 17941, "loss": 1.6508, "learning_rate": 9.175898025030134e-05, "epoch": 0.19898556379243074, "percentage": 19.9, "elapsed_time": "8:26:47", "remaining_time": "1 day, 10:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3571, "total_steps": 17941, "loss": 1.7258, "learning_rate": 9.175408246033458e-05, "epoch": 0.1990413020455939, "percentage": 19.9, "elapsed_time": "8:26:55", "remaining_time": "1 day, 9:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3572, "total_steps": 17941, "loss": 1.5918, "learning_rate": 9.17491833461718e-05, "epoch": 0.19909704029875705, "percentage": 19.91, "elapsed_time": "8:27:03", "remaining_time": "1 day, 9:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3573, "total_steps": 17941, "loss": 1.4328, "learning_rate": 9.174428290796833e-05, "epoch": 0.19915277855192018, "percentage": 19.92, "elapsed_time": "8:27:12", "remaining_time": "1 day, 9:59:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3574, "total_steps": 17941, "loss": 1.6627, "learning_rate": 9.173938114587957e-05, "epoch": 0.19920851680508334, "percentage": 19.92, "elapsed_time": "8:27:21", "remaining_time": "1 day, 9:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3575, "total_steps": 17941, "loss": 1.6238, "learning_rate": 9.173447806006102e-05, "epoch": 0.19926425505824646, "percentage": 19.93, "elapsed_time": "8:27:29", "remaining_time": "1 day, 9:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3576, "total_steps": 17941, "loss": 1.8033, "learning_rate": 9.172957365066815e-05, "epoch": 0.19931999331140962, "percentage": 19.93, "elapsed_time": "8:27:38", "remaining_time": "1 day, 9:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3577, "total_steps": 17941, "loss": 2.0117, "learning_rate": 9.17246679178565e-05, "epoch": 0.19937573156457278, "percentage": 19.94, "elapsed_time": "8:27:46", "remaining_time": "1 day, 9:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3578, "total_steps": 17941, "loss": 1.6994, "learning_rate": 9.171976086178164e-05, "epoch": 0.1994314698177359, "percentage": 19.94, "elapsed_time": "8:27:55", "remaining_time": "1 day, 9:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3579, "total_steps": 17941, "loss": 1.555, "learning_rate": 9.171485248259924e-05, "epoch": 0.19948720807089906, "percentage": 19.95, "elapsed_time": "8:28:03", "remaining_time": "1 day, 9:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3580, "total_steps": 17941, "loss": 1.7463, "learning_rate": 9.170994278046492e-05, "epoch": 0.1995429463240622, "percentage": 19.95, "elapsed_time": "8:28:12", "remaining_time": "1 day, 9:58:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3581, "total_steps": 17941, "loss": 1.8112, "learning_rate": 9.17050317555344e-05, "epoch": 0.19959868457722535, "percentage": 19.96, "elapsed_time": "8:28:20", "remaining_time": "1 day, 9:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3582, "total_steps": 17941, "loss": 1.7906, "learning_rate": 9.170011940796341e-05, "epoch": 0.1996544228303885, "percentage": 19.97, "elapsed_time": "8:28:29", "remaining_time": "1 day, 9:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3583, "total_steps": 17941, "loss": 2.0624, "learning_rate": 9.16952057379078e-05, "epoch": 0.19971016108355163, "percentage": 19.97, "elapsed_time": "8:28:37", "remaining_time": "1 day, 9:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3584, "total_steps": 17941, "loss": 1.8233, "learning_rate": 9.169029074552333e-05, "epoch": 0.1997658993367148, "percentage": 19.98, "elapsed_time": "8:28:46", "remaining_time": "1 day, 9:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3585, "total_steps": 17941, "loss": 1.6512, "learning_rate": 9.168537443096592e-05, "epoch": 0.19982163758987792, "percentage": 19.98, "elapsed_time": "8:28:54", "remaining_time": "1 day, 9:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3586, "total_steps": 17941, "loss": 1.5675, "learning_rate": 9.168045679439149e-05, "epoch": 0.19987737584304108, "percentage": 19.99, "elapsed_time": "8:29:03", "remaining_time": "1 day, 9:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3587, "total_steps": 17941, "loss": 1.8834, "learning_rate": 9.167553783595597e-05, "epoch": 0.19993311409620423, "percentage": 19.99, "elapsed_time": "8:29:11", "remaining_time": "1 day, 9:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3588, "total_steps": 17941, "loss": 1.7663, "learning_rate": 9.167061755581539e-05, "epoch": 0.19998885234936736, "percentage": 20.0, "elapsed_time": "8:29:20", "remaining_time": "1 day, 9:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3589, "total_steps": 17941, "loss": 1.8832, "learning_rate": 9.166569595412575e-05, "epoch": 0.20004459060253052, "percentage": 20.0, "elapsed_time": "8:29:28", "remaining_time": "1 day, 9:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3590, "total_steps": 17941, "loss": 1.661, "learning_rate": 9.166077303104319e-05, "epoch": 0.20010032885569365, "percentage": 20.01, "elapsed_time": "8:29:37", "remaining_time": "1 day, 9:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3591, "total_steps": 17941, "loss": 1.6764, "learning_rate": 9.165584878672378e-05, "epoch": 0.2001560671088568, "percentage": 20.02, "elapsed_time": "8:29:46", "remaining_time": "1 day, 9:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3592, "total_steps": 17941, "loss": 1.6847, "learning_rate": 9.165092322132374e-05, "epoch": 0.20021180536201996, "percentage": 20.02, "elapsed_time": "8:29:54", "remaining_time": "1 day, 9:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3593, "total_steps": 17941, "loss": 1.7428, "learning_rate": 9.164599633499925e-05, "epoch": 0.2002675436151831, "percentage": 20.03, "elapsed_time": "8:30:03", "remaining_time": "1 day, 9:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3594, "total_steps": 17941, "loss": 1.3011, "learning_rate": 9.164106812790657e-05, "epoch": 0.20032328186834625, "percentage": 20.03, "elapsed_time": "8:30:11", "remaining_time": "1 day, 9:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3595, "total_steps": 17941, "loss": 1.8065, "learning_rate": 9.1636138600202e-05, "epoch": 0.2003790201215094, "percentage": 20.04, "elapsed_time": "8:30:19", "remaining_time": "1 day, 9:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3596, "total_steps": 17941, "loss": 1.6812, "learning_rate": 9.163120775204187e-05, "epoch": 0.20043475837467253, "percentage": 20.04, "elapsed_time": "8:30:28", "remaining_time": "1 day, 9:56:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3597, "total_steps": 17941, "loss": 1.8109, "learning_rate": 9.162627558358255e-05, "epoch": 0.2004904966278357, "percentage": 20.05, "elapsed_time": "8:30:36", "remaining_time": "1 day, 9:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3598, "total_steps": 17941, "loss": 1.8183, "learning_rate": 9.162134209498046e-05, "epoch": 0.20054623488099882, "percentage": 20.05, "elapsed_time": "8:30:45", "remaining_time": "1 day, 9:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3599, "total_steps": 17941, "loss": 1.8642, "learning_rate": 9.161640728639207e-05, "epoch": 0.20060197313416198, "percentage": 20.06, "elapsed_time": "8:30:53", "remaining_time": "1 day, 9:55:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3600, "total_steps": 17941, "loss": 1.8178, "learning_rate": 9.161147115797388e-05, "epoch": 0.20065771138732513, "percentage": 20.07, "elapsed_time": "8:31:02", "remaining_time": "1 day, 9:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3601, "total_steps": 17941, "loss": 1.7343, "learning_rate": 9.160653370988243e-05, "epoch": 0.20071344964048826, "percentage": 20.07, "elapsed_time": "8:31:10", "remaining_time": "1 day, 9:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3602, "total_steps": 17941, "loss": 1.713, "learning_rate": 9.160159494227434e-05, "epoch": 0.20076918789365142, "percentage": 20.08, "elapsed_time": "8:31:18", "remaining_time": "1 day, 9:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3603, "total_steps": 17941, "loss": 1.8839, "learning_rate": 9.15966548553062e-05, "epoch": 0.20082492614681455, "percentage": 20.08, "elapsed_time": "8:31:27", "remaining_time": "1 day, 9:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3604, "total_steps": 17941, "loss": 1.8919, "learning_rate": 9.159171344913469e-05, "epoch": 0.2008806643999777, "percentage": 20.09, "elapsed_time": "8:31:35", "remaining_time": "1 day, 9:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3605, "total_steps": 17941, "loss": 1.7236, "learning_rate": 9.158677072391653e-05, "epoch": 0.20093640265314086, "percentage": 20.09, "elapsed_time": "8:31:44", "remaining_time": "1 day, 9:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3606, "total_steps": 17941, "loss": 1.6551, "learning_rate": 9.158182667980846e-05, "epoch": 0.200992140906304, "percentage": 20.1, "elapsed_time": "8:31:52", "remaining_time": "1 day, 9:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3607, "total_steps": 17941, "loss": 1.6537, "learning_rate": 9.157688131696729e-05, "epoch": 0.20104787915946715, "percentage": 20.1, "elapsed_time": "8:32:01", "remaining_time": "1 day, 9:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3608, "total_steps": 17941, "loss": 1.6112, "learning_rate": 9.157193463554986e-05, "epoch": 0.20110361741263028, "percentage": 20.11, "elapsed_time": "8:32:10", "remaining_time": "1 day, 9:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3609, "total_steps": 17941, "loss": 1.6377, "learning_rate": 9.156698663571305e-05, "epoch": 0.20115935566579343, "percentage": 20.12, "elapsed_time": "8:32:18", "remaining_time": "1 day, 9:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3610, "total_steps": 17941, "loss": 1.7296, "learning_rate": 9.156203731761376e-05, "epoch": 0.2012150939189566, "percentage": 20.12, "elapsed_time": "8:32:27", "remaining_time": "1 day, 9:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3611, "total_steps": 17941, "loss": 1.4073, "learning_rate": 9.155708668140899e-05, "epoch": 0.20127083217211972, "percentage": 20.13, "elapsed_time": "8:32:35", "remaining_time": "1 day, 9:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3612, "total_steps": 17941, "loss": 1.5432, "learning_rate": 9.155213472725571e-05, "epoch": 0.20132657042528287, "percentage": 20.13, "elapsed_time": "8:32:44", "remaining_time": "1 day, 9:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3613, "total_steps": 17941, "loss": 1.79, "learning_rate": 9.154718145531098e-05, "epoch": 0.201382308678446, "percentage": 20.14, "elapsed_time": "8:32:53", "remaining_time": "1 day, 9:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3614, "total_steps": 17941, "loss": 1.4084, "learning_rate": 9.15422268657319e-05, "epoch": 0.20143804693160916, "percentage": 20.14, "elapsed_time": "8:33:01", "remaining_time": "1 day, 9:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3615, "total_steps": 17941, "loss": 1.9196, "learning_rate": 9.15372709586756e-05, "epoch": 0.20149378518477232, "percentage": 20.15, "elapsed_time": "8:33:10", "remaining_time": "1 day, 9:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3616, "total_steps": 17941, "loss": 1.8508, "learning_rate": 9.153231373429922e-05, "epoch": 0.20154952343793545, "percentage": 20.15, "elapsed_time": "8:33:18", "remaining_time": "1 day, 9:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3617, "total_steps": 17941, "loss": 1.8367, "learning_rate": 9.152735519276002e-05, "epoch": 0.2016052616910986, "percentage": 20.16, "elapsed_time": "8:33:27", "remaining_time": "1 day, 9:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3618, "total_steps": 17941, "loss": 1.5819, "learning_rate": 9.152239533421523e-05, "epoch": 0.20166099994426176, "percentage": 20.17, "elapsed_time": "8:33:35", "remaining_time": "1 day, 9:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3619, "total_steps": 17941, "loss": 1.8245, "learning_rate": 9.151743415882215e-05, "epoch": 0.2017167381974249, "percentage": 20.17, "elapsed_time": "8:33:44", "remaining_time": "1 day, 9:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3620, "total_steps": 17941, "loss": 1.6422, "learning_rate": 9.151247166673811e-05, "epoch": 0.20177247645058805, "percentage": 20.18, "elapsed_time": "8:33:52", "remaining_time": "1 day, 9:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3621, "total_steps": 17941, "loss": 1.5992, "learning_rate": 9.150750785812052e-05, "epoch": 0.20182821470375117, "percentage": 20.18, "elapsed_time": "8:34:01", "remaining_time": "1 day, 9:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3622, "total_steps": 17941, "loss": 1.7729, "learning_rate": 9.150254273312677e-05, "epoch": 0.20188395295691433, "percentage": 20.19, "elapsed_time": "8:34:09", "remaining_time": "1 day, 9:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3623, "total_steps": 17941, "loss": 1.8279, "learning_rate": 9.149757629191436e-05, "epoch": 0.2019396912100775, "percentage": 20.19, "elapsed_time": "8:34:18", "remaining_time": "1 day, 9:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3624, "total_steps": 17941, "loss": 1.6135, "learning_rate": 9.149260853464077e-05, "epoch": 0.20199542946324062, "percentage": 20.2, "elapsed_time": "8:34:26", "remaining_time": "1 day, 9:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3625, "total_steps": 17941, "loss": 1.6617, "learning_rate": 9.148763946146354e-05, "epoch": 0.20205116771640377, "percentage": 20.21, "elapsed_time": "8:34:34", "remaining_time": "1 day, 9:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3626, "total_steps": 17941, "loss": 1.9072, "learning_rate": 9.148266907254031e-05, "epoch": 0.2021069059695669, "percentage": 20.21, "elapsed_time": "8:34:43", "remaining_time": "1 day, 9:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3627, "total_steps": 17941, "loss": 1.7807, "learning_rate": 9.147769736802864e-05, "epoch": 0.20216264422273006, "percentage": 20.22, "elapsed_time": "8:34:52", "remaining_time": "1 day, 9:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3628, "total_steps": 17941, "loss": 1.5633, "learning_rate": 9.147272434808627e-05, "epoch": 0.20221838247589322, "percentage": 20.22, "elapsed_time": "8:35:01", "remaining_time": "1 day, 9:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3629, "total_steps": 17941, "loss": 1.579, "learning_rate": 9.146775001287088e-05, "epoch": 0.20227412072905634, "percentage": 20.23, "elapsed_time": "8:35:10", "remaining_time": "1 day, 9:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3630, "total_steps": 17941, "loss": 1.8881, "learning_rate": 9.146277436254022e-05, "epoch": 0.2023298589822195, "percentage": 20.23, "elapsed_time": "8:35:18", "remaining_time": "1 day, 9:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3631, "total_steps": 17941, "loss": 1.7915, "learning_rate": 9.145779739725213e-05, "epoch": 0.20238559723538263, "percentage": 20.24, "elapsed_time": "8:35:26", "remaining_time": "1 day, 9:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3632, "total_steps": 17941, "loss": 1.8006, "learning_rate": 9.14528191171644e-05, "epoch": 0.2024413354885458, "percentage": 20.24, "elapsed_time": "8:35:35", "remaining_time": "1 day, 9:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3633, "total_steps": 17941, "loss": 1.5753, "learning_rate": 9.144783952243493e-05, "epoch": 0.20249707374170894, "percentage": 20.25, "elapsed_time": "8:35:43", "remaining_time": "1 day, 9:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3634, "total_steps": 17941, "loss": 1.7276, "learning_rate": 9.144285861322166e-05, "epoch": 0.20255281199487207, "percentage": 20.26, "elapsed_time": "8:35:52", "remaining_time": "1 day, 9:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3635, "total_steps": 17941, "loss": 1.8898, "learning_rate": 9.143787638968254e-05, "epoch": 0.20260855024803523, "percentage": 20.26, "elapsed_time": "8:36:00", "remaining_time": "1 day, 9:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3636, "total_steps": 17941, "loss": 1.9973, "learning_rate": 9.143289285197558e-05, "epoch": 0.20266428850119836, "percentage": 20.27, "elapsed_time": "8:36:09", "remaining_time": "1 day, 9:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3637, "total_steps": 17941, "loss": 1.7459, "learning_rate": 9.142790800025883e-05, "epoch": 0.20272002675436152, "percentage": 20.27, "elapsed_time": "8:36:17", "remaining_time": "1 day, 9:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3638, "total_steps": 17941, "loss": 1.9412, "learning_rate": 9.142292183469039e-05, "epoch": 0.20277576500752467, "percentage": 20.28, "elapsed_time": "8:36:25", "remaining_time": "1 day, 9:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3639, "total_steps": 17941, "loss": 1.6073, "learning_rate": 9.141793435542836e-05, "epoch": 0.2028315032606878, "percentage": 20.28, "elapsed_time": "8:36:34", "remaining_time": "1 day, 9:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3640, "total_steps": 17941, "loss": 1.5109, "learning_rate": 9.141294556263096e-05, "epoch": 0.20288724151385096, "percentage": 20.29, "elapsed_time": "8:36:42", "remaining_time": "1 day, 9:50:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3641, "total_steps": 17941, "loss": 1.7593, "learning_rate": 9.140795545645636e-05, "epoch": 0.20294297976701411, "percentage": 20.29, "elapsed_time": "8:36:51", "remaining_time": "1 day, 9:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3642, "total_steps": 17941, "loss": 1.6055, "learning_rate": 9.140296403706284e-05, "epoch": 0.20299871802017724, "percentage": 20.3, "elapsed_time": "8:36:59", "remaining_time": "1 day, 9:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3643, "total_steps": 17941, "loss": 2.0113, "learning_rate": 9.13979713046087e-05, "epoch": 0.2030544562733404, "percentage": 20.31, "elapsed_time": "8:37:08", "remaining_time": "1 day, 9:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3644, "total_steps": 17941, "loss": 1.516, "learning_rate": 9.139297725925229e-05, "epoch": 0.20311019452650353, "percentage": 20.31, "elapsed_time": "8:37:16", "remaining_time": "1 day, 9:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3645, "total_steps": 17941, "loss": 1.9002, "learning_rate": 9.138798190115196e-05, "epoch": 0.20316593277966669, "percentage": 20.32, "elapsed_time": "8:37:25", "remaining_time": "1 day, 9:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3646, "total_steps": 17941, "loss": 1.6288, "learning_rate": 9.138298523046617e-05, "epoch": 0.20322167103282984, "percentage": 20.32, "elapsed_time": "8:37:33", "remaining_time": "1 day, 9:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3647, "total_steps": 17941, "loss": 1.4397, "learning_rate": 9.137798724735336e-05, "epoch": 0.20327740928599297, "percentage": 20.33, "elapsed_time": "8:37:42", "remaining_time": "1 day, 9:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3648, "total_steps": 17941, "loss": 2.1691, "learning_rate": 9.137298795197204e-05, "epoch": 0.20333314753915613, "percentage": 20.33, "elapsed_time": "8:37:50", "remaining_time": "1 day, 9:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3649, "total_steps": 17941, "loss": 1.781, "learning_rate": 9.136798734448077e-05, "epoch": 0.20338888579231926, "percentage": 20.34, "elapsed_time": "8:37:58", "remaining_time": "1 day, 9:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3650, "total_steps": 17941, "loss": 1.6205, "learning_rate": 9.136298542503814e-05, "epoch": 0.20344462404548241, "percentage": 20.34, "elapsed_time": "8:38:07", "remaining_time": "1 day, 9:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3651, "total_steps": 17941, "loss": 1.7727, "learning_rate": 9.135798219380276e-05, "epoch": 0.20350036229864557, "percentage": 20.35, "elapsed_time": "8:38:15", "remaining_time": "1 day, 9:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3652, "total_steps": 17941, "loss": 1.7057, "learning_rate": 9.135297765093333e-05, "epoch": 0.2035561005518087, "percentage": 20.36, "elapsed_time": "8:38:24", "remaining_time": "1 day, 9:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3653, "total_steps": 17941, "loss": 1.7132, "learning_rate": 9.134797179658854e-05, "epoch": 0.20361183880497186, "percentage": 20.36, "elapsed_time": "8:38:32", "remaining_time": "1 day, 9:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3654, "total_steps": 17941, "loss": 1.9128, "learning_rate": 9.134296463092717e-05, "epoch": 0.20366757705813499, "percentage": 20.37, "elapsed_time": "8:38:41", "remaining_time": "1 day, 9:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3655, "total_steps": 17941, "loss": 1.6986, "learning_rate": 9.133795615410801e-05, "epoch": 0.20372331531129814, "percentage": 20.37, "elapsed_time": "8:38:49", "remaining_time": "1 day, 9:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3656, "total_steps": 17941, "loss": 1.9381, "learning_rate": 9.13329463662899e-05, "epoch": 0.2037790535644613, "percentage": 20.38, "elapsed_time": "8:38:58", "remaining_time": "1 day, 9:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3657, "total_steps": 17941, "loss": 1.6176, "learning_rate": 9.132793526763171e-05, "epoch": 0.20383479181762443, "percentage": 20.38, "elapsed_time": "8:39:07", "remaining_time": "1 day, 9:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3658, "total_steps": 17941, "loss": 1.5035, "learning_rate": 9.132292285829237e-05, "epoch": 0.20389053007078758, "percentage": 20.39, "elapsed_time": "8:39:15", "remaining_time": "1 day, 9:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3659, "total_steps": 17941, "loss": 1.6288, "learning_rate": 9.131790913843086e-05, "epoch": 0.20394626832395074, "percentage": 20.39, "elapsed_time": "8:39:24", "remaining_time": "1 day, 9:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3660, "total_steps": 17941, "loss": 1.71, "learning_rate": 9.131289410820616e-05, "epoch": 0.20400200657711387, "percentage": 20.4, "elapsed_time": "8:39:32", "remaining_time": "1 day, 9:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3661, "total_steps": 17941, "loss": 1.9395, "learning_rate": 9.130787776777734e-05, "epoch": 0.20405774483027703, "percentage": 20.41, "elapsed_time": "8:39:41", "remaining_time": "1 day, 9:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3662, "total_steps": 17941, "loss": 1.8358, "learning_rate": 9.130286011730347e-05, "epoch": 0.20411348308344016, "percentage": 20.41, "elapsed_time": "8:39:49", "remaining_time": "1 day, 9:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3663, "total_steps": 17941, "loss": 1.602, "learning_rate": 9.129784115694369e-05, "epoch": 0.2041692213366033, "percentage": 20.42, "elapsed_time": "8:39:58", "remaining_time": "1 day, 9:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3664, "total_steps": 17941, "loss": 1.7868, "learning_rate": 9.129282088685718e-05, "epoch": 0.20422495958976647, "percentage": 20.42, "elapsed_time": "8:40:06", "remaining_time": "1 day, 9:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3665, "total_steps": 17941, "loss": 1.6943, "learning_rate": 9.128779930720313e-05, "epoch": 0.2042806978429296, "percentage": 20.43, "elapsed_time": "8:40:14", "remaining_time": "1 day, 9:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3666, "total_steps": 17941, "loss": 1.9083, "learning_rate": 9.128277641814082e-05, "epoch": 0.20433643609609276, "percentage": 20.43, "elapsed_time": "8:40:23", "remaining_time": "1 day, 9:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3667, "total_steps": 17941, "loss": 1.9183, "learning_rate": 9.127775221982954e-05, "epoch": 0.20439217434925588, "percentage": 20.44, "elapsed_time": "8:40:31", "remaining_time": "1 day, 9:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3668, "total_steps": 17941, "loss": 1.6097, "learning_rate": 9.127272671242861e-05, "epoch": 0.20444791260241904, "percentage": 20.44, "elapsed_time": "8:40:40", "remaining_time": "1 day, 9:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3669, "total_steps": 17941, "loss": 1.7121, "learning_rate": 9.126769989609745e-05, "epoch": 0.2045036508555822, "percentage": 20.45, "elapsed_time": "8:40:48", "remaining_time": "1 day, 9:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3670, "total_steps": 17941, "loss": 1.8327, "learning_rate": 9.126267177099543e-05, "epoch": 0.20455938910874533, "percentage": 20.46, "elapsed_time": "8:40:57", "remaining_time": "1 day, 9:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3671, "total_steps": 17941, "loss": 1.9047, "learning_rate": 9.125764233728206e-05, "epoch": 0.20461512736190848, "percentage": 20.46, "elapsed_time": "8:41:05", "remaining_time": "1 day, 9:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3672, "total_steps": 17941, "loss": 1.8311, "learning_rate": 9.125261159511682e-05, "epoch": 0.2046708656150716, "percentage": 20.47, "elapsed_time": "8:41:14", "remaining_time": "1 day, 9:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3673, "total_steps": 17941, "loss": 1.5241, "learning_rate": 9.124757954465925e-05, "epoch": 0.20472660386823477, "percentage": 20.47, "elapsed_time": "8:41:22", "remaining_time": "1 day, 9:45:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3674, "total_steps": 17941, "loss": 1.6949, "learning_rate": 9.124254618606897e-05, "epoch": 0.20478234212139793, "percentage": 20.48, "elapsed_time": "8:41:30", "remaining_time": "1 day, 9:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3675, "total_steps": 17941, "loss": 1.8553, "learning_rate": 9.123751151950557e-05, "epoch": 0.20483808037456105, "percentage": 20.48, "elapsed_time": "8:41:39", "remaining_time": "1 day, 9:45:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3676, "total_steps": 17941, "loss": 1.7906, "learning_rate": 9.123247554512873e-05, "epoch": 0.2048938186277242, "percentage": 20.49, "elapsed_time": "8:41:47", "remaining_time": "1 day, 9:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3677, "total_steps": 17941, "loss": 1.7721, "learning_rate": 9.122743826309819e-05, "epoch": 0.20494955688088734, "percentage": 20.49, "elapsed_time": "8:41:56", "remaining_time": "1 day, 9:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3678, "total_steps": 17941, "loss": 1.9673, "learning_rate": 9.122239967357366e-05, "epoch": 0.2050052951340505, "percentage": 20.5, "elapsed_time": "8:42:05", "remaining_time": "1 day, 9:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3679, "total_steps": 17941, "loss": 2.0516, "learning_rate": 9.121735977671495e-05, "epoch": 0.20506103338721365, "percentage": 20.51, "elapsed_time": "8:42:13", "remaining_time": "1 day, 9:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3680, "total_steps": 17941, "loss": 1.5958, "learning_rate": 9.121231857268191e-05, "epoch": 0.20511677164037678, "percentage": 20.51, "elapsed_time": "8:42:22", "remaining_time": "1 day, 9:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3681, "total_steps": 17941, "loss": 1.6989, "learning_rate": 9.120727606163442e-05, "epoch": 0.20517250989353994, "percentage": 20.52, "elapsed_time": "8:42:30", "remaining_time": "1 day, 9:44:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3682, "total_steps": 17941, "loss": 1.4492, "learning_rate": 9.120223224373238e-05, "epoch": 0.2052282481467031, "percentage": 20.52, "elapsed_time": "8:42:39", "remaining_time": "1 day, 9:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3683, "total_steps": 17941, "loss": 1.6674, "learning_rate": 9.119718711913575e-05, "epoch": 0.20528398639986623, "percentage": 20.53, "elapsed_time": "8:42:48", "remaining_time": "1 day, 9:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3684, "total_steps": 17941, "loss": 1.6326, "learning_rate": 9.119214068800456e-05, "epoch": 0.20533972465302938, "percentage": 20.53, "elapsed_time": "8:42:57", "remaining_time": "1 day, 9:43:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3685, "total_steps": 17941, "loss": 1.9069, "learning_rate": 9.118709295049883e-05, "epoch": 0.2053954629061925, "percentage": 20.54, "elapsed_time": "8:43:05", "remaining_time": "1 day, 9:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3686, "total_steps": 17941, "loss": 1.6096, "learning_rate": 9.118204390677863e-05, "epoch": 0.20545120115935567, "percentage": 20.55, "elapsed_time": "8:43:14", "remaining_time": "1 day, 9:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3687, "total_steps": 17941, "loss": 1.7118, "learning_rate": 9.117699355700412e-05, "epoch": 0.20550693941251882, "percentage": 20.55, "elapsed_time": "8:43:22", "remaining_time": "1 day, 9:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3688, "total_steps": 17941, "loss": 1.713, "learning_rate": 9.117194190133545e-05, "epoch": 0.20556267766568195, "percentage": 20.56, "elapsed_time": "8:43:31", "remaining_time": "1 day, 9:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3689, "total_steps": 17941, "loss": 1.8858, "learning_rate": 9.116688893993284e-05, "epoch": 0.2056184159188451, "percentage": 20.56, "elapsed_time": "8:43:39", "remaining_time": "1 day, 9:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3690, "total_steps": 17941, "loss": 1.5922, "learning_rate": 9.116183467295651e-05, "epoch": 0.20567415417200824, "percentage": 20.57, "elapsed_time": "8:43:48", "remaining_time": "1 day, 9:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3691, "total_steps": 17941, "loss": 1.4441, "learning_rate": 9.115677910056681e-05, "epoch": 0.2057298924251714, "percentage": 20.57, "elapsed_time": "8:43:56", "remaining_time": "1 day, 9:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3692, "total_steps": 17941, "loss": 1.9545, "learning_rate": 9.115172222292401e-05, "epoch": 0.20578563067833455, "percentage": 20.58, "elapsed_time": "8:44:05", "remaining_time": "1 day, 9:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3693, "total_steps": 17941, "loss": 2.0095, "learning_rate": 9.114666404018853e-05, "epoch": 0.20584136893149768, "percentage": 20.58, "elapsed_time": "8:44:14", "remaining_time": "1 day, 9:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3694, "total_steps": 17941, "loss": 1.7295, "learning_rate": 9.114160455252074e-05, "epoch": 0.20589710718466084, "percentage": 20.59, "elapsed_time": "8:44:22", "remaining_time": "1 day, 9:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3695, "total_steps": 17941, "loss": 1.787, "learning_rate": 9.113654376008115e-05, "epoch": 0.20595284543782397, "percentage": 20.6, "elapsed_time": "8:44:31", "remaining_time": "1 day, 9:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3696, "total_steps": 17941, "loss": 1.6167, "learning_rate": 9.113148166303023e-05, "epoch": 0.20600858369098712, "percentage": 20.6, "elapsed_time": "8:44:39", "remaining_time": "1 day, 9:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3697, "total_steps": 17941, "loss": 1.7855, "learning_rate": 9.112641826152853e-05, "epoch": 0.20606432194415028, "percentage": 20.61, "elapsed_time": "8:44:48", "remaining_time": "1 day, 9:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3698, "total_steps": 17941, "loss": 1.7013, "learning_rate": 9.11213535557366e-05, "epoch": 0.2061200601973134, "percentage": 20.61, "elapsed_time": "8:44:56", "remaining_time": "1 day, 9:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3699, "total_steps": 17941, "loss": 1.7804, "learning_rate": 9.111628754581512e-05, "epoch": 0.20617579845047657, "percentage": 20.62, "elapsed_time": "8:45:05", "remaining_time": "1 day, 9:41:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3700, "total_steps": 17941, "loss": 1.8347, "learning_rate": 9.111122023192471e-05, "epoch": 0.2062315367036397, "percentage": 20.62, "elapsed_time": "8:45:13", "remaining_time": "1 day, 9:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3701, "total_steps": 17941, "loss": 1.878, "learning_rate": 9.110615161422609e-05, "epoch": 0.20628727495680285, "percentage": 20.63, "elapsed_time": "8:45:22", "remaining_time": "1 day, 9:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3702, "total_steps": 17941, "loss": 1.7626, "learning_rate": 9.110108169288001e-05, "epoch": 0.206343013209966, "percentage": 20.63, "elapsed_time": "8:45:30", "remaining_time": "1 day, 9:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3703, "total_steps": 17941, "loss": 1.8064, "learning_rate": 9.109601046804726e-05, "epoch": 0.20639875146312914, "percentage": 20.64, "elapsed_time": "8:45:39", "remaining_time": "1 day, 9:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3704, "total_steps": 17941, "loss": 1.8228, "learning_rate": 9.109093793988865e-05, "epoch": 0.2064544897162923, "percentage": 20.65, "elapsed_time": "8:45:47", "remaining_time": "1 day, 9:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3705, "total_steps": 17941, "loss": 1.8011, "learning_rate": 9.108586410856508e-05, "epoch": 0.20651022796945545, "percentage": 20.65, "elapsed_time": "8:45:55", "remaining_time": "1 day, 9:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3706, "total_steps": 17941, "loss": 1.8751, "learning_rate": 9.108078897423743e-05, "epoch": 0.20656596622261858, "percentage": 20.66, "elapsed_time": "8:46:04", "remaining_time": "1 day, 9:40:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3707, "total_steps": 17941, "loss": 1.8607, "learning_rate": 9.107571253706668e-05, "epoch": 0.20662170447578174, "percentage": 20.66, "elapsed_time": "8:46:12", "remaining_time": "1 day, 9:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3708, "total_steps": 17941, "loss": 1.4375, "learning_rate": 9.107063479721383e-05, "epoch": 0.20667744272894487, "percentage": 20.67, "elapsed_time": "8:46:21", "remaining_time": "1 day, 9:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3709, "total_steps": 17941, "loss": 1.3254, "learning_rate": 9.106555575483988e-05, "epoch": 0.20673318098210802, "percentage": 20.67, "elapsed_time": "8:46:29", "remaining_time": "1 day, 9:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3710, "total_steps": 17941, "loss": 1.776, "learning_rate": 9.106047541010593e-05, "epoch": 0.20678891923527118, "percentage": 20.68, "elapsed_time": "8:46:38", "remaining_time": "1 day, 9:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3711, "total_steps": 17941, "loss": 1.7099, "learning_rate": 9.105539376317312e-05, "epoch": 0.2068446574884343, "percentage": 20.68, "elapsed_time": "8:46:46", "remaining_time": "1 day, 9:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3712, "total_steps": 17941, "loss": 1.6337, "learning_rate": 9.105031081420259e-05, "epoch": 0.20690039574159746, "percentage": 20.69, "elapsed_time": "8:46:55", "remaining_time": "1 day, 9:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3713, "total_steps": 17941, "loss": 1.4172, "learning_rate": 9.104522656335553e-05, "epoch": 0.2069561339947606, "percentage": 20.7, "elapsed_time": "8:47:03", "remaining_time": "1 day, 9:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3714, "total_steps": 17941, "loss": 1.6826, "learning_rate": 9.10401410107932e-05, "epoch": 0.20701187224792375, "percentage": 20.7, "elapsed_time": "8:47:12", "remaining_time": "1 day, 9:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3715, "total_steps": 17941, "loss": 1.9881, "learning_rate": 9.103505415667686e-05, "epoch": 0.2070676105010869, "percentage": 20.71, "elapsed_time": "8:47:20", "remaining_time": "1 day, 9:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3716, "total_steps": 17941, "loss": 1.8194, "learning_rate": 9.102996600116786e-05, "epoch": 0.20712334875425004, "percentage": 20.71, "elapsed_time": "8:47:28", "remaining_time": "1 day, 9:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3717, "total_steps": 17941, "loss": 1.9822, "learning_rate": 9.102487654442758e-05, "epoch": 0.2071790870074132, "percentage": 20.72, "elapsed_time": "8:47:37", "remaining_time": "1 day, 9:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3718, "total_steps": 17941, "loss": 1.8422, "learning_rate": 9.101978578661738e-05, "epoch": 0.20723482526057632, "percentage": 20.72, "elapsed_time": "8:47:45", "remaining_time": "1 day, 9:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3719, "total_steps": 17941, "loss": 1.6269, "learning_rate": 9.101469372789874e-05, "epoch": 0.20729056351373948, "percentage": 20.73, "elapsed_time": "8:47:54", "remaining_time": "1 day, 9:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3720, "total_steps": 17941, "loss": 1.6431, "learning_rate": 9.100960036843317e-05, "epoch": 0.20734630176690264, "percentage": 20.73, "elapsed_time": "8:48:02", "remaining_time": "1 day, 9:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3721, "total_steps": 17941, "loss": 1.6332, "learning_rate": 9.100450570838216e-05, "epoch": 0.20740204002006576, "percentage": 20.74, "elapsed_time": "8:48:11", "remaining_time": "1 day, 9:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3722, "total_steps": 17941, "loss": 1.4083, "learning_rate": 9.09994097479073e-05, "epoch": 0.20745777827322892, "percentage": 20.75, "elapsed_time": "8:48:19", "remaining_time": "1 day, 9:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3723, "total_steps": 17941, "loss": 1.673, "learning_rate": 9.099431248717022e-05, "epoch": 0.20751351652639205, "percentage": 20.75, "elapsed_time": "8:48:28", "remaining_time": "1 day, 9:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3724, "total_steps": 17941, "loss": 1.8618, "learning_rate": 9.098921392633255e-05, "epoch": 0.2075692547795552, "percentage": 20.76, "elapsed_time": "8:48:36", "remaining_time": "1 day, 9:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3725, "total_steps": 17941, "loss": 1.761, "learning_rate": 9.0984114065556e-05, "epoch": 0.20762499303271836, "percentage": 20.76, "elapsed_time": "8:48:45", "remaining_time": "1 day, 9:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3726, "total_steps": 17941, "loss": 1.5652, "learning_rate": 9.097901290500231e-05, "epoch": 0.2076807312858815, "percentage": 20.77, "elapsed_time": "8:48:53", "remaining_time": "1 day, 9:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3727, "total_steps": 17941, "loss": 1.6899, "learning_rate": 9.097391044483325e-05, "epoch": 0.20773646953904465, "percentage": 20.77, "elapsed_time": "8:49:01", "remaining_time": "1 day, 9:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3728, "total_steps": 17941, "loss": 2.0674, "learning_rate": 9.096880668521066e-05, "epoch": 0.2077922077922078, "percentage": 20.78, "elapsed_time": "8:49:10", "remaining_time": "1 day, 9:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3729, "total_steps": 17941, "loss": 1.8427, "learning_rate": 9.096370162629637e-05, "epoch": 0.20784794604537093, "percentage": 20.78, "elapsed_time": "8:49:18", "remaining_time": "1 day, 9:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3730, "total_steps": 17941, "loss": 1.6487, "learning_rate": 9.09585952682523e-05, "epoch": 0.2079036842985341, "percentage": 20.79, "elapsed_time": "8:49:27", "remaining_time": "1 day, 9:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3731, "total_steps": 17941, "loss": 1.7153, "learning_rate": 9.09534876112404e-05, "epoch": 0.20795942255169722, "percentage": 20.8, "elapsed_time": "8:49:35", "remaining_time": "1 day, 9:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3732, "total_steps": 17941, "loss": 1.7336, "learning_rate": 9.094837865542265e-05, "epoch": 0.20801516080486038, "percentage": 20.8, "elapsed_time": "8:49:44", "remaining_time": "1 day, 9:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3733, "total_steps": 17941, "loss": 1.4747, "learning_rate": 9.094326840096106e-05, "epoch": 0.20807089905802353, "percentage": 20.81, "elapsed_time": "8:49:52", "remaining_time": "1 day, 9:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3734, "total_steps": 17941, "loss": 1.67, "learning_rate": 9.093815684801772e-05, "epoch": 0.20812663731118666, "percentage": 20.81, "elapsed_time": "8:50:01", "remaining_time": "1 day, 9:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3735, "total_steps": 17941, "loss": 1.8801, "learning_rate": 9.093304399675474e-05, "epoch": 0.20818237556434982, "percentage": 20.82, "elapsed_time": "8:50:10", "remaining_time": "1 day, 9:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3736, "total_steps": 17941, "loss": 1.5878, "learning_rate": 9.092792984733425e-05, "epoch": 0.20823811381751295, "percentage": 20.82, "elapsed_time": "8:50:18", "remaining_time": "1 day, 9:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3737, "total_steps": 17941, "loss": 1.9247, "learning_rate": 9.092281439991846e-05, "epoch": 0.2082938520706761, "percentage": 20.83, "elapsed_time": "8:50:27", "remaining_time": "1 day, 9:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3738, "total_steps": 17941, "loss": 1.7421, "learning_rate": 9.091769765466959e-05, "epoch": 0.20834959032383926, "percentage": 20.83, "elapsed_time": "8:50:35", "remaining_time": "1 day, 9:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3739, "total_steps": 17941, "loss": 2.0567, "learning_rate": 9.091257961174991e-05, "epoch": 0.2084053285770024, "percentage": 20.84, "elapsed_time": "8:50:43", "remaining_time": "1 day, 9:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3740, "total_steps": 17941, "loss": 1.6464, "learning_rate": 9.090746027132175e-05, "epoch": 0.20846106683016555, "percentage": 20.85, "elapsed_time": "8:50:52", "remaining_time": "1 day, 9:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3741, "total_steps": 17941, "loss": 1.8313, "learning_rate": 9.090233963354746e-05, "epoch": 0.20851680508332868, "percentage": 20.85, "elapsed_time": "8:51:00", "remaining_time": "1 day, 9:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3742, "total_steps": 17941, "loss": 1.629, "learning_rate": 9.089721769858943e-05, "epoch": 0.20857254333649183, "percentage": 20.86, "elapsed_time": "8:51:10", "remaining_time": "1 day, 9:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3743, "total_steps": 17941, "loss": 1.6353, "learning_rate": 9.08920944666101e-05, "epoch": 0.208628281589655, "percentage": 20.86, "elapsed_time": "8:51:18", "remaining_time": "1 day, 9:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3744, "total_steps": 17941, "loss": 1.6882, "learning_rate": 9.088696993777194e-05, "epoch": 0.20868401984281812, "percentage": 20.87, "elapsed_time": "8:51:27", "remaining_time": "1 day, 9:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3745, "total_steps": 17941, "loss": 1.5986, "learning_rate": 9.08818441122375e-05, "epoch": 0.20873975809598128, "percentage": 20.87, "elapsed_time": "8:51:35", "remaining_time": "1 day, 9:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3746, "total_steps": 17941, "loss": 1.6445, "learning_rate": 9.08767169901693e-05, "epoch": 0.2087954963491444, "percentage": 20.88, "elapsed_time": "8:51:43", "remaining_time": "1 day, 9:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3747, "total_steps": 17941, "loss": 1.851, "learning_rate": 9.087158857172999e-05, "epoch": 0.20885123460230756, "percentage": 20.89, "elapsed_time": "8:51:52", "remaining_time": "1 day, 9:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3748, "total_steps": 17941, "loss": 1.6359, "learning_rate": 9.086645885708218e-05, "epoch": 0.20890697285547072, "percentage": 20.89, "elapsed_time": "8:52:00", "remaining_time": "1 day, 9:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3749, "total_steps": 17941, "loss": 1.7563, "learning_rate": 9.086132784638857e-05, "epoch": 0.20896271110863385, "percentage": 20.9, "elapsed_time": "8:52:09", "remaining_time": "1 day, 9:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3750, "total_steps": 17941, "loss": 1.8104, "learning_rate": 9.085619553981187e-05, "epoch": 0.209018449361797, "percentage": 20.9, "elapsed_time": "8:52:17", "remaining_time": "1 day, 9:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3751, "total_steps": 17941, "loss": 1.4561, "learning_rate": 9.085106193751485e-05, "epoch": 0.20907418761496016, "percentage": 20.91, "elapsed_time": "8:52:26", "remaining_time": "1 day, 9:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3752, "total_steps": 17941, "loss": 1.6986, "learning_rate": 9.084592703966033e-05, "epoch": 0.2091299258681233, "percentage": 20.91, "elapsed_time": "8:52:34", "remaining_time": "1 day, 9:34:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3753, "total_steps": 17941, "loss": 1.7837, "learning_rate": 9.084079084641115e-05, "epoch": 0.20918566412128645, "percentage": 20.92, "elapsed_time": "8:52:43", "remaining_time": "1 day, 9:33:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3754, "total_steps": 17941, "loss": 1.7262, "learning_rate": 9.083565335793021e-05, "epoch": 0.20924140237444958, "percentage": 20.92, "elapsed_time": "8:52:52", "remaining_time": "1 day, 9:33:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3755, "total_steps": 17941, "loss": 1.7848, "learning_rate": 9.083051457438043e-05, "epoch": 0.20929714062761273, "percentage": 20.93, "elapsed_time": "8:53:00", "remaining_time": "1 day, 9:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3756, "total_steps": 17941, "loss": 2.0356, "learning_rate": 9.082537449592479e-05, "epoch": 0.2093528788807759, "percentage": 20.94, "elapsed_time": "8:53:09", "remaining_time": "1 day, 9:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3757, "total_steps": 17941, "loss": 1.9959, "learning_rate": 9.08202331227263e-05, "epoch": 0.20940861713393902, "percentage": 20.94, "elapsed_time": "8:53:18", "remaining_time": "1 day, 9:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3758, "total_steps": 17941, "loss": 1.7899, "learning_rate": 9.0815090454948e-05, "epoch": 0.20946435538710217, "percentage": 20.95, "elapsed_time": "8:53:26", "remaining_time": "1 day, 9:33:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3759, "total_steps": 17941, "loss": 1.4062, "learning_rate": 9.0809946492753e-05, "epoch": 0.2095200936402653, "percentage": 20.95, "elapsed_time": "8:53:35", "remaining_time": "1 day, 9:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3760, "total_steps": 17941, "loss": 1.6807, "learning_rate": 9.080480123630444e-05, "epoch": 0.20957583189342846, "percentage": 20.96, "elapsed_time": "8:53:43", "remaining_time": "1 day, 9:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3761, "total_steps": 17941, "loss": 1.9714, "learning_rate": 9.07996546857655e-05, "epoch": 0.20963157014659162, "percentage": 20.96, "elapsed_time": "8:53:52", "remaining_time": "1 day, 9:32:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3762, "total_steps": 17941, "loss": 1.7811, "learning_rate": 9.07945068412994e-05, "epoch": 0.20968730839975475, "percentage": 20.97, "elapsed_time": "8:54:00", "remaining_time": "1 day, 9:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3763, "total_steps": 17941, "loss": 1.7003, "learning_rate": 9.078935770306938e-05, "epoch": 0.2097430466529179, "percentage": 20.97, "elapsed_time": "8:54:08", "remaining_time": "1 day, 9:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3764, "total_steps": 17941, "loss": 2.0188, "learning_rate": 9.078420727123874e-05, "epoch": 0.20979878490608103, "percentage": 20.98, "elapsed_time": "8:54:17", "remaining_time": "1 day, 9:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3765, "total_steps": 17941, "loss": 1.7745, "learning_rate": 9.077905554597086e-05, "epoch": 0.2098545231592442, "percentage": 20.99, "elapsed_time": "8:54:25", "remaining_time": "1 day, 9:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3766, "total_steps": 17941, "loss": 1.7723, "learning_rate": 9.077390252742907e-05, "epoch": 0.20991026141240735, "percentage": 20.99, "elapsed_time": "8:54:34", "remaining_time": "1 day, 9:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3767, "total_steps": 17941, "loss": 1.7731, "learning_rate": 9.076874821577683e-05, "epoch": 0.20996599966557047, "percentage": 21.0, "elapsed_time": "8:54:42", "remaining_time": "1 day, 9:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3768, "total_steps": 17941, "loss": 1.6495, "learning_rate": 9.07635926111776e-05, "epoch": 0.21002173791873363, "percentage": 21.0, "elapsed_time": "8:54:50", "remaining_time": "1 day, 9:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3769, "total_steps": 17941, "loss": 1.9732, "learning_rate": 9.075843571379488e-05, "epoch": 0.21007747617189676, "percentage": 21.01, "elapsed_time": "8:54:59", "remaining_time": "1 day, 9:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3770, "total_steps": 17941, "loss": 1.8381, "learning_rate": 9.075327752379221e-05, "epoch": 0.21013321442505992, "percentage": 21.01, "elapsed_time": "8:55:07", "remaining_time": "1 day, 9:31:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3771, "total_steps": 17941, "loss": 1.7662, "learning_rate": 9.074811804133318e-05, "epoch": 0.21018895267822307, "percentage": 21.02, "elapsed_time": "8:55:16", "remaining_time": "1 day, 9:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3772, "total_steps": 17941, "loss": 1.6434, "learning_rate": 9.074295726658144e-05, "epoch": 0.2102446909313862, "percentage": 21.02, "elapsed_time": "8:55:24", "remaining_time": "1 day, 9:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3773, "total_steps": 17941, "loss": 1.7831, "learning_rate": 9.073779519970065e-05, "epoch": 0.21030042918454936, "percentage": 21.03, "elapsed_time": "8:55:33", "remaining_time": "1 day, 9:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3774, "total_steps": 17941, "loss": 1.9085, "learning_rate": 9.07326318408545e-05, "epoch": 0.21035616743771252, "percentage": 21.04, "elapsed_time": "8:55:41", "remaining_time": "1 day, 9:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3775, "total_steps": 17941, "loss": 1.851, "learning_rate": 9.072746719020676e-05, "epoch": 0.21041190569087564, "percentage": 21.04, "elapsed_time": "8:55:51", "remaining_time": "1 day, 9:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3776, "total_steps": 17941, "loss": 1.9007, "learning_rate": 9.072230124792121e-05, "epoch": 0.2104676439440388, "percentage": 21.05, "elapsed_time": "8:55:59", "remaining_time": "1 day, 9:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3777, "total_steps": 17941, "loss": 1.7664, "learning_rate": 9.07171340141617e-05, "epoch": 0.21052338219720193, "percentage": 21.05, "elapsed_time": "8:56:08", "remaining_time": "1 day, 9:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3778, "total_steps": 17941, "loss": 1.5912, "learning_rate": 9.071196548909208e-05, "epoch": 0.2105791204503651, "percentage": 21.06, "elapsed_time": "8:56:16", "remaining_time": "1 day, 9:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3779, "total_steps": 17941, "loss": 1.8595, "learning_rate": 9.070679567287631e-05, "epoch": 0.21063485870352824, "percentage": 21.06, "elapsed_time": "8:56:24", "remaining_time": "1 day, 9:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3780, "total_steps": 17941, "loss": 1.5864, "learning_rate": 9.07016245656783e-05, "epoch": 0.21069059695669137, "percentage": 21.07, "elapsed_time": "8:56:33", "remaining_time": "1 day, 9:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3781, "total_steps": 17941, "loss": 1.8166, "learning_rate": 9.069645216766208e-05, "epoch": 0.21074633520985453, "percentage": 21.07, "elapsed_time": "8:56:41", "remaining_time": "1 day, 9:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3782, "total_steps": 17941, "loss": 1.7482, "learning_rate": 9.069127847899166e-05, "epoch": 0.21080207346301766, "percentage": 21.08, "elapsed_time": "8:56:50", "remaining_time": "1 day, 9:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3783, "total_steps": 17941, "loss": 1.7065, "learning_rate": 9.068610349983113e-05, "epoch": 0.21085781171618082, "percentage": 21.09, "elapsed_time": "8:56:58", "remaining_time": "1 day, 9:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3784, "total_steps": 17941, "loss": 1.7781, "learning_rate": 9.068092723034462e-05, "epoch": 0.21091354996934397, "percentage": 21.09, "elapsed_time": "8:57:07", "remaining_time": "1 day, 9:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3785, "total_steps": 17941, "loss": 1.7871, "learning_rate": 9.067574967069628e-05, "epoch": 0.2109692882225071, "percentage": 21.1, "elapsed_time": "8:57:15", "remaining_time": "1 day, 9:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3786, "total_steps": 17941, "loss": 1.9512, "learning_rate": 9.067057082105032e-05, "epoch": 0.21102502647567026, "percentage": 21.1, "elapsed_time": "8:57:23", "remaining_time": "1 day, 9:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3787, "total_steps": 17941, "loss": 1.4585, "learning_rate": 9.066539068157098e-05, "epoch": 0.2110807647288334, "percentage": 21.11, "elapsed_time": "8:57:32", "remaining_time": "1 day, 9:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3788, "total_steps": 17941, "loss": 1.9236, "learning_rate": 9.066020925242256e-05, "epoch": 0.21113650298199654, "percentage": 21.11, "elapsed_time": "8:57:40", "remaining_time": "1 day, 9:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3789, "total_steps": 17941, "loss": 1.67, "learning_rate": 9.065502653376935e-05, "epoch": 0.2111922412351597, "percentage": 21.12, "elapsed_time": "8:57:49", "remaining_time": "1 day, 9:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3790, "total_steps": 17941, "loss": 1.8769, "learning_rate": 9.064984252577573e-05, "epoch": 0.21124797948832283, "percentage": 21.12, "elapsed_time": "8:57:58", "remaining_time": "1 day, 9:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3791, "total_steps": 17941, "loss": 1.6658, "learning_rate": 9.064465722860611e-05, "epoch": 0.21130371774148599, "percentage": 21.13, "elapsed_time": "8:58:06", "remaining_time": "1 day, 9:28:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3792, "total_steps": 17941, "loss": 1.7003, "learning_rate": 9.063947064242495e-05, "epoch": 0.21135945599464911, "percentage": 21.14, "elapsed_time": "8:58:15", "remaining_time": "1 day, 9:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3793, "total_steps": 17941, "loss": 1.7658, "learning_rate": 9.063428276739671e-05, "epoch": 0.21141519424781227, "percentage": 21.14, "elapsed_time": "8:58:23", "remaining_time": "1 day, 9:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3794, "total_steps": 17941, "loss": 1.7443, "learning_rate": 9.062909360368595e-05, "epoch": 0.21147093250097543, "percentage": 21.15, "elapsed_time": "8:58:32", "remaining_time": "1 day, 9:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3795, "total_steps": 17941, "loss": 1.4051, "learning_rate": 9.062390315145723e-05, "epoch": 0.21152667075413856, "percentage": 21.15, "elapsed_time": "8:58:40", "remaining_time": "1 day, 9:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3796, "total_steps": 17941, "loss": 1.6788, "learning_rate": 9.061871141087515e-05, "epoch": 0.2115824090073017, "percentage": 21.16, "elapsed_time": "8:58:49", "remaining_time": "1 day, 9:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3797, "total_steps": 17941, "loss": 1.7306, "learning_rate": 9.061351838210434e-05, "epoch": 0.21163814726046487, "percentage": 21.16, "elapsed_time": "8:58:57", "remaining_time": "1 day, 9:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3798, "total_steps": 17941, "loss": 1.7759, "learning_rate": 9.060832406530955e-05, "epoch": 0.211693885513628, "percentage": 21.17, "elapsed_time": "8:59:06", "remaining_time": "1 day, 9:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3799, "total_steps": 17941, "loss": 1.8155, "learning_rate": 9.060312846065548e-05, "epoch": 0.21174962376679116, "percentage": 21.17, "elapsed_time": "8:59:15", "remaining_time": "1 day, 9:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3800, "total_steps": 17941, "loss": 1.9103, "learning_rate": 9.059793156830691e-05, "epoch": 0.21180536201995429, "percentage": 21.18, "elapsed_time": "8:59:23", "remaining_time": "1 day, 9:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3801, "total_steps": 17941, "loss": 1.6333, "learning_rate": 9.059273338842864e-05, "epoch": 0.21186110027311744, "percentage": 21.19, "elapsed_time": "8:59:32", "remaining_time": "1 day, 9:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3802, "total_steps": 17941, "loss": 1.9328, "learning_rate": 9.058753392118555e-05, "epoch": 0.2119168385262806, "percentage": 21.19, "elapsed_time": "8:59:40", "remaining_time": "1 day, 9:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3803, "total_steps": 17941, "loss": 1.6296, "learning_rate": 9.058233316674252e-05, "epoch": 0.21197257677944373, "percentage": 21.2, "elapsed_time": "8:59:49", "remaining_time": "1 day, 9:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3804, "total_steps": 17941, "loss": 1.6512, "learning_rate": 9.057713112526449e-05, "epoch": 0.21202831503260688, "percentage": 21.2, "elapsed_time": "8:59:57", "remaining_time": "1 day, 9:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3805, "total_steps": 17941, "loss": 1.793, "learning_rate": 9.057192779691645e-05, "epoch": 0.21208405328577, "percentage": 21.21, "elapsed_time": "9:00:06", "remaining_time": "1 day, 9:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3806, "total_steps": 17941, "loss": 1.8989, "learning_rate": 9.05667231818634e-05, "epoch": 0.21213979153893317, "percentage": 21.21, "elapsed_time": "9:00:14", "remaining_time": "1 day, 9:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3807, "total_steps": 17941, "loss": 1.7235, "learning_rate": 9.056151728027042e-05, "epoch": 0.21219552979209633, "percentage": 21.22, "elapsed_time": "9:00:22", "remaining_time": "1 day, 9:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3808, "total_steps": 17941, "loss": 1.779, "learning_rate": 9.055631009230262e-05, "epoch": 0.21225126804525946, "percentage": 21.23, "elapsed_time": "9:00:31", "remaining_time": "1 day, 9:26:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3809, "total_steps": 17941, "loss": 1.9023, "learning_rate": 9.05511016181251e-05, "epoch": 0.2123070062984226, "percentage": 21.23, "elapsed_time": "9:00:39", "remaining_time": "1 day, 9:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3810, "total_steps": 17941, "loss": 1.6484, "learning_rate": 9.054589185790305e-05, "epoch": 0.21236274455158574, "percentage": 21.24, "elapsed_time": "9:00:48", "remaining_time": "1 day, 9:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3811, "total_steps": 17941, "loss": 1.6866, "learning_rate": 9.054068081180173e-05, "epoch": 0.2124184828047489, "percentage": 21.24, "elapsed_time": "9:00:56", "remaining_time": "1 day, 9:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3812, "total_steps": 17941, "loss": 1.6013, "learning_rate": 9.05354684799864e-05, "epoch": 0.21247422105791205, "percentage": 21.25, "elapsed_time": "9:01:05", "remaining_time": "1 day, 9:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3813, "total_steps": 17941, "loss": 1.7741, "learning_rate": 9.053025486262231e-05, "epoch": 0.21252995931107518, "percentage": 21.25, "elapsed_time": "9:01:13", "remaining_time": "1 day, 9:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3814, "total_steps": 17941, "loss": 1.7829, "learning_rate": 9.052503995987488e-05, "epoch": 0.21258569756423834, "percentage": 21.26, "elapsed_time": "9:01:22", "remaining_time": "1 day, 9:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3815, "total_steps": 17941, "loss": 1.6395, "learning_rate": 9.051982377190944e-05, "epoch": 0.21264143581740147, "percentage": 21.26, "elapsed_time": "9:01:30", "remaining_time": "1 day, 9:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3816, "total_steps": 17941, "loss": 1.4752, "learning_rate": 9.051460629889144e-05, "epoch": 0.21269717407056463, "percentage": 21.27, "elapsed_time": "9:01:39", "remaining_time": "1 day, 9:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3817, "total_steps": 17941, "loss": 1.7896, "learning_rate": 9.050938754098635e-05, "epoch": 0.21275291232372778, "percentage": 21.28, "elapsed_time": "9:01:47", "remaining_time": "1 day, 9:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3818, "total_steps": 17941, "loss": 1.5488, "learning_rate": 9.050416749835968e-05, "epoch": 0.2128086505768909, "percentage": 21.28, "elapsed_time": "9:01:55", "remaining_time": "1 day, 9:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3819, "total_steps": 17941, "loss": 1.9669, "learning_rate": 9.049894617117696e-05, "epoch": 0.21286438883005407, "percentage": 21.29, "elapsed_time": "9:02:04", "remaining_time": "1 day, 9:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3820, "total_steps": 17941, "loss": 1.761, "learning_rate": 9.04937235596038e-05, "epoch": 0.21292012708321723, "percentage": 21.29, "elapsed_time": "9:02:12", "remaining_time": "1 day, 9:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3821, "total_steps": 17941, "loss": 1.7399, "learning_rate": 9.04884996638058e-05, "epoch": 0.21297586533638035, "percentage": 21.3, "elapsed_time": "9:02:21", "remaining_time": "1 day, 9:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3822, "total_steps": 17941, "loss": 1.863, "learning_rate": 9.048327448394868e-05, "epoch": 0.2130316035895435, "percentage": 21.3, "elapsed_time": "9:02:29", "remaining_time": "1 day, 9:24:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3823, "total_steps": 17941, "loss": 1.4662, "learning_rate": 9.047804802019813e-05, "epoch": 0.21308734184270664, "percentage": 21.31, "elapsed_time": "9:02:38", "remaining_time": "1 day, 9:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3824, "total_steps": 17941, "loss": 1.7569, "learning_rate": 9.047282027271988e-05, "epoch": 0.2131430800958698, "percentage": 21.31, "elapsed_time": "9:02:46", "remaining_time": "1 day, 9:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3825, "total_steps": 17941, "loss": 1.5647, "learning_rate": 9.046759124167976e-05, "epoch": 0.21319881834903295, "percentage": 21.32, "elapsed_time": "9:02:54", "remaining_time": "1 day, 9:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3826, "total_steps": 17941, "loss": 1.8287, "learning_rate": 9.046236092724357e-05, "epoch": 0.21325455660219608, "percentage": 21.33, "elapsed_time": "9:03:03", "remaining_time": "1 day, 9:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3827, "total_steps": 17941, "loss": 1.7175, "learning_rate": 9.045712932957722e-05, "epoch": 0.21331029485535924, "percentage": 21.33, "elapsed_time": "9:03:11", "remaining_time": "1 day, 9:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3828, "total_steps": 17941, "loss": 1.9759, "learning_rate": 9.045189644884661e-05, "epoch": 0.21336603310852237, "percentage": 21.34, "elapsed_time": "9:03:20", "remaining_time": "1 day, 9:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3829, "total_steps": 17941, "loss": 1.7102, "learning_rate": 9.04466622852177e-05, "epoch": 0.21342177136168552, "percentage": 21.34, "elapsed_time": "9:03:28", "remaining_time": "1 day, 9:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3830, "total_steps": 17941, "loss": 1.647, "learning_rate": 9.044142683885645e-05, "epoch": 0.21347750961484868, "percentage": 21.35, "elapsed_time": "9:03:37", "remaining_time": "1 day, 9:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3831, "total_steps": 17941, "loss": 2.2611, "learning_rate": 9.043619010992897e-05, "epoch": 0.2135332478680118, "percentage": 21.35, "elapsed_time": "9:03:45", "remaining_time": "1 day, 9:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3832, "total_steps": 17941, "loss": 1.7279, "learning_rate": 9.043095209860128e-05, "epoch": 0.21358898612117497, "percentage": 21.36, "elapsed_time": "9:03:54", "remaining_time": "1 day, 9:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3833, "total_steps": 17941, "loss": 1.7293, "learning_rate": 9.042571280503951e-05, "epoch": 0.2136447243743381, "percentage": 21.36, "elapsed_time": "9:04:02", "remaining_time": "1 day, 9:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3834, "total_steps": 17941, "loss": 1.8327, "learning_rate": 9.042047222940985e-05, "epoch": 0.21370046262750125, "percentage": 21.37, "elapsed_time": "9:04:11", "remaining_time": "1 day, 9:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3835, "total_steps": 17941, "loss": 1.6961, "learning_rate": 9.041523037187847e-05, "epoch": 0.2137562008806644, "percentage": 21.38, "elapsed_time": "9:04:19", "remaining_time": "1 day, 9:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3836, "total_steps": 17941, "loss": 1.8019, "learning_rate": 9.04099872326116e-05, "epoch": 0.21381193913382754, "percentage": 21.38, "elapsed_time": "9:04:27", "remaining_time": "1 day, 9:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3837, "total_steps": 17941, "loss": 1.7182, "learning_rate": 9.040474281177557e-05, "epoch": 0.2138676773869907, "percentage": 21.39, "elapsed_time": "9:04:36", "remaining_time": "1 day, 9:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3838, "total_steps": 17941, "loss": 1.903, "learning_rate": 9.039949710953665e-05, "epoch": 0.21392341564015382, "percentage": 21.39, "elapsed_time": "9:04:45", "remaining_time": "1 day, 9:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3839, "total_steps": 17941, "loss": 1.6652, "learning_rate": 9.039425012606125e-05, "epoch": 0.21397915389331698, "percentage": 21.4, "elapsed_time": "9:04:53", "remaining_time": "1 day, 9:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3840, "total_steps": 17941, "loss": 1.8062, "learning_rate": 9.038900186151575e-05, "epoch": 0.21403489214648014, "percentage": 21.4, "elapsed_time": "9:05:03", "remaining_time": "1 day, 9:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3841, "total_steps": 17941, "loss": 1.7376, "learning_rate": 9.038375231606659e-05, "epoch": 0.21409063039964327, "percentage": 21.41, "elapsed_time": "9:05:11", "remaining_time": "1 day, 9:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3842, "total_steps": 17941, "loss": 1.7724, "learning_rate": 9.037850148988026e-05, "epoch": 0.21414636865280642, "percentage": 21.41, "elapsed_time": "9:05:20", "remaining_time": "1 day, 9:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3843, "total_steps": 17941, "loss": 1.9338, "learning_rate": 9.037324938312327e-05, "epoch": 0.21420210690596958, "percentage": 21.42, "elapsed_time": "9:05:28", "remaining_time": "1 day, 9:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3844, "total_steps": 17941, "loss": 1.6685, "learning_rate": 9.036799599596222e-05, "epoch": 0.2142578451591327, "percentage": 21.43, "elapsed_time": "9:05:36", "remaining_time": "1 day, 9:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3845, "total_steps": 17941, "loss": 1.6111, "learning_rate": 9.036274132856368e-05, "epoch": 0.21431358341229587, "percentage": 21.43, "elapsed_time": "9:05:45", "remaining_time": "1 day, 9:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3846, "total_steps": 17941, "loss": 1.7406, "learning_rate": 9.035748538109433e-05, "epoch": 0.214369321665459, "percentage": 21.44, "elapsed_time": "9:05:53", "remaining_time": "1 day, 9:20:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3847, "total_steps": 17941, "loss": 2.0365, "learning_rate": 9.035222815372084e-05, "epoch": 0.21442505991862215, "percentage": 21.44, "elapsed_time": "9:06:02", "remaining_time": "1 day, 9:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3848, "total_steps": 17941, "loss": 1.7869, "learning_rate": 9.034696964660996e-05, "epoch": 0.2144807981717853, "percentage": 21.45, "elapsed_time": "9:06:10", "remaining_time": "1 day, 9:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3849, "total_steps": 17941, "loss": 1.9884, "learning_rate": 9.034170985992843e-05, "epoch": 0.21453653642494844, "percentage": 21.45, "elapsed_time": "9:06:20", "remaining_time": "1 day, 9:20:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3850, "total_steps": 17941, "loss": 1.7483, "learning_rate": 9.033644879384307e-05, "epoch": 0.2145922746781116, "percentage": 21.46, "elapsed_time": "9:06:28", "remaining_time": "1 day, 9:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3851, "total_steps": 17941, "loss": 1.7319, "learning_rate": 9.033118644852073e-05, "epoch": 0.21464801293127472, "percentage": 21.46, "elapsed_time": "9:06:36", "remaining_time": "1 day, 9:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3852, "total_steps": 17941, "loss": 1.806, "learning_rate": 9.032592282412831e-05, "epoch": 0.21470375118443788, "percentage": 21.47, "elapsed_time": "9:06:46", "remaining_time": "1 day, 9:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3853, "total_steps": 17941, "loss": 1.7784, "learning_rate": 9.032065792083271e-05, "epoch": 0.21475948943760104, "percentage": 21.48, "elapsed_time": "9:06:54", "remaining_time": "1 day, 9:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3854, "total_steps": 17941, "loss": 1.8283, "learning_rate": 9.031539173880095e-05, "epoch": 0.21481522769076417, "percentage": 21.48, "elapsed_time": "9:07:02", "remaining_time": "1 day, 9:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3855, "total_steps": 17941, "loss": 1.8088, "learning_rate": 9.031012427820003e-05, "epoch": 0.21487096594392732, "percentage": 21.49, "elapsed_time": "9:07:11", "remaining_time": "1 day, 9:19:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3856, "total_steps": 17941, "loss": 2.021, "learning_rate": 9.030485553919696e-05, "epoch": 0.21492670419709045, "percentage": 21.49, "elapsed_time": "9:07:19", "remaining_time": "1 day, 9:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3857, "total_steps": 17941, "loss": 1.7416, "learning_rate": 9.029958552195889e-05, "epoch": 0.2149824424502536, "percentage": 21.5, "elapsed_time": "9:07:28", "remaining_time": "1 day, 9:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3858, "total_steps": 17941, "loss": 1.7158, "learning_rate": 9.029431422665292e-05, "epoch": 0.21503818070341676, "percentage": 21.5, "elapsed_time": "9:07:36", "remaining_time": "1 day, 9:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3859, "total_steps": 17941, "loss": 1.904, "learning_rate": 9.028904165344622e-05, "epoch": 0.2150939189565799, "percentage": 21.51, "elapsed_time": "9:07:45", "remaining_time": "1 day, 9:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3860, "total_steps": 17941, "loss": 1.5227, "learning_rate": 9.028376780250605e-05, "epoch": 0.21514965720974305, "percentage": 21.51, "elapsed_time": "9:07:53", "remaining_time": "1 day, 9:18:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3861, "total_steps": 17941, "loss": 1.8613, "learning_rate": 9.027849267399962e-05, "epoch": 0.21520539546290618, "percentage": 21.52, "elapsed_time": "9:08:02", "remaining_time": "1 day, 9:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3862, "total_steps": 17941, "loss": 1.7657, "learning_rate": 9.027321626809425e-05, "epoch": 0.21526113371606934, "percentage": 21.53, "elapsed_time": "9:08:10", "remaining_time": "1 day, 9:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3863, "total_steps": 17941, "loss": 1.7117, "learning_rate": 9.026793858495727e-05, "epoch": 0.2153168719692325, "percentage": 21.53, "elapsed_time": "9:08:19", "remaining_time": "1 day, 9:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3864, "total_steps": 17941, "loss": 1.781, "learning_rate": 9.026265962475605e-05, "epoch": 0.21537261022239562, "percentage": 21.54, "elapsed_time": "9:08:27", "remaining_time": "1 day, 9:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3865, "total_steps": 17941, "loss": 1.8402, "learning_rate": 9.025737938765801e-05, "epoch": 0.21542834847555878, "percentage": 21.54, "elapsed_time": "9:08:36", "remaining_time": "1 day, 9:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3866, "total_steps": 17941, "loss": 1.637, "learning_rate": 9.025209787383062e-05, "epoch": 0.21548408672872194, "percentage": 21.55, "elapsed_time": "9:08:44", "remaining_time": "1 day, 9:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3867, "total_steps": 17941, "loss": 1.7487, "learning_rate": 9.024681508344138e-05, "epoch": 0.21553982498188506, "percentage": 21.55, "elapsed_time": "9:08:53", "remaining_time": "1 day, 9:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3868, "total_steps": 17941, "loss": 1.8556, "learning_rate": 9.024153101665782e-05, "epoch": 0.21559556323504822, "percentage": 21.56, "elapsed_time": "9:09:02", "remaining_time": "1 day, 9:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3869, "total_steps": 17941, "loss": 1.8144, "learning_rate": 9.02362456736475e-05, "epoch": 0.21565130148821135, "percentage": 21.57, "elapsed_time": "9:09:10", "remaining_time": "1 day, 9:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3870, "total_steps": 17941, "loss": 1.7709, "learning_rate": 9.023095905457807e-05, "epoch": 0.2157070397413745, "percentage": 21.57, "elapsed_time": "9:09:19", "remaining_time": "1 day, 9:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3871, "total_steps": 17941, "loss": 1.7373, "learning_rate": 9.022567115961718e-05, "epoch": 0.21576277799453766, "percentage": 21.58, "elapsed_time": "9:09:27", "remaining_time": "1 day, 9:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3872, "total_steps": 17941, "loss": 1.642, "learning_rate": 9.022038198893254e-05, "epoch": 0.2158185162477008, "percentage": 21.58, "elapsed_time": "9:09:36", "remaining_time": "1 day, 9:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3873, "total_steps": 17941, "loss": 1.7393, "learning_rate": 9.021509154269187e-05, "epoch": 0.21587425450086395, "percentage": 21.59, "elapsed_time": "9:09:44", "remaining_time": "1 day, 9:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3874, "total_steps": 17941, "loss": 1.7803, "learning_rate": 9.0209799821063e-05, "epoch": 0.21592999275402708, "percentage": 21.59, "elapsed_time": "9:09:53", "remaining_time": "1 day, 9:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3875, "total_steps": 17941, "loss": 1.6007, "learning_rate": 9.020450682421368e-05, "epoch": 0.21598573100719023, "percentage": 21.6, "elapsed_time": "9:10:02", "remaining_time": "1 day, 9:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3876, "total_steps": 17941, "loss": 1.7964, "learning_rate": 9.019921255231183e-05, "epoch": 0.2160414692603534, "percentage": 21.6, "elapsed_time": "9:10:11", "remaining_time": "1 day, 9:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3877, "total_steps": 17941, "loss": 1.7572, "learning_rate": 9.019391700552533e-05, "epoch": 0.21609720751351652, "percentage": 21.61, "elapsed_time": "9:10:19", "remaining_time": "1 day, 9:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3878, "total_steps": 17941, "loss": 1.7768, "learning_rate": 9.018862018402214e-05, "epoch": 0.21615294576667968, "percentage": 21.62, "elapsed_time": "9:10:27", "remaining_time": "1 day, 9:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3879, "total_steps": 17941, "loss": 1.8262, "learning_rate": 9.018332208797023e-05, "epoch": 0.2162086840198428, "percentage": 21.62, "elapsed_time": "9:10:36", "remaining_time": "1 day, 9:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3880, "total_steps": 17941, "loss": 1.7966, "learning_rate": 9.017802271753763e-05, "epoch": 0.21626442227300596, "percentage": 21.63, "elapsed_time": "9:10:45", "remaining_time": "1 day, 9:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3881, "total_steps": 17941, "loss": 1.7047, "learning_rate": 9.017272207289241e-05, "epoch": 0.21632016052616912, "percentage": 21.63, "elapsed_time": "9:10:53", "remaining_time": "1 day, 9:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3882, "total_steps": 17941, "loss": 1.6662, "learning_rate": 9.016742015420264e-05, "epoch": 0.21637589877933225, "percentage": 21.64, "elapsed_time": "9:11:03", "remaining_time": "1 day, 9:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3883, "total_steps": 17941, "loss": 1.6667, "learning_rate": 9.016211696163651e-05, "epoch": 0.2164316370324954, "percentage": 21.64, "elapsed_time": "9:11:11", "remaining_time": "1 day, 9:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3884, "total_steps": 17941, "loss": 1.7085, "learning_rate": 9.015681249536219e-05, "epoch": 0.21648737528565853, "percentage": 21.65, "elapsed_time": "9:11:20", "remaining_time": "1 day, 9:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3885, "total_steps": 17941, "loss": 1.7739, "learning_rate": 9.015150675554791e-05, "epoch": 0.2165431135388217, "percentage": 21.65, "elapsed_time": "9:11:28", "remaining_time": "1 day, 9:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3886, "total_steps": 17941, "loss": 1.5412, "learning_rate": 9.014619974236195e-05, "epoch": 0.21659885179198485, "percentage": 21.66, "elapsed_time": "9:11:37", "remaining_time": "1 day, 9:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3887, "total_steps": 17941, "loss": 1.6956, "learning_rate": 9.014089145597259e-05, "epoch": 0.21665459004514798, "percentage": 21.67, "elapsed_time": "9:11:46", "remaining_time": "1 day, 9:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3888, "total_steps": 17941, "loss": 1.6772, "learning_rate": 9.013558189654819e-05, "epoch": 0.21671032829831113, "percentage": 21.67, "elapsed_time": "9:11:54", "remaining_time": "1 day, 9:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3889, "total_steps": 17941, "loss": 1.7071, "learning_rate": 9.013027106425713e-05, "epoch": 0.2167660665514743, "percentage": 21.68, "elapsed_time": "9:12:03", "remaining_time": "1 day, 9:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3890, "total_steps": 17941, "loss": 1.9886, "learning_rate": 9.012495895926786e-05, "epoch": 0.21682180480463742, "percentage": 21.68, "elapsed_time": "9:12:11", "remaining_time": "1 day, 9:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3891, "total_steps": 17941, "loss": 1.6111, "learning_rate": 9.011964558174884e-05, "epoch": 0.21687754305780058, "percentage": 21.69, "elapsed_time": "9:12:20", "remaining_time": "1 day, 9:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3892, "total_steps": 17941, "loss": 1.7192, "learning_rate": 9.011433093186856e-05, "epoch": 0.2169332813109637, "percentage": 21.69, "elapsed_time": "9:12:28", "remaining_time": "1 day, 9:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3893, "total_steps": 17941, "loss": 1.727, "learning_rate": 9.01090150097956e-05, "epoch": 0.21698901956412686, "percentage": 21.7, "elapsed_time": "9:12:37", "remaining_time": "1 day, 9:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3894, "total_steps": 17941, "loss": 1.5865, "learning_rate": 9.010369781569854e-05, "epoch": 0.21704475781729002, "percentage": 21.7, "elapsed_time": "9:12:45", "remaining_time": "1 day, 9:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3895, "total_steps": 17941, "loss": 1.6708, "learning_rate": 9.009837934974598e-05, "epoch": 0.21710049607045315, "percentage": 21.71, "elapsed_time": "9:12:53", "remaining_time": "1 day, 9:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3896, "total_steps": 17941, "loss": 1.816, "learning_rate": 9.009305961210664e-05, "epoch": 0.2171562343236163, "percentage": 21.72, "elapsed_time": "9:13:02", "remaining_time": "1 day, 9:13:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3897, "total_steps": 17941, "loss": 1.6085, "learning_rate": 9.008773860294921e-05, "epoch": 0.21721197257677943, "percentage": 21.72, "elapsed_time": "9:13:10", "remaining_time": "1 day, 9:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3898, "total_steps": 17941, "loss": 2.0664, "learning_rate": 9.008241632244243e-05, "epoch": 0.2172677108299426, "percentage": 21.73, "elapsed_time": "9:13:19", "remaining_time": "1 day, 9:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3899, "total_steps": 17941, "loss": 1.6078, "learning_rate": 9.00770927707551e-05, "epoch": 0.21732344908310575, "percentage": 21.73, "elapsed_time": "9:13:27", "remaining_time": "1 day, 9:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3900, "total_steps": 17941, "loss": 1.6985, "learning_rate": 9.007176794805606e-05, "epoch": 0.21737918733626888, "percentage": 21.74, "elapsed_time": "9:13:36", "remaining_time": "1 day, 9:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3901, "total_steps": 17941, "loss": 1.824, "learning_rate": 9.006644185451416e-05, "epoch": 0.21743492558943203, "percentage": 21.74, "elapsed_time": "9:13:44", "remaining_time": "1 day, 9:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3902, "total_steps": 17941, "loss": 1.674, "learning_rate": 9.006111449029835e-05, "epoch": 0.21749066384259516, "percentage": 21.75, "elapsed_time": "9:13:53", "remaining_time": "1 day, 9:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3903, "total_steps": 17941, "loss": 1.5491, "learning_rate": 9.005578585557754e-05, "epoch": 0.21754640209575832, "percentage": 21.75, "elapsed_time": "9:14:01", "remaining_time": "1 day, 9:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3904, "total_steps": 17941, "loss": 1.7583, "learning_rate": 9.005045595052077e-05, "epoch": 0.21760214034892147, "percentage": 21.76, "elapsed_time": "9:14:10", "remaining_time": "1 day, 9:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3905, "total_steps": 17941, "loss": 1.6147, "learning_rate": 9.004512477529702e-05, "epoch": 0.2176578786020846, "percentage": 21.77, "elapsed_time": "9:14:18", "remaining_time": "1 day, 9:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3906, "total_steps": 17941, "loss": 1.7576, "learning_rate": 9.003979233007541e-05, "epoch": 0.21771361685524776, "percentage": 21.77, "elapsed_time": "9:14:27", "remaining_time": "1 day, 9:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3907, "total_steps": 17941, "loss": 1.7114, "learning_rate": 9.003445861502502e-05, "epoch": 0.2177693551084109, "percentage": 21.78, "elapsed_time": "9:14:36", "remaining_time": "1 day, 9:12:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3908, "total_steps": 17941, "loss": 1.904, "learning_rate": 9.002912363031504e-05, "epoch": 0.21782509336157405, "percentage": 21.78, "elapsed_time": "9:14:44", "remaining_time": "1 day, 9:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3909, "total_steps": 17941, "loss": 1.5851, "learning_rate": 9.002378737611463e-05, "epoch": 0.2178808316147372, "percentage": 21.79, "elapsed_time": "9:14:53", "remaining_time": "1 day, 9:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3910, "total_steps": 17941, "loss": 1.6766, "learning_rate": 9.001844985259303e-05, "epoch": 0.21793656986790033, "percentage": 21.79, "elapsed_time": "9:15:01", "remaining_time": "1 day, 9:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3911, "total_steps": 17941, "loss": 1.6309, "learning_rate": 9.001311105991954e-05, "epoch": 0.2179923081210635, "percentage": 21.8, "elapsed_time": "9:15:10", "remaining_time": "1 day, 9:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3912, "total_steps": 17941, "loss": 1.5347, "learning_rate": 9.000777099826345e-05, "epoch": 0.21804804637422665, "percentage": 21.8, "elapsed_time": "9:15:18", "remaining_time": "1 day, 9:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3913, "total_steps": 17941, "loss": 1.7077, "learning_rate": 9.000242966779412e-05, "epoch": 0.21810378462738977, "percentage": 21.81, "elapsed_time": "9:15:27", "remaining_time": "1 day, 9:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3914, "total_steps": 17941, "loss": 1.4288, "learning_rate": 8.999708706868097e-05, "epoch": 0.21815952288055293, "percentage": 21.82, "elapsed_time": "9:15:35", "remaining_time": "1 day, 9:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3915, "total_steps": 17941, "loss": 1.6114, "learning_rate": 8.999174320109343e-05, "epoch": 0.21821526113371606, "percentage": 21.82, "elapsed_time": "9:15:44", "remaining_time": "1 day, 9:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3916, "total_steps": 17941, "loss": 1.6002, "learning_rate": 8.998639806520092e-05, "epoch": 0.21827099938687922, "percentage": 21.83, "elapsed_time": "9:15:52", "remaining_time": "1 day, 9:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3917, "total_steps": 17941, "loss": 1.7308, "learning_rate": 8.998105166117304e-05, "epoch": 0.21832673764004237, "percentage": 21.83, "elapsed_time": "9:16:00", "remaining_time": "1 day, 9:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3918, "total_steps": 17941, "loss": 1.7732, "learning_rate": 8.99757039891793e-05, "epoch": 0.2183824758932055, "percentage": 21.84, "elapsed_time": "9:16:09", "remaining_time": "1 day, 9:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3919, "total_steps": 17941, "loss": 1.6927, "learning_rate": 8.997035504938928e-05, "epoch": 0.21843821414636866, "percentage": 21.84, "elapsed_time": "9:16:18", "remaining_time": "1 day, 9:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3920, "total_steps": 17941, "loss": 1.7503, "learning_rate": 8.996500484197266e-05, "epoch": 0.2184939523995318, "percentage": 21.85, "elapsed_time": "9:16:26", "remaining_time": "1 day, 9:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3921, "total_steps": 17941, "loss": 1.8189, "learning_rate": 8.995965336709908e-05, "epoch": 0.21854969065269494, "percentage": 21.85, "elapsed_time": "9:16:35", "remaining_time": "1 day, 9:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3922, "total_steps": 17941, "loss": 1.9138, "learning_rate": 8.99543006249383e-05, "epoch": 0.2186054289058581, "percentage": 21.86, "elapsed_time": "9:16:43", "remaining_time": "1 day, 9:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3923, "total_steps": 17941, "loss": 1.6947, "learning_rate": 8.994894661566004e-05, "epoch": 0.21866116715902123, "percentage": 21.87, "elapsed_time": "9:16:52", "remaining_time": "1 day, 9:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3924, "total_steps": 17941, "loss": 1.7947, "learning_rate": 8.994359133943411e-05, "epoch": 0.2187169054121844, "percentage": 21.87, "elapsed_time": "9:17:00", "remaining_time": "1 day, 9:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3925, "total_steps": 17941, "loss": 1.8557, "learning_rate": 8.993823479643036e-05, "epoch": 0.21877264366534752, "percentage": 21.88, "elapsed_time": "9:17:08", "remaining_time": "1 day, 9:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3926, "total_steps": 17941, "loss": 1.6033, "learning_rate": 8.993287698681867e-05, "epoch": 0.21882838191851067, "percentage": 21.88, "elapsed_time": "9:17:17", "remaining_time": "1 day, 9:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3927, "total_steps": 17941, "loss": 1.6927, "learning_rate": 8.992751791076893e-05, "epoch": 0.21888412017167383, "percentage": 21.89, "elapsed_time": "9:17:25", "remaining_time": "1 day, 9:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3928, "total_steps": 17941, "loss": 1.6108, "learning_rate": 8.992215756845111e-05, "epoch": 0.21893985842483696, "percentage": 21.89, "elapsed_time": "9:17:34", "remaining_time": "1 day, 9:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3929, "total_steps": 17941, "loss": 1.821, "learning_rate": 8.991679596003521e-05, "epoch": 0.21899559667800012, "percentage": 21.9, "elapsed_time": "9:17:42", "remaining_time": "1 day, 9:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3930, "total_steps": 17941, "loss": 1.6755, "learning_rate": 8.991143308569129e-05, "epoch": 0.21905133493116324, "percentage": 21.91, "elapsed_time": "9:17:51", "remaining_time": "1 day, 9:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3931, "total_steps": 17941, "loss": 1.7568, "learning_rate": 8.990606894558942e-05, "epoch": 0.2191070731843264, "percentage": 21.91, "elapsed_time": "9:17:59", "remaining_time": "1 day, 9:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3932, "total_steps": 17941, "loss": 1.5701, "learning_rate": 8.99007035398997e-05, "epoch": 0.21916281143748956, "percentage": 21.92, "elapsed_time": "9:18:07", "remaining_time": "1 day, 9:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3933, "total_steps": 17941, "loss": 1.7533, "learning_rate": 8.98953368687923e-05, "epoch": 0.2192185496906527, "percentage": 21.92, "elapsed_time": "9:18:16", "remaining_time": "1 day, 9:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3934, "total_steps": 17941, "loss": 1.6604, "learning_rate": 8.988996893243742e-05, "epoch": 0.21927428794381584, "percentage": 21.93, "elapsed_time": "9:18:25", "remaining_time": "1 day, 9:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3935, "total_steps": 17941, "loss": 1.9101, "learning_rate": 8.988459973100529e-05, "epoch": 0.219330026196979, "percentage": 21.93, "elapsed_time": "9:18:33", "remaining_time": "1 day, 9:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3936, "total_steps": 17941, "loss": 1.6784, "learning_rate": 8.987922926466621e-05, "epoch": 0.21938576445014213, "percentage": 21.94, "elapsed_time": "9:18:42", "remaining_time": "1 day, 9:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3937, "total_steps": 17941, "loss": 1.8496, "learning_rate": 8.98738575335905e-05, "epoch": 0.21944150270330529, "percentage": 21.94, "elapsed_time": "9:18:50", "remaining_time": "1 day, 9:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3938, "total_steps": 17941, "loss": 1.6477, "learning_rate": 8.986848453794849e-05, "epoch": 0.21949724095646841, "percentage": 21.95, "elapsed_time": "9:18:59", "remaining_time": "1 day, 9:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3939, "total_steps": 17941, "loss": 1.9312, "learning_rate": 8.986311027791061e-05, "epoch": 0.21955297920963157, "percentage": 21.96, "elapsed_time": "9:19:07", "remaining_time": "1 day, 9:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3940, "total_steps": 17941, "loss": 1.8278, "learning_rate": 8.985773475364729e-05, "epoch": 0.21960871746279473, "percentage": 21.96, "elapsed_time": "9:19:16", "remaining_time": "1 day, 9:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3941, "total_steps": 17941, "loss": 1.5689, "learning_rate": 8.9852357965329e-05, "epoch": 0.21966445571595786, "percentage": 21.97, "elapsed_time": "9:19:24", "remaining_time": "1 day, 9:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3942, "total_steps": 17941, "loss": 1.6719, "learning_rate": 8.984697991312629e-05, "epoch": 0.219720193969121, "percentage": 21.97, "elapsed_time": "9:19:33", "remaining_time": "1 day, 9:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3943, "total_steps": 17941, "loss": 1.4167, "learning_rate": 8.98416005972097e-05, "epoch": 0.21977593222228414, "percentage": 21.98, "elapsed_time": "9:19:41", "remaining_time": "1 day, 9:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3944, "total_steps": 17941, "loss": 1.5936, "learning_rate": 8.98362200177498e-05, "epoch": 0.2198316704754473, "percentage": 21.98, "elapsed_time": "9:19:50", "remaining_time": "1 day, 9:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3945, "total_steps": 17941, "loss": 1.7715, "learning_rate": 8.98308381749173e-05, "epoch": 0.21988740872861046, "percentage": 21.99, "elapsed_time": "9:19:58", "remaining_time": "1 day, 9:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3946, "total_steps": 17941, "loss": 1.5167, "learning_rate": 8.982545506888282e-05, "epoch": 0.21994314698177359, "percentage": 21.99, "elapsed_time": "9:20:07", "remaining_time": "1 day, 9:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3947, "total_steps": 17941, "loss": 1.6694, "learning_rate": 8.982007069981711e-05, "epoch": 0.21999888523493674, "percentage": 22.0, "elapsed_time": "9:20:15", "remaining_time": "1 day, 9:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3948, "total_steps": 17941, "loss": 1.7098, "learning_rate": 8.981468506789093e-05, "epoch": 0.22005462348809987, "percentage": 22.01, "elapsed_time": "9:20:23", "remaining_time": "1 day, 9:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3949, "total_steps": 17941, "loss": 1.8188, "learning_rate": 8.980929817327509e-05, "epoch": 0.22011036174126303, "percentage": 22.01, "elapsed_time": "9:20:32", "remaining_time": "1 day, 9:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3950, "total_steps": 17941, "loss": 1.6947, "learning_rate": 8.980391001614039e-05, "epoch": 0.22016609999442618, "percentage": 22.02, "elapsed_time": "9:20:40", "remaining_time": "1 day, 9:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3951, "total_steps": 17941, "loss": 1.8565, "learning_rate": 8.979852059665774e-05, "epoch": 0.2202218382475893, "percentage": 22.02, "elapsed_time": "9:20:49", "remaining_time": "1 day, 9:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3952, "total_steps": 17941, "loss": 1.6119, "learning_rate": 8.979312991499807e-05, "epoch": 0.22027757650075247, "percentage": 22.03, "elapsed_time": "9:20:58", "remaining_time": "1 day, 9:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3953, "total_steps": 17941, "loss": 1.5012, "learning_rate": 8.97877379713323e-05, "epoch": 0.2203333147539156, "percentage": 22.03, "elapsed_time": "9:21:06", "remaining_time": "1 day, 9:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3954, "total_steps": 17941, "loss": 1.7968, "learning_rate": 8.97823447658315e-05, "epoch": 0.22038905300707876, "percentage": 22.04, "elapsed_time": "9:21:15", "remaining_time": "1 day, 9:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3955, "total_steps": 17941, "loss": 1.6924, "learning_rate": 8.977695029866665e-05, "epoch": 0.2204447912602419, "percentage": 22.04, "elapsed_time": "9:21:23", "remaining_time": "1 day, 9:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3956, "total_steps": 17941, "loss": 1.6837, "learning_rate": 8.977155457000886e-05, "epoch": 0.22050052951340504, "percentage": 22.05, "elapsed_time": "9:21:31", "remaining_time": "1 day, 9:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3957, "total_steps": 17941, "loss": 1.5339, "learning_rate": 8.976615758002925e-05, "epoch": 0.2205562677665682, "percentage": 22.06, "elapsed_time": "9:21:40", "remaining_time": "1 day, 9:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3958, "total_steps": 17941, "loss": 1.406, "learning_rate": 8.976075932889896e-05, "epoch": 0.22061200601973135, "percentage": 22.06, "elapsed_time": "9:21:48", "remaining_time": "1 day, 9:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3959, "total_steps": 17941, "loss": 1.6203, "learning_rate": 8.97553598167892e-05, "epoch": 0.22066774427289448, "percentage": 22.07, "elapsed_time": "9:21:57", "remaining_time": "1 day, 9:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3960, "total_steps": 17941, "loss": 1.6984, "learning_rate": 8.974995904387123e-05, "epoch": 0.22072348252605764, "percentage": 22.07, "elapsed_time": "9:22:05", "remaining_time": "1 day, 9:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3961, "total_steps": 17941, "loss": 1.7722, "learning_rate": 8.97445570103163e-05, "epoch": 0.22077922077922077, "percentage": 22.08, "elapsed_time": "9:22:14", "remaining_time": "1 day, 9:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3962, "total_steps": 17941, "loss": 1.8308, "learning_rate": 8.973915371629577e-05, "epoch": 0.22083495903238393, "percentage": 22.08, "elapsed_time": "9:22:22", "remaining_time": "1 day, 9:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3963, "total_steps": 17941, "loss": 1.6487, "learning_rate": 8.973374916198096e-05, "epoch": 0.22089069728554708, "percentage": 22.09, "elapsed_time": "9:22:31", "remaining_time": "1 day, 9:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3964, "total_steps": 17941, "loss": 1.4931, "learning_rate": 8.972834334754331e-05, "epoch": 0.2209464355387102, "percentage": 22.09, "elapsed_time": "9:22:40", "remaining_time": "1 day, 9:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3965, "total_steps": 17941, "loss": 1.9263, "learning_rate": 8.972293627315424e-05, "epoch": 0.22100217379187337, "percentage": 22.1, "elapsed_time": "9:22:48", "remaining_time": "1 day, 9:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3966, "total_steps": 17941, "loss": 1.8374, "learning_rate": 8.971752793898522e-05, "epoch": 0.2210579120450365, "percentage": 22.11, "elapsed_time": "9:22:56", "remaining_time": "1 day, 9:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3967, "total_steps": 17941, "loss": 1.7221, "learning_rate": 8.971211834520779e-05, "epoch": 0.22111365029819965, "percentage": 22.11, "elapsed_time": "9:23:05", "remaining_time": "1 day, 9:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3968, "total_steps": 17941, "loss": 1.713, "learning_rate": 8.970670749199351e-05, "epoch": 0.2211693885513628, "percentage": 22.12, "elapsed_time": "9:23:13", "remaining_time": "1 day, 9:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3969, "total_steps": 17941, "loss": 1.6519, "learning_rate": 8.970129537951395e-05, "epoch": 0.22122512680452594, "percentage": 22.12, "elapsed_time": "9:23:22", "remaining_time": "1 day, 9:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3970, "total_steps": 17941, "loss": 1.5816, "learning_rate": 8.969588200794079e-05, "epoch": 0.2212808650576891, "percentage": 22.13, "elapsed_time": "9:23:30", "remaining_time": "1 day, 9:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3971, "total_steps": 17941, "loss": 1.8442, "learning_rate": 8.969046737744571e-05, "epoch": 0.22133660331085223, "percentage": 22.13, "elapsed_time": "9:23:39", "remaining_time": "1 day, 9:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3972, "total_steps": 17941, "loss": 1.5886, "learning_rate": 8.968505148820039e-05, "epoch": 0.22139234156401538, "percentage": 22.14, "elapsed_time": "9:23:47", "remaining_time": "1 day, 9:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3973, "total_steps": 17941, "loss": 1.8938, "learning_rate": 8.967963434037663e-05, "epoch": 0.22144807981717854, "percentage": 22.14, "elapsed_time": "9:23:56", "remaining_time": "1 day, 9:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3974, "total_steps": 17941, "loss": 1.7739, "learning_rate": 8.967421593414622e-05, "epoch": 0.22150381807034167, "percentage": 22.15, "elapsed_time": "9:24:04", "remaining_time": "1 day, 9:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3975, "total_steps": 17941, "loss": 1.5916, "learning_rate": 8.966879626968099e-05, "epoch": 0.22155955632350482, "percentage": 22.16, "elapsed_time": "9:24:13", "remaining_time": "1 day, 9:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3976, "total_steps": 17941, "loss": 1.6879, "learning_rate": 8.966337534715284e-05, "epoch": 0.22161529457666795, "percentage": 22.16, "elapsed_time": "9:24:22", "remaining_time": "1 day, 9:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3977, "total_steps": 17941, "loss": 1.5465, "learning_rate": 8.965795316673366e-05, "epoch": 0.2216710328298311, "percentage": 22.17, "elapsed_time": "9:24:31", "remaining_time": "1 day, 9:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3978, "total_steps": 17941, "loss": 1.8477, "learning_rate": 8.965252972859545e-05, "epoch": 0.22172677108299427, "percentage": 22.17, "elapsed_time": "9:24:39", "remaining_time": "1 day, 9:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3979, "total_steps": 17941, "loss": 1.7961, "learning_rate": 8.964710503291018e-05, "epoch": 0.2217825093361574, "percentage": 22.18, "elapsed_time": "9:24:48", "remaining_time": "1 day, 9:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3980, "total_steps": 17941, "loss": 1.7795, "learning_rate": 8.964167907984988e-05, "epoch": 0.22183824758932055, "percentage": 22.18, "elapsed_time": "9:24:56", "remaining_time": "1 day, 9:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3981, "total_steps": 17941, "loss": 1.7824, "learning_rate": 8.963625186958666e-05, "epoch": 0.2218939858424837, "percentage": 22.19, "elapsed_time": "9:25:05", "remaining_time": "1 day, 9:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3982, "total_steps": 17941, "loss": 1.7521, "learning_rate": 8.963082340229263e-05, "epoch": 0.22194972409564684, "percentage": 22.19, "elapsed_time": "9:25:13", "remaining_time": "1 day, 9:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3983, "total_steps": 17941, "loss": 1.5493, "learning_rate": 8.962539367813993e-05, "epoch": 0.22200546234881, "percentage": 22.2, "elapsed_time": "9:25:22", "remaining_time": "1 day, 9:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3984, "total_steps": 17941, "loss": 1.5015, "learning_rate": 8.961996269730078e-05, "epoch": 0.22206120060197312, "percentage": 22.21, "elapsed_time": "9:25:30", "remaining_time": "1 day, 9:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3985, "total_steps": 17941, "loss": 1.7563, "learning_rate": 8.961453045994742e-05, "epoch": 0.22211693885513628, "percentage": 22.21, "elapsed_time": "9:25:38", "remaining_time": "1 day, 9:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3986, "total_steps": 17941, "loss": 1.6671, "learning_rate": 8.960909696625213e-05, "epoch": 0.22217267710829944, "percentage": 22.22, "elapsed_time": "9:25:47", "remaining_time": "1 day, 9:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3987, "total_steps": 17941, "loss": 1.7181, "learning_rate": 8.960366221638721e-05, "epoch": 0.22222841536146257, "percentage": 22.22, "elapsed_time": "9:25:55", "remaining_time": "1 day, 9:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3988, "total_steps": 17941, "loss": 1.8017, "learning_rate": 8.959822621052502e-05, "epoch": 0.22228415361462572, "percentage": 22.23, "elapsed_time": "9:26:04", "remaining_time": "1 day, 9:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3989, "total_steps": 17941, "loss": 1.8768, "learning_rate": 8.959278894883797e-05, "epoch": 0.22233989186778885, "percentage": 22.23, "elapsed_time": "9:26:12", "remaining_time": "1 day, 9:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3990, "total_steps": 17941, "loss": 1.6246, "learning_rate": 8.958735043149852e-05, "epoch": 0.222395630120952, "percentage": 22.24, "elapsed_time": "9:26:21", "remaining_time": "1 day, 9:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3991, "total_steps": 17941, "loss": 1.8083, "learning_rate": 8.958191065867912e-05, "epoch": 0.22245136837411517, "percentage": 22.25, "elapsed_time": "9:26:29", "remaining_time": "1 day, 9:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3992, "total_steps": 17941, "loss": 1.9074, "learning_rate": 8.957646963055227e-05, "epoch": 0.2225071066272783, "percentage": 22.25, "elapsed_time": "9:26:38", "remaining_time": "1 day, 8:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3993, "total_steps": 17941, "loss": 1.6518, "learning_rate": 8.957102734729057e-05, "epoch": 0.22256284488044145, "percentage": 22.26, "elapsed_time": "9:26:46", "remaining_time": "1 day, 8:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3994, "total_steps": 17941, "loss": 2.3105, "learning_rate": 8.956558380906659e-05, "epoch": 0.22261858313360458, "percentage": 22.26, "elapsed_time": "9:26:55", "remaining_time": "1 day, 8:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3995, "total_steps": 17941, "loss": 1.7229, "learning_rate": 8.956013901605299e-05, "epoch": 0.22267432138676774, "percentage": 22.27, "elapsed_time": "9:27:03", "remaining_time": "1 day, 8:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3996, "total_steps": 17941, "loss": 1.641, "learning_rate": 8.955469296842241e-05, "epoch": 0.2227300596399309, "percentage": 22.27, "elapsed_time": "9:27:11", "remaining_time": "1 day, 8:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3997, "total_steps": 17941, "loss": 1.6717, "learning_rate": 8.95492456663476e-05, "epoch": 0.22278579789309402, "percentage": 22.28, "elapsed_time": "9:27:20", "remaining_time": "1 day, 8:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3998, "total_steps": 17941, "loss": 1.7382, "learning_rate": 8.954379711000129e-05, "epoch": 0.22284153614625718, "percentage": 22.28, "elapsed_time": "9:27:28", "remaining_time": "1 day, 8:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3999, "total_steps": 17941, "loss": 1.7489, "learning_rate": 8.95383472995563e-05, "epoch": 0.2228972743994203, "percentage": 22.29, "elapsed_time": "9:27:37", "remaining_time": "1 day, 8:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4000, "total_steps": 17941, "loss": 1.7241, "learning_rate": 8.953289623518545e-05, "epoch": 0.22295301265258347, "percentage": 22.3, "elapsed_time": "9:27:45", "remaining_time": "1 day, 8:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4001, "total_steps": 17941, "loss": 1.6683, "learning_rate": 8.952744391706165e-05, "epoch": 0.22300875090574662, "percentage": 22.3, "elapsed_time": "9:27:54", "remaining_time": "1 day, 8:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4002, "total_steps": 17941, "loss": 1.6086, "learning_rate": 8.952199034535778e-05, "epoch": 0.22306448915890975, "percentage": 22.31, "elapsed_time": "9:28:02", "remaining_time": "1 day, 8:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4003, "total_steps": 17941, "loss": 1.9497, "learning_rate": 8.95165355202468e-05, "epoch": 0.2231202274120729, "percentage": 22.31, "elapsed_time": "9:28:11", "remaining_time": "1 day, 8:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4004, "total_steps": 17941, "loss": 1.9735, "learning_rate": 8.951107944190171e-05, "epoch": 0.22317596566523606, "percentage": 22.32, "elapsed_time": "9:28:19", "remaining_time": "1 day, 8:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4005, "total_steps": 17941, "loss": 1.5424, "learning_rate": 8.950562211049556e-05, "epoch": 0.2232317039183992, "percentage": 22.32, "elapsed_time": "9:28:27", "remaining_time": "1 day, 8:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4006, "total_steps": 17941, "loss": 1.6966, "learning_rate": 8.950016352620139e-05, "epoch": 0.22328744217156235, "percentage": 22.33, "elapsed_time": "9:28:36", "remaining_time": "1 day, 8:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4007, "total_steps": 17941, "loss": 1.6651, "learning_rate": 8.949470368919235e-05, "epoch": 0.22334318042472548, "percentage": 22.33, "elapsed_time": "9:28:45", "remaining_time": "1 day, 8:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4008, "total_steps": 17941, "loss": 1.7668, "learning_rate": 8.948924259964157e-05, "epoch": 0.22339891867788864, "percentage": 22.34, "elapsed_time": "9:28:54", "remaining_time": "1 day, 8:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4009, "total_steps": 17941, "loss": 1.7271, "learning_rate": 8.948378025772227e-05, "epoch": 0.2234546569310518, "percentage": 22.35, "elapsed_time": "9:29:03", "remaining_time": "1 day, 8:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4010, "total_steps": 17941, "loss": 1.7851, "learning_rate": 8.947831666360765e-05, "epoch": 0.22351039518421492, "percentage": 22.35, "elapsed_time": "9:29:11", "remaining_time": "1 day, 8:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4011, "total_steps": 17941, "loss": 1.8569, "learning_rate": 8.947285181747098e-05, "epoch": 0.22356613343737808, "percentage": 22.36, "elapsed_time": "9:29:20", "remaining_time": "1 day, 8:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4012, "total_steps": 17941, "loss": 1.6114, "learning_rate": 8.946738571948562e-05, "epoch": 0.2236218716905412, "percentage": 22.36, "elapsed_time": "9:29:29", "remaining_time": "1 day, 8:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4013, "total_steps": 17941, "loss": 1.8552, "learning_rate": 8.946191836982489e-05, "epoch": 0.22367760994370436, "percentage": 22.37, "elapsed_time": "9:29:37", "remaining_time": "1 day, 8:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4014, "total_steps": 17941, "loss": 1.5846, "learning_rate": 8.945644976866219e-05, "epoch": 0.22373334819686752, "percentage": 22.37, "elapsed_time": "9:29:45", "remaining_time": "1 day, 8:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4015, "total_steps": 17941, "loss": 1.8305, "learning_rate": 8.945097991617096e-05, "epoch": 0.22378908645003065, "percentage": 22.38, "elapsed_time": "9:29:54", "remaining_time": "1 day, 8:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4016, "total_steps": 17941, "loss": 1.6642, "learning_rate": 8.944550881252465e-05, "epoch": 0.2238448247031938, "percentage": 22.38, "elapsed_time": "9:30:02", "remaining_time": "1 day, 8:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4017, "total_steps": 17941, "loss": 1.7286, "learning_rate": 8.944003645789678e-05, "epoch": 0.22390056295635694, "percentage": 22.39, "elapsed_time": "9:30:11", "remaining_time": "1 day, 8:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4018, "total_steps": 17941, "loss": 1.6254, "learning_rate": 8.943456285246091e-05, "epoch": 0.2239563012095201, "percentage": 22.4, "elapsed_time": "9:30:19", "remaining_time": "1 day, 8:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4019, "total_steps": 17941, "loss": 1.4306, "learning_rate": 8.942908799639062e-05, "epoch": 0.22401203946268325, "percentage": 22.4, "elapsed_time": "9:30:28", "remaining_time": "1 day, 8:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4020, "total_steps": 17941, "loss": 1.8686, "learning_rate": 8.942361188985957e-05, "epoch": 0.22406777771584638, "percentage": 22.41, "elapsed_time": "9:30:36", "remaining_time": "1 day, 8:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4021, "total_steps": 17941, "loss": 1.6244, "learning_rate": 8.941813453304138e-05, "epoch": 0.22412351596900953, "percentage": 22.41, "elapsed_time": "9:30:45", "remaining_time": "1 day, 8:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4022, "total_steps": 17941, "loss": 1.5336, "learning_rate": 8.941265592610979e-05, "epoch": 0.22417925422217266, "percentage": 22.42, "elapsed_time": "9:30:54", "remaining_time": "1 day, 8:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4023, "total_steps": 17941, "loss": 1.5896, "learning_rate": 8.940717606923857e-05, "epoch": 0.22423499247533582, "percentage": 22.42, "elapsed_time": "9:31:03", "remaining_time": "1 day, 8:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4024, "total_steps": 17941, "loss": 1.8004, "learning_rate": 8.940169496260144e-05, "epoch": 0.22429073072849898, "percentage": 22.43, "elapsed_time": "9:31:11", "remaining_time": "1 day, 8:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4025, "total_steps": 17941, "loss": 1.6034, "learning_rate": 8.939621260637231e-05, "epoch": 0.2243464689816621, "percentage": 22.43, "elapsed_time": "9:31:20", "remaining_time": "1 day, 8:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4026, "total_steps": 17941, "loss": 1.7099, "learning_rate": 8.9390729000725e-05, "epoch": 0.22440220723482526, "percentage": 22.44, "elapsed_time": "9:31:28", "remaining_time": "1 day, 8:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4027, "total_steps": 17941, "loss": 1.8367, "learning_rate": 8.938524414583343e-05, "epoch": 0.22445794548798842, "percentage": 22.45, "elapsed_time": "9:31:37", "remaining_time": "1 day, 8:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4028, "total_steps": 17941, "loss": 1.6737, "learning_rate": 8.937975804187156e-05, "epoch": 0.22451368374115155, "percentage": 22.45, "elapsed_time": "9:31:45", "remaining_time": "1 day, 8:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4029, "total_steps": 17941, "loss": 1.7541, "learning_rate": 8.937427068901335e-05, "epoch": 0.2245694219943147, "percentage": 22.46, "elapsed_time": "9:31:54", "remaining_time": "1 day, 8:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4030, "total_steps": 17941, "loss": 1.7383, "learning_rate": 8.936878208743285e-05, "epoch": 0.22462516024747783, "percentage": 22.46, "elapsed_time": "9:32:02", "remaining_time": "1 day, 8:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4031, "total_steps": 17941, "loss": 1.5392, "learning_rate": 8.93632922373041e-05, "epoch": 0.224680898500641, "percentage": 22.47, "elapsed_time": "9:32:11", "remaining_time": "1 day, 8:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4032, "total_steps": 17941, "loss": 1.9703, "learning_rate": 8.935780113880125e-05, "epoch": 0.22473663675380415, "percentage": 22.47, "elapsed_time": "9:32:19", "remaining_time": "1 day, 8:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4033, "total_steps": 17941, "loss": 1.7827, "learning_rate": 8.93523087920984e-05, "epoch": 0.22479237500696728, "percentage": 22.48, "elapsed_time": "9:32:28", "remaining_time": "1 day, 8:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4034, "total_steps": 17941, "loss": 1.8036, "learning_rate": 8.934681519736977e-05, "epoch": 0.22484811326013043, "percentage": 22.48, "elapsed_time": "9:32:37", "remaining_time": "1 day, 8:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4035, "total_steps": 17941, "loss": 1.9969, "learning_rate": 8.934132035478955e-05, "epoch": 0.22490385151329356, "percentage": 22.49, "elapsed_time": "9:32:46", "remaining_time": "1 day, 8:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4036, "total_steps": 17941, "loss": 1.7836, "learning_rate": 8.933582426453205e-05, "epoch": 0.22495958976645672, "percentage": 22.5, "elapsed_time": "9:32:54", "remaining_time": "1 day, 8:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4037, "total_steps": 17941, "loss": 1.8767, "learning_rate": 8.933032692677153e-05, "epoch": 0.22501532801961988, "percentage": 22.5, "elapsed_time": "9:33:03", "remaining_time": "1 day, 8:53:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4038, "total_steps": 17941, "loss": 1.6584, "learning_rate": 8.932482834168237e-05, "epoch": 0.225071066272783, "percentage": 22.51, "elapsed_time": "9:33:12", "remaining_time": "1 day, 8:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4039, "total_steps": 17941, "loss": 1.6707, "learning_rate": 8.931932850943892e-05, "epoch": 0.22512680452594616, "percentage": 22.51, "elapsed_time": "9:33:20", "remaining_time": "1 day, 8:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4040, "total_steps": 17941, "loss": 1.5798, "learning_rate": 8.931382743021562e-05, "epoch": 0.2251825427791093, "percentage": 22.52, "elapsed_time": "9:33:29", "remaining_time": "1 day, 8:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4041, "total_steps": 17941, "loss": 1.5718, "learning_rate": 8.930832510418692e-05, "epoch": 0.22523828103227245, "percentage": 22.52, "elapsed_time": "9:33:37", "remaining_time": "1 day, 8:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4042, "total_steps": 17941, "loss": 1.7996, "learning_rate": 8.930282153152734e-05, "epoch": 0.2252940192854356, "percentage": 22.53, "elapsed_time": "9:33:46", "remaining_time": "1 day, 8:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4043, "total_steps": 17941, "loss": 1.8783, "learning_rate": 8.92973167124114e-05, "epoch": 0.22534975753859873, "percentage": 22.53, "elapsed_time": "9:33:54", "remaining_time": "1 day, 8:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4044, "total_steps": 17941, "loss": 1.9278, "learning_rate": 8.92918106470137e-05, "epoch": 0.2254054957917619, "percentage": 22.54, "elapsed_time": "9:34:02", "remaining_time": "1 day, 8:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4045, "total_steps": 17941, "loss": 1.6555, "learning_rate": 8.928630333550886e-05, "epoch": 0.22546123404492502, "percentage": 22.55, "elapsed_time": "9:34:11", "remaining_time": "1 day, 8:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4046, "total_steps": 17941, "loss": 1.6326, "learning_rate": 8.928079477807155e-05, "epoch": 0.22551697229808818, "percentage": 22.55, "elapsed_time": "9:34:19", "remaining_time": "1 day, 8:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4047, "total_steps": 17941, "loss": 1.7983, "learning_rate": 8.927528497487642e-05, "epoch": 0.22557271055125133, "percentage": 22.56, "elapsed_time": "9:34:28", "remaining_time": "1 day, 8:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4048, "total_steps": 17941, "loss": 1.9013, "learning_rate": 8.926977392609826e-05, "epoch": 0.22562844880441446, "percentage": 22.56, "elapsed_time": "9:34:36", "remaining_time": "1 day, 8:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4049, "total_steps": 17941, "loss": 1.8038, "learning_rate": 8.926426163191182e-05, "epoch": 0.22568418705757762, "percentage": 22.57, "elapsed_time": "9:34:45", "remaining_time": "1 day, 8:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4050, "total_steps": 17941, "loss": 1.893, "learning_rate": 8.925874809249193e-05, "epoch": 0.22573992531074077, "percentage": 22.57, "elapsed_time": "9:34:54", "remaining_time": "1 day, 8:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4051, "total_steps": 17941, "loss": 1.6987, "learning_rate": 8.925323330801345e-05, "epoch": 0.2257956635639039, "percentage": 22.58, "elapsed_time": "9:35:03", "remaining_time": "1 day, 8:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4052, "total_steps": 17941, "loss": 1.4703, "learning_rate": 8.924771727865126e-05, "epoch": 0.22585140181706706, "percentage": 22.59, "elapsed_time": "9:35:11", "remaining_time": "1 day, 8:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4053, "total_steps": 17941, "loss": 1.1188, "learning_rate": 8.924220000458032e-05, "epoch": 0.2259071400702302, "percentage": 22.59, "elapsed_time": "9:35:20", "remaining_time": "1 day, 8:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4054, "total_steps": 17941, "loss": 1.8899, "learning_rate": 8.92366814859756e-05, "epoch": 0.22596287832339335, "percentage": 22.6, "elapsed_time": "9:35:28", "remaining_time": "1 day, 8:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4055, "total_steps": 17941, "loss": 1.7006, "learning_rate": 8.923116172301208e-05, "epoch": 0.2260186165765565, "percentage": 22.6, "elapsed_time": "9:35:36", "remaining_time": "1 day, 8:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4056, "total_steps": 17941, "loss": 1.7435, "learning_rate": 8.922564071586487e-05, "epoch": 0.22607435482971963, "percentage": 22.61, "elapsed_time": "9:35:45", "remaining_time": "1 day, 8:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4057, "total_steps": 17941, "loss": 1.7926, "learning_rate": 8.922011846470903e-05, "epoch": 0.2261300930828828, "percentage": 22.61, "elapsed_time": "9:35:53", "remaining_time": "1 day, 8:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4058, "total_steps": 17941, "loss": 1.8028, "learning_rate": 8.921459496971971e-05, "epoch": 0.22618583133604592, "percentage": 22.62, "elapsed_time": "9:36:02", "remaining_time": "1 day, 8:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4059, "total_steps": 17941, "loss": 1.7713, "learning_rate": 8.920907023107208e-05, "epoch": 0.22624156958920907, "percentage": 22.62, "elapsed_time": "9:36:10", "remaining_time": "1 day, 8:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4060, "total_steps": 17941, "loss": 1.8308, "learning_rate": 8.920354424894133e-05, "epoch": 0.22629730784237223, "percentage": 22.63, "elapsed_time": "9:36:19", "remaining_time": "1 day, 8:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4061, "total_steps": 17941, "loss": 1.7824, "learning_rate": 8.919801702350272e-05, "epoch": 0.22635304609553536, "percentage": 22.64, "elapsed_time": "9:36:27", "remaining_time": "1 day, 8:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4062, "total_steps": 17941, "loss": 1.6801, "learning_rate": 8.919248855493156e-05, "epoch": 0.22640878434869852, "percentage": 22.64, "elapsed_time": "9:36:36", "remaining_time": "1 day, 8:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4063, "total_steps": 17941, "loss": 1.7266, "learning_rate": 8.918695884340318e-05, "epoch": 0.22646452260186165, "percentage": 22.65, "elapsed_time": "9:36:44", "remaining_time": "1 day, 8:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4064, "total_steps": 17941, "loss": 1.9331, "learning_rate": 8.918142788909294e-05, "epoch": 0.2265202608550248, "percentage": 22.65, "elapsed_time": "9:36:53", "remaining_time": "1 day, 8:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4065, "total_steps": 17941, "loss": 1.8074, "learning_rate": 8.917589569217624e-05, "epoch": 0.22657599910818796, "percentage": 22.66, "elapsed_time": "9:37:01", "remaining_time": "1 day, 8:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4066, "total_steps": 17941, "loss": 1.8719, "learning_rate": 8.917036225282855e-05, "epoch": 0.2266317373613511, "percentage": 22.66, "elapsed_time": "9:37:10", "remaining_time": "1 day, 8:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4067, "total_steps": 17941, "loss": 1.7155, "learning_rate": 8.916482757122535e-05, "epoch": 0.22668747561451424, "percentage": 22.67, "elapsed_time": "9:37:19", "remaining_time": "1 day, 8:49:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4068, "total_steps": 17941, "loss": 1.8401, "learning_rate": 8.915929164754215e-05, "epoch": 0.22674321386767737, "percentage": 22.67, "elapsed_time": "9:37:28", "remaining_time": "1 day, 8:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4069, "total_steps": 17941, "loss": 1.6825, "learning_rate": 8.915375448195455e-05, "epoch": 0.22679895212084053, "percentage": 22.68, "elapsed_time": "9:37:36", "remaining_time": "1 day, 8:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4070, "total_steps": 17941, "loss": 1.6471, "learning_rate": 8.914821607463814e-05, "epoch": 0.2268546903740037, "percentage": 22.69, "elapsed_time": "9:37:44", "remaining_time": "1 day, 8:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4071, "total_steps": 17941, "loss": 2.0078, "learning_rate": 8.914267642576857e-05, "epoch": 0.22691042862716682, "percentage": 22.69, "elapsed_time": "9:37:53", "remaining_time": "1 day, 8:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4072, "total_steps": 17941, "loss": 1.8949, "learning_rate": 8.91371355355215e-05, "epoch": 0.22696616688032997, "percentage": 22.7, "elapsed_time": "9:38:01", "remaining_time": "1 day, 8:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4073, "total_steps": 17941, "loss": 1.787, "learning_rate": 8.913159340407269e-05, "epoch": 0.22702190513349313, "percentage": 22.7, "elapsed_time": "9:38:10", "remaining_time": "1 day, 8:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4074, "total_steps": 17941, "loss": 1.6022, "learning_rate": 8.912605003159788e-05, "epoch": 0.22707764338665626, "percentage": 22.71, "elapsed_time": "9:38:18", "remaining_time": "1 day, 8:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4075, "total_steps": 17941, "loss": 1.6286, "learning_rate": 8.912050541827291e-05, "epoch": 0.22713338163981941, "percentage": 22.71, "elapsed_time": "9:38:27", "remaining_time": "1 day, 8:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4076, "total_steps": 17941, "loss": 1.8091, "learning_rate": 8.911495956427357e-05, "epoch": 0.22718911989298254, "percentage": 22.72, "elapsed_time": "9:38:35", "remaining_time": "1 day, 8:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4077, "total_steps": 17941, "loss": 1.7518, "learning_rate": 8.910941246977577e-05, "epoch": 0.2272448581461457, "percentage": 22.72, "elapsed_time": "9:38:44", "remaining_time": "1 day, 8:48:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4078, "total_steps": 17941, "loss": 1.7051, "learning_rate": 8.910386413495544e-05, "epoch": 0.22730059639930886, "percentage": 22.73, "elapsed_time": "9:38:52", "remaining_time": "1 day, 8:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4079, "total_steps": 17941, "loss": 1.5667, "learning_rate": 8.909831455998854e-05, "epoch": 0.227356334652472, "percentage": 22.74, "elapsed_time": "9:39:01", "remaining_time": "1 day, 8:47:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4080, "total_steps": 17941, "loss": 1.6594, "learning_rate": 8.909276374505104e-05, "epoch": 0.22741207290563514, "percentage": 22.74, "elapsed_time": "9:39:09", "remaining_time": "1 day, 8:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4081, "total_steps": 17941, "loss": 1.7931, "learning_rate": 8.908721169031901e-05, "epoch": 0.22746781115879827, "percentage": 22.75, "elapsed_time": "9:39:18", "remaining_time": "1 day, 8:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4082, "total_steps": 17941, "loss": 2.0539, "learning_rate": 8.908165839596852e-05, "epoch": 0.22752354941196143, "percentage": 22.75, "elapsed_time": "9:39:26", "remaining_time": "1 day, 8:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4083, "total_steps": 17941, "loss": 2.1055, "learning_rate": 8.907610386217568e-05, "epoch": 0.22757928766512459, "percentage": 22.76, "elapsed_time": "9:39:34", "remaining_time": "1 day, 8:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4084, "total_steps": 17941, "loss": 1.8536, "learning_rate": 8.907054808911668e-05, "epoch": 0.22763502591828771, "percentage": 22.76, "elapsed_time": "9:39:43", "remaining_time": "1 day, 8:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4085, "total_steps": 17941, "loss": 1.5868, "learning_rate": 8.906499107696766e-05, "epoch": 0.22769076417145087, "percentage": 22.77, "elapsed_time": "9:39:51", "remaining_time": "1 day, 8:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4086, "total_steps": 17941, "loss": 1.611, "learning_rate": 8.90594328259049e-05, "epoch": 0.227746502424614, "percentage": 22.77, "elapsed_time": "9:40:00", "remaining_time": "1 day, 8:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4087, "total_steps": 17941, "loss": 1.3946, "learning_rate": 8.905387333610466e-05, "epoch": 0.22780224067777716, "percentage": 22.78, "elapsed_time": "9:40:09", "remaining_time": "1 day, 8:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4088, "total_steps": 17941, "loss": 1.9145, "learning_rate": 8.904831260774327e-05, "epoch": 0.2278579789309403, "percentage": 22.79, "elapsed_time": "9:40:17", "remaining_time": "1 day, 8:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4089, "total_steps": 17941, "loss": 1.8516, "learning_rate": 8.904275064099708e-05, "epoch": 0.22791371718410344, "percentage": 22.79, "elapsed_time": "9:40:26", "remaining_time": "1 day, 8:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4090, "total_steps": 17941, "loss": 1.7872, "learning_rate": 8.903718743604244e-05, "epoch": 0.2279694554372666, "percentage": 22.8, "elapsed_time": "9:40:35", "remaining_time": "1 day, 8:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4091, "total_steps": 17941, "loss": 1.5771, "learning_rate": 8.903162299305585e-05, "epoch": 0.22802519369042973, "percentage": 22.8, "elapsed_time": "9:40:43", "remaining_time": "1 day, 8:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4092, "total_steps": 17941, "loss": 1.7952, "learning_rate": 8.902605731221373e-05, "epoch": 0.22808093194359289, "percentage": 22.81, "elapsed_time": "9:40:51", "remaining_time": "1 day, 8:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4093, "total_steps": 17941, "loss": 1.7417, "learning_rate": 8.902049039369261e-05, "epoch": 0.22813667019675604, "percentage": 22.81, "elapsed_time": "9:41:00", "remaining_time": "1 day, 8:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4094, "total_steps": 17941, "loss": 1.6605, "learning_rate": 8.901492223766906e-05, "epoch": 0.22819240844991917, "percentage": 22.82, "elapsed_time": "9:41:09", "remaining_time": "1 day, 8:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4095, "total_steps": 17941, "loss": 1.8027, "learning_rate": 8.900935284431961e-05, "epoch": 0.22824814670308233, "percentage": 22.82, "elapsed_time": "9:41:17", "remaining_time": "1 day, 8:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4096, "total_steps": 17941, "loss": 1.6941, "learning_rate": 8.900378221382097e-05, "epoch": 0.22830388495624548, "percentage": 22.83, "elapsed_time": "9:41:26", "remaining_time": "1 day, 8:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4097, "total_steps": 17941, "loss": 1.9182, "learning_rate": 8.899821034634974e-05, "epoch": 0.2283596232094086, "percentage": 22.84, "elapsed_time": "9:41:34", "remaining_time": "1 day, 8:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4098, "total_steps": 17941, "loss": 1.7512, "learning_rate": 8.899263724208266e-05, "epoch": 0.22841536146257177, "percentage": 22.84, "elapsed_time": "9:41:43", "remaining_time": "1 day, 8:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4099, "total_steps": 17941, "loss": 1.8606, "learning_rate": 8.898706290119647e-05, "epoch": 0.2284710997157349, "percentage": 22.85, "elapsed_time": "9:41:51", "remaining_time": "1 day, 8:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4100, "total_steps": 17941, "loss": 1.7136, "learning_rate": 8.898148732386795e-05, "epoch": 0.22852683796889806, "percentage": 22.85, "elapsed_time": "9:42:00", "remaining_time": "1 day, 8:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4101, "total_steps": 17941, "loss": 1.8315, "learning_rate": 8.897591051027394e-05, "epoch": 0.2285825762220612, "percentage": 22.86, "elapsed_time": "9:42:09", "remaining_time": "1 day, 8:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4102, "total_steps": 17941, "loss": 1.4505, "learning_rate": 8.89703324605913e-05, "epoch": 0.22863831447522434, "percentage": 22.86, "elapsed_time": "9:42:17", "remaining_time": "1 day, 8:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4103, "total_steps": 17941, "loss": 1.662, "learning_rate": 8.896475317499691e-05, "epoch": 0.2286940527283875, "percentage": 22.87, "elapsed_time": "9:42:26", "remaining_time": "1 day, 8:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4104, "total_steps": 17941, "loss": 1.6713, "learning_rate": 8.895917265366773e-05, "epoch": 0.22874979098155063, "percentage": 22.87, "elapsed_time": "9:42:34", "remaining_time": "1 day, 8:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4105, "total_steps": 17941, "loss": 1.6645, "learning_rate": 8.895359089678075e-05, "epoch": 0.22880552923471378, "percentage": 22.88, "elapsed_time": "9:42:42", "remaining_time": "1 day, 8:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4106, "total_steps": 17941, "loss": 1.7344, "learning_rate": 8.894800790451298e-05, "epoch": 0.22886126748787694, "percentage": 22.89, "elapsed_time": "9:42:51", "remaining_time": "1 day, 8:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4107, "total_steps": 17941, "loss": 1.7137, "learning_rate": 8.894242367704149e-05, "epoch": 0.22891700574104007, "percentage": 22.89, "elapsed_time": "9:42:59", "remaining_time": "1 day, 8:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4108, "total_steps": 17941, "loss": 1.689, "learning_rate": 8.893683821454335e-05, "epoch": 0.22897274399420323, "percentage": 22.9, "elapsed_time": "9:43:08", "remaining_time": "1 day, 8:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4109, "total_steps": 17941, "loss": 1.7345, "learning_rate": 8.893125151719574e-05, "epoch": 0.22902848224736636, "percentage": 22.9, "elapsed_time": "9:43:16", "remaining_time": "1 day, 8:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4110, "total_steps": 17941, "loss": 1.6921, "learning_rate": 8.89256635851758e-05, "epoch": 0.2290842205005295, "percentage": 22.91, "elapsed_time": "9:43:25", "remaining_time": "1 day, 8:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4111, "total_steps": 17941, "loss": 1.7282, "learning_rate": 8.892007441866076e-05, "epoch": 0.22913995875369267, "percentage": 22.91, "elapsed_time": "9:43:33", "remaining_time": "1 day, 8:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4112, "total_steps": 17941, "loss": 1.6771, "learning_rate": 8.89144840178279e-05, "epoch": 0.2291956970068558, "percentage": 22.92, "elapsed_time": "9:43:42", "remaining_time": "1 day, 8:43:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4113, "total_steps": 17941, "loss": 1.9474, "learning_rate": 8.89088923828545e-05, "epoch": 0.22925143526001895, "percentage": 22.93, "elapsed_time": "9:43:51", "remaining_time": "1 day, 8:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4114, "total_steps": 17941, "loss": 1.7969, "learning_rate": 8.890329951391787e-05, "epoch": 0.22930717351318208, "percentage": 22.93, "elapsed_time": "9:43:59", "remaining_time": "1 day, 8:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4115, "total_steps": 17941, "loss": 1.6611, "learning_rate": 8.88977054111954e-05, "epoch": 0.22936291176634524, "percentage": 22.94, "elapsed_time": "9:44:08", "remaining_time": "1 day, 8:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4116, "total_steps": 17941, "loss": 1.6558, "learning_rate": 8.889211007486451e-05, "epoch": 0.2294186500195084, "percentage": 22.94, "elapsed_time": "9:44:16", "remaining_time": "1 day, 8:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4117, "total_steps": 17941, "loss": 1.712, "learning_rate": 8.888651350510265e-05, "epoch": 0.22947438827267153, "percentage": 22.95, "elapsed_time": "9:44:25", "remaining_time": "1 day, 8:42:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4118, "total_steps": 17941, "loss": 1.8012, "learning_rate": 8.888091570208729e-05, "epoch": 0.22953012652583468, "percentage": 22.95, "elapsed_time": "9:44:33", "remaining_time": "1 day, 8:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4119, "total_steps": 17941, "loss": 2.0303, "learning_rate": 8.887531666599598e-05, "epoch": 0.22958586477899784, "percentage": 22.96, "elapsed_time": "9:44:42", "remaining_time": "1 day, 8:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4120, "total_steps": 17941, "loss": 1.6133, "learning_rate": 8.88697163970063e-05, "epoch": 0.22964160303216097, "percentage": 22.96, "elapsed_time": "9:44:50", "remaining_time": "1 day, 8:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4121, "total_steps": 17941, "loss": 1.6117, "learning_rate": 8.886411489529583e-05, "epoch": 0.22969734128532412, "percentage": 22.97, "elapsed_time": "9:44:59", "remaining_time": "1 day, 8:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4122, "total_steps": 17941, "loss": 1.8159, "learning_rate": 8.885851216104222e-05, "epoch": 0.22975307953848725, "percentage": 22.98, "elapsed_time": "9:45:07", "remaining_time": "1 day, 8:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4123, "total_steps": 17941, "loss": 1.8198, "learning_rate": 8.885290819442319e-05, "epoch": 0.2298088177916504, "percentage": 22.98, "elapsed_time": "9:45:16", "remaining_time": "1 day, 8:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4124, "total_steps": 17941, "loss": 1.8839, "learning_rate": 8.884730299561642e-05, "epoch": 0.22986455604481357, "percentage": 22.99, "elapsed_time": "9:45:24", "remaining_time": "1 day, 8:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4125, "total_steps": 17941, "loss": 1.5981, "learning_rate": 8.88416965647997e-05, "epoch": 0.2299202942979767, "percentage": 22.99, "elapsed_time": "9:45:32", "remaining_time": "1 day, 8:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4126, "total_steps": 17941, "loss": 1.5802, "learning_rate": 8.883608890215083e-05, "epoch": 0.22997603255113985, "percentage": 23.0, "elapsed_time": "9:45:41", "remaining_time": "1 day, 8:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4127, "total_steps": 17941, "loss": 1.7884, "learning_rate": 8.883048000784764e-05, "epoch": 0.23003177080430298, "percentage": 23.0, "elapsed_time": "9:45:49", "remaining_time": "1 day, 8:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4128, "total_steps": 17941, "loss": 1.8968, "learning_rate": 8.882486988206803e-05, "epoch": 0.23008750905746614, "percentage": 23.01, "elapsed_time": "9:45:58", "remaining_time": "1 day, 8:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4129, "total_steps": 17941, "loss": 1.5026, "learning_rate": 8.881925852498991e-05, "epoch": 0.2301432473106293, "percentage": 23.01, "elapsed_time": "9:46:06", "remaining_time": "1 day, 8:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4130, "total_steps": 17941, "loss": 2.02, "learning_rate": 8.881364593679124e-05, "epoch": 0.23019898556379242, "percentage": 23.02, "elapsed_time": "9:46:15", "remaining_time": "1 day, 8:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4131, "total_steps": 17941, "loss": 1.8447, "learning_rate": 8.880803211765003e-05, "epoch": 0.23025472381695558, "percentage": 23.03, "elapsed_time": "9:46:24", "remaining_time": "1 day, 8:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4132, "total_steps": 17941, "loss": 1.8952, "learning_rate": 8.880241706774431e-05, "epoch": 0.2303104620701187, "percentage": 23.03, "elapsed_time": "9:46:32", "remaining_time": "1 day, 8:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4133, "total_steps": 17941, "loss": 1.79, "learning_rate": 8.879680078725214e-05, "epoch": 0.23036620032328187, "percentage": 23.04, "elapsed_time": "9:46:41", "remaining_time": "1 day, 8:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4134, "total_steps": 17941, "loss": 1.31, "learning_rate": 8.879118327635165e-05, "epoch": 0.23042193857644502, "percentage": 23.04, "elapsed_time": "9:46:49", "remaining_time": "1 day, 8:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4135, "total_steps": 17941, "loss": 1.388, "learning_rate": 8.8785564535221e-05, "epoch": 0.23047767682960815, "percentage": 23.05, "elapsed_time": "9:46:58", "remaining_time": "1 day, 8:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4136, "total_steps": 17941, "loss": 1.8455, "learning_rate": 8.877994456403838e-05, "epoch": 0.2305334150827713, "percentage": 23.05, "elapsed_time": "9:47:06", "remaining_time": "1 day, 8:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4137, "total_steps": 17941, "loss": 1.513, "learning_rate": 8.877432336298201e-05, "epoch": 0.23058915333593444, "percentage": 23.06, "elapsed_time": "9:47:15", "remaining_time": "1 day, 8:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4138, "total_steps": 17941, "loss": 1.6449, "learning_rate": 8.876870093223019e-05, "epoch": 0.2306448915890976, "percentage": 23.06, "elapsed_time": "9:47:23", "remaining_time": "1 day, 8:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4139, "total_steps": 17941, "loss": 2.0891, "learning_rate": 8.87630772719612e-05, "epoch": 0.23070062984226075, "percentage": 23.07, "elapsed_time": "9:47:32", "remaining_time": "1 day, 8:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4140, "total_steps": 17941, "loss": 1.6314, "learning_rate": 8.875745238235341e-05, "epoch": 0.23075636809542388, "percentage": 23.08, "elapsed_time": "9:47:40", "remaining_time": "1 day, 8:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4141, "total_steps": 17941, "loss": 1.5437, "learning_rate": 8.87518262635852e-05, "epoch": 0.23081210634858704, "percentage": 23.08, "elapsed_time": "9:47:49", "remaining_time": "1 day, 8:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4142, "total_steps": 17941, "loss": 1.8075, "learning_rate": 8.8746198915835e-05, "epoch": 0.2308678446017502, "percentage": 23.09, "elapsed_time": "9:47:57", "remaining_time": "1 day, 8:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4143, "total_steps": 17941, "loss": 1.7196, "learning_rate": 8.874057033928128e-05, "epoch": 0.23092358285491332, "percentage": 23.09, "elapsed_time": "9:48:06", "remaining_time": "1 day, 8:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4144, "total_steps": 17941, "loss": 1.7623, "learning_rate": 8.873494053410254e-05, "epoch": 0.23097932110807648, "percentage": 23.1, "elapsed_time": "9:48:14", "remaining_time": "1 day, 8:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4145, "total_steps": 17941, "loss": 1.6683, "learning_rate": 8.872930950047733e-05, "epoch": 0.2310350593612396, "percentage": 23.1, "elapsed_time": "9:48:23", "remaining_time": "1 day, 8:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4146, "total_steps": 17941, "loss": 1.8277, "learning_rate": 8.872367723858422e-05, "epoch": 0.23109079761440277, "percentage": 23.11, "elapsed_time": "9:48:32", "remaining_time": "1 day, 8:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4147, "total_steps": 17941, "loss": 1.9413, "learning_rate": 8.871804374860185e-05, "epoch": 0.23114653586756592, "percentage": 23.11, "elapsed_time": "9:48:40", "remaining_time": "1 day, 8:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4148, "total_steps": 17941, "loss": 1.7471, "learning_rate": 8.871240903070888e-05, "epoch": 0.23120227412072905, "percentage": 23.12, "elapsed_time": "9:48:49", "remaining_time": "1 day, 8:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4149, "total_steps": 17941, "loss": 2.0195, "learning_rate": 8.870677308508399e-05, "epoch": 0.2312580123738922, "percentage": 23.13, "elapsed_time": "9:48:57", "remaining_time": "1 day, 8:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4150, "total_steps": 17941, "loss": 1.5686, "learning_rate": 8.870113591190595e-05, "epoch": 0.23131375062705534, "percentage": 23.13, "elapsed_time": "9:49:06", "remaining_time": "1 day, 8:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4151, "total_steps": 17941, "loss": 1.7178, "learning_rate": 8.869549751135352e-05, "epoch": 0.2313694888802185, "percentage": 23.14, "elapsed_time": "9:49:14", "remaining_time": "1 day, 8:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4152, "total_steps": 17941, "loss": 1.6998, "learning_rate": 8.868985788360551e-05, "epoch": 0.23142522713338165, "percentage": 23.14, "elapsed_time": "9:49:23", "remaining_time": "1 day, 8:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4153, "total_steps": 17941, "loss": 1.5045, "learning_rate": 8.868421702884077e-05, "epoch": 0.23148096538654478, "percentage": 23.15, "elapsed_time": "9:49:31", "remaining_time": "1 day, 8:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4154, "total_steps": 17941, "loss": 1.6035, "learning_rate": 8.867857494723824e-05, "epoch": 0.23153670363970794, "percentage": 23.15, "elapsed_time": "9:49:40", "remaining_time": "1 day, 8:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4155, "total_steps": 17941, "loss": 1.8108, "learning_rate": 8.867293163897681e-05, "epoch": 0.23159244189287106, "percentage": 23.16, "elapsed_time": "9:49:48", "remaining_time": "1 day, 8:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4156, "total_steps": 17941, "loss": 1.5952, "learning_rate": 8.866728710423547e-05, "epoch": 0.23164818014603422, "percentage": 23.16, "elapsed_time": "9:49:57", "remaining_time": "1 day, 8:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4157, "total_steps": 17941, "loss": 1.8621, "learning_rate": 8.866164134319323e-05, "epoch": 0.23170391839919738, "percentage": 23.17, "elapsed_time": "9:50:05", "remaining_time": "1 day, 8:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4158, "total_steps": 17941, "loss": 1.5408, "learning_rate": 8.865599435602915e-05, "epoch": 0.2317596566523605, "percentage": 23.18, "elapsed_time": "9:50:14", "remaining_time": "1 day, 8:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4159, "total_steps": 17941, "loss": 2.2779, "learning_rate": 8.86503461429223e-05, "epoch": 0.23181539490552366, "percentage": 23.18, "elapsed_time": "9:50:23", "remaining_time": "1 day, 8:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4160, "total_steps": 17941, "loss": 1.6574, "learning_rate": 8.86446967040518e-05, "epoch": 0.2318711331586868, "percentage": 23.19, "elapsed_time": "9:50:31", "remaining_time": "1 day, 8:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4161, "total_steps": 17941, "loss": 1.6591, "learning_rate": 8.863904603959686e-05, "epoch": 0.23192687141184995, "percentage": 23.19, "elapsed_time": "9:50:40", "remaining_time": "1 day, 8:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4162, "total_steps": 17941, "loss": 1.7869, "learning_rate": 8.863339414973664e-05, "epoch": 0.2319826096650131, "percentage": 23.2, "elapsed_time": "9:50:49", "remaining_time": "1 day, 8:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4163, "total_steps": 17941, "loss": 1.8322, "learning_rate": 8.862774103465042e-05, "epoch": 0.23203834791817624, "percentage": 23.2, "elapsed_time": "9:50:57", "remaining_time": "1 day, 8:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4164, "total_steps": 17941, "loss": 1.5869, "learning_rate": 8.862208669451748e-05, "epoch": 0.2320940861713394, "percentage": 23.21, "elapsed_time": "9:51:05", "remaining_time": "1 day, 8:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4165, "total_steps": 17941, "loss": 1.9482, "learning_rate": 8.861643112951712e-05, "epoch": 0.23214982442450255, "percentage": 23.21, "elapsed_time": "9:51:14", "remaining_time": "1 day, 8:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4166, "total_steps": 17941, "loss": 1.9292, "learning_rate": 8.86107743398287e-05, "epoch": 0.23220556267766568, "percentage": 23.22, "elapsed_time": "9:51:23", "remaining_time": "1 day, 8:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4167, "total_steps": 17941, "loss": 1.5677, "learning_rate": 8.860511632563166e-05, "epoch": 0.23226130093082883, "percentage": 23.23, "elapsed_time": "9:51:31", "remaining_time": "1 day, 8:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4168, "total_steps": 17941, "loss": 1.8537, "learning_rate": 8.85994570871054e-05, "epoch": 0.23231703918399196, "percentage": 23.23, "elapsed_time": "9:51:39", "remaining_time": "1 day, 8:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4169, "total_steps": 17941, "loss": 1.7031, "learning_rate": 8.859379662442941e-05, "epoch": 0.23237277743715512, "percentage": 23.24, "elapsed_time": "9:51:48", "remaining_time": "1 day, 8:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4170, "total_steps": 17941, "loss": 1.9365, "learning_rate": 8.858813493778322e-05, "epoch": 0.23242851569031828, "percentage": 23.24, "elapsed_time": "9:51:56", "remaining_time": "1 day, 8:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4171, "total_steps": 17941, "loss": 1.7084, "learning_rate": 8.858247202734637e-05, "epoch": 0.2324842539434814, "percentage": 23.25, "elapsed_time": "9:52:05", "remaining_time": "1 day, 8:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4172, "total_steps": 17941, "loss": 1.6353, "learning_rate": 8.857680789329844e-05, "epoch": 0.23253999219664456, "percentage": 23.25, "elapsed_time": "9:52:13", "remaining_time": "1 day, 8:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4173, "total_steps": 17941, "loss": 1.523, "learning_rate": 8.85711425358191e-05, "epoch": 0.2325957304498077, "percentage": 23.26, "elapsed_time": "9:52:22", "remaining_time": "1 day, 8:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4174, "total_steps": 17941, "loss": 1.38, "learning_rate": 8.8565475955088e-05, "epoch": 0.23265146870297085, "percentage": 23.27, "elapsed_time": "9:52:30", "remaining_time": "1 day, 8:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4175, "total_steps": 17941, "loss": 1.5261, "learning_rate": 8.855980815128486e-05, "epoch": 0.232707206956134, "percentage": 23.27, "elapsed_time": "9:52:40", "remaining_time": "1 day, 8:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4176, "total_steps": 17941, "loss": 1.7725, "learning_rate": 8.85541391245894e-05, "epoch": 0.23276294520929713, "percentage": 23.28, "elapsed_time": "9:52:48", "remaining_time": "1 day, 8:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4177, "total_steps": 17941, "loss": 1.4857, "learning_rate": 8.854846887518147e-05, "epoch": 0.2328186834624603, "percentage": 23.28, "elapsed_time": "9:52:56", "remaining_time": "1 day, 8:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4178, "total_steps": 17941, "loss": 1.8393, "learning_rate": 8.854279740324086e-05, "epoch": 0.23287442171562342, "percentage": 23.29, "elapsed_time": "9:53:06", "remaining_time": "1 day, 8:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4179, "total_steps": 17941, "loss": 1.6455, "learning_rate": 8.85371247089474e-05, "epoch": 0.23293015996878658, "percentage": 23.29, "elapsed_time": "9:53:14", "remaining_time": "1 day, 8:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4180, "total_steps": 17941, "loss": 1.6739, "learning_rate": 8.853145079248106e-05, "epoch": 0.23298589822194973, "percentage": 23.3, "elapsed_time": "9:53:23", "remaining_time": "1 day, 8:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4181, "total_steps": 17941, "loss": 1.6312, "learning_rate": 8.852577565402175e-05, "epoch": 0.23304163647511286, "percentage": 23.3, "elapsed_time": "9:53:31", "remaining_time": "1 day, 8:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4182, "total_steps": 17941, "loss": 1.8519, "learning_rate": 8.852009929374945e-05, "epoch": 0.23309737472827602, "percentage": 23.31, "elapsed_time": "9:53:40", "remaining_time": "1 day, 8:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4183, "total_steps": 17941, "loss": 1.6562, "learning_rate": 8.851442171184418e-05, "epoch": 0.23315311298143915, "percentage": 23.32, "elapsed_time": "9:53:48", "remaining_time": "1 day, 8:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4184, "total_steps": 17941, "loss": 1.7597, "learning_rate": 8.850874290848603e-05, "epoch": 0.2332088512346023, "percentage": 23.32, "elapsed_time": "9:53:57", "remaining_time": "1 day, 8:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4185, "total_steps": 17941, "loss": 1.7217, "learning_rate": 8.850306288385505e-05, "epoch": 0.23326458948776546, "percentage": 23.33, "elapsed_time": "9:54:05", "remaining_time": "1 day, 8:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4186, "total_steps": 17941, "loss": 1.7315, "learning_rate": 8.849738163813143e-05, "epoch": 0.2333203277409286, "percentage": 23.33, "elapsed_time": "9:54:14", "remaining_time": "1 day, 8:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4187, "total_steps": 17941, "loss": 1.7419, "learning_rate": 8.849169917149531e-05, "epoch": 0.23337606599409175, "percentage": 23.34, "elapsed_time": "9:54:22", "remaining_time": "1 day, 8:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4188, "total_steps": 17941, "loss": 1.8088, "learning_rate": 8.848601548412691e-05, "epoch": 0.2334318042472549, "percentage": 23.34, "elapsed_time": "9:54:31", "remaining_time": "1 day, 8:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4189, "total_steps": 17941, "loss": 1.6436, "learning_rate": 8.848033057620651e-05, "epoch": 0.23348754250041803, "percentage": 23.35, "elapsed_time": "9:54:39", "remaining_time": "1 day, 8:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4190, "total_steps": 17941, "loss": 1.6382, "learning_rate": 8.847464444791435e-05, "epoch": 0.2335432807535812, "percentage": 23.35, "elapsed_time": "9:54:48", "remaining_time": "1 day, 8:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4191, "total_steps": 17941, "loss": 1.8993, "learning_rate": 8.846895709943082e-05, "epoch": 0.23359901900674432, "percentage": 23.36, "elapsed_time": "9:54:56", "remaining_time": "1 day, 8:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4192, "total_steps": 17941, "loss": 1.7459, "learning_rate": 8.846326853093623e-05, "epoch": 0.23365475725990748, "percentage": 23.37, "elapsed_time": "9:55:05", "remaining_time": "1 day, 8:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4193, "total_steps": 17941, "loss": 1.618, "learning_rate": 8.845757874261104e-05, "epoch": 0.23371049551307063, "percentage": 23.37, "elapsed_time": "9:55:13", "remaining_time": "1 day, 8:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4194, "total_steps": 17941, "loss": 1.6731, "learning_rate": 8.845188773463566e-05, "epoch": 0.23376623376623376, "percentage": 23.38, "elapsed_time": "9:55:22", "remaining_time": "1 day, 8:31:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4195, "total_steps": 17941, "loss": 1.8368, "learning_rate": 8.84461955071906e-05, "epoch": 0.23382197201939692, "percentage": 23.38, "elapsed_time": "9:55:30", "remaining_time": "1 day, 8:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4196, "total_steps": 17941, "loss": 1.805, "learning_rate": 8.844050206045637e-05, "epoch": 0.23387771027256005, "percentage": 23.39, "elapsed_time": "9:55:39", "remaining_time": "1 day, 8:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4197, "total_steps": 17941, "loss": 1.4806, "learning_rate": 8.843480739461356e-05, "epoch": 0.2339334485257232, "percentage": 23.39, "elapsed_time": "9:55:47", "remaining_time": "1 day, 8:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4198, "total_steps": 17941, "loss": 1.7506, "learning_rate": 8.842911150984272e-05, "epoch": 0.23398918677888636, "percentage": 23.4, "elapsed_time": "9:55:56", "remaining_time": "1 day, 8:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4199, "total_steps": 17941, "loss": 1.8434, "learning_rate": 8.842341440632454e-05, "epoch": 0.2340449250320495, "percentage": 23.4, "elapsed_time": "9:56:05", "remaining_time": "1 day, 8:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4200, "total_steps": 17941, "loss": 1.6289, "learning_rate": 8.841771608423967e-05, "epoch": 0.23410066328521265, "percentage": 23.41, "elapsed_time": "9:56:13", "remaining_time": "1 day, 8:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4201, "total_steps": 17941, "loss": 1.782, "learning_rate": 8.841201654376883e-05, "epoch": 0.23415640153837577, "percentage": 23.42, "elapsed_time": "9:56:21", "remaining_time": "1 day, 8:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4202, "total_steps": 17941, "loss": 1.7904, "learning_rate": 8.84063157850928e-05, "epoch": 0.23421213979153893, "percentage": 23.42, "elapsed_time": "9:56:30", "remaining_time": "1 day, 8:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4203, "total_steps": 17941, "loss": 1.5506, "learning_rate": 8.840061380839235e-05, "epoch": 0.2342678780447021, "percentage": 23.43, "elapsed_time": "9:56:38", "remaining_time": "1 day, 8:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4204, "total_steps": 17941, "loss": 1.7914, "learning_rate": 8.839491061384832e-05, "epoch": 0.23432361629786522, "percentage": 23.43, "elapsed_time": "9:56:47", "remaining_time": "1 day, 8:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4205, "total_steps": 17941, "loss": 1.5682, "learning_rate": 8.838920620164157e-05, "epoch": 0.23437935455102837, "percentage": 23.44, "elapsed_time": "9:56:55", "remaining_time": "1 day, 8:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4206, "total_steps": 17941, "loss": 1.6598, "learning_rate": 8.838350057195304e-05, "epoch": 0.23443509280419153, "percentage": 23.44, "elapsed_time": "9:57:03", "remaining_time": "1 day, 8:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4207, "total_steps": 17941, "loss": 1.6682, "learning_rate": 8.837779372496367e-05, "epoch": 0.23449083105735466, "percentage": 23.45, "elapsed_time": "9:57:13", "remaining_time": "1 day, 8:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4208, "total_steps": 17941, "loss": 1.8047, "learning_rate": 8.837208566085441e-05, "epoch": 0.23454656931051782, "percentage": 23.45, "elapsed_time": "9:57:21", "remaining_time": "1 day, 8:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4209, "total_steps": 17941, "loss": 1.6225, "learning_rate": 8.836637637980636e-05, "epoch": 0.23460230756368095, "percentage": 23.46, "elapsed_time": "9:57:30", "remaining_time": "1 day, 8:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4210, "total_steps": 17941, "loss": 1.7139, "learning_rate": 8.836066588200051e-05, "epoch": 0.2346580458168441, "percentage": 23.47, "elapsed_time": "9:57:38", "remaining_time": "1 day, 8:29:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4211, "total_steps": 17941, "loss": 1.7928, "learning_rate": 8.8354954167618e-05, "epoch": 0.23471378407000726, "percentage": 23.47, "elapsed_time": "9:57:47", "remaining_time": "1 day, 8:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4212, "total_steps": 17941, "loss": 1.7035, "learning_rate": 8.834924123683998e-05, "epoch": 0.2347695223231704, "percentage": 23.48, "elapsed_time": "9:57:55", "remaining_time": "1 day, 8:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4213, "total_steps": 17941, "loss": 1.6887, "learning_rate": 8.834352708984762e-05, "epoch": 0.23482526057633354, "percentage": 23.48, "elapsed_time": "9:58:04", "remaining_time": "1 day, 8:28:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4214, "total_steps": 17941, "loss": 1.7476, "learning_rate": 8.833781172682214e-05, "epoch": 0.23488099882949667, "percentage": 23.49, "elapsed_time": "9:58:12", "remaining_time": "1 day, 8:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4215, "total_steps": 17941, "loss": 1.569, "learning_rate": 8.833209514794479e-05, "epoch": 0.23493673708265983, "percentage": 23.49, "elapsed_time": "9:58:21", "remaining_time": "1 day, 8:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4216, "total_steps": 17941, "loss": 1.6762, "learning_rate": 8.832637735339688e-05, "epoch": 0.234992475335823, "percentage": 23.5, "elapsed_time": "9:58:30", "remaining_time": "1 day, 8:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4217, "total_steps": 17941, "loss": 1.6699, "learning_rate": 8.832065834335973e-05, "epoch": 0.23504821358898612, "percentage": 23.5, "elapsed_time": "9:58:38", "remaining_time": "1 day, 8:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4218, "total_steps": 17941, "loss": 1.8292, "learning_rate": 8.831493811801472e-05, "epoch": 0.23510395184214927, "percentage": 23.51, "elapsed_time": "9:58:46", "remaining_time": "1 day, 8:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4219, "total_steps": 17941, "loss": 1.6958, "learning_rate": 8.830921667754328e-05, "epoch": 0.2351596900953124, "percentage": 23.52, "elapsed_time": "9:58:55", "remaining_time": "1 day, 8:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4220, "total_steps": 17941, "loss": 1.7544, "learning_rate": 8.830349402212683e-05, "epoch": 0.23521542834847556, "percentage": 23.52, "elapsed_time": "9:59:03", "remaining_time": "1 day, 8:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4221, "total_steps": 17941, "loss": 1.676, "learning_rate": 8.82977701519469e-05, "epoch": 0.23527116660163871, "percentage": 23.53, "elapsed_time": "9:59:12", "remaining_time": "1 day, 8:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4222, "total_steps": 17941, "loss": 1.7395, "learning_rate": 8.829204506718496e-05, "epoch": 0.23532690485480184, "percentage": 23.53, "elapsed_time": "9:59:20", "remaining_time": "1 day, 8:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4223, "total_steps": 17941, "loss": 1.8418, "learning_rate": 8.828631876802263e-05, "epoch": 0.235382643107965, "percentage": 23.54, "elapsed_time": "9:59:29", "remaining_time": "1 day, 8:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4224, "total_steps": 17941, "loss": 1.5981, "learning_rate": 8.828059125464148e-05, "epoch": 0.23543838136112813, "percentage": 23.54, "elapsed_time": "9:59:37", "remaining_time": "1 day, 8:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4225, "total_steps": 17941, "loss": 1.9862, "learning_rate": 8.827486252722316e-05, "epoch": 0.2354941196142913, "percentage": 23.55, "elapsed_time": "9:59:46", "remaining_time": "1 day, 8:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4226, "total_steps": 17941, "loss": 1.9931, "learning_rate": 8.826913258594937e-05, "epoch": 0.23554985786745444, "percentage": 23.55, "elapsed_time": "9:59:54", "remaining_time": "1 day, 8:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4227, "total_steps": 17941, "loss": 1.8651, "learning_rate": 8.826340143100182e-05, "epoch": 0.23560559612061757, "percentage": 23.56, "elapsed_time": "10:00:03", "remaining_time": "1 day, 8:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4228, "total_steps": 17941, "loss": 1.6837, "learning_rate": 8.825766906256228e-05, "epoch": 0.23566133437378073, "percentage": 23.57, "elapsed_time": "10:00:11", "remaining_time": "1 day, 8:26:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4229, "total_steps": 17941, "loss": 1.4064, "learning_rate": 8.825193548081252e-05, "epoch": 0.23571707262694389, "percentage": 23.57, "elapsed_time": "10:00:20", "remaining_time": "1 day, 8:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4230, "total_steps": 17941, "loss": 1.7501, "learning_rate": 8.824620068593439e-05, "epoch": 0.23577281088010701, "percentage": 23.58, "elapsed_time": "10:00:28", "remaining_time": "1 day, 8:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4231, "total_steps": 17941, "loss": 1.7263, "learning_rate": 8.824046467810976e-05, "epoch": 0.23582854913327017, "percentage": 23.58, "elapsed_time": "10:00:37", "remaining_time": "1 day, 8:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4232, "total_steps": 17941, "loss": 1.7752, "learning_rate": 8.823472745752055e-05, "epoch": 0.2358842873864333, "percentage": 23.59, "elapsed_time": "10:00:45", "remaining_time": "1 day, 8:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4233, "total_steps": 17941, "loss": 1.7809, "learning_rate": 8.822898902434873e-05, "epoch": 0.23594002563959646, "percentage": 23.59, "elapsed_time": "10:00:53", "remaining_time": "1 day, 8:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4234, "total_steps": 17941, "loss": 1.5033, "learning_rate": 8.822324937877624e-05, "epoch": 0.2359957638927596, "percentage": 23.6, "elapsed_time": "10:01:02", "remaining_time": "1 day, 8:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4235, "total_steps": 17941, "loss": 1.735, "learning_rate": 8.821750852098515e-05, "epoch": 0.23605150214592274, "percentage": 23.61, "elapsed_time": "10:01:10", "remaining_time": "1 day, 8:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4236, "total_steps": 17941, "loss": 1.8211, "learning_rate": 8.821176645115752e-05, "epoch": 0.2361072403990859, "percentage": 23.61, "elapsed_time": "10:01:19", "remaining_time": "1 day, 8:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4237, "total_steps": 17941, "loss": 1.6501, "learning_rate": 8.820602316947544e-05, "epoch": 0.23616297865224903, "percentage": 23.62, "elapsed_time": "10:01:28", "remaining_time": "1 day, 8:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4238, "total_steps": 17941, "loss": 1.9297, "learning_rate": 8.820027867612107e-05, "epoch": 0.23621871690541218, "percentage": 23.62, "elapsed_time": "10:01:36", "remaining_time": "1 day, 8:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4239, "total_steps": 17941, "loss": 1.7881, "learning_rate": 8.819453297127657e-05, "epoch": 0.23627445515857534, "percentage": 23.63, "elapsed_time": "10:01:44", "remaining_time": "1 day, 8:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4240, "total_steps": 17941, "loss": 1.7629, "learning_rate": 8.818878605512418e-05, "epoch": 0.23633019341173847, "percentage": 23.63, "elapsed_time": "10:01:53", "remaining_time": "1 day, 8:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4241, "total_steps": 17941, "loss": 1.939, "learning_rate": 8.818303792784615e-05, "epoch": 0.23638593166490163, "percentage": 23.64, "elapsed_time": "10:02:01", "remaining_time": "1 day, 8:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4242, "total_steps": 17941, "loss": 1.7058, "learning_rate": 8.817728858962478e-05, "epoch": 0.23644166991806476, "percentage": 23.64, "elapsed_time": "10:02:10", "remaining_time": "1 day, 8:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4243, "total_steps": 17941, "loss": 1.6284, "learning_rate": 8.817153804064241e-05, "epoch": 0.2364974081712279, "percentage": 23.65, "elapsed_time": "10:02:19", "remaining_time": "1 day, 8:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4244, "total_steps": 17941, "loss": 1.7203, "learning_rate": 8.81657862810814e-05, "epoch": 0.23655314642439107, "percentage": 23.66, "elapsed_time": "10:02:27", "remaining_time": "1 day, 8:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4245, "total_steps": 17941, "loss": 2.0629, "learning_rate": 8.816003331112419e-05, "epoch": 0.2366088846775542, "percentage": 23.66, "elapsed_time": "10:02:36", "remaining_time": "1 day, 8:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4246, "total_steps": 17941, "loss": 1.7256, "learning_rate": 8.81542791309532e-05, "epoch": 0.23666462293071736, "percentage": 23.67, "elapsed_time": "10:02:45", "remaining_time": "1 day, 8:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4247, "total_steps": 17941, "loss": 1.6476, "learning_rate": 8.814852374075093e-05, "epoch": 0.23672036118388048, "percentage": 23.67, "elapsed_time": "10:02:54", "remaining_time": "1 day, 8:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4248, "total_steps": 17941, "loss": 1.57, "learning_rate": 8.81427671406999e-05, "epoch": 0.23677609943704364, "percentage": 23.68, "elapsed_time": "10:03:02", "remaining_time": "1 day, 8:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4249, "total_steps": 17941, "loss": 1.497, "learning_rate": 8.81370093309827e-05, "epoch": 0.2368318376902068, "percentage": 23.68, "elapsed_time": "10:03:11", "remaining_time": "1 day, 8:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4250, "total_steps": 17941, "loss": 1.9324, "learning_rate": 8.813125031178191e-05, "epoch": 0.23688757594336993, "percentage": 23.69, "elapsed_time": "10:03:19", "remaining_time": "1 day, 8:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4251, "total_steps": 17941, "loss": 1.7841, "learning_rate": 8.812549008328017e-05, "epoch": 0.23694331419653308, "percentage": 23.69, "elapsed_time": "10:03:28", "remaining_time": "1 day, 8:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4252, "total_steps": 17941, "loss": 1.6966, "learning_rate": 8.811972864566018e-05, "epoch": 0.23699905244969624, "percentage": 23.7, "elapsed_time": "10:03:36", "remaining_time": "1 day, 8:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4253, "total_steps": 17941, "loss": 1.6449, "learning_rate": 8.811396599910467e-05, "epoch": 0.23705479070285937, "percentage": 23.71, "elapsed_time": "10:03:45", "remaining_time": "1 day, 8:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4254, "total_steps": 17941, "loss": 1.8372, "learning_rate": 8.810820214379636e-05, "epoch": 0.23711052895602253, "percentage": 23.71, "elapsed_time": "10:03:53", "remaining_time": "1 day, 8:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4255, "total_steps": 17941, "loss": 1.9996, "learning_rate": 8.810243707991805e-05, "epoch": 0.23716626720918565, "percentage": 23.72, "elapsed_time": "10:04:02", "remaining_time": "1 day, 8:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4256, "total_steps": 17941, "loss": 1.7619, "learning_rate": 8.809667080765262e-05, "epoch": 0.2372220054623488, "percentage": 23.72, "elapsed_time": "10:04:10", "remaining_time": "1 day, 8:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4257, "total_steps": 17941, "loss": 1.8621, "learning_rate": 8.809090332718288e-05, "epoch": 0.23727774371551197, "percentage": 23.73, "elapsed_time": "10:04:18", "remaining_time": "1 day, 8:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4258, "total_steps": 17941, "loss": 1.6625, "learning_rate": 8.808513463869179e-05, "epoch": 0.2373334819686751, "percentage": 23.73, "elapsed_time": "10:04:27", "remaining_time": "1 day, 8:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4259, "total_steps": 17941, "loss": 1.5929, "learning_rate": 8.80793647423623e-05, "epoch": 0.23738922022183825, "percentage": 23.74, "elapsed_time": "10:04:35", "remaining_time": "1 day, 8:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4260, "total_steps": 17941, "loss": 1.7551, "learning_rate": 8.807359363837734e-05, "epoch": 0.23744495847500138, "percentage": 23.74, "elapsed_time": "10:04:44", "remaining_time": "1 day, 8:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4261, "total_steps": 17941, "loss": 1.9474, "learning_rate": 8.806782132691999e-05, "epoch": 0.23750069672816454, "percentage": 23.75, "elapsed_time": "10:04:52", "remaining_time": "1 day, 8:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4262, "total_steps": 17941, "loss": 1.6914, "learning_rate": 8.806204780817331e-05, "epoch": 0.2375564349813277, "percentage": 23.76, "elapsed_time": "10:05:01", "remaining_time": "1 day, 8:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4263, "total_steps": 17941, "loss": 1.4148, "learning_rate": 8.805627308232036e-05, "epoch": 0.23761217323449083, "percentage": 23.76, "elapsed_time": "10:05:09", "remaining_time": "1 day, 8:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4264, "total_steps": 17941, "loss": 1.8304, "learning_rate": 8.805049714954434e-05, "epoch": 0.23766791148765398, "percentage": 23.77, "elapsed_time": "10:05:18", "remaining_time": "1 day, 8:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4265, "total_steps": 17941, "loss": 1.4575, "learning_rate": 8.804472001002839e-05, "epoch": 0.2377236497408171, "percentage": 23.77, "elapsed_time": "10:05:26", "remaining_time": "1 day, 8:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4266, "total_steps": 17941, "loss": 1.515, "learning_rate": 8.803894166395574e-05, "epoch": 0.23777938799398027, "percentage": 23.78, "elapsed_time": "10:05:34", "remaining_time": "1 day, 8:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4267, "total_steps": 17941, "loss": 1.657, "learning_rate": 8.803316211150964e-05, "epoch": 0.23783512624714342, "percentage": 23.78, "elapsed_time": "10:05:44", "remaining_time": "1 day, 8:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4268, "total_steps": 17941, "loss": 1.5228, "learning_rate": 8.802738135287338e-05, "epoch": 0.23789086450030655, "percentage": 23.79, "elapsed_time": "10:05:52", "remaining_time": "1 day, 8:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4269, "total_steps": 17941, "loss": 1.5667, "learning_rate": 8.802159938823031e-05, "epoch": 0.2379466027534697, "percentage": 23.79, "elapsed_time": "10:06:00", "remaining_time": "1 day, 8:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4270, "total_steps": 17941, "loss": 1.9385, "learning_rate": 8.801581621776379e-05, "epoch": 0.23800234100663284, "percentage": 23.8, "elapsed_time": "10:06:09", "remaining_time": "1 day, 8:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4271, "total_steps": 17941, "loss": 1.9139, "learning_rate": 8.801003184165722e-05, "epoch": 0.238058079259796, "percentage": 23.81, "elapsed_time": "10:06:17", "remaining_time": "1 day, 8:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4272, "total_steps": 17941, "loss": 1.8107, "learning_rate": 8.800424626009407e-05, "epoch": 0.23811381751295915, "percentage": 23.81, "elapsed_time": "10:06:26", "remaining_time": "1 day, 8:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4273, "total_steps": 17941, "loss": 1.72, "learning_rate": 8.799845947325777e-05, "epoch": 0.23816955576612228, "percentage": 23.82, "elapsed_time": "10:06:34", "remaining_time": "1 day, 8:20:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4274, "total_steps": 17941, "loss": 1.6711, "learning_rate": 8.799267148133192e-05, "epoch": 0.23822529401928544, "percentage": 23.82, "elapsed_time": "10:06:43", "remaining_time": "1 day, 8:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4275, "total_steps": 17941, "loss": 1.5716, "learning_rate": 8.798688228450002e-05, "epoch": 0.2382810322724486, "percentage": 23.83, "elapsed_time": "10:06:52", "remaining_time": "1 day, 8:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4276, "total_steps": 17941, "loss": 1.6498, "learning_rate": 8.798109188294572e-05, "epoch": 0.23833677052561172, "percentage": 23.83, "elapsed_time": "10:07:01", "remaining_time": "1 day, 8:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4277, "total_steps": 17941, "loss": 1.8761, "learning_rate": 8.797530027685261e-05, "epoch": 0.23839250877877488, "percentage": 23.84, "elapsed_time": "10:07:10", "remaining_time": "1 day, 8:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4278, "total_steps": 17941, "loss": 1.6984, "learning_rate": 8.796950746640439e-05, "epoch": 0.238448247031938, "percentage": 23.84, "elapsed_time": "10:07:18", "remaining_time": "1 day, 8:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4279, "total_steps": 17941, "loss": 1.3414, "learning_rate": 8.796371345178476e-05, "epoch": 0.23850398528510117, "percentage": 23.85, "elapsed_time": "10:07:27", "remaining_time": "1 day, 8:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4280, "total_steps": 17941, "loss": 1.716, "learning_rate": 8.79579182331775e-05, "epoch": 0.23855972353826432, "percentage": 23.86, "elapsed_time": "10:07:36", "remaining_time": "1 day, 8:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4281, "total_steps": 17941, "loss": 1.6889, "learning_rate": 8.795212181076638e-05, "epoch": 0.23861546179142745, "percentage": 23.86, "elapsed_time": "10:07:44", "remaining_time": "1 day, 8:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4282, "total_steps": 17941, "loss": 1.6941, "learning_rate": 8.794632418473522e-05, "epoch": 0.2386712000445906, "percentage": 23.87, "elapsed_time": "10:07:53", "remaining_time": "1 day, 8:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4283, "total_steps": 17941, "loss": 1.756, "learning_rate": 8.794052535526792e-05, "epoch": 0.23872693829775374, "percentage": 23.87, "elapsed_time": "10:08:01", "remaining_time": "1 day, 8:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4284, "total_steps": 17941, "loss": 1.8349, "learning_rate": 8.793472532254836e-05, "epoch": 0.2387826765509169, "percentage": 23.88, "elapsed_time": "10:08:10", "remaining_time": "1 day, 8:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4285, "total_steps": 17941, "loss": 1.6617, "learning_rate": 8.792892408676048e-05, "epoch": 0.23883841480408005, "percentage": 23.88, "elapsed_time": "10:08:18", "remaining_time": "1 day, 8:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4286, "total_steps": 17941, "loss": 1.5132, "learning_rate": 8.792312164808827e-05, "epoch": 0.23889415305724318, "percentage": 23.89, "elapsed_time": "10:08:27", "remaining_time": "1 day, 8:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4287, "total_steps": 17941, "loss": 1.7937, "learning_rate": 8.791731800671575e-05, "epoch": 0.23894989131040634, "percentage": 23.89, "elapsed_time": "10:08:35", "remaining_time": "1 day, 8:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4288, "total_steps": 17941, "loss": 1.8488, "learning_rate": 8.791151316282698e-05, "epoch": 0.23900562956356947, "percentage": 23.9, "elapsed_time": "10:08:43", "remaining_time": "1 day, 8:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4289, "total_steps": 17941, "loss": 1.7211, "learning_rate": 8.790570711660604e-05, "epoch": 0.23906136781673262, "percentage": 23.91, "elapsed_time": "10:08:52", "remaining_time": "1 day, 8:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4290, "total_steps": 17941, "loss": 1.6015, "learning_rate": 8.789989986823707e-05, "epoch": 0.23911710606989578, "percentage": 23.91, "elapsed_time": "10:09:00", "remaining_time": "1 day, 8:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4291, "total_steps": 17941, "loss": 1.7375, "learning_rate": 8.789409141790426e-05, "epoch": 0.2391728443230589, "percentage": 23.92, "elapsed_time": "10:09:09", "remaining_time": "1 day, 8:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4292, "total_steps": 17941, "loss": 1.7231, "learning_rate": 8.788828176579182e-05, "epoch": 0.23922858257622207, "percentage": 23.92, "elapsed_time": "10:09:17", "remaining_time": "1 day, 8:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4293, "total_steps": 17941, "loss": 1.7355, "learning_rate": 8.788247091208397e-05, "epoch": 0.2392843208293852, "percentage": 23.93, "elapsed_time": "10:09:26", "remaining_time": "1 day, 8:17:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4294, "total_steps": 17941, "loss": 2.0786, "learning_rate": 8.787665885696502e-05, "epoch": 0.23934005908254835, "percentage": 23.93, "elapsed_time": "10:09:35", "remaining_time": "1 day, 8:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4295, "total_steps": 17941, "loss": 1.6045, "learning_rate": 8.78708456006193e-05, "epoch": 0.2393957973357115, "percentage": 23.94, "elapsed_time": "10:09:44", "remaining_time": "1 day, 8:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4296, "total_steps": 17941, "loss": 1.6679, "learning_rate": 8.786503114323113e-05, "epoch": 0.23945153558887464, "percentage": 23.95, "elapsed_time": "10:09:52", "remaining_time": "1 day, 8:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4297, "total_steps": 17941, "loss": 1.6646, "learning_rate": 8.785921548498494e-05, "epoch": 0.2395072738420378, "percentage": 23.95, "elapsed_time": "10:10:01", "remaining_time": "1 day, 8:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4298, "total_steps": 17941, "loss": 1.7888, "learning_rate": 8.785339862606521e-05, "epoch": 0.23956301209520095, "percentage": 23.96, "elapsed_time": "10:10:09", "remaining_time": "1 day, 8:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4299, "total_steps": 17941, "loss": 1.9363, "learning_rate": 8.784758056665634e-05, "epoch": 0.23961875034836408, "percentage": 23.96, "elapsed_time": "10:10:18", "remaining_time": "1 day, 8:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4300, "total_steps": 17941, "loss": 1.8477, "learning_rate": 8.784176130694289e-05, "epoch": 0.23967448860152724, "percentage": 23.97, "elapsed_time": "10:10:26", "remaining_time": "1 day, 8:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4301, "total_steps": 17941, "loss": 1.9106, "learning_rate": 8.783594084710941e-05, "epoch": 0.23973022685469036, "percentage": 23.97, "elapsed_time": "10:10:35", "remaining_time": "1 day, 8:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4302, "total_steps": 17941, "loss": 1.7685, "learning_rate": 8.783011918734048e-05, "epoch": 0.23978596510785352, "percentage": 23.98, "elapsed_time": "10:10:43", "remaining_time": "1 day, 8:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4303, "total_steps": 17941, "loss": 1.6641, "learning_rate": 8.782429632782073e-05, "epoch": 0.23984170336101668, "percentage": 23.98, "elapsed_time": "10:10:52", "remaining_time": "1 day, 8:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4304, "total_steps": 17941, "loss": 1.8908, "learning_rate": 8.781847226873484e-05, "epoch": 0.2398974416141798, "percentage": 23.99, "elapsed_time": "10:11:00", "remaining_time": "1 day, 8:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4305, "total_steps": 17941, "loss": 1.5571, "learning_rate": 8.78126470102675e-05, "epoch": 0.23995317986734296, "percentage": 24.0, "elapsed_time": "10:11:09", "remaining_time": "1 day, 8:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4306, "total_steps": 17941, "loss": 1.514, "learning_rate": 8.780682055260348e-05, "epoch": 0.2400089181205061, "percentage": 24.0, "elapsed_time": "10:11:17", "remaining_time": "1 day, 8:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4307, "total_steps": 17941, "loss": 1.581, "learning_rate": 8.780099289592751e-05, "epoch": 0.24006465637366925, "percentage": 24.01, "elapsed_time": "10:11:26", "remaining_time": "1 day, 8:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4308, "total_steps": 17941, "loss": 1.7344, "learning_rate": 8.779516404042446e-05, "epoch": 0.2401203946268324, "percentage": 24.01, "elapsed_time": "10:11:35", "remaining_time": "1 day, 8:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4309, "total_steps": 17941, "loss": 1.7162, "learning_rate": 8.778933398627915e-05, "epoch": 0.24017613287999554, "percentage": 24.02, "elapsed_time": "10:11:44", "remaining_time": "1 day, 8:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4310, "total_steps": 17941, "loss": 1.7958, "learning_rate": 8.778350273367653e-05, "epoch": 0.2402318711331587, "percentage": 24.02, "elapsed_time": "10:11:52", "remaining_time": "1 day, 8:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4311, "total_steps": 17941, "loss": 1.4958, "learning_rate": 8.777767028280145e-05, "epoch": 0.24028760938632182, "percentage": 24.03, "elapsed_time": "10:12:01", "remaining_time": "1 day, 8:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4312, "total_steps": 17941, "loss": 1.6876, "learning_rate": 8.777183663383896e-05, "epoch": 0.24034334763948498, "percentage": 24.03, "elapsed_time": "10:12:09", "remaining_time": "1 day, 8:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4313, "total_steps": 17941, "loss": 1.7538, "learning_rate": 8.776600178697402e-05, "epoch": 0.24039908589264813, "percentage": 24.04, "elapsed_time": "10:12:18", "remaining_time": "1 day, 8:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4314, "total_steps": 17941, "loss": 1.7722, "learning_rate": 8.776016574239171e-05, "epoch": 0.24045482414581126, "percentage": 24.05, "elapsed_time": "10:12:26", "remaining_time": "1 day, 8:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4315, "total_steps": 17941, "loss": 1.8447, "learning_rate": 8.77543285002771e-05, "epoch": 0.24051056239897442, "percentage": 24.05, "elapsed_time": "10:12:35", "remaining_time": "1 day, 8:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4316, "total_steps": 17941, "loss": 2.111, "learning_rate": 8.774849006081529e-05, "epoch": 0.24056630065213755, "percentage": 24.06, "elapsed_time": "10:12:43", "remaining_time": "1 day, 8:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4317, "total_steps": 17941, "loss": 1.9022, "learning_rate": 8.774265042419148e-05, "epoch": 0.2406220389053007, "percentage": 24.06, "elapsed_time": "10:12:52", "remaining_time": "1 day, 8:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4318, "total_steps": 17941, "loss": 1.4723, "learning_rate": 8.773680959059086e-05, "epoch": 0.24067777715846386, "percentage": 24.07, "elapsed_time": "10:13:00", "remaining_time": "1 day, 8:14:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4319, "total_steps": 17941, "loss": 1.8138, "learning_rate": 8.773096756019866e-05, "epoch": 0.240733515411627, "percentage": 24.07, "elapsed_time": "10:13:09", "remaining_time": "1 day, 8:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4320, "total_steps": 17941, "loss": 1.5152, "learning_rate": 8.772512433320014e-05, "epoch": 0.24078925366479015, "percentage": 24.08, "elapsed_time": "10:13:17", "remaining_time": "1 day, 8:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4321, "total_steps": 17941, "loss": 1.7373, "learning_rate": 8.771927990978063e-05, "epoch": 0.2408449919179533, "percentage": 24.08, "elapsed_time": "10:13:26", "remaining_time": "1 day, 8:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4322, "total_steps": 17941, "loss": 1.3736, "learning_rate": 8.771343429012549e-05, "epoch": 0.24090073017111643, "percentage": 24.09, "elapsed_time": "10:13:34", "remaining_time": "1 day, 8:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4323, "total_steps": 17941, "loss": 1.7854, "learning_rate": 8.77075874744201e-05, "epoch": 0.2409564684242796, "percentage": 24.1, "elapsed_time": "10:13:43", "remaining_time": "1 day, 8:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4324, "total_steps": 17941, "loss": 1.9596, "learning_rate": 8.770173946284987e-05, "epoch": 0.24101220667744272, "percentage": 24.1, "elapsed_time": "10:13:51", "remaining_time": "1 day, 8:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4325, "total_steps": 17941, "loss": 1.6905, "learning_rate": 8.76958902556003e-05, "epoch": 0.24106794493060588, "percentage": 24.11, "elapsed_time": "10:14:00", "remaining_time": "1 day, 8:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4326, "total_steps": 17941, "loss": 1.8015, "learning_rate": 8.769003985285686e-05, "epoch": 0.24112368318376903, "percentage": 24.11, "elapsed_time": "10:14:09", "remaining_time": "1 day, 8:12:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4327, "total_steps": 17941, "loss": 1.7408, "learning_rate": 8.76841882548051e-05, "epoch": 0.24117942143693216, "percentage": 24.12, "elapsed_time": "10:14:17", "remaining_time": "1 day, 8:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4328, "total_steps": 17941, "loss": 1.6473, "learning_rate": 8.767833546163062e-05, "epoch": 0.24123515969009532, "percentage": 24.12, "elapsed_time": "10:14:26", "remaining_time": "1 day, 8:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4329, "total_steps": 17941, "loss": 1.724, "learning_rate": 8.767248147351902e-05, "epoch": 0.24129089794325845, "percentage": 24.13, "elapsed_time": "10:14:35", "remaining_time": "1 day, 8:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4330, "total_steps": 17941, "loss": 1.7469, "learning_rate": 8.766662629065594e-05, "epoch": 0.2413466361964216, "percentage": 24.13, "elapsed_time": "10:14:44", "remaining_time": "1 day, 8:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4331, "total_steps": 17941, "loss": 1.7262, "learning_rate": 8.76607699132271e-05, "epoch": 0.24140237444958476, "percentage": 24.14, "elapsed_time": "10:14:52", "remaining_time": "1 day, 8:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4332, "total_steps": 17941, "loss": 2.0055, "learning_rate": 8.76549123414182e-05, "epoch": 0.2414581127027479, "percentage": 24.15, "elapsed_time": "10:15:01", "remaining_time": "1 day, 8:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4333, "total_steps": 17941, "loss": 1.7602, "learning_rate": 8.764905357541505e-05, "epoch": 0.24151385095591105, "percentage": 24.15, "elapsed_time": "10:15:09", "remaining_time": "1 day, 8:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4334, "total_steps": 17941, "loss": 1.7666, "learning_rate": 8.76431936154034e-05, "epoch": 0.24156958920907418, "percentage": 24.16, "elapsed_time": "10:15:18", "remaining_time": "1 day, 8:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4335, "total_steps": 17941, "loss": 1.5892, "learning_rate": 8.763733246156913e-05, "epoch": 0.24162532746223733, "percentage": 24.16, "elapsed_time": "10:15:27", "remaining_time": "1 day, 8:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4336, "total_steps": 17941, "loss": 1.9398, "learning_rate": 8.763147011409811e-05, "epoch": 0.2416810657154005, "percentage": 24.17, "elapsed_time": "10:15:35", "remaining_time": "1 day, 8:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4337, "total_steps": 17941, "loss": 1.4019, "learning_rate": 8.762560657317629e-05, "epoch": 0.24173680396856362, "percentage": 24.17, "elapsed_time": "10:15:44", "remaining_time": "1 day, 8:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4338, "total_steps": 17941, "loss": 1.7063, "learning_rate": 8.761974183898957e-05, "epoch": 0.24179254222172678, "percentage": 24.18, "elapsed_time": "10:15:53", "remaining_time": "1 day, 8:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4339, "total_steps": 17941, "loss": 1.7957, "learning_rate": 8.7613875911724e-05, "epoch": 0.2418482804748899, "percentage": 24.18, "elapsed_time": "10:16:01", "remaining_time": "1 day, 8:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4340, "total_steps": 17941, "loss": 1.5686, "learning_rate": 8.760800879156558e-05, "epoch": 0.24190401872805306, "percentage": 24.19, "elapsed_time": "10:16:10", "remaining_time": "1 day, 8:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4341, "total_steps": 17941, "loss": 2.0046, "learning_rate": 8.760214047870039e-05, "epoch": 0.24195975698121622, "percentage": 24.2, "elapsed_time": "10:16:18", "remaining_time": "1 day, 8:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4342, "total_steps": 17941, "loss": 1.6902, "learning_rate": 8.759627097331455e-05, "epoch": 0.24201549523437935, "percentage": 24.2, "elapsed_time": "10:16:26", "remaining_time": "1 day, 8:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4343, "total_steps": 17941, "loss": 1.9046, "learning_rate": 8.759040027559418e-05, "epoch": 0.2420712334875425, "percentage": 24.21, "elapsed_time": "10:16:35", "remaining_time": "1 day, 8:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4344, "total_steps": 17941, "loss": 1.7593, "learning_rate": 8.758452838572551e-05, "epoch": 0.24212697174070566, "percentage": 24.21, "elapsed_time": "10:16:44", "remaining_time": "1 day, 8:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4345, "total_steps": 17941, "loss": 2.0021, "learning_rate": 8.75786553038947e-05, "epoch": 0.2421827099938688, "percentage": 24.22, "elapsed_time": "10:16:52", "remaining_time": "1 day, 8:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4346, "total_steps": 17941, "loss": 1.1718, "learning_rate": 8.757278103028806e-05, "epoch": 0.24223844824703195, "percentage": 24.22, "elapsed_time": "10:17:00", "remaining_time": "1 day, 8:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4347, "total_steps": 17941, "loss": 1.6083, "learning_rate": 8.756690556509186e-05, "epoch": 0.24229418650019507, "percentage": 24.23, "elapsed_time": "10:17:09", "remaining_time": "1 day, 8:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4348, "total_steps": 17941, "loss": 1.6982, "learning_rate": 8.756102890849246e-05, "epoch": 0.24234992475335823, "percentage": 24.23, "elapsed_time": "10:17:18", "remaining_time": "1 day, 8:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4349, "total_steps": 17941, "loss": 1.8505, "learning_rate": 8.75551510606762e-05, "epoch": 0.2424056630065214, "percentage": 24.24, "elapsed_time": "10:17:26", "remaining_time": "1 day, 8:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4350, "total_steps": 17941, "loss": 1.8455, "learning_rate": 8.754927202182953e-05, "epoch": 0.24246140125968452, "percentage": 24.25, "elapsed_time": "10:17:35", "remaining_time": "1 day, 8:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4351, "total_steps": 17941, "loss": 1.5964, "learning_rate": 8.754339179213886e-05, "epoch": 0.24251713951284767, "percentage": 24.25, "elapsed_time": "10:17:43", "remaining_time": "1 day, 8:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4352, "total_steps": 17941, "loss": 1.7428, "learning_rate": 8.753751037179073e-05, "epoch": 0.2425728777660108, "percentage": 24.26, "elapsed_time": "10:17:52", "remaining_time": "1 day, 8:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4353, "total_steps": 17941, "loss": 1.7279, "learning_rate": 8.75316277609716e-05, "epoch": 0.24262861601917396, "percentage": 24.26, "elapsed_time": "10:18:00", "remaining_time": "1 day, 8:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4354, "total_steps": 17941, "loss": 1.508, "learning_rate": 8.752574395986806e-05, "epoch": 0.24268435427233712, "percentage": 24.27, "elapsed_time": "10:18:09", "remaining_time": "1 day, 8:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4355, "total_steps": 17941, "loss": 1.8978, "learning_rate": 8.751985896866672e-05, "epoch": 0.24274009252550025, "percentage": 24.27, "elapsed_time": "10:18:17", "remaining_time": "1 day, 8:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4356, "total_steps": 17941, "loss": 1.94, "learning_rate": 8.75139727875542e-05, "epoch": 0.2427958307786634, "percentage": 24.28, "elapsed_time": "10:18:26", "remaining_time": "1 day, 8:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4357, "total_steps": 17941, "loss": 1.9239, "learning_rate": 8.75080854167172e-05, "epoch": 0.24285156903182653, "percentage": 24.29, "elapsed_time": "10:18:34", "remaining_time": "1 day, 8:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4358, "total_steps": 17941, "loss": 1.6965, "learning_rate": 8.75021968563424e-05, "epoch": 0.2429073072849897, "percentage": 24.29, "elapsed_time": "10:18:43", "remaining_time": "1 day, 8:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4359, "total_steps": 17941, "loss": 1.7979, "learning_rate": 8.749630710661658e-05, "epoch": 0.24296304553815284, "percentage": 24.3, "elapsed_time": "10:18:51", "remaining_time": "1 day, 8:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4360, "total_steps": 17941, "loss": 1.753, "learning_rate": 8.749041616772653e-05, "epoch": 0.24301878379131597, "percentage": 24.3, "elapsed_time": "10:19:00", "remaining_time": "1 day, 8:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4361, "total_steps": 17941, "loss": 1.518, "learning_rate": 8.748452403985905e-05, "epoch": 0.24307452204447913, "percentage": 24.31, "elapsed_time": "10:19:08", "remaining_time": "1 day, 8:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4362, "total_steps": 17941, "loss": 1.7267, "learning_rate": 8.747863072320102e-05, "epoch": 0.24313026029764226, "percentage": 24.31, "elapsed_time": "10:19:17", "remaining_time": "1 day, 8:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4363, "total_steps": 17941, "loss": 1.6697, "learning_rate": 8.747273621793932e-05, "epoch": 0.24318599855080542, "percentage": 24.32, "elapsed_time": "10:19:25", "remaining_time": "1 day, 8:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4364, "total_steps": 17941, "loss": 1.628, "learning_rate": 8.746684052426093e-05, "epoch": 0.24324173680396857, "percentage": 24.32, "elapsed_time": "10:19:34", "remaining_time": "1 day, 8:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4365, "total_steps": 17941, "loss": 1.8611, "learning_rate": 8.74609436423528e-05, "epoch": 0.2432974750571317, "percentage": 24.33, "elapsed_time": "10:19:43", "remaining_time": "1 day, 8:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4366, "total_steps": 17941, "loss": 1.8587, "learning_rate": 8.745504557240195e-05, "epoch": 0.24335321331029486, "percentage": 24.34, "elapsed_time": "10:19:51", "remaining_time": "1 day, 8:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4367, "total_steps": 17941, "loss": 1.82, "learning_rate": 8.744914631459544e-05, "epoch": 0.24340895156345801, "percentage": 24.34, "elapsed_time": "10:20:00", "remaining_time": "1 day, 8:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4368, "total_steps": 17941, "loss": 1.5662, "learning_rate": 8.744324586912033e-05, "epoch": 0.24346468981662114, "percentage": 24.35, "elapsed_time": "10:20:09", "remaining_time": "1 day, 8:07:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4369, "total_steps": 17941, "loss": 1.618, "learning_rate": 8.74373442361638e-05, "epoch": 0.2435204280697843, "percentage": 24.35, "elapsed_time": "10:20:18", "remaining_time": "1 day, 8:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4370, "total_steps": 17941, "loss": 1.6436, "learning_rate": 8.743144141591297e-05, "epoch": 0.24357616632294743, "percentage": 24.36, "elapsed_time": "10:20:26", "remaining_time": "1 day, 8:06:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4371, "total_steps": 17941, "loss": 1.9764, "learning_rate": 8.742553740855506e-05, "epoch": 0.2436319045761106, "percentage": 24.36, "elapsed_time": "10:20:35", "remaining_time": "1 day, 8:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4372, "total_steps": 17941, "loss": 1.4643, "learning_rate": 8.741963221427732e-05, "epoch": 0.24368764282927374, "percentage": 24.37, "elapsed_time": "10:20:43", "remaining_time": "1 day, 8:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4373, "total_steps": 17941, "loss": 1.7132, "learning_rate": 8.7413725833267e-05, "epoch": 0.24374338108243687, "percentage": 24.37, "elapsed_time": "10:20:52", "remaining_time": "1 day, 8:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4374, "total_steps": 17941, "loss": 1.613, "learning_rate": 8.740781826571144e-05, "epoch": 0.24379911933560003, "percentage": 24.38, "elapsed_time": "10:21:00", "remaining_time": "1 day, 8:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4375, "total_steps": 17941, "loss": 1.7225, "learning_rate": 8.740190951179799e-05, "epoch": 0.24385485758876316, "percentage": 24.39, "elapsed_time": "10:21:09", "remaining_time": "1 day, 8:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4376, "total_steps": 17941, "loss": 1.7796, "learning_rate": 8.739599957171404e-05, "epoch": 0.24391059584192631, "percentage": 24.39, "elapsed_time": "10:21:18", "remaining_time": "1 day, 8:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4377, "total_steps": 17941, "loss": 1.8918, "learning_rate": 8.7390088445647e-05, "epoch": 0.24396633409508947, "percentage": 24.4, "elapsed_time": "10:21:26", "remaining_time": "1 day, 8:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4378, "total_steps": 17941, "loss": 1.6408, "learning_rate": 8.738417613378439e-05, "epoch": 0.2440220723482526, "percentage": 24.4, "elapsed_time": "10:21:34", "remaining_time": "1 day, 8:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4379, "total_steps": 17941, "loss": 1.5007, "learning_rate": 8.737826263631363e-05, "epoch": 0.24407781060141576, "percentage": 24.41, "elapsed_time": "10:21:43", "remaining_time": "1 day, 8:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4380, "total_steps": 17941, "loss": 1.8818, "learning_rate": 8.737826263631363e-05, "epoch": 0.24413354885457889, "percentage": 24.41, "elapsed_time": "10:21:51", "remaining_time": "1 day, 8:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4381, "total_steps": 17941, "loss": 1.6008, "learning_rate": 8.737234795342234e-05, "epoch": 0.24418928710774204, "percentage": 24.42, "elapsed_time": "10:22:00", "remaining_time": "1 day, 8:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4382, "total_steps": 17941, "loss": 1.5589, "learning_rate": 8.736643208529807e-05, "epoch": 0.2442450253609052, "percentage": 24.42, "elapsed_time": "10:22:08", "remaining_time": "1 day, 8:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4383, "total_steps": 17941, "loss": 1.8349, "learning_rate": 8.736051503212843e-05, "epoch": 0.24430076361406833, "percentage": 24.43, "elapsed_time": "10:22:17", "remaining_time": "1 day, 8:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4384, "total_steps": 17941, "loss": 1.6444, "learning_rate": 8.735459679410108e-05, "epoch": 0.24435650186723148, "percentage": 24.44, "elapsed_time": "10:22:25", "remaining_time": "1 day, 8:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4385, "total_steps": 17941, "loss": 1.5685, "learning_rate": 8.734867737140371e-05, "epoch": 0.2444122401203946, "percentage": 24.44, "elapsed_time": "10:22:34", "remaining_time": "1 day, 8:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4386, "total_steps": 17941, "loss": 1.7138, "learning_rate": 8.734275676422406e-05, "epoch": 0.24446797837355777, "percentage": 24.45, "elapsed_time": "10:22:43", "remaining_time": "1 day, 8:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4387, "total_steps": 17941, "loss": 1.8035, "learning_rate": 8.73368349727499e-05, "epoch": 0.24452371662672093, "percentage": 24.45, "elapsed_time": "10:22:51", "remaining_time": "1 day, 8:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4388, "total_steps": 17941, "loss": 1.7692, "learning_rate": 8.733091199716899e-05, "epoch": 0.24457945487988406, "percentage": 24.46, "elapsed_time": "10:23:00", "remaining_time": "1 day, 8:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4389, "total_steps": 17941, "loss": 1.7145, "learning_rate": 8.732498783766923e-05, "epoch": 0.2446351931330472, "percentage": 24.46, "elapsed_time": "10:23:09", "remaining_time": "1 day, 8:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4390, "total_steps": 17941, "loss": 1.3759, "learning_rate": 8.731906249443847e-05, "epoch": 0.24469093138621037, "percentage": 24.47, "elapsed_time": "10:23:17", "remaining_time": "1 day, 8:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4391, "total_steps": 17941, "loss": 1.6403, "learning_rate": 8.731313596766461e-05, "epoch": 0.2447466696393735, "percentage": 24.47, "elapsed_time": "10:23:26", "remaining_time": "1 day, 8:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4392, "total_steps": 17941, "loss": 1.7304, "learning_rate": 8.730720825753567e-05, "epoch": 0.24480240789253666, "percentage": 24.48, "elapsed_time": "10:23:34", "remaining_time": "1 day, 8:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4393, "total_steps": 17941, "loss": 1.7039, "learning_rate": 8.730127936423957e-05, "epoch": 0.24485814614569978, "percentage": 24.49, "elapsed_time": "10:23:43", "remaining_time": "1 day, 8:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4394, "total_steps": 17941, "loss": 1.87, "learning_rate": 8.729534928796438e-05, "epoch": 0.24491388439886294, "percentage": 24.49, "elapsed_time": "10:23:52", "remaining_time": "1 day, 8:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4395, "total_steps": 17941, "loss": 1.6194, "learning_rate": 8.728941802889816e-05, "epoch": 0.2449696226520261, "percentage": 24.5, "elapsed_time": "10:24:00", "remaining_time": "1 day, 8:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4396, "total_steps": 17941, "loss": 1.6804, "learning_rate": 8.728348558722901e-05, "epoch": 0.24502536090518923, "percentage": 24.5, "elapsed_time": "10:24:09", "remaining_time": "1 day, 8:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4397, "total_steps": 17941, "loss": 1.5289, "learning_rate": 8.727755196314507e-05, "epoch": 0.24508109915835238, "percentage": 24.51, "elapsed_time": "10:24:17", "remaining_time": "1 day, 8:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4398, "total_steps": 17941, "loss": 1.7488, "learning_rate": 8.727161715683452e-05, "epoch": 0.2451368374115155, "percentage": 24.51, "elapsed_time": "10:24:26", "remaining_time": "1 day, 8:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4399, "total_steps": 17941, "loss": 1.4552, "learning_rate": 8.726568116848559e-05, "epoch": 0.24519257566467867, "percentage": 24.52, "elapsed_time": "10:24:34", "remaining_time": "1 day, 8:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4400, "total_steps": 17941, "loss": 1.8822, "learning_rate": 8.725974399828653e-05, "epoch": 0.24524831391784183, "percentage": 24.52, "elapsed_time": "10:24:43", "remaining_time": "1 day, 8:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4401, "total_steps": 17941, "loss": 1.7286, "learning_rate": 8.725380564642563e-05, "epoch": 0.24530405217100495, "percentage": 24.53, "elapsed_time": "10:24:52", "remaining_time": "1 day, 8:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4402, "total_steps": 17941, "loss": 1.5182, "learning_rate": 8.724786611309123e-05, "epoch": 0.2453597904241681, "percentage": 24.54, "elapsed_time": "10:25:00", "remaining_time": "1 day, 8:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4403, "total_steps": 17941, "loss": 1.7967, "learning_rate": 8.724192539847167e-05, "epoch": 0.24541552867733124, "percentage": 24.54, "elapsed_time": "10:25:09", "remaining_time": "1 day, 8:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4404, "total_steps": 17941, "loss": 1.8081, "learning_rate": 8.723598350275537e-05, "epoch": 0.2454712669304944, "percentage": 24.55, "elapsed_time": "10:25:18", "remaining_time": "1 day, 8:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4405, "total_steps": 17941, "loss": 1.8369, "learning_rate": 8.723004042613079e-05, "epoch": 0.24552700518365755, "percentage": 24.55, "elapsed_time": "10:25:26", "remaining_time": "1 day, 8:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4406, "total_steps": 17941, "loss": 1.6556, "learning_rate": 8.722409616878637e-05, "epoch": 0.24558274343682068, "percentage": 24.56, "elapsed_time": "10:25:35", "remaining_time": "1 day, 8:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4407, "total_steps": 17941, "loss": 1.5745, "learning_rate": 8.721815073091068e-05, "epoch": 0.24563848168998384, "percentage": 24.56, "elapsed_time": "10:25:44", "remaining_time": "1 day, 8:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4408, "total_steps": 17941, "loss": 1.8282, "learning_rate": 8.721220411269222e-05, "epoch": 0.24569421994314697, "percentage": 24.57, "elapsed_time": "10:25:52", "remaining_time": "1 day, 8:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4409, "total_steps": 17941, "loss": 1.6782, "learning_rate": 8.720625631431963e-05, "epoch": 0.24574995819631013, "percentage": 24.57, "elapsed_time": "10:26:01", "remaining_time": "1 day, 8:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4410, "total_steps": 17941, "loss": 1.7703, "learning_rate": 8.72003073359815e-05, "epoch": 0.24580569644947328, "percentage": 24.58, "elapsed_time": "10:26:09", "remaining_time": "1 day, 8:01:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4411, "total_steps": 17941, "loss": 1.4931, "learning_rate": 8.719435717786653e-05, "epoch": 0.2458614347026364, "percentage": 24.59, "elapsed_time": "10:26:18", "remaining_time": "1 day, 8:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4412, "total_steps": 17941, "loss": 1.8267, "learning_rate": 8.718840584016339e-05, "epoch": 0.24591717295579957, "percentage": 24.59, "elapsed_time": "10:26:26", "remaining_time": "1 day, 8:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4413, "total_steps": 17941, "loss": 1.7073, "learning_rate": 8.718245332306086e-05, "epoch": 0.24597291120896272, "percentage": 24.6, "elapsed_time": "10:26:35", "remaining_time": "1 day, 8:00:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4414, "total_steps": 17941, "loss": 1.7481, "learning_rate": 8.717649962674768e-05, "epoch": 0.24602864946212585, "percentage": 24.6, "elapsed_time": "10:26:43", "remaining_time": "1 day, 8:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4415, "total_steps": 17941, "loss": 1.4674, "learning_rate": 8.71705447514127e-05, "epoch": 0.246084387715289, "percentage": 24.61, "elapsed_time": "10:26:52", "remaining_time": "1 day, 8:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4416, "total_steps": 17941, "loss": 1.7044, "learning_rate": 8.716458869724475e-05, "epoch": 0.24614012596845214, "percentage": 24.61, "elapsed_time": "10:27:01", "remaining_time": "1 day, 8:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4417, "total_steps": 17941, "loss": 1.9216, "learning_rate": 8.715863146443273e-05, "epoch": 0.2461958642216153, "percentage": 24.62, "elapsed_time": "10:27:09", "remaining_time": "1 day, 8:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4418, "total_steps": 17941, "loss": 1.3814, "learning_rate": 8.715267305316558e-05, "epoch": 0.24625160247477845, "percentage": 24.63, "elapsed_time": "10:27:18", "remaining_time": "1 day, 8:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4419, "total_steps": 17941, "loss": 1.7245, "learning_rate": 8.714671346363226e-05, "epoch": 0.24630734072794158, "percentage": 24.63, "elapsed_time": "10:27:26", "remaining_time": "1 day, 7:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4420, "total_steps": 17941, "loss": 1.7225, "learning_rate": 8.714075269602176e-05, "epoch": 0.24636307898110474, "percentage": 24.64, "elapsed_time": "10:27:35", "remaining_time": "1 day, 7:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4421, "total_steps": 17941, "loss": 1.637, "learning_rate": 8.713479075052312e-05, "epoch": 0.24641881723426787, "percentage": 24.64, "elapsed_time": "10:27:43", "remaining_time": "1 day, 7:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4422, "total_steps": 17941, "loss": 2.0957, "learning_rate": 8.712882762732543e-05, "epoch": 0.24647455548743102, "percentage": 24.65, "elapsed_time": "10:27:52", "remaining_time": "1 day, 7:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4423, "total_steps": 17941, "loss": 1.8551, "learning_rate": 8.712286332661783e-05, "epoch": 0.24653029374059418, "percentage": 24.65, "elapsed_time": "10:28:00", "remaining_time": "1 day, 7:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4424, "total_steps": 17941, "loss": 2.0364, "learning_rate": 8.711689784858943e-05, "epoch": 0.2465860319937573, "percentage": 24.66, "elapsed_time": "10:28:09", "remaining_time": "1 day, 7:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4425, "total_steps": 17941, "loss": 1.9078, "learning_rate": 8.711093119342944e-05, "epoch": 0.24664177024692047, "percentage": 24.66, "elapsed_time": "10:28:17", "remaining_time": "1 day, 7:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4426, "total_steps": 17941, "loss": 1.7235, "learning_rate": 8.710496336132707e-05, "epoch": 0.2466975085000836, "percentage": 24.67, "elapsed_time": "10:28:26", "remaining_time": "1 day, 7:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4427, "total_steps": 17941, "loss": 1.5281, "learning_rate": 8.709899435247162e-05, "epoch": 0.24675324675324675, "percentage": 24.68, "elapsed_time": "10:28:34", "remaining_time": "1 day, 7:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4428, "total_steps": 17941, "loss": 1.6194, "learning_rate": 8.709302416705235e-05, "epoch": 0.2468089850064099, "percentage": 24.68, "elapsed_time": "10:28:43", "remaining_time": "1 day, 7:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4429, "total_steps": 17941, "loss": 1.8987, "learning_rate": 8.708705280525863e-05, "epoch": 0.24686472325957304, "percentage": 24.69, "elapsed_time": "10:28:51", "remaining_time": "1 day, 7:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4430, "total_steps": 17941, "loss": 1.8762, "learning_rate": 8.708108026727983e-05, "epoch": 0.2469204615127362, "percentage": 24.69, "elapsed_time": "10:29:00", "remaining_time": "1 day, 7:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4431, "total_steps": 17941, "loss": 1.7246, "learning_rate": 8.707510655330535e-05, "epoch": 0.24697619976589932, "percentage": 24.7, "elapsed_time": "10:29:08", "remaining_time": "1 day, 7:58:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4432, "total_steps": 17941, "loss": 1.7012, "learning_rate": 8.706913166352468e-05, "epoch": 0.24703193801906248, "percentage": 24.7, "elapsed_time": "10:29:17", "remaining_time": "1 day, 7:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4433, "total_steps": 17941, "loss": 1.6476, "learning_rate": 8.706315559812725e-05, "epoch": 0.24708767627222564, "percentage": 24.71, "elapsed_time": "10:29:25", "remaining_time": "1 day, 7:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4434, "total_steps": 17941, "loss": 1.7085, "learning_rate": 8.705717835730263e-05, "epoch": 0.24714341452538877, "percentage": 24.71, "elapsed_time": "10:29:34", "remaining_time": "1 day, 7:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4435, "total_steps": 17941, "loss": 1.6553, "learning_rate": 8.705119994124038e-05, "epoch": 0.24719915277855192, "percentage": 24.72, "elapsed_time": "10:29:42", "remaining_time": "1 day, 7:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4436, "total_steps": 17941, "loss": 1.9495, "learning_rate": 8.70452203501301e-05, "epoch": 0.24725489103171508, "percentage": 24.73, "elapsed_time": "10:29:51", "remaining_time": "1 day, 7:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4437, "total_steps": 17941, "loss": 1.6201, "learning_rate": 8.703923958416141e-05, "epoch": 0.2473106292848782, "percentage": 24.73, "elapsed_time": "10:29:59", "remaining_time": "1 day, 7:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4438, "total_steps": 17941, "loss": 1.6372, "learning_rate": 8.703325764352397e-05, "epoch": 0.24736636753804137, "percentage": 24.74, "elapsed_time": "10:30:08", "remaining_time": "1 day, 7:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4439, "total_steps": 17941, "loss": 1.7135, "learning_rate": 8.702727452840753e-05, "epoch": 0.2474221057912045, "percentage": 24.74, "elapsed_time": "10:30:16", "remaining_time": "1 day, 7:57:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4440, "total_steps": 17941, "loss": 1.7636, "learning_rate": 8.702129023900184e-05, "epoch": 0.24747784404436765, "percentage": 24.75, "elapsed_time": "10:30:25", "remaining_time": "1 day, 7:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4441, "total_steps": 17941, "loss": 1.7144, "learning_rate": 8.701530477549666e-05, "epoch": 0.2475335822975308, "percentage": 24.75, "elapsed_time": "10:30:33", "remaining_time": "1 day, 7:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4442, "total_steps": 17941, "loss": 1.7915, "learning_rate": 8.700931813808182e-05, "epoch": 0.24758932055069394, "percentage": 24.76, "elapsed_time": "10:30:42", "remaining_time": "1 day, 7:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4443, "total_steps": 17941, "loss": 1.8956, "learning_rate": 8.700333032694721e-05, "epoch": 0.2476450588038571, "percentage": 24.76, "elapsed_time": "10:30:50", "remaining_time": "1 day, 7:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4444, "total_steps": 17941, "loss": 2.0, "learning_rate": 8.69973413422827e-05, "epoch": 0.24770079705702022, "percentage": 24.77, "elapsed_time": "10:30:59", "remaining_time": "1 day, 7:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4445, "total_steps": 17941, "loss": 1.7215, "learning_rate": 8.699135118427821e-05, "epoch": 0.24775653531018338, "percentage": 24.78, "elapsed_time": "10:31:07", "remaining_time": "1 day, 7:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4446, "total_steps": 17941, "loss": 1.5958, "learning_rate": 8.698535985312376e-05, "epoch": 0.24781227356334654, "percentage": 24.78, "elapsed_time": "10:31:16", "remaining_time": "1 day, 7:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4447, "total_steps": 17941, "loss": 1.7741, "learning_rate": 8.697936734900932e-05, "epoch": 0.24786801181650966, "percentage": 24.79, "elapsed_time": "10:31:24", "remaining_time": "1 day, 7:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4448, "total_steps": 17941, "loss": 1.7966, "learning_rate": 8.697337367212496e-05, "epoch": 0.24792375006967282, "percentage": 24.79, "elapsed_time": "10:31:32", "remaining_time": "1 day, 7:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4449, "total_steps": 17941, "loss": 1.8026, "learning_rate": 8.696737882266076e-05, "epoch": 0.24797948832283595, "percentage": 24.8, "elapsed_time": "10:31:41", "remaining_time": "1 day, 7:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4450, "total_steps": 17941, "loss": 1.7823, "learning_rate": 8.696138280080684e-05, "epoch": 0.2480352265759991, "percentage": 24.8, "elapsed_time": "10:31:49", "remaining_time": "1 day, 7:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4451, "total_steps": 17941, "loss": 1.5817, "learning_rate": 8.695538560675334e-05, "epoch": 0.24809096482916226, "percentage": 24.81, "elapsed_time": "10:31:58", "remaining_time": "1 day, 7:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4452, "total_steps": 17941, "loss": 1.8425, "learning_rate": 8.694938724069048e-05, "epoch": 0.2481467030823254, "percentage": 24.81, "elapsed_time": "10:32:07", "remaining_time": "1 day, 7:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4453, "total_steps": 17941, "loss": 1.6939, "learning_rate": 8.69433877028085e-05, "epoch": 0.24820244133548855, "percentage": 24.82, "elapsed_time": "10:32:15", "remaining_time": "1 day, 7:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4454, "total_steps": 17941, "loss": 1.6874, "learning_rate": 8.693738699329765e-05, "epoch": 0.24825817958865168, "percentage": 24.83, "elapsed_time": "10:32:24", "remaining_time": "1 day, 7:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4455, "total_steps": 17941, "loss": 1.7339, "learning_rate": 8.693138511234825e-05, "epoch": 0.24831391784181484, "percentage": 24.83, "elapsed_time": "10:32:32", "remaining_time": "1 day, 7:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4456, "total_steps": 17941, "loss": 1.8301, "learning_rate": 8.692538206015062e-05, "epoch": 0.248369656094978, "percentage": 24.84, "elapsed_time": "10:32:41", "remaining_time": "1 day, 7:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4457, "total_steps": 17941, "loss": 1.7435, "learning_rate": 8.691937783689518e-05, "epoch": 0.24842539434814112, "percentage": 24.84, "elapsed_time": "10:32:49", "remaining_time": "1 day, 7:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4458, "total_steps": 17941, "loss": 1.6348, "learning_rate": 8.691337244277231e-05, "epoch": 0.24848113260130428, "percentage": 24.85, "elapsed_time": "10:32:58", "remaining_time": "1 day, 7:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4459, "total_steps": 17941, "loss": 1.6839, "learning_rate": 8.69073658779725e-05, "epoch": 0.24853687085446743, "percentage": 24.85, "elapsed_time": "10:33:06", "remaining_time": "1 day, 7:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4460, "total_steps": 17941, "loss": 1.7292, "learning_rate": 8.690135814268623e-05, "epoch": 0.24859260910763056, "percentage": 24.86, "elapsed_time": "10:33:15", "remaining_time": "1 day, 7:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4461, "total_steps": 17941, "loss": 1.8113, "learning_rate": 8.689534923710403e-05, "epoch": 0.24864834736079372, "percentage": 24.86, "elapsed_time": "10:33:23", "remaining_time": "1 day, 7:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4462, "total_steps": 17941, "loss": 1.9261, "learning_rate": 8.688933916141647e-05, "epoch": 0.24870408561395685, "percentage": 24.87, "elapsed_time": "10:33:31", "remaining_time": "1 day, 7:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4463, "total_steps": 17941, "loss": 1.8136, "learning_rate": 8.688332791581415e-05, "epoch": 0.24875982386712, "percentage": 24.88, "elapsed_time": "10:33:40", "remaining_time": "1 day, 7:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4464, "total_steps": 17941, "loss": 1.6383, "learning_rate": 8.68773155004877e-05, "epoch": 0.24881556212028316, "percentage": 24.88, "elapsed_time": "10:33:48", "remaining_time": "1 day, 7:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4465, "total_steps": 17941, "loss": 1.7313, "learning_rate": 8.687130191562782e-05, "epoch": 0.2488713003734463, "percentage": 24.89, "elapsed_time": "10:33:57", "remaining_time": "1 day, 7:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4466, "total_steps": 17941, "loss": 1.7355, "learning_rate": 8.686528716142523e-05, "epoch": 0.24892703862660945, "percentage": 24.89, "elapsed_time": "10:34:05", "remaining_time": "1 day, 7:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4467, "total_steps": 17941, "loss": 1.7786, "learning_rate": 8.685927123807065e-05, "epoch": 0.24898277687977258, "percentage": 24.9, "elapsed_time": "10:34:14", "remaining_time": "1 day, 7:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4468, "total_steps": 17941, "loss": 1.8995, "learning_rate": 8.68532541457549e-05, "epoch": 0.24903851513293573, "percentage": 24.9, "elapsed_time": "10:34:22", "remaining_time": "1 day, 7:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4469, "total_steps": 17941, "loss": 1.86, "learning_rate": 8.68472358846688e-05, "epoch": 0.2490942533860989, "percentage": 24.91, "elapsed_time": "10:34:31", "remaining_time": "1 day, 7:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4470, "total_steps": 17941, "loss": 1.803, "learning_rate": 8.684121645500322e-05, "epoch": 0.24914999163926202, "percentage": 24.91, "elapsed_time": "10:34:39", "remaining_time": "1 day, 7:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4471, "total_steps": 17941, "loss": 1.5786, "learning_rate": 8.683519585694903e-05, "epoch": 0.24920572989242518, "percentage": 24.92, "elapsed_time": "10:34:48", "remaining_time": "1 day, 7:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4472, "total_steps": 17941, "loss": 1.8524, "learning_rate": 8.682917409069721e-05, "epoch": 0.2492614681455883, "percentage": 24.93, "elapsed_time": "10:34:56", "remaining_time": "1 day, 7:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4473, "total_steps": 17941, "loss": 1.7891, "learning_rate": 8.682315115643872e-05, "epoch": 0.24931720639875146, "percentage": 24.93, "elapsed_time": "10:35:06", "remaining_time": "1 day, 7:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4474, "total_steps": 17941, "loss": 1.3104, "learning_rate": 8.681712705436455e-05, "epoch": 0.24937294465191462, "percentage": 24.94, "elapsed_time": "10:35:15", "remaining_time": "1 day, 7:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4475, "total_steps": 17941, "loss": 1.7571, "learning_rate": 8.68111017846658e-05, "epoch": 0.24942868290507775, "percentage": 24.94, "elapsed_time": "10:35:23", "remaining_time": "1 day, 7:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4476, "total_steps": 17941, "loss": 1.7915, "learning_rate": 8.68050753475335e-05, "epoch": 0.2494844211582409, "percentage": 24.95, "elapsed_time": "10:35:32", "remaining_time": "1 day, 7:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4477, "total_steps": 17941, "loss": 1.7928, "learning_rate": 8.67990477431588e-05, "epoch": 0.24954015941140403, "percentage": 24.95, "elapsed_time": "10:35:40", "remaining_time": "1 day, 7:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4478, "total_steps": 17941, "loss": 1.6592, "learning_rate": 8.679301897173287e-05, "epoch": 0.2495958976645672, "percentage": 24.96, "elapsed_time": "10:35:49", "remaining_time": "1 day, 7:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4479, "total_steps": 17941, "loss": 1.6482, "learning_rate": 8.678698903344689e-05, "epoch": 0.24965163591773035, "percentage": 24.97, "elapsed_time": "10:35:57", "remaining_time": "1 day, 7:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4480, "total_steps": 17941, "loss": 1.7838, "learning_rate": 8.67809579284921e-05, "epoch": 0.24970737417089348, "percentage": 24.97, "elapsed_time": "10:36:07", "remaining_time": "1 day, 7:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4481, "total_steps": 17941, "loss": 1.7705, "learning_rate": 8.677492565705976e-05, "epoch": 0.24976311242405663, "percentage": 24.98, "elapsed_time": "10:36:15", "remaining_time": "1 day, 7:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4482, "total_steps": 17941, "loss": 1.8349, "learning_rate": 8.676889221934121e-05, "epoch": 0.2498188506772198, "percentage": 24.98, "elapsed_time": "10:36:24", "remaining_time": "1 day, 7:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4483, "total_steps": 17941, "loss": 1.6761, "learning_rate": 8.676285761552775e-05, "epoch": 0.24987458893038292, "percentage": 24.99, "elapsed_time": "10:36:32", "remaining_time": "1 day, 7:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4484, "total_steps": 17941, "loss": 1.6409, "learning_rate": 8.675682184581081e-05, "epoch": 0.24993032718354607, "percentage": 24.99, "elapsed_time": "10:36:41", "remaining_time": "1 day, 7:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4485, "total_steps": 17941, "loss": 1.4604, "learning_rate": 8.67507849103818e-05, "epoch": 0.2499860654367092, "percentage": 25.0, "elapsed_time": "10:36:49", "remaining_time": "1 day, 7:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4486, "total_steps": 17941, "loss": 1.5605, "learning_rate": 8.674474680943215e-05, "epoch": 0.25004180368987233, "percentage": 25.0, "elapsed_time": "10:36:58", "remaining_time": "1 day, 7:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4487, "total_steps": 17941, "loss": 1.625, "learning_rate": 8.673870754315336e-05, "epoch": 0.2500975419430355, "percentage": 25.01, "elapsed_time": "10:37:06", "remaining_time": "1 day, 7:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4488, "total_steps": 17941, "loss": 1.7826, "learning_rate": 8.673266711173698e-05, "epoch": 0.25015328019619865, "percentage": 25.02, "elapsed_time": "10:37:15", "remaining_time": "1 day, 7:50:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4489, "total_steps": 17941, "loss": 1.595, "learning_rate": 8.672662551537457e-05, "epoch": 0.2502090184493618, "percentage": 25.02, "elapsed_time": "10:37:24", "remaining_time": "1 day, 7:50:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4490, "total_steps": 17941, "loss": 1.5468, "learning_rate": 8.672058275425772e-05, "epoch": 0.25026475670252496, "percentage": 25.03, "elapsed_time": "10:37:32", "remaining_time": "1 day, 7:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4491, "total_steps": 17941, "loss": 1.8862, "learning_rate": 8.671453882857808e-05, "epoch": 0.2503204949556881, "percentage": 25.03, "elapsed_time": "10:37:41", "remaining_time": "1 day, 7:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4492, "total_steps": 17941, "loss": 1.6133, "learning_rate": 8.670849373852734e-05, "epoch": 0.2503762332088512, "percentage": 25.04, "elapsed_time": "10:37:49", "remaining_time": "1 day, 7:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4493, "total_steps": 17941, "loss": 1.7045, "learning_rate": 8.670244748429719e-05, "epoch": 0.2504319714620144, "percentage": 25.04, "elapsed_time": "10:37:58", "remaining_time": "1 day, 7:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4494, "total_steps": 17941, "loss": 1.6462, "learning_rate": 8.66964000660794e-05, "epoch": 0.25048770971517753, "percentage": 25.05, "elapsed_time": "10:38:06", "remaining_time": "1 day, 7:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4495, "total_steps": 17941, "loss": 1.5736, "learning_rate": 8.669035148406577e-05, "epoch": 0.25054344796834066, "percentage": 25.05, "elapsed_time": "10:38:15", "remaining_time": "1 day, 7:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4496, "total_steps": 17941, "loss": 1.8931, "learning_rate": 8.668430173844808e-05, "epoch": 0.25059918622150384, "percentage": 25.06, "elapsed_time": "10:38:24", "remaining_time": "1 day, 7:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4497, "total_steps": 17941, "loss": 1.6553, "learning_rate": 8.667825082941826e-05, "epoch": 0.250654924474667, "percentage": 25.07, "elapsed_time": "10:38:33", "remaining_time": "1 day, 7:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4498, "total_steps": 17941, "loss": 1.7692, "learning_rate": 8.667219875716814e-05, "epoch": 0.2507106627278301, "percentage": 25.07, "elapsed_time": "10:38:41", "remaining_time": "1 day, 7:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4499, "total_steps": 17941, "loss": 1.8116, "learning_rate": 8.66661455218897e-05, "epoch": 0.25076640098099323, "percentage": 25.08, "elapsed_time": "10:38:50", "remaining_time": "1 day, 7:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4500, "total_steps": 17941, "loss": 1.938, "learning_rate": 8.666009112377491e-05, "epoch": 0.2508221392341564, "percentage": 25.08, "elapsed_time": "10:38:58", "remaining_time": "1 day, 7:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4501, "total_steps": 17941, "loss": 1.6026, "learning_rate": 8.665403556301576e-05, "epoch": 0.25087787748731954, "percentage": 25.09, "elapsed_time": "10:39:07", "remaining_time": "1 day, 7:48:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4502, "total_steps": 17941, "loss": 1.6589, "learning_rate": 8.664797883980434e-05, "epoch": 0.2509336157404827, "percentage": 25.09, "elapsed_time": "10:39:15", "remaining_time": "1 day, 7:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4503, "total_steps": 17941, "loss": 1.7016, "learning_rate": 8.664192095433266e-05, "epoch": 0.25098935399364586, "percentage": 25.1, "elapsed_time": "10:39:23", "remaining_time": "1 day, 7:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4504, "total_steps": 17941, "loss": 1.8425, "learning_rate": 8.663586190679291e-05, "epoch": 0.251045092246809, "percentage": 25.1, "elapsed_time": "10:39:32", "remaining_time": "1 day, 7:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4505, "total_steps": 17941, "loss": 1.6105, "learning_rate": 8.662980169737723e-05, "epoch": 0.2511008304999721, "percentage": 25.11, "elapsed_time": "10:39:40", "remaining_time": "1 day, 7:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4506, "total_steps": 17941, "loss": 1.9352, "learning_rate": 8.662374032627778e-05, "epoch": 0.2511565687531353, "percentage": 25.12, "elapsed_time": "10:39:49", "remaining_time": "1 day, 7:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4507, "total_steps": 17941, "loss": 1.7867, "learning_rate": 8.661767779368683e-05, "epoch": 0.25121230700629843, "percentage": 25.12, "elapsed_time": "10:39:58", "remaining_time": "1 day, 7:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4508, "total_steps": 17941, "loss": 1.6947, "learning_rate": 8.661161409979665e-05, "epoch": 0.25126804525946156, "percentage": 25.13, "elapsed_time": "10:40:06", "remaining_time": "1 day, 7:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4509, "total_steps": 17941, "loss": 1.796, "learning_rate": 8.66055492447995e-05, "epoch": 0.2513237835126247, "percentage": 25.13, "elapsed_time": "10:40:14", "remaining_time": "1 day, 7:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4510, "total_steps": 17941, "loss": 1.6343, "learning_rate": 8.659948322888777e-05, "epoch": 0.25137952176578787, "percentage": 25.14, "elapsed_time": "10:40:23", "remaining_time": "1 day, 7:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4511, "total_steps": 17941, "loss": 1.8057, "learning_rate": 8.659341605225384e-05, "epoch": 0.251435260018951, "percentage": 25.14, "elapsed_time": "10:40:32", "remaining_time": "1 day, 7:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4512, "total_steps": 17941, "loss": 1.8123, "learning_rate": 8.65873477150901e-05, "epoch": 0.25149099827211413, "percentage": 25.15, "elapsed_time": "10:40:40", "remaining_time": "1 day, 7:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4513, "total_steps": 17941, "loss": 1.7952, "learning_rate": 8.658127821758899e-05, "epoch": 0.2515467365252773, "percentage": 25.15, "elapsed_time": "10:40:48", "remaining_time": "1 day, 7:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4514, "total_steps": 17941, "loss": 1.8295, "learning_rate": 8.657520755994305e-05, "epoch": 0.25160247477844044, "percentage": 25.16, "elapsed_time": "10:40:57", "remaining_time": "1 day, 7:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4515, "total_steps": 17941, "loss": 1.6294, "learning_rate": 8.656913574234474e-05, "epoch": 0.2516582130316036, "percentage": 25.17, "elapsed_time": "10:41:06", "remaining_time": "1 day, 7:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4516, "total_steps": 17941, "loss": 1.8597, "learning_rate": 8.656306276498667e-05, "epoch": 0.25171395128476676, "percentage": 25.17, "elapsed_time": "10:41:14", "remaining_time": "1 day, 7:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4517, "total_steps": 17941, "loss": 1.7067, "learning_rate": 8.655698862806143e-05, "epoch": 0.2517696895379299, "percentage": 25.18, "elapsed_time": "10:41:23", "remaining_time": "1 day, 7:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4518, "total_steps": 17941, "loss": 1.7043, "learning_rate": 8.655091333176165e-05, "epoch": 0.251825427791093, "percentage": 25.18, "elapsed_time": "10:41:31", "remaining_time": "1 day, 7:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4519, "total_steps": 17941, "loss": 1.7418, "learning_rate": 8.654483687628002e-05, "epoch": 0.2518811660442562, "percentage": 25.19, "elapsed_time": "10:41:39", "remaining_time": "1 day, 7:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4520, "total_steps": 17941, "loss": 1.6442, "learning_rate": 8.65387592618092e-05, "epoch": 0.25193690429741933, "percentage": 25.19, "elapsed_time": "10:41:48", "remaining_time": "1 day, 7:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4521, "total_steps": 17941, "loss": 1.7816, "learning_rate": 8.653268048854201e-05, "epoch": 0.25199264255058246, "percentage": 25.2, "elapsed_time": "10:41:57", "remaining_time": "1 day, 7:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4522, "total_steps": 17941, "loss": 1.5046, "learning_rate": 8.652660055667117e-05, "epoch": 0.2520483808037456, "percentage": 25.2, "elapsed_time": "10:42:05", "remaining_time": "1 day, 7:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4523, "total_steps": 17941, "loss": 1.582, "learning_rate": 8.652051946638953e-05, "epoch": 0.25210411905690877, "percentage": 25.21, "elapsed_time": "10:42:13", "remaining_time": "1 day, 7:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4524, "total_steps": 17941, "loss": 1.6199, "learning_rate": 8.651443721788996e-05, "epoch": 0.2521598573100719, "percentage": 25.22, "elapsed_time": "10:42:22", "remaining_time": "1 day, 7:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4525, "total_steps": 17941, "loss": 1.5345, "learning_rate": 8.650835381136533e-05, "epoch": 0.25221559556323503, "percentage": 25.22, "elapsed_time": "10:42:31", "remaining_time": "1 day, 7:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4526, "total_steps": 17941, "loss": 1.6656, "learning_rate": 8.650226924700855e-05, "epoch": 0.2522713338163982, "percentage": 25.23, "elapsed_time": "10:42:39", "remaining_time": "1 day, 7:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4527, "total_steps": 17941, "loss": 1.598, "learning_rate": 8.649618352501264e-05, "epoch": 0.25232707206956134, "percentage": 25.23, "elapsed_time": "10:42:48", "remaining_time": "1 day, 7:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4528, "total_steps": 17941, "loss": 1.3941, "learning_rate": 8.649009664557057e-05, "epoch": 0.25238281032272447, "percentage": 25.24, "elapsed_time": "10:42:56", "remaining_time": "1 day, 7:44:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4529, "total_steps": 17941, "loss": 1.7144, "learning_rate": 8.648400860887538e-05, "epoch": 0.25243854857588766, "percentage": 25.24, "elapsed_time": "10:43:05", "remaining_time": "1 day, 7:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4530, "total_steps": 17941, "loss": 1.8223, "learning_rate": 8.647791941512016e-05, "epoch": 0.2524942868290508, "percentage": 25.25, "elapsed_time": "10:43:13", "remaining_time": "1 day, 7:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4531, "total_steps": 17941, "loss": 1.6577, "learning_rate": 8.6471829064498e-05, "epoch": 0.2525500250822139, "percentage": 25.26, "elapsed_time": "10:43:22", "remaining_time": "1 day, 7:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4532, "total_steps": 17941, "loss": 1.6222, "learning_rate": 8.646573755720209e-05, "epoch": 0.25260576333537704, "percentage": 25.26, "elapsed_time": "10:43:30", "remaining_time": "1 day, 7:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4533, "total_steps": 17941, "loss": 1.8348, "learning_rate": 8.645964489342557e-05, "epoch": 0.2526615015885402, "percentage": 25.27, "elapsed_time": "10:43:39", "remaining_time": "1 day, 7:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4534, "total_steps": 17941, "loss": 1.7095, "learning_rate": 8.645355107336171e-05, "epoch": 0.25271723984170336, "percentage": 25.27, "elapsed_time": "10:43:47", "remaining_time": "1 day, 7:43:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4535, "total_steps": 17941, "loss": 1.9243, "learning_rate": 8.644745609720375e-05, "epoch": 0.2527729780948665, "percentage": 25.28, "elapsed_time": "10:43:56", "remaining_time": "1 day, 7:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4536, "total_steps": 17941, "loss": 1.782, "learning_rate": 8.644135996514498e-05, "epoch": 0.25282871634802967, "percentage": 25.28, "elapsed_time": "10:44:04", "remaining_time": "1 day, 7:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4537, "total_steps": 17941, "loss": 1.6014, "learning_rate": 8.643526267737873e-05, "epoch": 0.2528844546011928, "percentage": 25.29, "elapsed_time": "10:44:13", "remaining_time": "1 day, 7:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4538, "total_steps": 17941, "loss": 1.6435, "learning_rate": 8.642916423409839e-05, "epoch": 0.2529401928543559, "percentage": 25.29, "elapsed_time": "10:44:21", "remaining_time": "1 day, 7:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4539, "total_steps": 17941, "loss": 1.7686, "learning_rate": 8.642306463549736e-05, "epoch": 0.2529959311075191, "percentage": 25.3, "elapsed_time": "10:44:30", "remaining_time": "1 day, 7:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4540, "total_steps": 17941, "loss": 1.8116, "learning_rate": 8.641696388176907e-05, "epoch": 0.25305166936068224, "percentage": 25.31, "elapsed_time": "10:44:39", "remaining_time": "1 day, 7:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4541, "total_steps": 17941, "loss": 1.4985, "learning_rate": 8.641086197310703e-05, "epoch": 0.25310740761384537, "percentage": 25.31, "elapsed_time": "10:44:47", "remaining_time": "1 day, 7:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4542, "total_steps": 17941, "loss": 1.7948, "learning_rate": 8.640475890970471e-05, "epoch": 0.25316314586700855, "percentage": 25.32, "elapsed_time": "10:44:56", "remaining_time": "1 day, 7:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4543, "total_steps": 17941, "loss": 1.5825, "learning_rate": 8.639865469175572e-05, "epoch": 0.2532188841201717, "percentage": 25.32, "elapsed_time": "10:45:04", "remaining_time": "1 day, 7:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4544, "total_steps": 17941, "loss": 1.4125, "learning_rate": 8.639254931945362e-05, "epoch": 0.2532746223733348, "percentage": 25.33, "elapsed_time": "10:45:13", "remaining_time": "1 day, 7:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4545, "total_steps": 17941, "loss": 1.6964, "learning_rate": 8.638644279299202e-05, "epoch": 0.25333036062649794, "percentage": 25.33, "elapsed_time": "10:45:21", "remaining_time": "1 day, 7:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4546, "total_steps": 17941, "loss": 1.6725, "learning_rate": 8.638033511256462e-05, "epoch": 0.2533860988796611, "percentage": 25.34, "elapsed_time": "10:45:30", "remaining_time": "1 day, 7:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4547, "total_steps": 17941, "loss": 2.0334, "learning_rate": 8.637422627836509e-05, "epoch": 0.25344183713282425, "percentage": 25.34, "elapsed_time": "10:45:39", "remaining_time": "1 day, 7:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4548, "total_steps": 17941, "loss": 1.6665, "learning_rate": 8.636811629058718e-05, "epoch": 0.2534975753859874, "percentage": 25.35, "elapsed_time": "10:45:47", "remaining_time": "1 day, 7:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4549, "total_steps": 17941, "loss": 1.5875, "learning_rate": 8.636200514942467e-05, "epoch": 0.25355331363915057, "percentage": 25.36, "elapsed_time": "10:45:56", "remaining_time": "1 day, 7:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4550, "total_steps": 17941, "loss": 1.838, "learning_rate": 8.635589285507135e-05, "epoch": 0.2536090518923137, "percentage": 25.36, "elapsed_time": "10:46:04", "remaining_time": "1 day, 7:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4551, "total_steps": 17941, "loss": 1.7802, "learning_rate": 8.634977940772108e-05, "epoch": 0.2536647901454768, "percentage": 25.37, "elapsed_time": "10:46:13", "remaining_time": "1 day, 7:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4552, "total_steps": 17941, "loss": 1.6153, "learning_rate": 8.634366480756774e-05, "epoch": 0.25372052839864, "percentage": 25.37, "elapsed_time": "10:46:21", "remaining_time": "1 day, 7:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4553, "total_steps": 17941, "loss": 1.8255, "learning_rate": 8.633754905480527e-05, "epoch": 0.25377626665180314, "percentage": 25.38, "elapsed_time": "10:46:30", "remaining_time": "1 day, 7:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4554, "total_steps": 17941, "loss": 1.6177, "learning_rate": 8.63314321496276e-05, "epoch": 0.25383200490496627, "percentage": 25.38, "elapsed_time": "10:46:38", "remaining_time": "1 day, 7:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4555, "total_steps": 17941, "loss": 1.8342, "learning_rate": 8.632531409222872e-05, "epoch": 0.2538877431581294, "percentage": 25.39, "elapsed_time": "10:46:47", "remaining_time": "1 day, 7:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4556, "total_steps": 17941, "loss": 1.6217, "learning_rate": 8.631919488280267e-05, "epoch": 0.2539434814112926, "percentage": 25.39, "elapsed_time": "10:46:56", "remaining_time": "1 day, 7:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4557, "total_steps": 17941, "loss": 1.5318, "learning_rate": 8.631307452154352e-05, "epoch": 0.2539992196644557, "percentage": 25.4, "elapsed_time": "10:47:04", "remaining_time": "1 day, 7:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4558, "total_steps": 17941, "loss": 1.7415, "learning_rate": 8.630695300864536e-05, "epoch": 0.25405495791761884, "percentage": 25.41, "elapsed_time": "10:47:14", "remaining_time": "1 day, 7:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4559, "total_steps": 17941, "loss": 1.9215, "learning_rate": 8.630083034430232e-05, "epoch": 0.254110696170782, "percentage": 25.41, "elapsed_time": "10:47:22", "remaining_time": "1 day, 7:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4560, "total_steps": 17941, "loss": 1.5432, "learning_rate": 8.629470652870861e-05, "epoch": 0.25416643442394515, "percentage": 25.42, "elapsed_time": "10:47:30", "remaining_time": "1 day, 7:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4561, "total_steps": 17941, "loss": 1.9161, "learning_rate": 8.628858156205842e-05, "epoch": 0.2542221726771083, "percentage": 25.42, "elapsed_time": "10:47:39", "remaining_time": "1 day, 7:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4562, "total_steps": 17941, "loss": 1.8547, "learning_rate": 8.6282455444546e-05, "epoch": 0.25427791093027147, "percentage": 25.43, "elapsed_time": "10:47:47", "remaining_time": "1 day, 7:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4563, "total_steps": 17941, "loss": 1.3558, "learning_rate": 8.627632817636563e-05, "epoch": 0.2543336491834346, "percentage": 25.43, "elapsed_time": "10:47:56", "remaining_time": "1 day, 7:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4564, "total_steps": 17941, "loss": 1.7991, "learning_rate": 8.627019975771165e-05, "epoch": 0.2543893874365977, "percentage": 25.44, "elapsed_time": "10:48:04", "remaining_time": "1 day, 7:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4565, "total_steps": 17941, "loss": 1.5515, "learning_rate": 8.626407018877837e-05, "epoch": 0.2544451256897609, "percentage": 25.44, "elapsed_time": "10:48:13", "remaining_time": "1 day, 7:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4566, "total_steps": 17941, "loss": 1.7666, "learning_rate": 8.625793946976026e-05, "epoch": 0.25450086394292404, "percentage": 25.45, "elapsed_time": "10:48:21", "remaining_time": "1 day, 7:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4567, "total_steps": 17941, "loss": 1.9701, "learning_rate": 8.625180760085167e-05, "epoch": 0.25455660219608717, "percentage": 25.46, "elapsed_time": "10:48:30", "remaining_time": "1 day, 7:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4568, "total_steps": 17941, "loss": 1.7123, "learning_rate": 8.624567458224713e-05, "epoch": 0.2546123404492503, "percentage": 25.46, "elapsed_time": "10:48:38", "remaining_time": "1 day, 7:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4569, "total_steps": 17941, "loss": 1.8511, "learning_rate": 8.62395404141411e-05, "epoch": 0.2546680787024135, "percentage": 25.47, "elapsed_time": "10:48:47", "remaining_time": "1 day, 7:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4570, "total_steps": 17941, "loss": 1.6913, "learning_rate": 8.623340509672817e-05, "epoch": 0.2547238169555766, "percentage": 25.47, "elapsed_time": "10:48:56", "remaining_time": "1 day, 7:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4571, "total_steps": 17941, "loss": 1.6337, "learning_rate": 8.622726863020285e-05, "epoch": 0.25477955520873974, "percentage": 25.48, "elapsed_time": "10:49:04", "remaining_time": "1 day, 7:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4572, "total_steps": 17941, "loss": 1.8858, "learning_rate": 8.622113101475982e-05, "epoch": 0.2548352934619029, "percentage": 25.48, "elapsed_time": "10:49:13", "remaining_time": "1 day, 7:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4573, "total_steps": 17941, "loss": 1.6353, "learning_rate": 8.621499225059369e-05, "epoch": 0.25489103171506605, "percentage": 25.49, "elapsed_time": "10:49:21", "remaining_time": "1 day, 7:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4574, "total_steps": 17941, "loss": 1.4418, "learning_rate": 8.620885233789914e-05, "epoch": 0.2549467699682292, "percentage": 25.49, "elapsed_time": "10:49:30", "remaining_time": "1 day, 7:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4575, "total_steps": 17941, "loss": 1.7161, "learning_rate": 8.620271127687092e-05, "epoch": 0.25500250822139237, "percentage": 25.5, "elapsed_time": "10:49:38", "remaining_time": "1 day, 7:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4576, "total_steps": 17941, "loss": 1.8467, "learning_rate": 8.619656906770377e-05, "epoch": 0.2550582464745555, "percentage": 25.51, "elapsed_time": "10:49:47", "remaining_time": "1 day, 7:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4577, "total_steps": 17941, "loss": 1.7528, "learning_rate": 8.619042571059248e-05, "epoch": 0.2551139847277186, "percentage": 25.51, "elapsed_time": "10:49:55", "remaining_time": "1 day, 7:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4578, "total_steps": 17941, "loss": 1.5648, "learning_rate": 8.61842812057319e-05, "epoch": 0.25516972298088175, "percentage": 25.52, "elapsed_time": "10:50:04", "remaining_time": "1 day, 7:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4579, "total_steps": 17941, "loss": 1.5093, "learning_rate": 8.617813555331689e-05, "epoch": 0.25522546123404494, "percentage": 25.52, "elapsed_time": "10:50:12", "remaining_time": "1 day, 7:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4580, "total_steps": 17941, "loss": 1.6445, "learning_rate": 8.617198875354235e-05, "epoch": 0.25528119948720807, "percentage": 25.53, "elapsed_time": "10:50:21", "remaining_time": "1 day, 7:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4581, "total_steps": 17941, "loss": 1.6225, "learning_rate": 8.616584080660323e-05, "epoch": 0.2553369377403712, "percentage": 25.53, "elapsed_time": "10:50:29", "remaining_time": "1 day, 7:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4582, "total_steps": 17941, "loss": 1.8017, "learning_rate": 8.615969171269449e-05, "epoch": 0.2553926759935344, "percentage": 25.54, "elapsed_time": "10:50:38", "remaining_time": "1 day, 7:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4583, "total_steps": 17941, "loss": 1.6034, "learning_rate": 8.615354147201116e-05, "epoch": 0.2554484142466975, "percentage": 25.54, "elapsed_time": "10:50:46", "remaining_time": "1 day, 7:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4584, "total_steps": 17941, "loss": 1.481, "learning_rate": 8.614739008474829e-05, "epoch": 0.25550415249986064, "percentage": 25.55, "elapsed_time": "10:50:55", "remaining_time": "1 day, 7:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4585, "total_steps": 17941, "loss": 1.6323, "learning_rate": 8.614123755110096e-05, "epoch": 0.2555598907530238, "percentage": 25.56, "elapsed_time": "10:51:03", "remaining_time": "1 day, 7:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4586, "total_steps": 17941, "loss": 1.4896, "learning_rate": 8.61350838712643e-05, "epoch": 0.25561562900618695, "percentage": 25.56, "elapsed_time": "10:51:12", "remaining_time": "1 day, 7:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4587, "total_steps": 17941, "loss": 1.6488, "learning_rate": 8.612892904543344e-05, "epoch": 0.2556713672593501, "percentage": 25.57, "elapsed_time": "10:51:20", "remaining_time": "1 day, 7:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4588, "total_steps": 17941, "loss": 1.7467, "learning_rate": 8.612277307380361e-05, "epoch": 0.25572710551251326, "percentage": 25.57, "elapsed_time": "10:51:29", "remaining_time": "1 day, 7:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4589, "total_steps": 17941, "loss": 1.4627, "learning_rate": 8.611661595657004e-05, "epoch": 0.2557828437656764, "percentage": 25.58, "elapsed_time": "10:51:39", "remaining_time": "1 day, 7:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4590, "total_steps": 17941, "loss": 1.654, "learning_rate": 8.611045769392796e-05, "epoch": 0.2558385820188395, "percentage": 25.58, "elapsed_time": "10:51:47", "remaining_time": "1 day, 7:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4591, "total_steps": 17941, "loss": 1.6177, "learning_rate": 8.610429828607271e-05, "epoch": 0.25589432027200265, "percentage": 25.59, "elapsed_time": "10:51:55", "remaining_time": "1 day, 7:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4592, "total_steps": 17941, "loss": 1.9184, "learning_rate": 8.609813773319963e-05, "epoch": 0.25595005852516584, "percentage": 25.6, "elapsed_time": "10:52:04", "remaining_time": "1 day, 7:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4593, "total_steps": 17941, "loss": 1.6321, "learning_rate": 8.609197603550409e-05, "epoch": 0.25600579677832896, "percentage": 25.6, "elapsed_time": "10:52:13", "remaining_time": "1 day, 7:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4594, "total_steps": 17941, "loss": 1.6094, "learning_rate": 8.608581319318148e-05, "epoch": 0.2560615350314921, "percentage": 25.61, "elapsed_time": "10:52:22", "remaining_time": "1 day, 7:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4595, "total_steps": 17941, "loss": 1.7111, "learning_rate": 8.607964920642728e-05, "epoch": 0.2561172732846553, "percentage": 25.61, "elapsed_time": "10:52:30", "remaining_time": "1 day, 7:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4596, "total_steps": 17941, "loss": 1.5206, "learning_rate": 8.607348407543699e-05, "epoch": 0.2561730115378184, "percentage": 25.62, "elapsed_time": "10:52:39", "remaining_time": "1 day, 7:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4597, "total_steps": 17941, "loss": 1.9129, "learning_rate": 8.606731780040608e-05, "epoch": 0.25622874979098154, "percentage": 25.62, "elapsed_time": "10:52:48", "remaining_time": "1 day, 7:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4598, "total_steps": 17941, "loss": 1.7739, "learning_rate": 8.606115038153015e-05, "epoch": 0.2562844880441447, "percentage": 25.63, "elapsed_time": "10:52:56", "remaining_time": "1 day, 7:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4599, "total_steps": 17941, "loss": 1.6853, "learning_rate": 8.605498181900477e-05, "epoch": 0.25634022629730785, "percentage": 25.63, "elapsed_time": "10:53:04", "remaining_time": "1 day, 7:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4600, "total_steps": 17941, "loss": 1.8345, "learning_rate": 8.604881211302559e-05, "epoch": 0.256395964550471, "percentage": 25.64, "elapsed_time": "10:53:13", "remaining_time": "1 day, 7:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4601, "total_steps": 17941, "loss": 1.9012, "learning_rate": 8.604264126378827e-05, "epoch": 0.2564517028036341, "percentage": 25.65, "elapsed_time": "10:53:21", "remaining_time": "1 day, 7:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4602, "total_steps": 17941, "loss": 1.5109, "learning_rate": 8.603646927148849e-05, "epoch": 0.2565074410567973, "percentage": 25.65, "elapsed_time": "10:53:30", "remaining_time": "1 day, 7:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4603, "total_steps": 17941, "loss": 1.758, "learning_rate": 8.603029613632205e-05, "epoch": 0.2565631793099604, "percentage": 25.66, "elapsed_time": "10:53:38", "remaining_time": "1 day, 7:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4604, "total_steps": 17941, "loss": 1.6211, "learning_rate": 8.602412185848466e-05, "epoch": 0.25661891756312355, "percentage": 25.66, "elapsed_time": "10:53:47", "remaining_time": "1 day, 7:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4605, "total_steps": 17941, "loss": 1.8896, "learning_rate": 8.601794643817216e-05, "epoch": 0.25667465581628673, "percentage": 25.67, "elapsed_time": "10:53:55", "remaining_time": "1 day, 7:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4606, "total_steps": 17941, "loss": 1.6733, "learning_rate": 8.601176987558041e-05, "epoch": 0.25673039406944986, "percentage": 25.67, "elapsed_time": "10:54:04", "remaining_time": "1 day, 7:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4607, "total_steps": 17941, "loss": 1.824, "learning_rate": 8.600559217090529e-05, "epoch": 0.256786132322613, "percentage": 25.68, "elapsed_time": "10:54:12", "remaining_time": "1 day, 7:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4608, "total_steps": 17941, "loss": 1.7229, "learning_rate": 8.599941332434269e-05, "epoch": 0.2568418705757762, "percentage": 25.68, "elapsed_time": "10:54:21", "remaining_time": "1 day, 7:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4609, "total_steps": 17941, "loss": 1.846, "learning_rate": 8.599323333608861e-05, "epoch": 0.2568976088289393, "percentage": 25.69, "elapsed_time": "10:54:29", "remaining_time": "1 day, 7:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4610, "total_steps": 17941, "loss": 1.7334, "learning_rate": 8.598705220633903e-05, "epoch": 0.25695334708210243, "percentage": 25.7, "elapsed_time": "10:54:38", "remaining_time": "1 day, 7:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4611, "total_steps": 17941, "loss": 1.9449, "learning_rate": 8.598086993528996e-05, "epoch": 0.2570090853352656, "percentage": 25.7, "elapsed_time": "10:54:46", "remaining_time": "1 day, 7:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4612, "total_steps": 17941, "loss": 1.8884, "learning_rate": 8.597468652313747e-05, "epoch": 0.25706482358842875, "percentage": 25.71, "elapsed_time": "10:54:55", "remaining_time": "1 day, 7:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4613, "total_steps": 17941, "loss": 1.6199, "learning_rate": 8.596850197007767e-05, "epoch": 0.2571205618415919, "percentage": 25.71, "elapsed_time": "10:55:03", "remaining_time": "1 day, 7:32:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4614, "total_steps": 17941, "loss": 1.5702, "learning_rate": 8.596231627630671e-05, "epoch": 0.257176300094755, "percentage": 25.72, "elapsed_time": "10:55:12", "remaining_time": "1 day, 7:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4615, "total_steps": 17941, "loss": 1.6538, "learning_rate": 8.595612944202076e-05, "epoch": 0.2572320383479182, "percentage": 25.72, "elapsed_time": "10:55:20", "remaining_time": "1 day, 7:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4616, "total_steps": 17941, "loss": 1.79, "learning_rate": 8.5949941467416e-05, "epoch": 0.2572877766010813, "percentage": 25.73, "elapsed_time": "10:55:29", "remaining_time": "1 day, 7:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4617, "total_steps": 17941, "loss": 2.0629, "learning_rate": 8.594375235268872e-05, "epoch": 0.25734351485424445, "percentage": 25.73, "elapsed_time": "10:55:37", "remaining_time": "1 day, 7:32:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4618, "total_steps": 17941, "loss": 1.7105, "learning_rate": 8.593756209803518e-05, "epoch": 0.25739925310740763, "percentage": 25.74, "elapsed_time": "10:55:46", "remaining_time": "1 day, 7:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4619, "total_steps": 17941, "loss": 1.7797, "learning_rate": 8.59313707036517e-05, "epoch": 0.25745499136057076, "percentage": 25.75, "elapsed_time": "10:55:54", "remaining_time": "1 day, 7:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4620, "total_steps": 17941, "loss": 1.6879, "learning_rate": 8.592517816973462e-05, "epoch": 0.2575107296137339, "percentage": 25.75, "elapsed_time": "10:56:03", "remaining_time": "1 day, 7:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4621, "total_steps": 17941, "loss": 1.6947, "learning_rate": 8.591898449648035e-05, "epoch": 0.2575664678668971, "percentage": 25.76, "elapsed_time": "10:56:11", "remaining_time": "1 day, 7:31:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4622, "total_steps": 17941, "loss": 1.8276, "learning_rate": 8.591278968408532e-05, "epoch": 0.2576222061200602, "percentage": 25.76, "elapsed_time": "10:56:20", "remaining_time": "1 day, 7:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4623, "total_steps": 17941, "loss": 1.6054, "learning_rate": 8.590659373274599e-05, "epoch": 0.25767794437322333, "percentage": 25.77, "elapsed_time": "10:56:28", "remaining_time": "1 day, 7:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4624, "total_steps": 17941, "loss": 1.612, "learning_rate": 8.590039664265885e-05, "epoch": 0.25773368262638646, "percentage": 25.77, "elapsed_time": "10:56:37", "remaining_time": "1 day, 7:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4625, "total_steps": 17941, "loss": 2.1569, "learning_rate": 8.589419841402047e-05, "epoch": 0.25778942087954965, "percentage": 25.78, "elapsed_time": "10:56:45", "remaining_time": "1 day, 7:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4626, "total_steps": 17941, "loss": 1.4849, "learning_rate": 8.588799904702736e-05, "epoch": 0.2578451591327128, "percentage": 25.78, "elapsed_time": "10:56:54", "remaining_time": "1 day, 7:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4627, "total_steps": 17941, "loss": 1.882, "learning_rate": 8.588179854187616e-05, "epoch": 0.2579008973858759, "percentage": 25.79, "elapsed_time": "10:57:02", "remaining_time": "1 day, 7:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4628, "total_steps": 17941, "loss": 1.7811, "learning_rate": 8.587559689876354e-05, "epoch": 0.2579566356390391, "percentage": 25.8, "elapsed_time": "10:57:11", "remaining_time": "1 day, 7:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4629, "total_steps": 17941, "loss": 1.8589, "learning_rate": 8.586939411788615e-05, "epoch": 0.2580123738922022, "percentage": 25.8, "elapsed_time": "10:57:19", "remaining_time": "1 day, 7:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4630, "total_steps": 17941, "loss": 1.5817, "learning_rate": 8.586319019944071e-05, "epoch": 0.25806811214536535, "percentage": 25.81, "elapsed_time": "10:57:28", "remaining_time": "1 day, 7:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4631, "total_steps": 17941, "loss": 1.4472, "learning_rate": 8.585698514362397e-05, "epoch": 0.25812385039852853, "percentage": 25.81, "elapsed_time": "10:57:36", "remaining_time": "1 day, 7:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4632, "total_steps": 17941, "loss": 1.9396, "learning_rate": 8.585077895063271e-05, "epoch": 0.25817958865169166, "percentage": 25.82, "elapsed_time": "10:57:45", "remaining_time": "1 day, 7:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4633, "total_steps": 17941, "loss": 1.6806, "learning_rate": 8.58445716206638e-05, "epoch": 0.2582353269048548, "percentage": 25.82, "elapsed_time": "10:57:55", "remaining_time": "1 day, 7:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4634, "total_steps": 17941, "loss": 1.5884, "learning_rate": 8.583836315391403e-05, "epoch": 0.258291065158018, "percentage": 25.83, "elapsed_time": "10:58:03", "remaining_time": "1 day, 7:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4635, "total_steps": 17941, "loss": 2.001, "learning_rate": 8.583215355058035e-05, "epoch": 0.2583468034111811, "percentage": 25.83, "elapsed_time": "10:58:11", "remaining_time": "1 day, 7:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4636, "total_steps": 17941, "loss": 1.6639, "learning_rate": 8.582594281085967e-05, "epoch": 0.25840254166434423, "percentage": 25.84, "elapsed_time": "10:58:20", "remaining_time": "1 day, 7:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4637, "total_steps": 17941, "loss": 1.841, "learning_rate": 8.581973093494897e-05, "epoch": 0.25845827991750736, "percentage": 25.85, "elapsed_time": "10:58:28", "remaining_time": "1 day, 7:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4638, "total_steps": 17941, "loss": 1.6623, "learning_rate": 8.581351792304524e-05, "epoch": 0.25851401817067055, "percentage": 25.85, "elapsed_time": "10:58:37", "remaining_time": "1 day, 7:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4639, "total_steps": 17941, "loss": 1.5144, "learning_rate": 8.580730377534554e-05, "epoch": 0.2585697564238337, "percentage": 25.86, "elapsed_time": "10:58:45", "remaining_time": "1 day, 7:28:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4640, "total_steps": 17941, "loss": 1.4875, "learning_rate": 8.580108849204693e-05, "epoch": 0.2586254946769968, "percentage": 25.86, "elapsed_time": "10:58:54", "remaining_time": "1 day, 7:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4641, "total_steps": 17941, "loss": 1.7197, "learning_rate": 8.579487207334653e-05, "epoch": 0.25868123293016, "percentage": 25.87, "elapsed_time": "10:59:02", "remaining_time": "1 day, 7:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4642, "total_steps": 17941, "loss": 1.4488, "learning_rate": 8.578865451944148e-05, "epoch": 0.2587369711833231, "percentage": 25.87, "elapsed_time": "10:59:11", "remaining_time": "1 day, 7:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4643, "total_steps": 17941, "loss": 1.7116, "learning_rate": 8.578243583052897e-05, "epoch": 0.25879270943648625, "percentage": 25.88, "elapsed_time": "10:59:19", "remaining_time": "1 day, 7:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4644, "total_steps": 17941, "loss": 1.5765, "learning_rate": 8.577621600680623e-05, "epoch": 0.25884844768964943, "percentage": 25.88, "elapsed_time": "10:59:28", "remaining_time": "1 day, 7:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4645, "total_steps": 17941, "loss": 1.7881, "learning_rate": 8.57699950484705e-05, "epoch": 0.25890418594281256, "percentage": 25.89, "elapsed_time": "10:59:37", "remaining_time": "1 day, 7:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4646, "total_steps": 17941, "loss": 1.8373, "learning_rate": 8.57637729557191e-05, "epoch": 0.2589599241959757, "percentage": 25.9, "elapsed_time": "10:59:45", "remaining_time": "1 day, 7:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4647, "total_steps": 17941, "loss": 1.6772, "learning_rate": 8.575754972874931e-05, "epoch": 0.2590156624491388, "percentage": 25.9, "elapsed_time": "10:59:54", "remaining_time": "1 day, 7:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4648, "total_steps": 17941, "loss": 1.8558, "learning_rate": 8.575132536775853e-05, "epoch": 0.259071400702302, "percentage": 25.91, "elapsed_time": "11:00:03", "remaining_time": "1 day, 7:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4649, "total_steps": 17941, "loss": 1.9364, "learning_rate": 8.574509987294417e-05, "epoch": 0.25912713895546513, "percentage": 25.91, "elapsed_time": "11:00:11", "remaining_time": "1 day, 7:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4650, "total_steps": 17941, "loss": 1.8956, "learning_rate": 8.573887324450364e-05, "epoch": 0.25918287720862826, "percentage": 25.92, "elapsed_time": "11:00:20", "remaining_time": "1 day, 7:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4651, "total_steps": 17941, "loss": 1.7338, "learning_rate": 8.573264548263442e-05, "epoch": 0.25923861546179144, "percentage": 25.92, "elapsed_time": "11:00:28", "remaining_time": "1 day, 7:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4652, "total_steps": 17941, "loss": 1.5941, "learning_rate": 8.572641658753404e-05, "epoch": 0.2592943537149546, "percentage": 25.93, "elapsed_time": "11:00:37", "remaining_time": "1 day, 7:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4653, "total_steps": 17941, "loss": 1.7035, "learning_rate": 8.572018655940001e-05, "epoch": 0.2593500919681177, "percentage": 25.94, "elapsed_time": "11:00:45", "remaining_time": "1 day, 7:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4654, "total_steps": 17941, "loss": 1.7387, "learning_rate": 8.571395539842992e-05, "epoch": 0.2594058302212809, "percentage": 25.94, "elapsed_time": "11:00:54", "remaining_time": "1 day, 7:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4655, "total_steps": 17941, "loss": 1.7089, "learning_rate": 8.570772310482141e-05, "epoch": 0.259461568474444, "percentage": 25.95, "elapsed_time": "11:01:03", "remaining_time": "1 day, 7:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4656, "total_steps": 17941, "loss": 1.5298, "learning_rate": 8.57014896787721e-05, "epoch": 0.25951730672760714, "percentage": 25.95, "elapsed_time": "11:01:11", "remaining_time": "1 day, 7:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4657, "total_steps": 17941, "loss": 1.7676, "learning_rate": 8.569525512047969e-05, "epoch": 0.25957304498077033, "percentage": 25.96, "elapsed_time": "11:01:19", "remaining_time": "1 day, 7:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4658, "total_steps": 17941, "loss": 1.636, "learning_rate": 8.56890194301419e-05, "epoch": 0.25962878323393346, "percentage": 25.96, "elapsed_time": "11:01:28", "remaining_time": "1 day, 7:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4659, "total_steps": 17941, "loss": 1.8281, "learning_rate": 8.56827826079565e-05, "epoch": 0.2596845214870966, "percentage": 25.97, "elapsed_time": "11:01:36", "remaining_time": "1 day, 7:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4660, "total_steps": 17941, "loss": 1.7335, "learning_rate": 8.56765446541213e-05, "epoch": 0.2597402597402597, "percentage": 25.97, "elapsed_time": "11:01:45", "remaining_time": "1 day, 7:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4661, "total_steps": 17941, "loss": 1.8524, "learning_rate": 8.567030556883408e-05, "epoch": 0.2597959979934229, "percentage": 25.98, "elapsed_time": "11:01:53", "remaining_time": "1 day, 7:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4662, "total_steps": 17941, "loss": 1.7883, "learning_rate": 8.566406535229276e-05, "epoch": 0.25985173624658603, "percentage": 25.99, "elapsed_time": "11:02:02", "remaining_time": "1 day, 7:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4663, "total_steps": 17941, "loss": 1.7011, "learning_rate": 8.565782400469522e-05, "epoch": 0.25990747449974916, "percentage": 25.99, "elapsed_time": "11:02:11", "remaining_time": "1 day, 7:25:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4664, "total_steps": 17941, "loss": 1.4828, "learning_rate": 8.56515815262394e-05, "epoch": 0.25996321275291234, "percentage": 26.0, "elapsed_time": "11:02:19", "remaining_time": "1 day, 7:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4665, "total_steps": 17941, "loss": 1.7885, "learning_rate": 8.564533791712328e-05, "epoch": 0.26001895100607547, "percentage": 26.0, "elapsed_time": "11:02:28", "remaining_time": "1 day, 7:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4666, "total_steps": 17941, "loss": 1.9297, "learning_rate": 8.563909317754487e-05, "epoch": 0.2600746892592386, "percentage": 26.01, "elapsed_time": "11:02:36", "remaining_time": "1 day, 7:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4667, "total_steps": 17941, "loss": 1.9536, "learning_rate": 8.563284730770221e-05, "epoch": 0.2601304275124018, "percentage": 26.01, "elapsed_time": "11:02:45", "remaining_time": "1 day, 7:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4668, "total_steps": 17941, "loss": 2.003, "learning_rate": 8.56266003077934e-05, "epoch": 0.2601861657655649, "percentage": 26.02, "elapsed_time": "11:02:53", "remaining_time": "1 day, 7:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4669, "total_steps": 17941, "loss": 2.0024, "learning_rate": 8.562035217801652e-05, "epoch": 0.26024190401872804, "percentage": 26.02, "elapsed_time": "11:03:02", "remaining_time": "1 day, 7:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4670, "total_steps": 17941, "loss": 1.5865, "learning_rate": 8.561410291856977e-05, "epoch": 0.26029764227189117, "percentage": 26.03, "elapsed_time": "11:03:10", "remaining_time": "1 day, 7:24:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4671, "total_steps": 17941, "loss": 1.7586, "learning_rate": 8.560785252965131e-05, "epoch": 0.26035338052505436, "percentage": 26.04, "elapsed_time": "11:03:19", "remaining_time": "1 day, 7:24:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4672, "total_steps": 17941, "loss": 1.9274, "learning_rate": 8.560160101145937e-05, "epoch": 0.2604091187782175, "percentage": 26.04, "elapsed_time": "11:03:27", "remaining_time": "1 day, 7:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4673, "total_steps": 17941, "loss": 1.7652, "learning_rate": 8.559534836419224e-05, "epoch": 0.2604648570313806, "percentage": 26.05, "elapsed_time": "11:03:36", "remaining_time": "1 day, 7:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4674, "total_steps": 17941, "loss": 1.9096, "learning_rate": 8.558909458804818e-05, "epoch": 0.2605205952845438, "percentage": 26.05, "elapsed_time": "11:03:44", "remaining_time": "1 day, 7:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4675, "total_steps": 17941, "loss": 1.6586, "learning_rate": 8.558283968322555e-05, "epoch": 0.26057633353770693, "percentage": 26.06, "elapsed_time": "11:03:52", "remaining_time": "1 day, 7:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4676, "total_steps": 17941, "loss": 1.606, "learning_rate": 8.55765836499227e-05, "epoch": 0.26063207179087006, "percentage": 26.06, "elapsed_time": "11:04:01", "remaining_time": "1 day, 7:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4677, "total_steps": 17941, "loss": 1.698, "learning_rate": 8.557032648833804e-05, "epoch": 0.26068781004403324, "percentage": 26.07, "elapsed_time": "11:04:09", "remaining_time": "1 day, 7:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4678, "total_steps": 17941, "loss": 1.9568, "learning_rate": 8.556406819867001e-05, "epoch": 0.26074354829719637, "percentage": 26.07, "elapsed_time": "11:04:18", "remaining_time": "1 day, 7:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4679, "total_steps": 17941, "loss": 1.6827, "learning_rate": 8.55578087811171e-05, "epoch": 0.2607992865503595, "percentage": 26.08, "elapsed_time": "11:04:26", "remaining_time": "1 day, 7:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4680, "total_steps": 17941, "loss": 1.631, "learning_rate": 8.55515482358778e-05, "epoch": 0.2608550248035227, "percentage": 26.09, "elapsed_time": "11:04:35", "remaining_time": "1 day, 7:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4681, "total_steps": 17941, "loss": 1.7978, "learning_rate": 8.554528656315069e-05, "epoch": 0.2609107630566858, "percentage": 26.09, "elapsed_time": "11:04:43", "remaining_time": "1 day, 7:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4682, "total_steps": 17941, "loss": 1.4935, "learning_rate": 8.55390237631343e-05, "epoch": 0.26096650130984894, "percentage": 26.1, "elapsed_time": "11:04:52", "remaining_time": "1 day, 7:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4683, "total_steps": 17941, "loss": 1.3459, "learning_rate": 8.553275983602732e-05, "epoch": 0.26102223956301207, "percentage": 26.1, "elapsed_time": "11:05:00", "remaining_time": "1 day, 7:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4684, "total_steps": 17941, "loss": 1.8008, "learning_rate": 8.552649478202834e-05, "epoch": 0.26107797781617526, "percentage": 26.11, "elapsed_time": "11:05:09", "remaining_time": "1 day, 7:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4685, "total_steps": 17941, "loss": 1.5853, "learning_rate": 8.55202286013361e-05, "epoch": 0.2611337160693384, "percentage": 26.11, "elapsed_time": "11:05:18", "remaining_time": "1 day, 7:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4686, "total_steps": 17941, "loss": 1.7352, "learning_rate": 8.551396129414928e-05, "epoch": 0.2611894543225015, "percentage": 26.12, "elapsed_time": "11:05:26", "remaining_time": "1 day, 7:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4687, "total_steps": 17941, "loss": 1.5833, "learning_rate": 8.550769286066669e-05, "epoch": 0.2612451925756647, "percentage": 26.12, "elapsed_time": "11:05:35", "remaining_time": "1 day, 7:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4688, "total_steps": 17941, "loss": 1.8692, "learning_rate": 8.55014233010871e-05, "epoch": 0.2613009308288278, "percentage": 26.13, "elapsed_time": "11:05:43", "remaining_time": "1 day, 7:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4689, "total_steps": 17941, "loss": 1.6987, "learning_rate": 8.549515261560937e-05, "epoch": 0.26135666908199096, "percentage": 26.14, "elapsed_time": "11:05:51", "remaining_time": "1 day, 7:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4690, "total_steps": 17941, "loss": 1.4492, "learning_rate": 8.548888080443231e-05, "epoch": 0.26141240733515414, "percentage": 26.14, "elapsed_time": "11:06:00", "remaining_time": "1 day, 7:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4691, "total_steps": 17941, "loss": 1.7292, "learning_rate": 8.54826078677549e-05, "epoch": 0.26146814558831727, "percentage": 26.15, "elapsed_time": "11:06:08", "remaining_time": "1 day, 7:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4692, "total_steps": 17941, "loss": 1.9054, "learning_rate": 8.547633380577604e-05, "epoch": 0.2615238838414804, "percentage": 26.15, "elapsed_time": "11:06:17", "remaining_time": "1 day, 7:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4693, "total_steps": 17941, "loss": 1.8537, "learning_rate": 8.54700586186947e-05, "epoch": 0.2615796220946435, "percentage": 26.16, "elapsed_time": "11:06:26", "remaining_time": "1 day, 7:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4694, "total_steps": 17941, "loss": 1.7507, "learning_rate": 8.546378230670992e-05, "epoch": 0.2616353603478067, "percentage": 26.16, "elapsed_time": "11:06:35", "remaining_time": "1 day, 7:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4695, "total_steps": 17941, "loss": 1.5895, "learning_rate": 8.545750487002073e-05, "epoch": 0.26169109860096984, "percentage": 26.17, "elapsed_time": "11:06:43", "remaining_time": "1 day, 7:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4696, "total_steps": 17941, "loss": 1.5736, "learning_rate": 8.54512263088262e-05, "epoch": 0.26174683685413297, "percentage": 26.17, "elapsed_time": "11:06:52", "remaining_time": "1 day, 7:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4697, "total_steps": 17941, "loss": 1.5192, "learning_rate": 8.544494662332548e-05, "epoch": 0.26180257510729615, "percentage": 26.18, "elapsed_time": "11:07:01", "remaining_time": "1 day, 7:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4698, "total_steps": 17941, "loss": 1.7796, "learning_rate": 8.543866581371771e-05, "epoch": 0.2618583133604593, "percentage": 26.19, "elapsed_time": "11:07:09", "remaining_time": "1 day, 7:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4699, "total_steps": 17941, "loss": 1.756, "learning_rate": 8.54323838802021e-05, "epoch": 0.2619140516136224, "percentage": 26.19, "elapsed_time": "11:07:18", "remaining_time": "1 day, 7:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4700, "total_steps": 17941, "loss": 1.7589, "learning_rate": 8.542610082297783e-05, "epoch": 0.2619697898667856, "percentage": 26.2, "elapsed_time": "11:07:26", "remaining_time": "1 day, 7:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4701, "total_steps": 17941, "loss": 1.5043, "learning_rate": 8.541981664224421e-05, "epoch": 0.2620255281199487, "percentage": 26.2, "elapsed_time": "11:07:35", "remaining_time": "1 day, 7:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4702, "total_steps": 17941, "loss": 1.731, "learning_rate": 8.54135313382005e-05, "epoch": 0.26208126637311185, "percentage": 26.21, "elapsed_time": "11:07:43", "remaining_time": "1 day, 7:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4703, "total_steps": 17941, "loss": 1.6976, "learning_rate": 8.540724491104606e-05, "epoch": 0.26213700462627504, "percentage": 26.21, "elapsed_time": "11:07:52", "remaining_time": "1 day, 7:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4704, "total_steps": 17941, "loss": 1.8049, "learning_rate": 8.540095736098026e-05, "epoch": 0.26219274287943817, "percentage": 26.22, "elapsed_time": "11:08:01", "remaining_time": "1 day, 7:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4705, "total_steps": 17941, "loss": 1.5834, "learning_rate": 8.539466868820247e-05, "epoch": 0.2622484811326013, "percentage": 26.22, "elapsed_time": "11:08:09", "remaining_time": "1 day, 7:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4706, "total_steps": 17941, "loss": 1.6546, "learning_rate": 8.538837889291218e-05, "epoch": 0.2623042193857644, "percentage": 26.23, "elapsed_time": "11:08:18", "remaining_time": "1 day, 7:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4707, "total_steps": 17941, "loss": 1.434, "learning_rate": 8.538208797530883e-05, "epoch": 0.2623599576389276, "percentage": 26.24, "elapsed_time": "11:08:26", "remaining_time": "1 day, 7:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4708, "total_steps": 17941, "loss": 1.6628, "learning_rate": 8.537579593559195e-05, "epoch": 0.26241569589209074, "percentage": 26.24, "elapsed_time": "11:08:35", "remaining_time": "1 day, 7:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4709, "total_steps": 17941, "loss": 1.5702, "learning_rate": 8.536950277396106e-05, "epoch": 0.26247143414525387, "percentage": 26.25, "elapsed_time": "11:08:43", "remaining_time": "1 day, 7:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4710, "total_steps": 17941, "loss": 1.7829, "learning_rate": 8.536320849061577e-05, "epoch": 0.26252717239841705, "percentage": 26.25, "elapsed_time": "11:08:52", "remaining_time": "1 day, 7:18:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4711, "total_steps": 17941, "loss": 1.8271, "learning_rate": 8.535691308575569e-05, "epoch": 0.2625829106515802, "percentage": 26.26, "elapsed_time": "11:09:00", "remaining_time": "1 day, 7:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4712, "total_steps": 17941, "loss": 1.888, "learning_rate": 8.535061655958048e-05, "epoch": 0.2626386489047433, "percentage": 26.26, "elapsed_time": "11:09:09", "remaining_time": "1 day, 7:18:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4713, "total_steps": 17941, "loss": 1.5633, "learning_rate": 8.534431891228981e-05, "epoch": 0.2626943871579065, "percentage": 26.27, "elapsed_time": "11:09:18", "remaining_time": "1 day, 7:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4714, "total_steps": 17941, "loss": 1.7778, "learning_rate": 8.533802014408341e-05, "epoch": 0.2627501254110696, "percentage": 26.28, "elapsed_time": "11:09:26", "remaining_time": "1 day, 7:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4715, "total_steps": 17941, "loss": 1.6732, "learning_rate": 8.533172025516106e-05, "epoch": 0.26280586366423275, "percentage": 26.28, "elapsed_time": "11:09:35", "remaining_time": "1 day, 7:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4716, "total_steps": 17941, "loss": 1.7714, "learning_rate": 8.532541924572254e-05, "epoch": 0.2628616019173959, "percentage": 26.29, "elapsed_time": "11:09:43", "remaining_time": "1 day, 7:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4717, "total_steps": 17941, "loss": 1.7311, "learning_rate": 8.531911711596767e-05, "epoch": 0.26291734017055907, "percentage": 26.29, "elapsed_time": "11:09:52", "remaining_time": "1 day, 7:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4718, "total_steps": 17941, "loss": 1.684, "learning_rate": 8.531281386609633e-05, "epoch": 0.2629730784237222, "percentage": 26.3, "elapsed_time": "11:10:01", "remaining_time": "1 day, 7:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4719, "total_steps": 17941, "loss": 1.7727, "learning_rate": 8.530650949630844e-05, "epoch": 0.2630288166768853, "percentage": 26.3, "elapsed_time": "11:10:09", "remaining_time": "1 day, 7:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4720, "total_steps": 17941, "loss": 1.6802, "learning_rate": 8.530020400680392e-05, "epoch": 0.2630845549300485, "percentage": 26.31, "elapsed_time": "11:10:17", "remaining_time": "1 day, 7:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4721, "total_steps": 17941, "loss": 1.6691, "learning_rate": 8.529389739778272e-05, "epoch": 0.26314029318321164, "percentage": 26.31, "elapsed_time": "11:10:26", "remaining_time": "1 day, 7:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4722, "total_steps": 17941, "loss": 1.6649, "learning_rate": 8.528758966944489e-05, "epoch": 0.26319603143637477, "percentage": 26.32, "elapsed_time": "11:10:34", "remaining_time": "1 day, 7:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4723, "total_steps": 17941, "loss": 1.8637, "learning_rate": 8.528128082199046e-05, "epoch": 0.26325176968953795, "percentage": 26.33, "elapsed_time": "11:10:43", "remaining_time": "1 day, 7:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4724, "total_steps": 17941, "loss": 1.6409, "learning_rate": 8.527497085561949e-05, "epoch": 0.2633075079427011, "percentage": 26.33, "elapsed_time": "11:10:51", "remaining_time": "1 day, 7:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4725, "total_steps": 17941, "loss": 1.8414, "learning_rate": 8.526865977053211e-05, "epoch": 0.2633632461958642, "percentage": 26.34, "elapsed_time": "11:11:00", "remaining_time": "1 day, 7:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4726, "total_steps": 17941, "loss": 1.725, "learning_rate": 8.52623475669285e-05, "epoch": 0.2634189844490274, "percentage": 26.34, "elapsed_time": "11:11:08", "remaining_time": "1 day, 7:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4727, "total_steps": 17941, "loss": 1.5888, "learning_rate": 8.52560342450088e-05, "epoch": 0.2634747227021905, "percentage": 26.35, "elapsed_time": "11:11:17", "remaining_time": "1 day, 7:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4728, "total_steps": 17941, "loss": 1.5588, "learning_rate": 8.524971980497325e-05, "epoch": 0.26353046095535365, "percentage": 26.35, "elapsed_time": "11:11:25", "remaining_time": "1 day, 7:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4729, "total_steps": 17941, "loss": 1.6186, "learning_rate": 8.524340424702211e-05, "epoch": 0.2635861992085168, "percentage": 26.36, "elapsed_time": "11:11:34", "remaining_time": "1 day, 7:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4730, "total_steps": 17941, "loss": 1.6917, "learning_rate": 8.523708757135567e-05, "epoch": 0.26364193746167996, "percentage": 26.36, "elapsed_time": "11:11:42", "remaining_time": "1 day, 7:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4731, "total_steps": 17941, "loss": 1.8079, "learning_rate": 8.523076977817426e-05, "epoch": 0.2636976757148431, "percentage": 26.37, "elapsed_time": "11:11:51", "remaining_time": "1 day, 7:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4732, "total_steps": 17941, "loss": 1.6814, "learning_rate": 8.522445086767826e-05, "epoch": 0.2637534139680062, "percentage": 26.38, "elapsed_time": "11:11:59", "remaining_time": "1 day, 7:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4733, "total_steps": 17941, "loss": 1.7971, "learning_rate": 8.521813084006802e-05, "epoch": 0.2638091522211694, "percentage": 26.38, "elapsed_time": "11:12:07", "remaining_time": "1 day, 7:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4734, "total_steps": 17941, "loss": 1.6389, "learning_rate": 8.5211809695544e-05, "epoch": 0.26386489047433254, "percentage": 26.39, "elapsed_time": "11:12:16", "remaining_time": "1 day, 7:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4735, "total_steps": 17941, "loss": 1.8107, "learning_rate": 8.520548743430673e-05, "epoch": 0.26392062872749567, "percentage": 26.39, "elapsed_time": "11:12:24", "remaining_time": "1 day, 7:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4736, "total_steps": 17941, "loss": 1.7698, "learning_rate": 8.51991640565566e-05, "epoch": 0.26397636698065885, "percentage": 26.4, "elapsed_time": "11:12:33", "remaining_time": "1 day, 7:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4737, "total_steps": 17941, "loss": 1.9701, "learning_rate": 8.519283956249424e-05, "epoch": 0.264032105233822, "percentage": 26.4, "elapsed_time": "11:12:41", "remaining_time": "1 day, 7:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4738, "total_steps": 17941, "loss": 1.7033, "learning_rate": 8.51865139523202e-05, "epoch": 0.2640878434869851, "percentage": 26.41, "elapsed_time": "11:12:50", "remaining_time": "1 day, 7:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4739, "total_steps": 17941, "loss": 1.6353, "learning_rate": 8.518018722623509e-05, "epoch": 0.26414358174014824, "percentage": 26.41, "elapsed_time": "11:12:58", "remaining_time": "1 day, 7:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4740, "total_steps": 17941, "loss": 1.8496, "learning_rate": 8.517385938443955e-05, "epoch": 0.2641993199933114, "percentage": 26.42, "elapsed_time": "11:13:07", "remaining_time": "1 day, 7:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4741, "total_steps": 17941, "loss": 1.612, "learning_rate": 8.516753042713426e-05, "epoch": 0.26425505824647455, "percentage": 26.43, "elapsed_time": "11:13:15", "remaining_time": "1 day, 7:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4742, "total_steps": 17941, "loss": 1.5978, "learning_rate": 8.516120035451996e-05, "epoch": 0.2643107964996377, "percentage": 26.43, "elapsed_time": "11:13:24", "remaining_time": "1 day, 7:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4743, "total_steps": 17941, "loss": 1.9667, "learning_rate": 8.515486916679738e-05, "epoch": 0.26436653475280086, "percentage": 26.44, "elapsed_time": "11:13:32", "remaining_time": "1 day, 7:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4744, "total_steps": 17941, "loss": 1.639, "learning_rate": 8.514853686416732e-05, "epoch": 0.264422273005964, "percentage": 26.44, "elapsed_time": "11:13:41", "remaining_time": "1 day, 7:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4745, "total_steps": 17941, "loss": 1.6839, "learning_rate": 8.51422034468306e-05, "epoch": 0.2644780112591271, "percentage": 26.45, "elapsed_time": "11:13:49", "remaining_time": "1 day, 7:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4746, "total_steps": 17941, "loss": 1.6927, "learning_rate": 8.513586891498809e-05, "epoch": 0.2645337495122903, "percentage": 26.45, "elapsed_time": "11:13:57", "remaining_time": "1 day, 7:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4747, "total_steps": 17941, "loss": 1.5131, "learning_rate": 8.512953326884066e-05, "epoch": 0.26458948776545343, "percentage": 26.46, "elapsed_time": "11:14:06", "remaining_time": "1 day, 7:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4748, "total_steps": 17941, "loss": 1.8373, "learning_rate": 8.512319650858926e-05, "epoch": 0.26464522601861656, "percentage": 26.46, "elapsed_time": "11:14:14", "remaining_time": "1 day, 7:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4749, "total_steps": 17941, "loss": 1.723, "learning_rate": 8.511685863443484e-05, "epoch": 0.26470096427177975, "percentage": 26.47, "elapsed_time": "11:14:23", "remaining_time": "1 day, 7:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4750, "total_steps": 17941, "loss": 1.6108, "learning_rate": 8.511051964657842e-05, "epoch": 0.2647567025249429, "percentage": 26.48, "elapsed_time": "11:14:32", "remaining_time": "1 day, 7:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4751, "total_steps": 17941, "loss": 1.6268, "learning_rate": 8.510417954522102e-05, "epoch": 0.264812440778106, "percentage": 26.48, "elapsed_time": "11:14:40", "remaining_time": "1 day, 7:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4752, "total_steps": 17941, "loss": 1.828, "learning_rate": 8.509783833056373e-05, "epoch": 0.26486817903126914, "percentage": 26.49, "elapsed_time": "11:14:49", "remaining_time": "1 day, 7:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4753, "total_steps": 17941, "loss": 1.6537, "learning_rate": 8.509149600280762e-05, "epoch": 0.2649239172844323, "percentage": 26.49, "elapsed_time": "11:14:57", "remaining_time": "1 day, 7:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4754, "total_steps": 17941, "loss": 1.6702, "learning_rate": 8.508515256215389e-05, "epoch": 0.26497965553759545, "percentage": 26.5, "elapsed_time": "11:15:05", "remaining_time": "1 day, 7:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4755, "total_steps": 17941, "loss": 1.7545, "learning_rate": 8.507880800880364e-05, "epoch": 0.2650353937907586, "percentage": 26.5, "elapsed_time": "11:15:14", "remaining_time": "1 day, 7:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4756, "total_steps": 17941, "loss": 1.9199, "learning_rate": 8.507246234295814e-05, "epoch": 0.26509113204392176, "percentage": 26.51, "elapsed_time": "11:15:22", "remaining_time": "1 day, 7:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4757, "total_steps": 17941, "loss": 1.645, "learning_rate": 8.506611556481862e-05, "epoch": 0.2651468702970849, "percentage": 26.51, "elapsed_time": "11:15:31", "remaining_time": "1 day, 7:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4758, "total_steps": 17941, "loss": 1.8503, "learning_rate": 8.505976767458636e-05, "epoch": 0.265202608550248, "percentage": 26.52, "elapsed_time": "11:15:39", "remaining_time": "1 day, 7:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4759, "total_steps": 17941, "loss": 1.6562, "learning_rate": 8.50534186724627e-05, "epoch": 0.2652583468034112, "percentage": 26.53, "elapsed_time": "11:15:48", "remaining_time": "1 day, 7:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4760, "total_steps": 17941, "loss": 1.7167, "learning_rate": 8.504706855864897e-05, "epoch": 0.26531408505657433, "percentage": 26.53, "elapsed_time": "11:15:56", "remaining_time": "1 day, 7:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4761, "total_steps": 17941, "loss": 1.955, "learning_rate": 8.504071733334656e-05, "epoch": 0.26536982330973746, "percentage": 26.54, "elapsed_time": "11:16:05", "remaining_time": "1 day, 7:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4762, "total_steps": 17941, "loss": 1.7336, "learning_rate": 8.503436499675687e-05, "epoch": 0.2654255615629006, "percentage": 26.54, "elapsed_time": "11:16:14", "remaining_time": "1 day, 7:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4763, "total_steps": 17941, "loss": 1.7619, "learning_rate": 8.502801154908142e-05, "epoch": 0.2654812998160638, "percentage": 26.55, "elapsed_time": "11:16:22", "remaining_time": "1 day, 7:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4764, "total_steps": 17941, "loss": 1.6425, "learning_rate": 8.502165699052168e-05, "epoch": 0.2655370380692269, "percentage": 26.55, "elapsed_time": "11:16:31", "remaining_time": "1 day, 7:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4765, "total_steps": 17941, "loss": 1.5942, "learning_rate": 8.501530132127915e-05, "epoch": 0.26559277632239003, "percentage": 26.56, "elapsed_time": "11:16:39", "remaining_time": "1 day, 7:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4766, "total_steps": 17941, "loss": 1.4847, "learning_rate": 8.500894454155541e-05, "epoch": 0.2656485145755532, "percentage": 26.56, "elapsed_time": "11:16:48", "remaining_time": "1 day, 7:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4767, "total_steps": 17941, "loss": 1.8069, "learning_rate": 8.500258665155207e-05, "epoch": 0.26570425282871635, "percentage": 26.57, "elapsed_time": "11:16:56", "remaining_time": "1 day, 7:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4768, "total_steps": 17941, "loss": 1.9243, "learning_rate": 8.499622765147078e-05, "epoch": 0.2657599910818795, "percentage": 26.58, "elapsed_time": "11:17:04", "remaining_time": "1 day, 7:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4769, "total_steps": 17941, "loss": 1.5832, "learning_rate": 8.498986754151316e-05, "epoch": 0.26581572933504266, "percentage": 26.58, "elapsed_time": "11:17:13", "remaining_time": "1 day, 7:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4770, "total_steps": 17941, "loss": 1.7387, "learning_rate": 8.498350632188097e-05, "epoch": 0.2658714675882058, "percentage": 26.59, "elapsed_time": "11:17:21", "remaining_time": "1 day, 7:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4771, "total_steps": 17941, "loss": 1.7853, "learning_rate": 8.497714399277592e-05, "epoch": 0.2659272058413689, "percentage": 26.59, "elapsed_time": "11:17:30", "remaining_time": "1 day, 7:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4772, "total_steps": 17941, "loss": 1.4848, "learning_rate": 8.49707805543998e-05, "epoch": 0.2659829440945321, "percentage": 26.6, "elapsed_time": "11:17:38", "remaining_time": "1 day, 7:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4773, "total_steps": 17941, "loss": 1.615, "learning_rate": 8.496441600695441e-05, "epoch": 0.26603868234769523, "percentage": 26.6, "elapsed_time": "11:17:47", "remaining_time": "1 day, 7:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4774, "total_steps": 17941, "loss": 1.8508, "learning_rate": 8.495805035064159e-05, "epoch": 0.26609442060085836, "percentage": 26.61, "elapsed_time": "11:17:56", "remaining_time": "1 day, 7:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4775, "total_steps": 17941, "loss": 1.6307, "learning_rate": 8.495168358566325e-05, "epoch": 0.2661501588540215, "percentage": 26.62, "elapsed_time": "11:18:04", "remaining_time": "1 day, 7:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4776, "total_steps": 17941, "loss": 1.7516, "learning_rate": 8.494531571222128e-05, "epoch": 0.2662058971071847, "percentage": 26.62, "elapsed_time": "11:18:12", "remaining_time": "1 day, 7:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4777, "total_steps": 17941, "loss": 1.9439, "learning_rate": 8.493894673051765e-05, "epoch": 0.2662616353603478, "percentage": 26.63, "elapsed_time": "11:18:21", "remaining_time": "1 day, 7:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4778, "total_steps": 17941, "loss": 1.7159, "learning_rate": 8.493257664075433e-05, "epoch": 0.26631737361351093, "percentage": 26.63, "elapsed_time": "11:18:29", "remaining_time": "1 day, 7:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4779, "total_steps": 17941, "loss": 1.6972, "learning_rate": 8.492620544313335e-05, "epoch": 0.2663731118666741, "percentage": 26.64, "elapsed_time": "11:18:38", "remaining_time": "1 day, 7:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4780, "total_steps": 17941, "loss": 1.6285, "learning_rate": 8.491983313785676e-05, "epoch": 0.26642885011983725, "percentage": 26.64, "elapsed_time": "11:18:47", "remaining_time": "1 day, 7:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4781, "total_steps": 17941, "loss": 1.7433, "learning_rate": 8.491345972512668e-05, "epoch": 0.2664845883730004, "percentage": 26.65, "elapsed_time": "11:18:55", "remaining_time": "1 day, 7:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4782, "total_steps": 17941, "loss": 1.8665, "learning_rate": 8.490708520514519e-05, "epoch": 0.26654032662616356, "percentage": 26.65, "elapsed_time": "11:19:04", "remaining_time": "1 day, 7:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4783, "total_steps": 17941, "loss": 1.7147, "learning_rate": 8.490070957811449e-05, "epoch": 0.2665960648793267, "percentage": 26.66, "elapsed_time": "11:19:12", "remaining_time": "1 day, 7:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4784, "total_steps": 17941, "loss": 1.5935, "learning_rate": 8.489433284423678e-05, "epoch": 0.2666518031324898, "percentage": 26.67, "elapsed_time": "11:19:21", "remaining_time": "1 day, 7:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4785, "total_steps": 17941, "loss": 1.8616, "learning_rate": 8.488795500371427e-05, "epoch": 0.26670754138565295, "percentage": 26.67, "elapsed_time": "11:19:29", "remaining_time": "1 day, 7:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4786, "total_steps": 17941, "loss": 1.5693, "learning_rate": 8.488157605674925e-05, "epoch": 0.26676327963881613, "percentage": 26.68, "elapsed_time": "11:19:37", "remaining_time": "1 day, 7:08:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4787, "total_steps": 17941, "loss": 1.797, "learning_rate": 8.487519600354399e-05, "epoch": 0.26681901789197926, "percentage": 26.68, "elapsed_time": "11:19:46", "remaining_time": "1 day, 7:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4788, "total_steps": 17941, "loss": 1.7024, "learning_rate": 8.486881484430085e-05, "epoch": 0.2668747561451424, "percentage": 26.69, "elapsed_time": "11:19:55", "remaining_time": "1 day, 7:07:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4789, "total_steps": 17941, "loss": 1.6602, "learning_rate": 8.486243257922221e-05, "epoch": 0.2669304943983056, "percentage": 26.69, "elapsed_time": "11:20:03", "remaining_time": "1 day, 7:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4790, "total_steps": 17941, "loss": 1.7195, "learning_rate": 8.485604920851049e-05, "epoch": 0.2669862326514687, "percentage": 26.7, "elapsed_time": "11:20:11", "remaining_time": "1 day, 7:07:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4791, "total_steps": 17941, "loss": 1.6503, "learning_rate": 8.48496647323681e-05, "epoch": 0.26704197090463183, "percentage": 26.7, "elapsed_time": "11:20:20", "remaining_time": "1 day, 7:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4792, "total_steps": 17941, "loss": 1.7975, "learning_rate": 8.484327915099752e-05, "epoch": 0.267097709157795, "percentage": 26.71, "elapsed_time": "11:20:28", "remaining_time": "1 day, 7:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4793, "total_steps": 17941, "loss": 1.8362, "learning_rate": 8.48368924646013e-05, "epoch": 0.26715344741095814, "percentage": 26.72, "elapsed_time": "11:20:37", "remaining_time": "1 day, 7:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4794, "total_steps": 17941, "loss": 1.7033, "learning_rate": 8.483050467338194e-05, "epoch": 0.2672091856641213, "percentage": 26.72, "elapsed_time": "11:20:45", "remaining_time": "1 day, 7:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4795, "total_steps": 17941, "loss": 1.828, "learning_rate": 8.482411577754205e-05, "epoch": 0.26726492391728446, "percentage": 26.73, "elapsed_time": "11:20:54", "remaining_time": "1 day, 7:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4796, "total_steps": 17941, "loss": 1.6922, "learning_rate": 8.481772577728426e-05, "epoch": 0.2673206621704476, "percentage": 26.73, "elapsed_time": "11:21:03", "remaining_time": "1 day, 7:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4797, "total_steps": 17941, "loss": 1.7228, "learning_rate": 8.48113346728112e-05, "epoch": 0.2673764004236107, "percentage": 26.74, "elapsed_time": "11:21:11", "remaining_time": "1 day, 7:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4798, "total_steps": 17941, "loss": 1.7192, "learning_rate": 8.480494246432557e-05, "epoch": 0.26743213867677385, "percentage": 26.74, "elapsed_time": "11:21:20", "remaining_time": "1 day, 7:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4799, "total_steps": 17941, "loss": 1.5593, "learning_rate": 8.47985491520301e-05, "epoch": 0.26748787692993703, "percentage": 26.75, "elapsed_time": "11:21:28", "remaining_time": "1 day, 7:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4800, "total_steps": 17941, "loss": 1.7545, "learning_rate": 8.479215473612754e-05, "epoch": 0.26754361518310016, "percentage": 26.75, "elapsed_time": "11:21:37", "remaining_time": "1 day, 7:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4801, "total_steps": 17941, "loss": 1.9369, "learning_rate": 8.478575921682066e-05, "epoch": 0.2675993534362633, "percentage": 26.76, "elapsed_time": "11:21:45", "remaining_time": "1 day, 7:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4802, "total_steps": 17941, "loss": 1.6485, "learning_rate": 8.477936259431235e-05, "epoch": 0.26765509168942647, "percentage": 26.77, "elapsed_time": "11:21:53", "remaining_time": "1 day, 7:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4803, "total_steps": 17941, "loss": 1.6459, "learning_rate": 8.477296486880541e-05, "epoch": 0.2677108299425896, "percentage": 26.77, "elapsed_time": "11:22:02", "remaining_time": "1 day, 7:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4804, "total_steps": 17941, "loss": 1.8825, "learning_rate": 8.476656604050277e-05, "epoch": 0.26776656819575273, "percentage": 26.78, "elapsed_time": "11:22:11", "remaining_time": "1 day, 7:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4805, "total_steps": 17941, "loss": 1.8011, "learning_rate": 8.476016610960736e-05, "epoch": 0.2678223064489159, "percentage": 26.78, "elapsed_time": "11:22:19", "remaining_time": "1 day, 7:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4806, "total_steps": 17941, "loss": 1.726, "learning_rate": 8.475376507632215e-05, "epoch": 0.26787804470207904, "percentage": 26.79, "elapsed_time": "11:22:28", "remaining_time": "1 day, 7:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4807, "total_steps": 17941, "loss": 1.6394, "learning_rate": 8.474736294085014e-05, "epoch": 0.2679337829552422, "percentage": 26.79, "elapsed_time": "11:22:37", "remaining_time": "1 day, 7:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4808, "total_steps": 17941, "loss": 1.7973, "learning_rate": 8.474095970339436e-05, "epoch": 0.2679895212084053, "percentage": 26.8, "elapsed_time": "11:22:45", "remaining_time": "1 day, 7:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4809, "total_steps": 17941, "loss": 1.6653, "learning_rate": 8.473455536415789e-05, "epoch": 0.2680452594615685, "percentage": 26.8, "elapsed_time": "11:22:54", "remaining_time": "1 day, 7:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4810, "total_steps": 17941, "loss": 1.7463, "learning_rate": 8.472814992334386e-05, "epoch": 0.2681009977147316, "percentage": 26.81, "elapsed_time": "11:23:02", "remaining_time": "1 day, 7:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4811, "total_steps": 17941, "loss": 1.9016, "learning_rate": 8.472174338115537e-05, "epoch": 0.26815673596789474, "percentage": 26.82, "elapsed_time": "11:23:10", "remaining_time": "1 day, 7:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4812, "total_steps": 17941, "loss": 1.6117, "learning_rate": 8.471533573779564e-05, "epoch": 0.26821247422105793, "percentage": 26.82, "elapsed_time": "11:23:19", "remaining_time": "1 day, 7:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4813, "total_steps": 17941, "loss": 1.6871, "learning_rate": 8.470892699346786e-05, "epoch": 0.26826821247422106, "percentage": 26.83, "elapsed_time": "11:23:27", "remaining_time": "1 day, 7:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4814, "total_steps": 17941, "loss": 1.7255, "learning_rate": 8.470251714837529e-05, "epoch": 0.2683239507273842, "percentage": 26.83, "elapsed_time": "11:23:36", "remaining_time": "1 day, 7:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4815, "total_steps": 17941, "loss": 1.414, "learning_rate": 8.46961062027212e-05, "epoch": 0.26837968898054737, "percentage": 26.84, "elapsed_time": "11:23:44", "remaining_time": "1 day, 7:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4816, "total_steps": 17941, "loss": 1.835, "learning_rate": 8.46896941567089e-05, "epoch": 0.2684354272337105, "percentage": 26.84, "elapsed_time": "11:23:53", "remaining_time": "1 day, 7:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4817, "total_steps": 17941, "loss": 1.5269, "learning_rate": 8.468328101054177e-05, "epoch": 0.26849116548687363, "percentage": 26.85, "elapsed_time": "11:24:01", "remaining_time": "1 day, 7:03:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4818, "total_steps": 17941, "loss": 1.7195, "learning_rate": 8.467686676442318e-05, "epoch": 0.2685469037400368, "percentage": 26.85, "elapsed_time": "11:24:10", "remaining_time": "1 day, 7:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4819, "total_steps": 17941, "loss": 1.6714, "learning_rate": 8.467045141855656e-05, "epoch": 0.26860264199319994, "percentage": 26.86, "elapsed_time": "11:24:19", "remaining_time": "1 day, 7:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4820, "total_steps": 17941, "loss": 1.6444, "learning_rate": 8.466403497314537e-05, "epoch": 0.26865838024636307, "percentage": 26.87, "elapsed_time": "11:24:27", "remaining_time": "1 day, 7:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4821, "total_steps": 17941, "loss": 1.9121, "learning_rate": 8.465761742839307e-05, "epoch": 0.2687141184995262, "percentage": 26.87, "elapsed_time": "11:24:36", "remaining_time": "1 day, 7:03:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4822, "total_steps": 17941, "loss": 1.8351, "learning_rate": 8.465119878450324e-05, "epoch": 0.2687698567526894, "percentage": 26.88, "elapsed_time": "11:24:44", "remaining_time": "1 day, 7:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4823, "total_steps": 17941, "loss": 1.8308, "learning_rate": 8.46447790416794e-05, "epoch": 0.2688255950058525, "percentage": 26.88, "elapsed_time": "11:24:53", "remaining_time": "1 day, 7:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4824, "total_steps": 17941, "loss": 1.6928, "learning_rate": 8.463835820012517e-05, "epoch": 0.26888133325901564, "percentage": 26.89, "elapsed_time": "11:25:01", "remaining_time": "1 day, 7:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4825, "total_steps": 17941, "loss": 1.8407, "learning_rate": 8.463193626004418e-05, "epoch": 0.2689370715121788, "percentage": 26.89, "elapsed_time": "11:25:10", "remaining_time": "1 day, 7:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4826, "total_steps": 17941, "loss": 1.7246, "learning_rate": 8.462551322164007e-05, "epoch": 0.26899280976534196, "percentage": 26.9, "elapsed_time": "11:25:18", "remaining_time": "1 day, 7:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4827, "total_steps": 17941, "loss": 1.7408, "learning_rate": 8.461908908511657e-05, "epoch": 0.2690485480185051, "percentage": 26.9, "elapsed_time": "11:25:27", "remaining_time": "1 day, 7:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4828, "total_steps": 17941, "loss": 1.6012, "learning_rate": 8.461266385067741e-05, "epoch": 0.26910428627166827, "percentage": 26.91, "elapsed_time": "11:25:35", "remaining_time": "1 day, 7:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4829, "total_steps": 17941, "loss": 1.6175, "learning_rate": 8.460623751852637e-05, "epoch": 0.2691600245248314, "percentage": 26.92, "elapsed_time": "11:25:43", "remaining_time": "1 day, 7:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4830, "total_steps": 17941, "loss": 1.7742, "learning_rate": 8.459981008886721e-05, "epoch": 0.2692157627779945, "percentage": 26.92, "elapsed_time": "11:25:52", "remaining_time": "1 day, 7:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4831, "total_steps": 17941, "loss": 1.6737, "learning_rate": 8.459338156190384e-05, "epoch": 0.26927150103115766, "percentage": 26.93, "elapsed_time": "11:26:00", "remaining_time": "1 day, 7:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4832, "total_steps": 17941, "loss": 1.6606, "learning_rate": 8.45869519378401e-05, "epoch": 0.26932723928432084, "percentage": 26.93, "elapsed_time": "11:26:09", "remaining_time": "1 day, 7:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4833, "total_steps": 17941, "loss": 1.9741, "learning_rate": 8.458052121687987e-05, "epoch": 0.26938297753748397, "percentage": 26.94, "elapsed_time": "11:26:18", "remaining_time": "1 day, 7:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4834, "total_steps": 17941, "loss": 1.7103, "learning_rate": 8.457408939922715e-05, "epoch": 0.2694387157906471, "percentage": 26.94, "elapsed_time": "11:26:26", "remaining_time": "1 day, 7:01:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4835, "total_steps": 17941, "loss": 1.7605, "learning_rate": 8.456765648508589e-05, "epoch": 0.2694944540438103, "percentage": 26.95, "elapsed_time": "11:26:35", "remaining_time": "1 day, 7:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4836, "total_steps": 17941, "loss": 1.6074, "learning_rate": 8.456122247466009e-05, "epoch": 0.2695501922969734, "percentage": 26.96, "elapsed_time": "11:26:43", "remaining_time": "1 day, 7:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4837, "total_steps": 17941, "loss": 1.6341, "learning_rate": 8.455478736815385e-05, "epoch": 0.26960593055013654, "percentage": 26.96, "elapsed_time": "11:26:52", "remaining_time": "1 day, 7:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4838, "total_steps": 17941, "loss": 1.792, "learning_rate": 8.454835116577122e-05, "epoch": 0.2696616688032997, "percentage": 26.97, "elapsed_time": "11:27:00", "remaining_time": "1 day, 7:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4839, "total_steps": 17941, "loss": 1.5826, "learning_rate": 8.45419138677163e-05, "epoch": 0.26971740705646285, "percentage": 26.97, "elapsed_time": "11:27:09", "remaining_time": "1 day, 7:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4840, "total_steps": 17941, "loss": 1.7387, "learning_rate": 8.453547547419329e-05, "epoch": 0.269773145309626, "percentage": 26.98, "elapsed_time": "11:27:17", "remaining_time": "1 day, 7:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4841, "total_steps": 17941, "loss": 1.532, "learning_rate": 8.452903598540634e-05, "epoch": 0.26982888356278917, "percentage": 26.98, "elapsed_time": "11:27:26", "remaining_time": "1 day, 7:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4842, "total_steps": 17941, "loss": 1.7955, "learning_rate": 8.452259540155968e-05, "epoch": 0.2698846218159523, "percentage": 26.99, "elapsed_time": "11:27:34", "remaining_time": "1 day, 7:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4843, "total_steps": 17941, "loss": 1.7329, "learning_rate": 8.451615372285758e-05, "epoch": 0.2699403600691154, "percentage": 26.99, "elapsed_time": "11:27:43", "remaining_time": "1 day, 6:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4844, "total_steps": 17941, "loss": 1.7294, "learning_rate": 8.450971094950433e-05, "epoch": 0.26999609832227855, "percentage": 27.0, "elapsed_time": "11:27:51", "remaining_time": "1 day, 6:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4845, "total_steps": 17941, "loss": 2.0301, "learning_rate": 8.450326708170426e-05, "epoch": 0.27005183657544174, "percentage": 27.01, "elapsed_time": "11:28:00", "remaining_time": "1 day, 6:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4846, "total_steps": 17941, "loss": 1.5171, "learning_rate": 8.449682211966172e-05, "epoch": 0.27010757482860487, "percentage": 27.01, "elapsed_time": "11:28:09", "remaining_time": "1 day, 6:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4847, "total_steps": 17941, "loss": 1.776, "learning_rate": 8.449037606358111e-05, "epoch": 0.270163313081768, "percentage": 27.02, "elapsed_time": "11:28:17", "remaining_time": "1 day, 6:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4848, "total_steps": 17941, "loss": 1.8956, "learning_rate": 8.448392891366688e-05, "epoch": 0.2702190513349312, "percentage": 27.02, "elapsed_time": "11:28:26", "remaining_time": "1 day, 6:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4849, "total_steps": 17941, "loss": 1.7156, "learning_rate": 8.447748067012345e-05, "epoch": 0.2702747895880943, "percentage": 27.03, "elapsed_time": "11:28:34", "remaining_time": "1 day, 6:59:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4850, "total_steps": 17941, "loss": 1.6983, "learning_rate": 8.447103133315537e-05, "epoch": 0.27033052784125744, "percentage": 27.03, "elapsed_time": "11:28:43", "remaining_time": "1 day, 6:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4851, "total_steps": 17941, "loss": 1.6147, "learning_rate": 8.446458090296716e-05, "epoch": 0.2703862660944206, "percentage": 27.04, "elapsed_time": "11:28:51", "remaining_time": "1 day, 6:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4852, "total_steps": 17941, "loss": 1.677, "learning_rate": 8.445812937976338e-05, "epoch": 0.27044200434758375, "percentage": 27.04, "elapsed_time": "11:29:00", "remaining_time": "1 day, 6:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4853, "total_steps": 17941, "loss": 1.4833, "learning_rate": 8.445167676374865e-05, "epoch": 0.2704977426007469, "percentage": 27.05, "elapsed_time": "11:29:08", "remaining_time": "1 day, 6:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4854, "total_steps": 17941, "loss": 1.5832, "learning_rate": 8.444522305512757e-05, "epoch": 0.27055348085391, "percentage": 27.06, "elapsed_time": "11:29:16", "remaining_time": "1 day, 6:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4855, "total_steps": 17941, "loss": 1.4971, "learning_rate": 8.443876825410488e-05, "epoch": 0.2706092191070732, "percentage": 27.06, "elapsed_time": "11:29:25", "remaining_time": "1 day, 6:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4856, "total_steps": 17941, "loss": 1.7624, "learning_rate": 8.443231236088524e-05, "epoch": 0.2706649573602363, "percentage": 27.07, "elapsed_time": "11:29:33", "remaining_time": "1 day, 6:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4857, "total_steps": 17941, "loss": 1.5509, "learning_rate": 8.44258553756734e-05, "epoch": 0.27072069561339945, "percentage": 27.07, "elapsed_time": "11:29:42", "remaining_time": "1 day, 6:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4858, "total_steps": 17941, "loss": 1.8286, "learning_rate": 8.441939729867415e-05, "epoch": 0.27077643386656264, "percentage": 27.08, "elapsed_time": "11:29:50", "remaining_time": "1 day, 6:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4859, "total_steps": 17941, "loss": 1.7291, "learning_rate": 8.44129381300923e-05, "epoch": 0.27083217211972577, "percentage": 27.08, "elapsed_time": "11:29:59", "remaining_time": "1 day, 6:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4860, "total_steps": 17941, "loss": 1.6051, "learning_rate": 8.440647787013268e-05, "epoch": 0.2708879103728889, "percentage": 27.09, "elapsed_time": "11:30:07", "remaining_time": "1 day, 6:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4861, "total_steps": 17941, "loss": 1.5241, "learning_rate": 8.44000165190002e-05, "epoch": 0.2709436486260521, "percentage": 27.09, "elapsed_time": "11:30:15", "remaining_time": "1 day, 6:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4862, "total_steps": 17941, "loss": 1.8138, "learning_rate": 8.439355407689975e-05, "epoch": 0.2709993868792152, "percentage": 27.1, "elapsed_time": "11:30:24", "remaining_time": "1 day, 6:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4863, "total_steps": 17941, "loss": 1.5114, "learning_rate": 8.43870905440363e-05, "epoch": 0.27105512513237834, "percentage": 27.11, "elapsed_time": "11:30:33", "remaining_time": "1 day, 6:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4864, "total_steps": 17941, "loss": 1.5331, "learning_rate": 8.438062592061485e-05, "epoch": 0.2711108633855415, "percentage": 27.11, "elapsed_time": "11:30:41", "remaining_time": "1 day, 6:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4865, "total_steps": 17941, "loss": 1.5122, "learning_rate": 8.437416020684036e-05, "epoch": 0.27116660163870465, "percentage": 27.12, "elapsed_time": "11:30:50", "remaining_time": "1 day, 6:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4866, "total_steps": 17941, "loss": 1.8776, "learning_rate": 8.436769340291794e-05, "epoch": 0.2712223398918678, "percentage": 27.12, "elapsed_time": "11:30:58", "remaining_time": "1 day, 6:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4867, "total_steps": 17941, "loss": 1.6388, "learning_rate": 8.436122550905266e-05, "epoch": 0.2712780781450309, "percentage": 27.13, "elapsed_time": "11:31:06", "remaining_time": "1 day, 6:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4868, "total_steps": 17941, "loss": 1.5203, "learning_rate": 8.435475652544967e-05, "epoch": 0.2713338163981941, "percentage": 27.13, "elapsed_time": "11:31:15", "remaining_time": "1 day, 6:56:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4869, "total_steps": 17941, "loss": 1.8796, "learning_rate": 8.434828645231407e-05, "epoch": 0.2713895546513572, "percentage": 27.14, "elapsed_time": "11:31:23", "remaining_time": "1 day, 6:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4870, "total_steps": 17941, "loss": 1.711, "learning_rate": 8.434181528985112e-05, "epoch": 0.27144529290452035, "percentage": 27.14, "elapsed_time": "11:31:32", "remaining_time": "1 day, 6:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4871, "total_steps": 17941, "loss": 1.5739, "learning_rate": 8.4335343038266e-05, "epoch": 0.27150103115768354, "percentage": 27.15, "elapsed_time": "11:31:40", "remaining_time": "1 day, 6:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4872, "total_steps": 17941, "loss": 1.7037, "learning_rate": 8.432886969776398e-05, "epoch": 0.27155676941084667, "percentage": 27.16, "elapsed_time": "11:31:49", "remaining_time": "1 day, 6:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4873, "total_steps": 17941, "loss": 1.566, "learning_rate": 8.432239526855036e-05, "epoch": 0.2716125076640098, "percentage": 27.16, "elapsed_time": "11:31:58", "remaining_time": "1 day, 6:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4874, "total_steps": 17941, "loss": 1.7742, "learning_rate": 8.431591975083049e-05, "epoch": 0.271668245917173, "percentage": 27.17, "elapsed_time": "11:32:06", "remaining_time": "1 day, 6:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4875, "total_steps": 17941, "loss": 1.7467, "learning_rate": 8.430944314480973e-05, "epoch": 0.2717239841703361, "percentage": 27.17, "elapsed_time": "11:32:15", "remaining_time": "1 day, 6:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4876, "total_steps": 17941, "loss": 1.5414, "learning_rate": 8.430296545069345e-05, "epoch": 0.27177972242349924, "percentage": 27.18, "elapsed_time": "11:32:23", "remaining_time": "1 day, 6:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4877, "total_steps": 17941, "loss": 1.7401, "learning_rate": 8.429648666868713e-05, "epoch": 0.27183546067666237, "percentage": 27.18, "elapsed_time": "11:32:32", "remaining_time": "1 day, 6:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4878, "total_steps": 17941, "loss": 1.6739, "learning_rate": 8.429000679899619e-05, "epoch": 0.27189119892982555, "percentage": 27.19, "elapsed_time": "11:32:40", "remaining_time": "1 day, 6:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4879, "total_steps": 17941, "loss": 1.6982, "learning_rate": 8.428352584182617e-05, "epoch": 0.2719469371829887, "percentage": 27.19, "elapsed_time": "11:32:49", "remaining_time": "1 day, 6:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4880, "total_steps": 17941, "loss": 1.6927, "learning_rate": 8.42770437973826e-05, "epoch": 0.2720026754361518, "percentage": 27.2, "elapsed_time": "11:32:57", "remaining_time": "1 day, 6:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4881, "total_steps": 17941, "loss": 1.6674, "learning_rate": 8.427056066587105e-05, "epoch": 0.272058413689315, "percentage": 27.21, "elapsed_time": "11:33:05", "remaining_time": "1 day, 6:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4882, "total_steps": 17941, "loss": 1.8356, "learning_rate": 8.426407644749711e-05, "epoch": 0.2721141519424781, "percentage": 27.21, "elapsed_time": "11:33:14", "remaining_time": "1 day, 6:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4883, "total_steps": 17941, "loss": 1.749, "learning_rate": 8.425759114246647e-05, "epoch": 0.27216989019564125, "percentage": 27.22, "elapsed_time": "11:33:22", "remaining_time": "1 day, 6:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4884, "total_steps": 17941, "loss": 1.4771, "learning_rate": 8.425110475098476e-05, "epoch": 0.27222562844880444, "percentage": 27.22, "elapsed_time": "11:33:31", "remaining_time": "1 day, 6:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4885, "total_steps": 17941, "loss": 1.6603, "learning_rate": 8.42446172732577e-05, "epoch": 0.27228136670196756, "percentage": 27.23, "elapsed_time": "11:33:39", "remaining_time": "1 day, 6:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4886, "total_steps": 17941, "loss": 1.8797, "learning_rate": 8.423812870949104e-05, "epoch": 0.2723371049551307, "percentage": 27.23, "elapsed_time": "11:33:48", "remaining_time": "1 day, 6:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4887, "total_steps": 17941, "loss": 1.649, "learning_rate": 8.423163905989055e-05, "epoch": 0.2723928432082939, "percentage": 27.24, "elapsed_time": "11:33:56", "remaining_time": "1 day, 6:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4888, "total_steps": 17941, "loss": 1.7182, "learning_rate": 8.422514832466206e-05, "epoch": 0.272448581461457, "percentage": 27.24, "elapsed_time": "11:34:05", "remaining_time": "1 day, 6:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4889, "total_steps": 17941, "loss": 1.6317, "learning_rate": 8.421865650401143e-05, "epoch": 0.27250431971462014, "percentage": 27.25, "elapsed_time": "11:34:13", "remaining_time": "1 day, 6:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4890, "total_steps": 17941, "loss": 1.7071, "learning_rate": 8.421216359814451e-05, "epoch": 0.27256005796778326, "percentage": 27.26, "elapsed_time": "11:34:22", "remaining_time": "1 day, 6:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4891, "total_steps": 17941, "loss": 1.6561, "learning_rate": 8.420566960726723e-05, "epoch": 0.27261579622094645, "percentage": 27.26, "elapsed_time": "11:34:30", "remaining_time": "1 day, 6:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4892, "total_steps": 17941, "loss": 1.5538, "learning_rate": 8.419917453158554e-05, "epoch": 0.2726715344741096, "percentage": 27.27, "elapsed_time": "11:34:39", "remaining_time": "1 day, 6:52:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4893, "total_steps": 17941, "loss": 1.5957, "learning_rate": 8.419267837130544e-05, "epoch": 0.2727272727272727, "percentage": 27.27, "elapsed_time": "11:34:47", "remaining_time": "1 day, 6:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4894, "total_steps": 17941, "loss": 1.6552, "learning_rate": 8.418618112663292e-05, "epoch": 0.2727830109804359, "percentage": 27.28, "elapsed_time": "11:34:56", "remaining_time": "1 day, 6:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4895, "total_steps": 17941, "loss": 1.8649, "learning_rate": 8.417968279777409e-05, "epoch": 0.272838749233599, "percentage": 27.28, "elapsed_time": "11:35:04", "remaining_time": "1 day, 6:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4896, "total_steps": 17941, "loss": 1.8317, "learning_rate": 8.417318338493497e-05, "epoch": 0.27289448748676215, "percentage": 27.29, "elapsed_time": "11:35:13", "remaining_time": "1 day, 6:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4897, "total_steps": 17941, "loss": 1.775, "learning_rate": 8.416668288832173e-05, "epoch": 0.27295022573992533, "percentage": 27.3, "elapsed_time": "11:35:21", "remaining_time": "1 day, 6:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4898, "total_steps": 17941, "loss": 1.9256, "learning_rate": 8.41601813081405e-05, "epoch": 0.27300596399308846, "percentage": 27.3, "elapsed_time": "11:35:29", "remaining_time": "1 day, 6:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4899, "total_steps": 17941, "loss": 1.6553, "learning_rate": 8.415367864459751e-05, "epoch": 0.2730617022462516, "percentage": 27.31, "elapsed_time": "11:35:39", "remaining_time": "1 day, 6:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4900, "total_steps": 17941, "loss": 1.8121, "learning_rate": 8.414717489789894e-05, "epoch": 0.2731174404994147, "percentage": 27.31, "elapsed_time": "11:35:47", "remaining_time": "1 day, 6:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4901, "total_steps": 17941, "loss": 1.657, "learning_rate": 8.414067006825108e-05, "epoch": 0.2731731787525779, "percentage": 27.32, "elapsed_time": "11:35:56", "remaining_time": "1 day, 6:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4902, "total_steps": 17941, "loss": 2.2447, "learning_rate": 8.413416415586024e-05, "epoch": 0.27322891700574103, "percentage": 27.32, "elapsed_time": "11:36:04", "remaining_time": "1 day, 6:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4903, "total_steps": 17941, "loss": 1.5666, "learning_rate": 8.412765716093272e-05, "epoch": 0.27328465525890416, "percentage": 27.33, "elapsed_time": "11:36:13", "remaining_time": "1 day, 6:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4904, "total_steps": 17941, "loss": 1.5972, "learning_rate": 8.412114908367488e-05, "epoch": 0.27334039351206735, "percentage": 27.33, "elapsed_time": "11:36:21", "remaining_time": "1 day, 6:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4905, "total_steps": 17941, "loss": 1.8609, "learning_rate": 8.411463992429314e-05, "epoch": 0.2733961317652305, "percentage": 27.34, "elapsed_time": "11:36:30", "remaining_time": "1 day, 6:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4906, "total_steps": 17941, "loss": 1.8211, "learning_rate": 8.41081296829939e-05, "epoch": 0.2734518700183936, "percentage": 27.35, "elapsed_time": "11:36:38", "remaining_time": "1 day, 6:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4907, "total_steps": 17941, "loss": 1.7879, "learning_rate": 8.410161835998369e-05, "epoch": 0.2735076082715568, "percentage": 27.35, "elapsed_time": "11:36:47", "remaining_time": "1 day, 6:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4908, "total_steps": 17941, "loss": 1.9543, "learning_rate": 8.409510595546894e-05, "epoch": 0.2735633465247199, "percentage": 27.36, "elapsed_time": "11:36:55", "remaining_time": "1 day, 6:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4909, "total_steps": 17941, "loss": 1.8165, "learning_rate": 8.408859246965623e-05, "epoch": 0.27361908477788305, "percentage": 27.36, "elapsed_time": "11:37:03", "remaining_time": "1 day, 6:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4910, "total_steps": 17941, "loss": 1.8084, "learning_rate": 8.408207790275213e-05, "epoch": 0.27367482303104623, "percentage": 27.37, "elapsed_time": "11:37:12", "remaining_time": "1 day, 6:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4911, "total_steps": 17941, "loss": 1.782, "learning_rate": 8.407556225496322e-05, "epoch": 0.27373056128420936, "percentage": 27.37, "elapsed_time": "11:37:20", "remaining_time": "1 day, 6:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4912, "total_steps": 17941, "loss": 1.7673, "learning_rate": 8.406904552649614e-05, "epoch": 0.2737862995373725, "percentage": 27.38, "elapsed_time": "11:37:29", "remaining_time": "1 day, 6:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4913, "total_steps": 17941, "loss": 1.9742, "learning_rate": 8.406252771755758e-05, "epoch": 0.2738420377905356, "percentage": 27.38, "elapsed_time": "11:37:37", "remaining_time": "1 day, 6:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4914, "total_steps": 17941, "loss": 1.6226, "learning_rate": 8.405600882835425e-05, "epoch": 0.2738977760436988, "percentage": 27.39, "elapsed_time": "11:37:46", "remaining_time": "1 day, 6:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4915, "total_steps": 17941, "loss": 1.7948, "learning_rate": 8.404948885909288e-05, "epoch": 0.27395351429686193, "percentage": 27.4, "elapsed_time": "11:37:54", "remaining_time": "1 day, 6:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4916, "total_steps": 17941, "loss": 1.5653, "learning_rate": 8.404296780998022e-05, "epoch": 0.27400925255002506, "percentage": 27.4, "elapsed_time": "11:38:02", "remaining_time": "1 day, 6:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4917, "total_steps": 17941, "loss": 1.6596, "learning_rate": 8.403644568122313e-05, "epoch": 0.27406499080318825, "percentage": 27.41, "elapsed_time": "11:38:11", "remaining_time": "1 day, 6:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4918, "total_steps": 17941, "loss": 1.7119, "learning_rate": 8.402992247302842e-05, "epoch": 0.2741207290563514, "percentage": 27.41, "elapsed_time": "11:38:19", "remaining_time": "1 day, 6:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4919, "total_steps": 17941, "loss": 1.7161, "learning_rate": 8.402339818560296e-05, "epoch": 0.2741764673095145, "percentage": 27.42, "elapsed_time": "11:38:28", "remaining_time": "1 day, 6:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4920, "total_steps": 17941, "loss": 1.7174, "learning_rate": 8.401687281915371e-05, "epoch": 0.2742322055626777, "percentage": 27.42, "elapsed_time": "11:38:36", "remaining_time": "1 day, 6:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4921, "total_steps": 17941, "loss": 1.5517, "learning_rate": 8.401034637388758e-05, "epoch": 0.2742879438158408, "percentage": 27.43, "elapsed_time": "11:38:45", "remaining_time": "1 day, 6:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4922, "total_steps": 17941, "loss": 1.7067, "learning_rate": 8.400381885001155e-05, "epoch": 0.27434368206900395, "percentage": 27.43, "elapsed_time": "11:38:53", "remaining_time": "1 day, 6:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4923, "total_steps": 17941, "loss": 1.7333, "learning_rate": 8.399729024773264e-05, "epoch": 0.2743994203221671, "percentage": 27.44, "elapsed_time": "11:39:02", "remaining_time": "1 day, 6:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4924, "total_steps": 17941, "loss": 1.7721, "learning_rate": 8.39907605672579e-05, "epoch": 0.27445515857533026, "percentage": 27.45, "elapsed_time": "11:39:10", "remaining_time": "1 day, 6:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4925, "total_steps": 17941, "loss": 1.5788, "learning_rate": 8.398422980879442e-05, "epoch": 0.2745108968284934, "percentage": 27.45, "elapsed_time": "11:39:19", "remaining_time": "1 day, 6:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4926, "total_steps": 17941, "loss": 1.7782, "learning_rate": 8.39776979725493e-05, "epoch": 0.2745666350816565, "percentage": 27.46, "elapsed_time": "11:39:27", "remaining_time": "1 day, 6:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4927, "total_steps": 17941, "loss": 1.6911, "learning_rate": 8.397116505872973e-05, "epoch": 0.2746223733348197, "percentage": 27.46, "elapsed_time": "11:39:36", "remaining_time": "1 day, 6:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4928, "total_steps": 17941, "loss": 1.7944, "learning_rate": 8.396463106754285e-05, "epoch": 0.27467811158798283, "percentage": 27.47, "elapsed_time": "11:39:44", "remaining_time": "1 day, 6:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4929, "total_steps": 17941, "loss": 1.8542, "learning_rate": 8.395809599919591e-05, "epoch": 0.27473384984114596, "percentage": 27.47, "elapsed_time": "11:39:53", "remaining_time": "1 day, 6:47:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4930, "total_steps": 17941, "loss": 1.582, "learning_rate": 8.395155985389615e-05, "epoch": 0.27478958809430915, "percentage": 27.48, "elapsed_time": "11:40:02", "remaining_time": "1 day, 6:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4931, "total_steps": 17941, "loss": 1.8807, "learning_rate": 8.394502263185087e-05, "epoch": 0.2748453263474723, "percentage": 27.48, "elapsed_time": "11:40:10", "remaining_time": "1 day, 6:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4932, "total_steps": 17941, "loss": 1.8139, "learning_rate": 8.393848433326736e-05, "epoch": 0.2749010646006354, "percentage": 27.49, "elapsed_time": "11:40:19", "remaining_time": "1 day, 6:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4933, "total_steps": 17941, "loss": 1.9141, "learning_rate": 8.393194495835304e-05, "epoch": 0.2749568028537986, "percentage": 27.5, "elapsed_time": "11:40:27", "remaining_time": "1 day, 6:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4934, "total_steps": 17941, "loss": 1.7951, "learning_rate": 8.392540450731522e-05, "epoch": 0.2750125411069617, "percentage": 27.5, "elapsed_time": "11:40:36", "remaining_time": "1 day, 6:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4935, "total_steps": 17941, "loss": 1.7804, "learning_rate": 8.39188629803614e-05, "epoch": 0.27506827936012485, "percentage": 27.51, "elapsed_time": "11:40:44", "remaining_time": "1 day, 6:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4936, "total_steps": 17941, "loss": 1.82, "learning_rate": 8.3912320377699e-05, "epoch": 0.275124017613288, "percentage": 27.51, "elapsed_time": "11:40:53", "remaining_time": "1 day, 6:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4937, "total_steps": 17941, "loss": 1.7678, "learning_rate": 8.390577669953552e-05, "epoch": 0.27517975586645116, "percentage": 27.52, "elapsed_time": "11:41:01", "remaining_time": "1 day, 6:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4938, "total_steps": 17941, "loss": 1.5144, "learning_rate": 8.389923194607849e-05, "epoch": 0.2752354941196143, "percentage": 27.52, "elapsed_time": "11:41:09", "remaining_time": "1 day, 6:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4939, "total_steps": 17941, "loss": 1.6204, "learning_rate": 8.389268611753546e-05, "epoch": 0.2752912323727774, "percentage": 27.53, "elapsed_time": "11:41:18", "remaining_time": "1 day, 6:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4940, "total_steps": 17941, "loss": 1.6948, "learning_rate": 8.388613921411404e-05, "epoch": 0.2753469706259406, "percentage": 27.53, "elapsed_time": "11:41:26", "remaining_time": "1 day, 6:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4941, "total_steps": 17941, "loss": 1.5522, "learning_rate": 8.387959123602185e-05, "epoch": 0.27540270887910373, "percentage": 27.54, "elapsed_time": "11:41:35", "remaining_time": "1 day, 6:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4942, "total_steps": 17941, "loss": 1.6392, "learning_rate": 8.387304218346656e-05, "epoch": 0.27545844713226686, "percentage": 27.55, "elapsed_time": "11:41:43", "remaining_time": "1 day, 6:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4943, "total_steps": 17941, "loss": 1.674, "learning_rate": 8.386649205665586e-05, "epoch": 0.27551418538543004, "percentage": 27.55, "elapsed_time": "11:41:52", "remaining_time": "1 day, 6:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4944, "total_steps": 17941, "loss": 2.0767, "learning_rate": 8.385994085579751e-05, "epoch": 0.2755699236385932, "percentage": 27.56, "elapsed_time": "11:42:00", "remaining_time": "1 day, 6:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4945, "total_steps": 17941, "loss": 1.8275, "learning_rate": 8.385338858109922e-05, "epoch": 0.2756256618917563, "percentage": 27.56, "elapsed_time": "11:42:10", "remaining_time": "1 day, 6:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4946, "total_steps": 17941, "loss": 1.5918, "learning_rate": 8.384683523276885e-05, "epoch": 0.27568140014491943, "percentage": 27.57, "elapsed_time": "11:42:18", "remaining_time": "1 day, 6:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4947, "total_steps": 17941, "loss": 1.6857, "learning_rate": 8.38402808110142e-05, "epoch": 0.2757371383980826, "percentage": 27.57, "elapsed_time": "11:42:27", "remaining_time": "1 day, 6:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4948, "total_steps": 17941, "loss": 1.6894, "learning_rate": 8.383372531604314e-05, "epoch": 0.27579287665124574, "percentage": 27.58, "elapsed_time": "11:42:35", "remaining_time": "1 day, 6:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4949, "total_steps": 17941, "loss": 1.7214, "learning_rate": 8.382716874806357e-05, "epoch": 0.2758486149044089, "percentage": 27.58, "elapsed_time": "11:42:44", "remaining_time": "1 day, 6:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4950, "total_steps": 17941, "loss": 1.4341, "learning_rate": 8.382061110728345e-05, "epoch": 0.27590435315757206, "percentage": 27.59, "elapsed_time": "11:42:52", "remaining_time": "1 day, 6:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4951, "total_steps": 17941, "loss": 1.7528, "learning_rate": 8.381405239391074e-05, "epoch": 0.2759600914107352, "percentage": 27.6, "elapsed_time": "11:43:00", "remaining_time": "1 day, 6:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4952, "total_steps": 17941, "loss": 1.8709, "learning_rate": 8.38074926081534e-05, "epoch": 0.2760158296638983, "percentage": 27.6, "elapsed_time": "11:43:09", "remaining_time": "1 day, 6:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4953, "total_steps": 17941, "loss": 1.8472, "learning_rate": 8.380093175021953e-05, "epoch": 0.2760715679170615, "percentage": 27.61, "elapsed_time": "11:43:17", "remaining_time": "1 day, 6:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4954, "total_steps": 17941, "loss": 1.5508, "learning_rate": 8.379436982031718e-05, "epoch": 0.27612730617022463, "percentage": 27.61, "elapsed_time": "11:43:27", "remaining_time": "1 day, 6:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4955, "total_steps": 17941, "loss": 1.7762, "learning_rate": 8.378780681865445e-05, "epoch": 0.27618304442338776, "percentage": 27.62, "elapsed_time": "11:43:35", "remaining_time": "1 day, 6:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4956, "total_steps": 17941, "loss": 1.8666, "learning_rate": 8.37812427454395e-05, "epoch": 0.27623878267655094, "percentage": 27.62, "elapsed_time": "11:43:44", "remaining_time": "1 day, 6:43:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4957, "total_steps": 17941, "loss": 1.6681, "learning_rate": 8.377467760088046e-05, "epoch": 0.27629452092971407, "percentage": 27.63, "elapsed_time": "11:43:52", "remaining_time": "1 day, 6:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4958, "total_steps": 17941, "loss": 1.8999, "learning_rate": 8.376811138518558e-05, "epoch": 0.2763502591828772, "percentage": 27.64, "elapsed_time": "11:44:00", "remaining_time": "1 day, 6:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4959, "total_steps": 17941, "loss": 2.1091, "learning_rate": 8.376154409856309e-05, "epoch": 0.27640599743604033, "percentage": 27.64, "elapsed_time": "11:44:09", "remaining_time": "1 day, 6:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4960, "total_steps": 17941, "loss": 1.837, "learning_rate": 8.375497574122127e-05, "epoch": 0.2764617356892035, "percentage": 27.65, "elapsed_time": "11:44:17", "remaining_time": "1 day, 6:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4961, "total_steps": 17941, "loss": 1.643, "learning_rate": 8.374840631336842e-05, "epoch": 0.27651747394236664, "percentage": 27.65, "elapsed_time": "11:44:26", "remaining_time": "1 day, 6:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4962, "total_steps": 17941, "loss": 1.6044, "learning_rate": 8.374183581521288e-05, "epoch": 0.27657321219552977, "percentage": 27.66, "elapsed_time": "11:44:34", "remaining_time": "1 day, 6:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4963, "total_steps": 17941, "loss": 1.7088, "learning_rate": 8.373526424696305e-05, "epoch": 0.27662895044869296, "percentage": 27.66, "elapsed_time": "11:44:43", "remaining_time": "1 day, 6:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4964, "total_steps": 17941, "loss": 1.5888, "learning_rate": 8.372869160882733e-05, "epoch": 0.2766846887018561, "percentage": 27.67, "elapsed_time": "11:44:51", "remaining_time": "1 day, 6:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4965, "total_steps": 17941, "loss": 1.6905, "learning_rate": 8.372211790101414e-05, "epoch": 0.2767404269550192, "percentage": 27.67, "elapsed_time": "11:45:00", "remaining_time": "1 day, 6:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4966, "total_steps": 17941, "loss": 1.7584, "learning_rate": 8.3715543123732e-05, "epoch": 0.2767961652081824, "percentage": 27.68, "elapsed_time": "11:45:08", "remaining_time": "1 day, 6:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4967, "total_steps": 17941, "loss": 1.7863, "learning_rate": 8.370896727718942e-05, "epoch": 0.2768519034613455, "percentage": 27.69, "elapsed_time": "11:45:18", "remaining_time": "1 day, 6:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4968, "total_steps": 17941, "loss": 1.8825, "learning_rate": 8.370239036159493e-05, "epoch": 0.27690764171450866, "percentage": 27.69, "elapsed_time": "11:45:26", "remaining_time": "1 day, 6:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4969, "total_steps": 17941, "loss": 1.9587, "learning_rate": 8.36958123771571e-05, "epoch": 0.2769633799676718, "percentage": 27.7, "elapsed_time": "11:45:35", "remaining_time": "1 day, 6:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4970, "total_steps": 17941, "loss": 1.8635, "learning_rate": 8.368923332408459e-05, "epoch": 0.27701911822083497, "percentage": 27.7, "elapsed_time": "11:45:43", "remaining_time": "1 day, 6:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4971, "total_steps": 17941, "loss": 1.7843, "learning_rate": 8.368265320258598e-05, "epoch": 0.2770748564739981, "percentage": 27.71, "elapsed_time": "11:45:52", "remaining_time": "1 day, 6:41:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4972, "total_steps": 17941, "loss": 1.6231, "learning_rate": 8.367607201287002e-05, "epoch": 0.27713059472716123, "percentage": 27.71, "elapsed_time": "11:46:00", "remaining_time": "1 day, 6:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4973, "total_steps": 17941, "loss": 1.5014, "learning_rate": 8.366948975514539e-05, "epoch": 0.2771863329803244, "percentage": 27.72, "elapsed_time": "11:46:09", "remaining_time": "1 day, 6:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4974, "total_steps": 17941, "loss": 1.522, "learning_rate": 8.366290642962087e-05, "epoch": 0.27724207123348754, "percentage": 27.72, "elapsed_time": "11:46:17", "remaining_time": "1 day, 6:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4975, "total_steps": 17941, "loss": 1.5344, "learning_rate": 8.36563220365052e-05, "epoch": 0.27729780948665067, "percentage": 27.73, "elapsed_time": "11:46:26", "remaining_time": "1 day, 6:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4976, "total_steps": 17941, "loss": 1.4201, "learning_rate": 8.364973657600724e-05, "epoch": 0.27735354773981385, "percentage": 27.74, "elapsed_time": "11:46:34", "remaining_time": "1 day, 6:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4977, "total_steps": 17941, "loss": 1.7664, "learning_rate": 8.364315004833583e-05, "epoch": 0.277409285992977, "percentage": 27.74, "elapsed_time": "11:46:42", "remaining_time": "1 day, 6:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4978, "total_steps": 17941, "loss": 1.75, "learning_rate": 8.363656245369984e-05, "epoch": 0.2774650242461401, "percentage": 27.75, "elapsed_time": "11:46:51", "remaining_time": "1 day, 6:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4979, "total_steps": 17941, "loss": 1.6432, "learning_rate": 8.362997379230822e-05, "epoch": 0.2775207624993033, "percentage": 27.75, "elapsed_time": "11:46:59", "remaining_time": "1 day, 6:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4980, "total_steps": 17941, "loss": 1.948, "learning_rate": 8.36233840643699e-05, "epoch": 0.2775765007524664, "percentage": 27.76, "elapsed_time": "11:47:08", "remaining_time": "1 day, 6:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4981, "total_steps": 17941, "loss": 1.8148, "learning_rate": 8.361679327009388e-05, "epoch": 0.27763223900562956, "percentage": 27.76, "elapsed_time": "11:47:16", "remaining_time": "1 day, 6:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4982, "total_steps": 17941, "loss": 1.9087, "learning_rate": 8.361020140968919e-05, "epoch": 0.2776879772587927, "percentage": 27.77, "elapsed_time": "11:47:25", "remaining_time": "1 day, 6:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4983, "total_steps": 17941, "loss": 1.7628, "learning_rate": 8.360360848336484e-05, "epoch": 0.27774371551195587, "percentage": 27.77, "elapsed_time": "11:47:33", "remaining_time": "1 day, 6:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4984, "total_steps": 17941, "loss": 1.8127, "learning_rate": 8.359701449132998e-05, "epoch": 0.277799453765119, "percentage": 27.78, "elapsed_time": "11:47:42", "remaining_time": "1 day, 6:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4985, "total_steps": 17941, "loss": 1.5508, "learning_rate": 8.359041943379369e-05, "epoch": 0.2778551920182821, "percentage": 27.79, "elapsed_time": "11:47:50", "remaining_time": "1 day, 6:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4986, "total_steps": 17941, "loss": 1.6666, "learning_rate": 8.358382331096514e-05, "epoch": 0.2779109302714453, "percentage": 27.79, "elapsed_time": "11:47:59", "remaining_time": "1 day, 6:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4987, "total_steps": 17941, "loss": 1.8808, "learning_rate": 8.357722612305353e-05, "epoch": 0.27796666852460844, "percentage": 27.8, "elapsed_time": "11:48:07", "remaining_time": "1 day, 6:39:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4988, "total_steps": 17941, "loss": 1.7122, "learning_rate": 8.357062787026805e-05, "epoch": 0.27802240677777157, "percentage": 27.8, "elapsed_time": "11:48:15", "remaining_time": "1 day, 6:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4989, "total_steps": 17941, "loss": 1.6552, "learning_rate": 8.356402855281802e-05, "epoch": 0.27807814503093475, "percentage": 27.81, "elapsed_time": "11:48:24", "remaining_time": "1 day, 6:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4990, "total_steps": 17941, "loss": 1.4913, "learning_rate": 8.355742817091268e-05, "epoch": 0.2781338832840979, "percentage": 27.81, "elapsed_time": "11:48:32", "remaining_time": "1 day, 6:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4991, "total_steps": 17941, "loss": 1.7334, "learning_rate": 8.355082672476136e-05, "epoch": 0.278189621537261, "percentage": 27.82, "elapsed_time": "11:48:41", "remaining_time": "1 day, 6:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4992, "total_steps": 17941, "loss": 2.005, "learning_rate": 8.354422421457346e-05, "epoch": 0.27824535979042414, "percentage": 27.82, "elapsed_time": "11:48:49", "remaining_time": "1 day, 6:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4993, "total_steps": 17941, "loss": 1.6484, "learning_rate": 8.353762064055833e-05, "epoch": 0.2783010980435873, "percentage": 27.83, "elapsed_time": "11:48:58", "remaining_time": "1 day, 6:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4994, "total_steps": 17941, "loss": 1.7403, "learning_rate": 8.353101600292541e-05, "epoch": 0.27835683629675045, "percentage": 27.84, "elapsed_time": "11:49:06", "remaining_time": "1 day, 6:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4995, "total_steps": 17941, "loss": 1.6779, "learning_rate": 8.352441030188417e-05, "epoch": 0.2784125745499136, "percentage": 27.84, "elapsed_time": "11:49:15", "remaining_time": "1 day, 6:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4996, "total_steps": 17941, "loss": 1.7298, "learning_rate": 8.351780353764408e-05, "epoch": 0.27846831280307677, "percentage": 27.85, "elapsed_time": "11:49:23", "remaining_time": "1 day, 6:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4997, "total_steps": 17941, "loss": 1.594, "learning_rate": 8.351119571041468e-05, "epoch": 0.2785240510562399, "percentage": 27.85, "elapsed_time": "11:49:31", "remaining_time": "1 day, 6:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4998, "total_steps": 17941, "loss": 1.7623, "learning_rate": 8.350458682040556e-05, "epoch": 0.278579789309403, "percentage": 27.86, "elapsed_time": "11:49:40", "remaining_time": "1 day, 6:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4999, "total_steps": 17941, "loss": 1.6779, "learning_rate": 8.349797686782627e-05, "epoch": 0.2786355275625662, "percentage": 27.86, "elapsed_time": "11:49:48", "remaining_time": "1 day, 6:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5000, "total_steps": 17941, "loss": 1.8159, "learning_rate": 8.349136585288648e-05, "epoch": 0.27869126581572934, "percentage": 27.87, "elapsed_time": "11:49:57", "remaining_time": "1 day, 6:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5001, "total_steps": 17941, "loss": 1.6049, "learning_rate": 8.348475377579583e-05, "epoch": 0.27874700406889247, "percentage": 27.87, "elapsed_time": "11:50:05", "remaining_time": "1 day, 6:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5002, "total_steps": 17941, "loss": 1.661, "learning_rate": 8.3478140636764e-05, "epoch": 0.27880274232205565, "percentage": 27.88, "elapsed_time": "11:50:14", "remaining_time": "1 day, 6:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5003, "total_steps": 17941, "loss": 1.6633, "learning_rate": 8.347152643600076e-05, "epoch": 0.2788584805752188, "percentage": 27.89, "elapsed_time": "11:50:22", "remaining_time": "1 day, 6:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5004, "total_steps": 17941, "loss": 1.7599, "learning_rate": 8.346491117371584e-05, "epoch": 0.2789142188283819, "percentage": 27.89, "elapsed_time": "11:50:32", "remaining_time": "1 day, 6:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5005, "total_steps": 17941, "loss": 1.6645, "learning_rate": 8.345829485011906e-05, "epoch": 0.27896995708154504, "percentage": 27.9, "elapsed_time": "11:50:40", "remaining_time": "1 day, 6:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5006, "total_steps": 17941, "loss": 1.7965, "learning_rate": 8.345167746542024e-05, "epoch": 0.2790256953347082, "percentage": 27.9, "elapsed_time": "11:50:48", "remaining_time": "1 day, 6:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5007, "total_steps": 17941, "loss": 1.8171, "learning_rate": 8.344505901982926e-05, "epoch": 0.27908143358787135, "percentage": 27.91, "elapsed_time": "11:50:57", "remaining_time": "1 day, 6:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5008, "total_steps": 17941, "loss": 1.5853, "learning_rate": 8.343843951355599e-05, "epoch": 0.2791371718410345, "percentage": 27.91, "elapsed_time": "11:51:05", "remaining_time": "1 day, 6:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5009, "total_steps": 17941, "loss": 1.8362, "learning_rate": 8.34318189468104e-05, "epoch": 0.27919291009419767, "percentage": 27.92, "elapsed_time": "11:51:14", "remaining_time": "1 day, 6:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5010, "total_steps": 17941, "loss": 1.7712, "learning_rate": 8.34251973198024e-05, "epoch": 0.2792486483473608, "percentage": 27.92, "elapsed_time": "11:51:22", "remaining_time": "1 day, 6:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5011, "total_steps": 17941, "loss": 1.729, "learning_rate": 8.341857463274204e-05, "epoch": 0.2793043866005239, "percentage": 27.93, "elapsed_time": "11:51:31", "remaining_time": "1 day, 6:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5012, "total_steps": 17941, "loss": 1.9075, "learning_rate": 8.341195088583934e-05, "epoch": 0.2793601248536871, "percentage": 27.94, "elapsed_time": "11:51:39", "remaining_time": "1 day, 6:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5013, "total_steps": 17941, "loss": 1.6845, "learning_rate": 8.340532607930435e-05, "epoch": 0.27941586310685024, "percentage": 27.94, "elapsed_time": "11:51:48", "remaining_time": "1 day, 6:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5014, "total_steps": 17941, "loss": 1.677, "learning_rate": 8.339870021334721e-05, "epoch": 0.27947160136001337, "percentage": 27.95, "elapsed_time": "11:51:56", "remaining_time": "1 day, 6:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5015, "total_steps": 17941, "loss": 1.7604, "learning_rate": 8.339207328817801e-05, "epoch": 0.2795273396131765, "percentage": 27.95, "elapsed_time": "11:52:04", "remaining_time": "1 day, 6:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5016, "total_steps": 17941, "loss": 1.8327, "learning_rate": 8.338544530400694e-05, "epoch": 0.2795830778663397, "percentage": 27.96, "elapsed_time": "11:52:13", "remaining_time": "1 day, 6:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5017, "total_steps": 17941, "loss": 1.8363, "learning_rate": 8.337881626104418e-05, "epoch": 0.2796388161195028, "percentage": 27.96, "elapsed_time": "11:52:21", "remaining_time": "1 day, 6:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5018, "total_steps": 17941, "loss": 1.5949, "learning_rate": 8.337218615949999e-05, "epoch": 0.27969455437266594, "percentage": 27.97, "elapsed_time": "11:52:30", "remaining_time": "1 day, 6:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5019, "total_steps": 17941, "loss": 1.7101, "learning_rate": 8.336555499958463e-05, "epoch": 0.2797502926258291, "percentage": 27.98, "elapsed_time": "11:52:39", "remaining_time": "1 day, 6:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5020, "total_steps": 17941, "loss": 1.6419, "learning_rate": 8.33589227815084e-05, "epoch": 0.27980603087899225, "percentage": 27.98, "elapsed_time": "11:52:47", "remaining_time": "1 day, 6:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5021, "total_steps": 17941, "loss": 1.5752, "learning_rate": 8.335228950548164e-05, "epoch": 0.2798617691321554, "percentage": 27.99, "elapsed_time": "11:52:56", "remaining_time": "1 day, 6:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5022, "total_steps": 17941, "loss": 1.608, "learning_rate": 8.334565517171471e-05, "epoch": 0.27991750738531856, "percentage": 27.99, "elapsed_time": "11:53:04", "remaining_time": "1 day, 6:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5023, "total_steps": 17941, "loss": 1.8295, "learning_rate": 8.333901978041801e-05, "epoch": 0.2799732456384817, "percentage": 28.0, "elapsed_time": "11:53:13", "remaining_time": "1 day, 6:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5024, "total_steps": 17941, "loss": 2.1082, "learning_rate": 8.3332383331802e-05, "epoch": 0.2800289838916448, "percentage": 28.0, "elapsed_time": "11:53:22", "remaining_time": "1 day, 6:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5025, "total_steps": 17941, "loss": 1.5637, "learning_rate": 8.332574582607712e-05, "epoch": 0.280084722144808, "percentage": 28.01, "elapsed_time": "11:53:30", "remaining_time": "1 day, 6:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5026, "total_steps": 17941, "loss": 1.565, "learning_rate": 8.331910726345389e-05, "epoch": 0.28014046039797114, "percentage": 28.01, "elapsed_time": "11:53:39", "remaining_time": "1 day, 6:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5027, "total_steps": 17941, "loss": 1.6853, "learning_rate": 8.331246764414282e-05, "epoch": 0.28019619865113427, "percentage": 28.02, "elapsed_time": "11:53:47", "remaining_time": "1 day, 6:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5028, "total_steps": 17941, "loss": 1.8281, "learning_rate": 8.330582696835453e-05, "epoch": 0.2802519369042974, "percentage": 28.03, "elapsed_time": "11:53:56", "remaining_time": "1 day, 6:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5029, "total_steps": 17941, "loss": 1.5658, "learning_rate": 8.329918523629958e-05, "epoch": 0.2803076751574606, "percentage": 28.03, "elapsed_time": "11:54:04", "remaining_time": "1 day, 6:33:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5030, "total_steps": 17941, "loss": 1.5369, "learning_rate": 8.329254244818862e-05, "epoch": 0.2803634134106237, "percentage": 28.04, "elapsed_time": "11:54:13", "remaining_time": "1 day, 6:33:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5031, "total_steps": 17941, "loss": 1.718, "learning_rate": 8.328589860423234e-05, "epoch": 0.28041915166378684, "percentage": 28.04, "elapsed_time": "11:54:21", "remaining_time": "1 day, 6:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5032, "total_steps": 17941, "loss": 1.5096, "learning_rate": 8.327925370464142e-05, "epoch": 0.28047488991695, "percentage": 28.05, "elapsed_time": "11:54:29", "remaining_time": "1 day, 6:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5033, "total_steps": 17941, "loss": 1.8082, "learning_rate": 8.32726077496266e-05, "epoch": 0.28053062817011315, "percentage": 28.05, "elapsed_time": "11:54:38", "remaining_time": "1 day, 6:32:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5034, "total_steps": 17941, "loss": 1.885, "learning_rate": 8.326596073939865e-05, "epoch": 0.2805863664232763, "percentage": 28.06, "elapsed_time": "11:54:46", "remaining_time": "1 day, 6:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5035, "total_steps": 17941, "loss": 1.6933, "learning_rate": 8.325931267416837e-05, "epoch": 0.28064210467643946, "percentage": 28.06, "elapsed_time": "11:54:55", "remaining_time": "1 day, 6:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5036, "total_steps": 17941, "loss": 1.7869, "learning_rate": 8.325266355414663e-05, "epoch": 0.2806978429296026, "percentage": 28.07, "elapsed_time": "11:55:03", "remaining_time": "1 day, 6:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5037, "total_steps": 17941, "loss": 1.8213, "learning_rate": 8.324601337954427e-05, "epoch": 0.2807535811827657, "percentage": 28.08, "elapsed_time": "11:55:12", "remaining_time": "1 day, 6:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5038, "total_steps": 17941, "loss": 1.5685, "learning_rate": 8.323936215057219e-05, "epoch": 0.28080931943592885, "percentage": 28.08, "elapsed_time": "11:55:20", "remaining_time": "1 day, 6:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5039, "total_steps": 17941, "loss": 1.6801, "learning_rate": 8.323270986744136e-05, "epoch": 0.28086505768909203, "percentage": 28.09, "elapsed_time": "11:55:29", "remaining_time": "1 day, 6:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5040, "total_steps": 17941, "loss": 1.7527, "learning_rate": 8.322605653036273e-05, "epoch": 0.28092079594225516, "percentage": 28.09, "elapsed_time": "11:55:38", "remaining_time": "1 day, 6:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5041, "total_steps": 17941, "loss": 1.7583, "learning_rate": 8.32194021395473e-05, "epoch": 0.2809765341954183, "percentage": 28.1, "elapsed_time": "11:55:46", "remaining_time": "1 day, 6:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5042, "total_steps": 17941, "loss": 1.6603, "learning_rate": 8.321274669520613e-05, "epoch": 0.2810322724485815, "percentage": 28.1, "elapsed_time": "11:55:55", "remaining_time": "1 day, 6:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5043, "total_steps": 17941, "loss": 1.8041, "learning_rate": 8.320609019755025e-05, "epoch": 0.2810880107017446, "percentage": 28.11, "elapsed_time": "11:56:03", "remaining_time": "1 day, 6:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5044, "total_steps": 17941, "loss": 1.8187, "learning_rate": 8.319943264679082e-05, "epoch": 0.28114374895490774, "percentage": 28.11, "elapsed_time": "11:56:11", "remaining_time": "1 day, 6:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5045, "total_steps": 17941, "loss": 1.627, "learning_rate": 8.319277404313895e-05, "epoch": 0.2811994872080709, "percentage": 28.12, "elapsed_time": "11:56:20", "remaining_time": "1 day, 6:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5046, "total_steps": 17941, "loss": 1.7922, "learning_rate": 8.318611438680581e-05, "epoch": 0.28125522546123405, "percentage": 28.13, "elapsed_time": "11:56:28", "remaining_time": "1 day, 6:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5047, "total_steps": 17941, "loss": 1.9276, "learning_rate": 8.317945367800262e-05, "epoch": 0.2813109637143972, "percentage": 28.13, "elapsed_time": "11:56:37", "remaining_time": "1 day, 6:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5048, "total_steps": 17941, "loss": 1.6415, "learning_rate": 8.31727919169406e-05, "epoch": 0.28136670196756036, "percentage": 28.14, "elapsed_time": "11:56:45", "remaining_time": "1 day, 6:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5049, "total_steps": 17941, "loss": 1.7371, "learning_rate": 8.316612910383104e-05, "epoch": 0.2814224402207235, "percentage": 28.14, "elapsed_time": "11:56:54", "remaining_time": "1 day, 6:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5050, "total_steps": 17941, "loss": 1.5045, "learning_rate": 8.315946523888523e-05, "epoch": 0.2814781784738866, "percentage": 28.15, "elapsed_time": "11:57:03", "remaining_time": "1 day, 6:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5051, "total_steps": 17941, "loss": 1.7094, "learning_rate": 8.31528003223145e-05, "epoch": 0.28153391672704975, "percentage": 28.15, "elapsed_time": "11:57:12", "remaining_time": "1 day, 6:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5052, "total_steps": 17941, "loss": 1.7824, "learning_rate": 8.314613435433025e-05, "epoch": 0.28158965498021293, "percentage": 28.16, "elapsed_time": "11:57:20", "remaining_time": "1 day, 6:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5053, "total_steps": 17941, "loss": 1.6823, "learning_rate": 8.313946733514388e-05, "epoch": 0.28164539323337606, "percentage": 28.16, "elapsed_time": "11:57:29", "remaining_time": "1 day, 6:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5054, "total_steps": 17941, "loss": 1.6891, "learning_rate": 8.313279926496682e-05, "epoch": 0.2817011314865392, "percentage": 28.17, "elapsed_time": "11:57:37", "remaining_time": "1 day, 6:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5055, "total_steps": 17941, "loss": 1.6879, "learning_rate": 8.312613014401053e-05, "epoch": 0.2817568697397024, "percentage": 28.18, "elapsed_time": "11:57:46", "remaining_time": "1 day, 6:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5056, "total_steps": 17941, "loss": 1.7741, "learning_rate": 8.311945997248656e-05, "epoch": 0.2818126079928655, "percentage": 28.18, "elapsed_time": "11:57:54", "remaining_time": "1 day, 6:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5057, "total_steps": 17941, "loss": 1.5888, "learning_rate": 8.31127887506064e-05, "epoch": 0.28186834624602863, "percentage": 28.19, "elapsed_time": "11:58:03", "remaining_time": "1 day, 6:29:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5058, "total_steps": 17941, "loss": 1.8173, "learning_rate": 8.310611647858164e-05, "epoch": 0.2819240844991918, "percentage": 28.19, "elapsed_time": "11:58:12", "remaining_time": "1 day, 6:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5059, "total_steps": 17941, "loss": 1.6492, "learning_rate": 8.30994431566239e-05, "epoch": 0.28197982275235495, "percentage": 28.2, "elapsed_time": "11:58:20", "remaining_time": "1 day, 6:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5060, "total_steps": 17941, "loss": 1.9265, "learning_rate": 8.309276878494481e-05, "epoch": 0.2820355610055181, "percentage": 28.2, "elapsed_time": "11:58:28", "remaining_time": "1 day, 6:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5061, "total_steps": 17941, "loss": 1.5966, "learning_rate": 8.308609336375601e-05, "epoch": 0.28209129925868126, "percentage": 28.21, "elapsed_time": "11:58:37", "remaining_time": "1 day, 6:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5062, "total_steps": 17941, "loss": 1.6598, "learning_rate": 8.307941689326926e-05, "epoch": 0.2821470375118444, "percentage": 28.21, "elapsed_time": "11:58:45", "remaining_time": "1 day, 6:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5063, "total_steps": 17941, "loss": 1.3741, "learning_rate": 8.307273937369627e-05, "epoch": 0.2822027757650075, "percentage": 28.22, "elapsed_time": "11:58:54", "remaining_time": "1 day, 6:28:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5064, "total_steps": 17941, "loss": 1.7855, "learning_rate": 8.30660608052488e-05, "epoch": 0.28225851401817065, "percentage": 28.23, "elapsed_time": "11:59:02", "remaining_time": "1 day, 6:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5065, "total_steps": 17941, "loss": 1.6285, "learning_rate": 8.305938118813868e-05, "epoch": 0.28231425227133383, "percentage": 28.23, "elapsed_time": "11:59:11", "remaining_time": "1 day, 6:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5066, "total_steps": 17941, "loss": 1.8315, "learning_rate": 8.305270052257773e-05, "epoch": 0.28236999052449696, "percentage": 28.24, "elapsed_time": "11:59:19", "remaining_time": "1 day, 6:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5067, "total_steps": 17941, "loss": 1.8598, "learning_rate": 8.304601880877784e-05, "epoch": 0.2824257287776601, "percentage": 28.24, "elapsed_time": "11:59:28", "remaining_time": "1 day, 6:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5068, "total_steps": 17941, "loss": 1.5472, "learning_rate": 8.30393360469509e-05, "epoch": 0.2824814670308233, "percentage": 28.25, "elapsed_time": "11:59:36", "remaining_time": "1 day, 6:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5069, "total_steps": 17941, "loss": 1.8186, "learning_rate": 8.303265223730885e-05, "epoch": 0.2825372052839864, "percentage": 28.25, "elapsed_time": "11:59:45", "remaining_time": "1 day, 6:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5070, "total_steps": 17941, "loss": 1.7101, "learning_rate": 8.302596738006367e-05, "epoch": 0.28259294353714953, "percentage": 28.26, "elapsed_time": "11:59:53", "remaining_time": "1 day, 6:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5071, "total_steps": 17941, "loss": 1.6207, "learning_rate": 8.301928147542736e-05, "epoch": 0.2826486817903127, "percentage": 28.26, "elapsed_time": "12:00:02", "remaining_time": "1 day, 6:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5072, "total_steps": 17941, "loss": 1.7829, "learning_rate": 8.301259452361197e-05, "epoch": 0.28270442004347585, "percentage": 28.27, "elapsed_time": "12:00:10", "remaining_time": "1 day, 6:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5073, "total_steps": 17941, "loss": 1.844, "learning_rate": 8.300590652482954e-05, "epoch": 0.282760158296639, "percentage": 28.28, "elapsed_time": "12:00:18", "remaining_time": "1 day, 6:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5074, "total_steps": 17941, "loss": 1.9242, "learning_rate": 8.29992174792922e-05, "epoch": 0.2828158965498021, "percentage": 28.28, "elapsed_time": "12:00:27", "remaining_time": "1 day, 6:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5075, "total_steps": 17941, "loss": 1.7337, "learning_rate": 8.299252738721206e-05, "epoch": 0.2828716348029653, "percentage": 28.29, "elapsed_time": "12:00:35", "remaining_time": "1 day, 6:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5076, "total_steps": 17941, "loss": 1.6531, "learning_rate": 8.298583624880135e-05, "epoch": 0.2829273730561284, "percentage": 28.29, "elapsed_time": "12:00:44", "remaining_time": "1 day, 6:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5077, "total_steps": 17941, "loss": 1.6198, "learning_rate": 8.29791440642722e-05, "epoch": 0.28298311130929155, "percentage": 28.3, "elapsed_time": "12:00:52", "remaining_time": "1 day, 6:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5078, "total_steps": 17941, "loss": 1.7574, "learning_rate": 8.297245083383689e-05, "epoch": 0.28303884956245473, "percentage": 28.3, "elapsed_time": "12:01:01", "remaining_time": "1 day, 6:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5079, "total_steps": 17941, "loss": 1.7325, "learning_rate": 8.296575655770768e-05, "epoch": 0.28309458781561786, "percentage": 28.31, "elapsed_time": "12:01:09", "remaining_time": "1 day, 6:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5080, "total_steps": 17941, "loss": 1.6964, "learning_rate": 8.295906123609688e-05, "epoch": 0.283150326068781, "percentage": 28.32, "elapsed_time": "12:01:18", "remaining_time": "1 day, 6:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5081, "total_steps": 17941, "loss": 1.6128, "learning_rate": 8.295236486921685e-05, "epoch": 0.2832060643219442, "percentage": 28.32, "elapsed_time": "12:01:26", "remaining_time": "1 day, 6:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5082, "total_steps": 17941, "loss": 1.8898, "learning_rate": 8.29456674572799e-05, "epoch": 0.2832618025751073, "percentage": 28.33, "elapsed_time": "12:01:35", "remaining_time": "1 day, 6:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5083, "total_steps": 17941, "loss": 1.513, "learning_rate": 8.293896900049846e-05, "epoch": 0.28331754082827043, "percentage": 28.33, "elapsed_time": "12:01:43", "remaining_time": "1 day, 6:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5084, "total_steps": 17941, "loss": 1.658, "learning_rate": 8.293226949908499e-05, "epoch": 0.2833732790814336, "percentage": 28.34, "elapsed_time": "12:01:52", "remaining_time": "1 day, 6:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5085, "total_steps": 17941, "loss": 1.6148, "learning_rate": 8.292556895325194e-05, "epoch": 0.28342901733459674, "percentage": 28.34, "elapsed_time": "12:02:00", "remaining_time": "1 day, 6:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5086, "total_steps": 17941, "loss": 1.7469, "learning_rate": 8.29188673632118e-05, "epoch": 0.2834847555877599, "percentage": 28.35, "elapsed_time": "12:02:09", "remaining_time": "1 day, 6:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5087, "total_steps": 17941, "loss": 1.6819, "learning_rate": 8.291216472917714e-05, "epoch": 0.283540493840923, "percentage": 28.35, "elapsed_time": "12:02:17", "remaining_time": "1 day, 6:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5088, "total_steps": 17941, "loss": 1.3384, "learning_rate": 8.290546105136048e-05, "epoch": 0.2835962320940862, "percentage": 28.36, "elapsed_time": "12:02:25", "remaining_time": "1 day, 6:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5089, "total_steps": 17941, "loss": 1.6534, "learning_rate": 8.289875632997446e-05, "epoch": 0.2836519703472493, "percentage": 28.37, "elapsed_time": "12:02:34", "remaining_time": "1 day, 6:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5090, "total_steps": 17941, "loss": 1.6963, "learning_rate": 8.289205056523168e-05, "epoch": 0.28370770860041244, "percentage": 28.37, "elapsed_time": "12:02:42", "remaining_time": "1 day, 6:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5091, "total_steps": 17941, "loss": 1.6027, "learning_rate": 8.288534375734486e-05, "epoch": 0.28376344685357563, "percentage": 28.38, "elapsed_time": "12:02:51", "remaining_time": "1 day, 6:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5092, "total_steps": 17941, "loss": 1.6362, "learning_rate": 8.287863590652666e-05, "epoch": 0.28381918510673876, "percentage": 28.38, "elapsed_time": "12:02:59", "remaining_time": "1 day, 6:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5093, "total_steps": 17941, "loss": 1.5781, "learning_rate": 8.287192701298982e-05, "epoch": 0.2838749233599019, "percentage": 28.39, "elapsed_time": "12:03:08", "remaining_time": "1 day, 6:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5094, "total_steps": 17941, "loss": 1.8077, "learning_rate": 8.286521707694712e-05, "epoch": 0.28393066161306507, "percentage": 28.39, "elapsed_time": "12:03:16", "remaining_time": "1 day, 6:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5095, "total_steps": 17941, "loss": 1.8407, "learning_rate": 8.285850609861134e-05, "epoch": 0.2839863998662282, "percentage": 28.4, "elapsed_time": "12:03:25", "remaining_time": "1 day, 6:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5096, "total_steps": 17941, "loss": 1.579, "learning_rate": 8.285179407819534e-05, "epoch": 0.28404213811939133, "percentage": 28.4, "elapsed_time": "12:03:33", "remaining_time": "1 day, 6:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5097, "total_steps": 17941, "loss": 1.3955, "learning_rate": 8.284508101591198e-05, "epoch": 0.28409787637255446, "percentage": 28.41, "elapsed_time": "12:03:42", "remaining_time": "1 day, 6:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5098, "total_steps": 17941, "loss": 1.8429, "learning_rate": 8.283836691197413e-05, "epoch": 0.28415361462571764, "percentage": 28.42, "elapsed_time": "12:03:50", "remaining_time": "1 day, 6:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5099, "total_steps": 17941, "loss": 1.8281, "learning_rate": 8.283165176659474e-05, "epoch": 0.28420935287888077, "percentage": 28.42, "elapsed_time": "12:03:59", "remaining_time": "1 day, 6:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5100, "total_steps": 17941, "loss": 1.764, "learning_rate": 8.282493557998678e-05, "epoch": 0.2842650911320439, "percentage": 28.43, "elapsed_time": "12:04:07", "remaining_time": "1 day, 6:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5101, "total_steps": 17941, "loss": 1.8694, "learning_rate": 8.281821835236325e-05, "epoch": 0.2843208293852071, "percentage": 28.43, "elapsed_time": "12:04:16", "remaining_time": "1 day, 6:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5102, "total_steps": 17941, "loss": 1.8829, "learning_rate": 8.281150008393718e-05, "epoch": 0.2843765676383702, "percentage": 28.44, "elapsed_time": "12:04:24", "remaining_time": "1 day, 6:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5103, "total_steps": 17941, "loss": 1.8996, "learning_rate": 8.280478077492163e-05, "epoch": 0.28443230589153334, "percentage": 28.44, "elapsed_time": "12:04:33", "remaining_time": "1 day, 6:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5104, "total_steps": 17941, "loss": 1.7342, "learning_rate": 8.27980604255297e-05, "epoch": 0.28448804414469653, "percentage": 28.45, "elapsed_time": "12:04:41", "remaining_time": "1 day, 6:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5105, "total_steps": 17941, "loss": 1.7496, "learning_rate": 8.279133903597451e-05, "epoch": 0.28454378239785966, "percentage": 28.45, "elapsed_time": "12:04:49", "remaining_time": "1 day, 6:22:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5106, "total_steps": 17941, "loss": 1.63, "learning_rate": 8.278461660646925e-05, "epoch": 0.2845995206510228, "percentage": 28.46, "elapsed_time": "12:04:58", "remaining_time": "1 day, 6:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5107, "total_steps": 17941, "loss": 1.6639, "learning_rate": 8.27778931372271e-05, "epoch": 0.28465525890418597, "percentage": 28.47, "elapsed_time": "12:05:06", "remaining_time": "1 day, 6:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5108, "total_steps": 17941, "loss": 1.9303, "learning_rate": 8.277116862846126e-05, "epoch": 0.2847109971573491, "percentage": 28.47, "elapsed_time": "12:05:15", "remaining_time": "1 day, 6:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5109, "total_steps": 17941, "loss": 1.7833, "learning_rate": 8.276444308038504e-05, "epoch": 0.28476673541051223, "percentage": 28.48, "elapsed_time": "12:05:23", "remaining_time": "1 day, 6:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5110, "total_steps": 17941, "loss": 1.9167, "learning_rate": 8.27577164932117e-05, "epoch": 0.28482247366367536, "percentage": 28.48, "elapsed_time": "12:05:32", "remaining_time": "1 day, 6:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5111, "total_steps": 17941, "loss": 1.7716, "learning_rate": 8.275098886715462e-05, "epoch": 0.28487821191683854, "percentage": 28.49, "elapsed_time": "12:05:41", "remaining_time": "1 day, 6:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5112, "total_steps": 17941, "loss": 1.9078, "learning_rate": 8.274426020242709e-05, "epoch": 0.28493395017000167, "percentage": 28.49, "elapsed_time": "12:05:49", "remaining_time": "1 day, 6:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5113, "total_steps": 17941, "loss": 1.7014, "learning_rate": 8.273753049924256e-05, "epoch": 0.2849896884231648, "percentage": 28.5, "elapsed_time": "12:05:58", "remaining_time": "1 day, 6:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5114, "total_steps": 17941, "loss": 1.6482, "learning_rate": 8.273079975781442e-05, "epoch": 0.285045426676328, "percentage": 28.5, "elapsed_time": "12:06:06", "remaining_time": "1 day, 6:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5115, "total_steps": 17941, "loss": 1.7304, "learning_rate": 8.272406797835614e-05, "epoch": 0.2851011649294911, "percentage": 28.51, "elapsed_time": "12:06:15", "remaining_time": "1 day, 6:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5116, "total_steps": 17941, "loss": 1.6698, "learning_rate": 8.271733516108125e-05, "epoch": 0.28515690318265424, "percentage": 28.52, "elapsed_time": "12:06:24", "remaining_time": "1 day, 6:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5117, "total_steps": 17941, "loss": 2.0553, "learning_rate": 8.27106013062032e-05, "epoch": 0.2852126414358174, "percentage": 28.52, "elapsed_time": "12:06:32", "remaining_time": "1 day, 6:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5118, "total_steps": 17941, "loss": 1.5031, "learning_rate": 8.270386641393564e-05, "epoch": 0.28526837968898056, "percentage": 28.53, "elapsed_time": "12:06:41", "remaining_time": "1 day, 6:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5119, "total_steps": 17941, "loss": 1.9087, "learning_rate": 8.269713048449208e-05, "epoch": 0.2853241179421437, "percentage": 28.53, "elapsed_time": "12:06:49", "remaining_time": "1 day, 6:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5120, "total_steps": 17941, "loss": 1.8125, "learning_rate": 8.26903935180862e-05, "epoch": 0.2853798561953068, "percentage": 28.54, "elapsed_time": "12:06:58", "remaining_time": "1 day, 6:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5121, "total_steps": 17941, "loss": 1.6459, "learning_rate": 8.268365551493161e-05, "epoch": 0.28543559444847, "percentage": 28.54, "elapsed_time": "12:07:06", "remaining_time": "1 day, 6:20:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5122, "total_steps": 17941, "loss": 1.6801, "learning_rate": 8.267691647524206e-05, "epoch": 0.2854913327016331, "percentage": 28.55, "elapsed_time": "12:07:14", "remaining_time": "1 day, 6:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5123, "total_steps": 17941, "loss": 1.4172, "learning_rate": 8.26701763992312e-05, "epoch": 0.28554707095479626, "percentage": 28.55, "elapsed_time": "12:07:23", "remaining_time": "1 day, 6:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5124, "total_steps": 17941, "loss": 1.6956, "learning_rate": 8.266343528711285e-05, "epoch": 0.28560280920795944, "percentage": 28.56, "elapsed_time": "12:07:31", "remaining_time": "1 day, 6:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5125, "total_steps": 17941, "loss": 1.5235, "learning_rate": 8.265669313910077e-05, "epoch": 0.28565854746112257, "percentage": 28.57, "elapsed_time": "12:07:40", "remaining_time": "1 day, 6:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5126, "total_steps": 17941, "loss": 1.9089, "learning_rate": 8.264994995540878e-05, "epoch": 0.2857142857142857, "percentage": 28.57, "elapsed_time": "12:07:48", "remaining_time": "1 day, 6:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5127, "total_steps": 17941, "loss": 1.6013, "learning_rate": 8.264320573625075e-05, "epoch": 0.2857700239674489, "percentage": 28.58, "elapsed_time": "12:07:57", "remaining_time": "1 day, 6:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5128, "total_steps": 17941, "loss": 1.6596, "learning_rate": 8.263646048184055e-05, "epoch": 0.285825762220612, "percentage": 28.58, "elapsed_time": "12:08:06", "remaining_time": "1 day, 6:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5129, "total_steps": 17941, "loss": 1.7786, "learning_rate": 8.26297141923921e-05, "epoch": 0.28588150047377514, "percentage": 28.59, "elapsed_time": "12:08:15", "remaining_time": "1 day, 6:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5130, "total_steps": 17941, "loss": 1.6151, "learning_rate": 8.262296686811936e-05, "epoch": 0.2859372387269383, "percentage": 28.59, "elapsed_time": "12:08:23", "remaining_time": "1 day, 6:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5131, "total_steps": 17941, "loss": 1.587, "learning_rate": 8.261621850923634e-05, "epoch": 0.28599297698010145, "percentage": 28.6, "elapsed_time": "12:08:32", "remaining_time": "1 day, 6:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5132, "total_steps": 17941, "loss": 1.6915, "learning_rate": 8.260946911595701e-05, "epoch": 0.2860487152332646, "percentage": 28.6, "elapsed_time": "12:08:40", "remaining_time": "1 day, 6:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5133, "total_steps": 17941, "loss": 1.9188, "learning_rate": 8.260271868849547e-05, "epoch": 0.2861044534864277, "percentage": 28.61, "elapsed_time": "12:08:49", "remaining_time": "1 day, 6:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5134, "total_steps": 17941, "loss": 1.7657, "learning_rate": 8.259596722706575e-05, "epoch": 0.2861601917395909, "percentage": 28.62, "elapsed_time": "12:08:57", "remaining_time": "1 day, 6:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5135, "total_steps": 17941, "loss": 1.3247, "learning_rate": 8.258921473188202e-05, "epoch": 0.286215929992754, "percentage": 28.62, "elapsed_time": "12:09:06", "remaining_time": "1 day, 6:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5136, "total_steps": 17941, "loss": 1.6025, "learning_rate": 8.25824612031584e-05, "epoch": 0.28627166824591715, "percentage": 28.63, "elapsed_time": "12:09:14", "remaining_time": "1 day, 6:18:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5137, "total_steps": 17941, "loss": 1.7264, "learning_rate": 8.257570664110907e-05, "epoch": 0.28632740649908034, "percentage": 28.63, "elapsed_time": "12:09:23", "remaining_time": "1 day, 6:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5138, "total_steps": 17941, "loss": 1.802, "learning_rate": 8.256895104594828e-05, "epoch": 0.28638314475224347, "percentage": 28.64, "elapsed_time": "12:09:32", "remaining_time": "1 day, 6:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5139, "total_steps": 17941, "loss": 1.9493, "learning_rate": 8.256219441789022e-05, "epoch": 0.2864388830054066, "percentage": 28.64, "elapsed_time": "12:09:40", "remaining_time": "1 day, 6:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5140, "total_steps": 17941, "loss": 1.5655, "learning_rate": 8.255543675714923e-05, "epoch": 0.2864946212585698, "percentage": 28.65, "elapsed_time": "12:09:48", "remaining_time": "1 day, 6:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5141, "total_steps": 17941, "loss": 1.5492, "learning_rate": 8.254867806393957e-05, "epoch": 0.2865503595117329, "percentage": 28.66, "elapsed_time": "12:09:57", "remaining_time": "1 day, 6:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5142, "total_steps": 17941, "loss": 1.7343, "learning_rate": 8.254191833847564e-05, "epoch": 0.28660609776489604, "percentage": 28.66, "elapsed_time": "12:10:06", "remaining_time": "1 day, 6:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5143, "total_steps": 17941, "loss": 1.6551, "learning_rate": 8.253515758097179e-05, "epoch": 0.28666183601805917, "percentage": 28.67, "elapsed_time": "12:10:15", "remaining_time": "1 day, 6:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5144, "total_steps": 17941, "loss": 1.8227, "learning_rate": 8.252839579164243e-05, "epoch": 0.28671757427122235, "percentage": 28.67, "elapsed_time": "12:10:23", "remaining_time": "1 day, 6:17:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5145, "total_steps": 17941, "loss": 1.9731, "learning_rate": 8.252163297070201e-05, "epoch": 0.2867733125243855, "percentage": 28.68, "elapsed_time": "12:10:31", "remaining_time": "1 day, 6:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5146, "total_steps": 17941, "loss": 1.5992, "learning_rate": 8.251486911836501e-05, "epoch": 0.2868290507775486, "percentage": 28.68, "elapsed_time": "12:10:40", "remaining_time": "1 day, 6:16:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5147, "total_steps": 17941, "loss": 1.5641, "learning_rate": 8.250810423484592e-05, "epoch": 0.2868847890307118, "percentage": 28.69, "elapsed_time": "12:10:48", "remaining_time": "1 day, 6:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5148, "total_steps": 17941, "loss": 1.759, "learning_rate": 8.25013383203593e-05, "epoch": 0.2869405272838749, "percentage": 28.69, "elapsed_time": "12:10:57", "remaining_time": "1 day, 6:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5149, "total_steps": 17941, "loss": 1.7229, "learning_rate": 8.249457137511976e-05, "epoch": 0.28699626553703805, "percentage": 28.7, "elapsed_time": "12:11:05", "remaining_time": "1 day, 6:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5150, "total_steps": 17941, "loss": 1.6758, "learning_rate": 8.248780339934183e-05, "epoch": 0.28705200379020124, "percentage": 28.71, "elapsed_time": "12:11:14", "remaining_time": "1 day, 6:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5151, "total_steps": 17941, "loss": 1.7173, "learning_rate": 8.248103439324022e-05, "epoch": 0.28710774204336437, "percentage": 28.71, "elapsed_time": "12:11:22", "remaining_time": "1 day, 6:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5152, "total_steps": 17941, "loss": 1.8327, "learning_rate": 8.247426435702956e-05, "epoch": 0.2871634802965275, "percentage": 28.72, "elapsed_time": "12:11:31", "remaining_time": "1 day, 6:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5153, "total_steps": 17941, "loss": 1.6373, "learning_rate": 8.246749329092458e-05, "epoch": 0.2872192185496907, "percentage": 28.72, "elapsed_time": "12:11:39", "remaining_time": "1 day, 6:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5154, "total_steps": 17941, "loss": 2.0384, "learning_rate": 8.246072119514e-05, "epoch": 0.2872749568028538, "percentage": 28.73, "elapsed_time": "12:11:47", "remaining_time": "1 day, 6:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5155, "total_steps": 17941, "loss": 1.9093, "learning_rate": 8.245394806989062e-05, "epoch": 0.28733069505601694, "percentage": 28.73, "elapsed_time": "12:11:56", "remaining_time": "1 day, 6:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5156, "total_steps": 17941, "loss": 1.6794, "learning_rate": 8.244717391539124e-05, "epoch": 0.28738643330918007, "percentage": 28.74, "elapsed_time": "12:12:04", "remaining_time": "1 day, 6:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5157, "total_steps": 17941, "loss": 1.6624, "learning_rate": 8.244039873185664e-05, "epoch": 0.28744217156234325, "percentage": 28.74, "elapsed_time": "12:12:13", "remaining_time": "1 day, 6:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5158, "total_steps": 17941, "loss": 1.7119, "learning_rate": 8.243362251950177e-05, "epoch": 0.2874979098155064, "percentage": 28.75, "elapsed_time": "12:12:21", "remaining_time": "1 day, 6:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5159, "total_steps": 17941, "loss": 1.7379, "learning_rate": 8.242684527854148e-05, "epoch": 0.2875536480686695, "percentage": 28.76, "elapsed_time": "12:12:30", "remaining_time": "1 day, 6:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5160, "total_steps": 17941, "loss": 1.648, "learning_rate": 8.242006700919072e-05, "epoch": 0.2876093863218327, "percentage": 28.76, "elapsed_time": "12:12:38", "remaining_time": "1 day, 6:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5161, "total_steps": 17941, "loss": 1.8969, "learning_rate": 8.241328771166446e-05, "epoch": 0.2876651245749958, "percentage": 28.77, "elapsed_time": "12:12:47", "remaining_time": "1 day, 6:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5162, "total_steps": 17941, "loss": 1.7941, "learning_rate": 8.24065073861777e-05, "epoch": 0.28772086282815895, "percentage": 28.77, "elapsed_time": "12:12:55", "remaining_time": "1 day, 6:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5163, "total_steps": 17941, "loss": 1.7996, "learning_rate": 8.239972603294546e-05, "epoch": 0.28777660108132214, "percentage": 28.78, "elapsed_time": "12:13:04", "remaining_time": "1 day, 6:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5164, "total_steps": 17941, "loss": 1.486, "learning_rate": 8.239294365218282e-05, "epoch": 0.28783233933448527, "percentage": 28.78, "elapsed_time": "12:13:12", "remaining_time": "1 day, 6:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5165, "total_steps": 17941, "loss": 1.8011, "learning_rate": 8.238616024410486e-05, "epoch": 0.2878880775876484, "percentage": 28.79, "elapsed_time": "12:13:20", "remaining_time": "1 day, 6:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5166, "total_steps": 17941, "loss": 1.7308, "learning_rate": 8.237937580892674e-05, "epoch": 0.2879438158408115, "percentage": 28.79, "elapsed_time": "12:13:29", "remaining_time": "1 day, 6:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5167, "total_steps": 17941, "loss": 1.7732, "learning_rate": 8.237259034686359e-05, "epoch": 0.2879995540939747, "percentage": 28.8, "elapsed_time": "12:13:38", "remaining_time": "1 day, 6:13:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5168, "total_steps": 17941, "loss": 1.6932, "learning_rate": 8.236580385813062e-05, "epoch": 0.28805529234713784, "percentage": 28.81, "elapsed_time": "12:13:46", "remaining_time": "1 day, 6:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5169, "total_steps": 17941, "loss": 1.8033, "learning_rate": 8.235901634294306e-05, "epoch": 0.28811103060030097, "percentage": 28.81, "elapsed_time": "12:13:54", "remaining_time": "1 day, 6:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5170, "total_steps": 17941, "loss": 1.5637, "learning_rate": 8.235222780151616e-05, "epoch": 0.28816676885346415, "percentage": 28.82, "elapsed_time": "12:14:03", "remaining_time": "1 day, 6:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5171, "total_steps": 17941, "loss": 1.5763, "learning_rate": 8.234543823406525e-05, "epoch": 0.2882225071066273, "percentage": 28.82, "elapsed_time": "12:14:11", "remaining_time": "1 day, 6:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5172, "total_steps": 17941, "loss": 1.7251, "learning_rate": 8.23386476408056e-05, "epoch": 0.2882782453597904, "percentage": 28.83, "elapsed_time": "12:14:20", "remaining_time": "1 day, 6:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5173, "total_steps": 17941, "loss": 1.7168, "learning_rate": 8.233185602195259e-05, "epoch": 0.2883339836129536, "percentage": 28.83, "elapsed_time": "12:14:28", "remaining_time": "1 day, 6:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5174, "total_steps": 17941, "loss": 1.7282, "learning_rate": 8.232506337772163e-05, "epoch": 0.2883897218661167, "percentage": 28.84, "elapsed_time": "12:14:37", "remaining_time": "1 day, 6:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5175, "total_steps": 17941, "loss": 2.0267, "learning_rate": 8.231826970832812e-05, "epoch": 0.28844546011927985, "percentage": 28.84, "elapsed_time": "12:14:45", "remaining_time": "1 day, 6:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5176, "total_steps": 17941, "loss": 1.4387, "learning_rate": 8.231147501398753e-05, "epoch": 0.28850119837244304, "percentage": 28.85, "elapsed_time": "12:14:54", "remaining_time": "1 day, 6:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5177, "total_steps": 17941, "loss": 1.7042, "learning_rate": 8.230467929491534e-05, "epoch": 0.28855693662560616, "percentage": 28.86, "elapsed_time": "12:15:02", "remaining_time": "1 day, 6:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5178, "total_steps": 17941, "loss": 1.6752, "learning_rate": 8.229788255132706e-05, "epoch": 0.2886126748787693, "percentage": 28.86, "elapsed_time": "12:15:11", "remaining_time": "1 day, 6:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5179, "total_steps": 17941, "loss": 1.5905, "learning_rate": 8.229108478343827e-05, "epoch": 0.2886684131319324, "percentage": 28.87, "elapsed_time": "12:15:19", "remaining_time": "1 day, 6:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5180, "total_steps": 17941, "loss": 1.6857, "learning_rate": 8.228428599146453e-05, "epoch": 0.2887241513850956, "percentage": 28.87, "elapsed_time": "12:15:27", "remaining_time": "1 day, 6:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5181, "total_steps": 17941, "loss": 1.6489, "learning_rate": 8.227748617562147e-05, "epoch": 0.28877988963825874, "percentage": 28.88, "elapsed_time": "12:15:36", "remaining_time": "1 day, 6:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5182, "total_steps": 17941, "loss": 1.8709, "learning_rate": 8.227068533612475e-05, "epoch": 0.28883562789142186, "percentage": 28.88, "elapsed_time": "12:15:44", "remaining_time": "1 day, 6:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5183, "total_steps": 17941, "loss": 1.7088, "learning_rate": 8.226388347319004e-05, "epoch": 0.28889136614458505, "percentage": 28.89, "elapsed_time": "12:15:53", "remaining_time": "1 day, 6:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5184, "total_steps": 17941, "loss": 1.59, "learning_rate": 8.225708058703305e-05, "epoch": 0.2889471043977482, "percentage": 28.89, "elapsed_time": "12:16:01", "remaining_time": "1 day, 6:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5185, "total_steps": 17941, "loss": 1.4301, "learning_rate": 8.225027667786955e-05, "epoch": 0.2890028426509113, "percentage": 28.9, "elapsed_time": "12:16:10", "remaining_time": "1 day, 6:11:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5186, "total_steps": 17941, "loss": 1.533, "learning_rate": 8.224347174591529e-05, "epoch": 0.2890585809040745, "percentage": 28.91, "elapsed_time": "12:16:18", "remaining_time": "1 day, 6:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5187, "total_steps": 17941, "loss": 1.7171, "learning_rate": 8.22366657913861e-05, "epoch": 0.2891143191572376, "percentage": 28.91, "elapsed_time": "12:16:27", "remaining_time": "1 day, 6:10:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5188, "total_steps": 17941, "loss": 1.7751, "learning_rate": 8.222985881449783e-05, "epoch": 0.28917005741040075, "percentage": 28.92, "elapsed_time": "12:16:35", "remaining_time": "1 day, 6:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5189, "total_steps": 17941, "loss": 1.6905, "learning_rate": 8.222305081546635e-05, "epoch": 0.2892257956635639, "percentage": 28.92, "elapsed_time": "12:16:44", "remaining_time": "1 day, 6:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5190, "total_steps": 17941, "loss": 1.6461, "learning_rate": 8.221624179450757e-05, "epoch": 0.28928153391672706, "percentage": 28.93, "elapsed_time": "12:16:52", "remaining_time": "1 day, 6:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5191, "total_steps": 17941, "loss": 2.0131, "learning_rate": 8.220943175183743e-05, "epoch": 0.2893372721698902, "percentage": 28.93, "elapsed_time": "12:17:01", "remaining_time": "1 day, 6:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5192, "total_steps": 17941, "loss": 1.977, "learning_rate": 8.220262068767191e-05, "epoch": 0.2893930104230533, "percentage": 28.94, "elapsed_time": "12:17:09", "remaining_time": "1 day, 6:10:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5193, "total_steps": 17941, "loss": 1.6866, "learning_rate": 8.219580860222701e-05, "epoch": 0.2894487486762165, "percentage": 28.94, "elapsed_time": "12:17:18", "remaining_time": "1 day, 6:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5194, "total_steps": 17941, "loss": 1.6639, "learning_rate": 8.218899549571878e-05, "epoch": 0.28950448692937963, "percentage": 28.95, "elapsed_time": "12:17:26", "remaining_time": "1 day, 6:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5195, "total_steps": 17941, "loss": 1.435, "learning_rate": 8.218218136836331e-05, "epoch": 0.28956022518254276, "percentage": 28.96, "elapsed_time": "12:17:34", "remaining_time": "1 day, 6:09:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5196, "total_steps": 17941, "loss": 1.6317, "learning_rate": 8.217536622037667e-05, "epoch": 0.28961596343570595, "percentage": 28.96, "elapsed_time": "12:17:43", "remaining_time": "1 day, 6:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5197, "total_steps": 17941, "loss": 1.7473, "learning_rate": 8.2168550051975e-05, "epoch": 0.2896717016888691, "percentage": 28.97, "elapsed_time": "12:17:51", "remaining_time": "1 day, 6:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5198, "total_steps": 17941, "loss": 1.8094, "learning_rate": 8.216173286337448e-05, "epoch": 0.2897274399420322, "percentage": 28.97, "elapsed_time": "12:18:00", "remaining_time": "1 day, 6:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5199, "total_steps": 17941, "loss": 1.5757, "learning_rate": 8.215491465479133e-05, "epoch": 0.2897831781951954, "percentage": 28.98, "elapsed_time": "12:18:08", "remaining_time": "1 day, 6:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5200, "total_steps": 17941, "loss": 1.9404, "learning_rate": 8.214809542644173e-05, "epoch": 0.2898389164483585, "percentage": 28.98, "elapsed_time": "12:18:17", "remaining_time": "1 day, 6:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5201, "total_steps": 17941, "loss": 1.8751, "learning_rate": 8.214127517854199e-05, "epoch": 0.28989465470152165, "percentage": 28.99, "elapsed_time": "12:18:26", "remaining_time": "1 day, 6:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5202, "total_steps": 17941, "loss": 1.8278, "learning_rate": 8.213445391130841e-05, "epoch": 0.2899503929546848, "percentage": 29.0, "elapsed_time": "12:18:34", "remaining_time": "1 day, 6:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5203, "total_steps": 17941, "loss": 1.683, "learning_rate": 8.212763162495729e-05, "epoch": 0.29000613120784796, "percentage": 29.0, "elapsed_time": "12:18:43", "remaining_time": "1 day, 6:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5204, "total_steps": 17941, "loss": 1.6758, "learning_rate": 8.212080831970503e-05, "epoch": 0.2900618694610111, "percentage": 29.01, "elapsed_time": "12:18:52", "remaining_time": "1 day, 6:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5205, "total_steps": 17941, "loss": 1.7229, "learning_rate": 8.2113983995768e-05, "epoch": 0.2901176077141742, "percentage": 29.01, "elapsed_time": "12:19:01", "remaining_time": "1 day, 6:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5206, "total_steps": 17941, "loss": 1.8076, "learning_rate": 8.210715865336263e-05, "epoch": 0.2901733459673374, "percentage": 29.02, "elapsed_time": "12:19:09", "remaining_time": "1 day, 6:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5207, "total_steps": 17941, "loss": 1.672, "learning_rate": 8.21003322927054e-05, "epoch": 0.29022908422050053, "percentage": 29.02, "elapsed_time": "12:19:18", "remaining_time": "1 day, 6:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5208, "total_steps": 17941, "loss": 1.6009, "learning_rate": 8.209350491401277e-05, "epoch": 0.29028482247366366, "percentage": 29.03, "elapsed_time": "12:19:26", "remaining_time": "1 day, 6:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5209, "total_steps": 17941, "loss": 1.8675, "learning_rate": 8.20866765175013e-05, "epoch": 0.29034056072682685, "percentage": 29.03, "elapsed_time": "12:19:34", "remaining_time": "1 day, 6:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5210, "total_steps": 17941, "loss": 1.7122, "learning_rate": 8.207984710338752e-05, "epoch": 0.29039629897999, "percentage": 29.04, "elapsed_time": "12:19:43", "remaining_time": "1 day, 6:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5211, "total_steps": 17941, "loss": 1.5629, "learning_rate": 8.207301667188803e-05, "epoch": 0.2904520372331531, "percentage": 29.05, "elapsed_time": "12:19:51", "remaining_time": "1 day, 6:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5212, "total_steps": 17941, "loss": 1.6373, "learning_rate": 8.206618522321945e-05, "epoch": 0.29050777548631623, "percentage": 29.05, "elapsed_time": "12:20:00", "remaining_time": "1 day, 6:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5213, "total_steps": 17941, "loss": 1.7587, "learning_rate": 8.205935275759842e-05, "epoch": 0.2905635137394794, "percentage": 29.06, "elapsed_time": "12:20:08", "remaining_time": "1 day, 6:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5214, "total_steps": 17941, "loss": 1.6596, "learning_rate": 8.205251927524164e-05, "epoch": 0.29061925199264255, "percentage": 29.06, "elapsed_time": "12:20:17", "remaining_time": "1 day, 6:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5215, "total_steps": 17941, "loss": 1.7195, "learning_rate": 8.204568477636585e-05, "epoch": 0.2906749902458057, "percentage": 29.07, "elapsed_time": "12:20:26", "remaining_time": "1 day, 6:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5216, "total_steps": 17941, "loss": 1.6929, "learning_rate": 8.203884926118777e-05, "epoch": 0.29073072849896886, "percentage": 29.07, "elapsed_time": "12:20:34", "remaining_time": "1 day, 6:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5217, "total_steps": 17941, "loss": 1.4884, "learning_rate": 8.203201272992419e-05, "epoch": 0.290786466752132, "percentage": 29.08, "elapsed_time": "12:20:43", "remaining_time": "1 day, 6:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5218, "total_steps": 17941, "loss": 1.6383, "learning_rate": 8.202517518279193e-05, "epoch": 0.2908422050052951, "percentage": 29.08, "elapsed_time": "12:20:51", "remaining_time": "1 day, 6:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5219, "total_steps": 17941, "loss": 1.3916, "learning_rate": 8.201833662000781e-05, "epoch": 0.2908979432584583, "percentage": 29.09, "elapsed_time": "12:21:00", "remaining_time": "1 day, 6:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5220, "total_steps": 17941, "loss": 1.8316, "learning_rate": 8.201149704178875e-05, "epoch": 0.29095368151162143, "percentage": 29.1, "elapsed_time": "12:21:08", "remaining_time": "1 day, 6:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5221, "total_steps": 17941, "loss": 1.479, "learning_rate": 8.200465644835165e-05, "epoch": 0.29100941976478456, "percentage": 29.1, "elapsed_time": "12:21:17", "remaining_time": "1 day, 6:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5222, "total_steps": 17941, "loss": 1.8735, "learning_rate": 8.199781483991345e-05, "epoch": 0.29106515801794774, "percentage": 29.11, "elapsed_time": "12:21:25", "remaining_time": "1 day, 6:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5223, "total_steps": 17941, "loss": 1.8911, "learning_rate": 8.19909722166911e-05, "epoch": 0.2911208962711109, "percentage": 29.11, "elapsed_time": "12:21:34", "remaining_time": "1 day, 6:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5224, "total_steps": 17941, "loss": 1.5865, "learning_rate": 8.198412857890166e-05, "epoch": 0.291176634524274, "percentage": 29.12, "elapsed_time": "12:21:42", "remaining_time": "1 day, 6:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5225, "total_steps": 17941, "loss": 1.518, "learning_rate": 8.197728392676211e-05, "epoch": 0.29123237277743713, "percentage": 29.12, "elapsed_time": "12:21:51", "remaining_time": "1 day, 6:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5226, "total_steps": 17941, "loss": 1.4729, "learning_rate": 8.197043826048957e-05, "epoch": 0.2912881110306003, "percentage": 29.13, "elapsed_time": "12:21:59", "remaining_time": "1 day, 6:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5227, "total_steps": 17941, "loss": 1.7724, "learning_rate": 8.196359158030113e-05, "epoch": 0.29134384928376345, "percentage": 29.13, "elapsed_time": "12:22:08", "remaining_time": "1 day, 6:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5228, "total_steps": 17941, "loss": 1.7379, "learning_rate": 8.195674388641393e-05, "epoch": 0.2913995875369266, "percentage": 29.14, "elapsed_time": "12:22:16", "remaining_time": "1 day, 6:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5229, "total_steps": 17941, "loss": 1.694, "learning_rate": 8.194989517904513e-05, "epoch": 0.29145532579008976, "percentage": 29.15, "elapsed_time": "12:22:25", "remaining_time": "1 day, 6:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5230, "total_steps": 17941, "loss": 1.7607, "learning_rate": 8.194304545841193e-05, "epoch": 0.2915110640432529, "percentage": 29.15, "elapsed_time": "12:22:33", "remaining_time": "1 day, 6:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5231, "total_steps": 17941, "loss": 1.7321, "learning_rate": 8.19361947247316e-05, "epoch": 0.291566802296416, "percentage": 29.16, "elapsed_time": "12:22:42", "remaining_time": "1 day, 6:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5232, "total_steps": 17941, "loss": 1.7183, "learning_rate": 8.192934297822133e-05, "epoch": 0.2916225405495792, "percentage": 29.16, "elapsed_time": "12:22:50", "remaining_time": "1 day, 6:04:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5233, "total_steps": 17941, "loss": 1.9229, "learning_rate": 8.192249021909847e-05, "epoch": 0.29167827880274233, "percentage": 29.17, "elapsed_time": "12:22:59", "remaining_time": "1 day, 6:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5234, "total_steps": 17941, "loss": 1.8151, "learning_rate": 8.191563644758037e-05, "epoch": 0.29173401705590546, "percentage": 29.17, "elapsed_time": "12:23:07", "remaining_time": "1 day, 6:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5235, "total_steps": 17941, "loss": 1.6619, "learning_rate": 8.190878166388435e-05, "epoch": 0.2917897553090686, "percentage": 29.18, "elapsed_time": "12:23:16", "remaining_time": "1 day, 6:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5236, "total_steps": 17941, "loss": 1.8347, "learning_rate": 8.19019258682278e-05, "epoch": 0.2918454935622318, "percentage": 29.18, "elapsed_time": "12:23:25", "remaining_time": "1 day, 6:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5237, "total_steps": 17941, "loss": 1.7583, "learning_rate": 8.189506906082818e-05, "epoch": 0.2919012318153949, "percentage": 29.19, "elapsed_time": "12:23:33", "remaining_time": "1 day, 6:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5238, "total_steps": 17941, "loss": 1.4644, "learning_rate": 8.188821124190293e-05, "epoch": 0.29195697006855803, "percentage": 29.2, "elapsed_time": "12:23:42", "remaining_time": "1 day, 6:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5239, "total_steps": 17941, "loss": 1.6562, "learning_rate": 8.188135241166953e-05, "epoch": 0.2920127083217212, "percentage": 29.2, "elapsed_time": "12:23:50", "remaining_time": "1 day, 6:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5240, "total_steps": 17941, "loss": 1.6493, "learning_rate": 8.187449257034552e-05, "epoch": 0.29206844657488434, "percentage": 29.21, "elapsed_time": "12:23:59", "remaining_time": "1 day, 6:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5241, "total_steps": 17941, "loss": 1.5672, "learning_rate": 8.186763171814845e-05, "epoch": 0.2921241848280475, "percentage": 29.21, "elapsed_time": "12:24:07", "remaining_time": "1 day, 6:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5242, "total_steps": 17941, "loss": 1.6091, "learning_rate": 8.186076985529589e-05, "epoch": 0.29217992308121066, "percentage": 29.22, "elapsed_time": "12:24:16", "remaining_time": "1 day, 6:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5243, "total_steps": 17941, "loss": 1.8457, "learning_rate": 8.18539069820055e-05, "epoch": 0.2922356613343738, "percentage": 29.22, "elapsed_time": "12:24:24", "remaining_time": "1 day, 6:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5244, "total_steps": 17941, "loss": 1.5562, "learning_rate": 8.184704309849487e-05, "epoch": 0.2922913995875369, "percentage": 29.23, "elapsed_time": "12:24:33", "remaining_time": "1 day, 6:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5245, "total_steps": 17941, "loss": 1.8421, "learning_rate": 8.184017820498173e-05, "epoch": 0.2923471378407001, "percentage": 29.23, "elapsed_time": "12:24:41", "remaining_time": "1 day, 6:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5246, "total_steps": 17941, "loss": 1.7761, "learning_rate": 8.183331230168377e-05, "epoch": 0.29240287609386323, "percentage": 29.24, "elapsed_time": "12:24:50", "remaining_time": "1 day, 6:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5247, "total_steps": 17941, "loss": 1.6677, "learning_rate": 8.182644538881873e-05, "epoch": 0.29245861434702636, "percentage": 29.25, "elapsed_time": "12:24:58", "remaining_time": "1 day, 6:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5248, "total_steps": 17941, "loss": 2.0468, "learning_rate": 8.181957746660445e-05, "epoch": 0.2925143526001895, "percentage": 29.25, "elapsed_time": "12:25:07", "remaining_time": "1 day, 6:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5249, "total_steps": 17941, "loss": 1.5903, "learning_rate": 8.181270853525866e-05, "epoch": 0.29257009085335267, "percentage": 29.26, "elapsed_time": "12:25:15", "remaining_time": "1 day, 6:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5250, "total_steps": 17941, "loss": 1.6818, "learning_rate": 8.180583859499923e-05, "epoch": 0.2926258291065158, "percentage": 29.26, "elapsed_time": "12:25:23", "remaining_time": "1 day, 6:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5251, "total_steps": 17941, "loss": 1.7915, "learning_rate": 8.179896764604407e-05, "epoch": 0.29268156735967893, "percentage": 29.27, "elapsed_time": "12:25:32", "remaining_time": "1 day, 6:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5252, "total_steps": 17941, "loss": 1.4523, "learning_rate": 8.179209568861104e-05, "epoch": 0.2927373056128421, "percentage": 29.27, "elapsed_time": "12:25:40", "remaining_time": "1 day, 6:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5253, "total_steps": 17941, "loss": 1.5611, "learning_rate": 8.178522272291809e-05, "epoch": 0.29279304386600524, "percentage": 29.28, "elapsed_time": "12:25:49", "remaining_time": "1 day, 6:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5254, "total_steps": 17941, "loss": 1.7228, "learning_rate": 8.17783487491832e-05, "epoch": 0.29284878211916837, "percentage": 29.28, "elapsed_time": "12:25:57", "remaining_time": "1 day, 6:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5255, "total_steps": 17941, "loss": 1.8324, "learning_rate": 8.177147376762437e-05, "epoch": 0.29290452037233156, "percentage": 29.29, "elapsed_time": "12:26:06", "remaining_time": "1 day, 6:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5256, "total_steps": 17941, "loss": 1.6782, "learning_rate": 8.176459777845964e-05, "epoch": 0.2929602586254947, "percentage": 29.3, "elapsed_time": "12:26:14", "remaining_time": "1 day, 6:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5257, "total_steps": 17941, "loss": 1.4567, "learning_rate": 8.175772078190707e-05, "epoch": 0.2930159968786578, "percentage": 29.3, "elapsed_time": "12:26:23", "remaining_time": "1 day, 6:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5258, "total_steps": 17941, "loss": 1.6129, "learning_rate": 8.175084277818472e-05, "epoch": 0.29307173513182094, "percentage": 29.31, "elapsed_time": "12:26:31", "remaining_time": "1 day, 6:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5259, "total_steps": 17941, "loss": 1.5253, "learning_rate": 8.174396376751079e-05, "epoch": 0.2931274733849841, "percentage": 29.31, "elapsed_time": "12:26:39", "remaining_time": "1 day, 6:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5260, "total_steps": 17941, "loss": 1.574, "learning_rate": 8.173708375010342e-05, "epoch": 0.29318321163814726, "percentage": 29.32, "elapsed_time": "12:26:48", "remaining_time": "1 day, 6:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5261, "total_steps": 17941, "loss": 1.8022, "learning_rate": 8.173020272618078e-05, "epoch": 0.2932389498913104, "percentage": 29.32, "elapsed_time": "12:26:57", "remaining_time": "1 day, 6:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5262, "total_steps": 17941, "loss": 1.952, "learning_rate": 8.172332069596111e-05, "epoch": 0.29329468814447357, "percentage": 29.33, "elapsed_time": "12:27:05", "remaining_time": "1 day, 6:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5263, "total_steps": 17941, "loss": 1.6838, "learning_rate": 8.171643765966266e-05, "epoch": 0.2933504263976367, "percentage": 29.34, "elapsed_time": "12:27:14", "remaining_time": "1 day, 6:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5264, "total_steps": 17941, "loss": 1.8205, "learning_rate": 8.170955361750373e-05, "epoch": 0.29340616465079983, "percentage": 29.34, "elapsed_time": "12:27:23", "remaining_time": "1 day, 5:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5265, "total_steps": 17941, "loss": 1.6995, "learning_rate": 8.170266856970264e-05, "epoch": 0.293461902903963, "percentage": 29.35, "elapsed_time": "12:27:32", "remaining_time": "1 day, 5:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5266, "total_steps": 17941, "loss": 1.8193, "learning_rate": 8.169578251647775e-05, "epoch": 0.29351764115712614, "percentage": 29.35, "elapsed_time": "12:27:40", "remaining_time": "1 day, 5:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5267, "total_steps": 17941, "loss": 1.6137, "learning_rate": 8.168889545804743e-05, "epoch": 0.29357337941028927, "percentage": 29.36, "elapsed_time": "12:27:49", "remaining_time": "1 day, 5:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5268, "total_steps": 17941, "loss": 1.3883, "learning_rate": 8.16820073946301e-05, "epoch": 0.29362911766345245, "percentage": 29.36, "elapsed_time": "12:27:58", "remaining_time": "1 day, 5:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5269, "total_steps": 17941, "loss": 1.7465, "learning_rate": 8.167511832644423e-05, "epoch": 0.2936848559166156, "percentage": 29.37, "elapsed_time": "12:28:06", "remaining_time": "1 day, 5:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5270, "total_steps": 17941, "loss": 1.8121, "learning_rate": 8.166822825370828e-05, "epoch": 0.2937405941697787, "percentage": 29.37, "elapsed_time": "12:28:15", "remaining_time": "1 day, 5:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5271, "total_steps": 17941, "loss": 1.8007, "learning_rate": 8.166133717664075e-05, "epoch": 0.29379633242294184, "percentage": 29.38, "elapsed_time": "12:28:23", "remaining_time": "1 day, 5:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5272, "total_steps": 17941, "loss": 1.7627, "learning_rate": 8.165444509546023e-05, "epoch": 0.293852070676105, "percentage": 29.39, "elapsed_time": "12:28:32", "remaining_time": "1 day, 5:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5273, "total_steps": 17941, "loss": 1.8668, "learning_rate": 8.164755201038525e-05, "epoch": 0.29390780892926816, "percentage": 29.39, "elapsed_time": "12:28:40", "remaining_time": "1 day, 5:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5274, "total_steps": 17941, "loss": 1.6992, "learning_rate": 8.164065792163445e-05, "epoch": 0.2939635471824313, "percentage": 29.4, "elapsed_time": "12:28:49", "remaining_time": "1 day, 5:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5275, "total_steps": 17941, "loss": 1.6882, "learning_rate": 8.163376282942645e-05, "epoch": 0.29401928543559447, "percentage": 29.4, "elapsed_time": "12:28:57", "remaining_time": "1 day, 5:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5276, "total_steps": 17941, "loss": 1.6314, "learning_rate": 8.162686673397995e-05, "epoch": 0.2940750236887576, "percentage": 29.41, "elapsed_time": "12:29:06", "remaining_time": "1 day, 5:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5277, "total_steps": 17941, "loss": 1.8543, "learning_rate": 8.161996963551361e-05, "epoch": 0.2941307619419207, "percentage": 29.41, "elapsed_time": "12:29:15", "remaining_time": "1 day, 5:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5278, "total_steps": 17941, "loss": 1.407, "learning_rate": 8.16130715342462e-05, "epoch": 0.2941865001950839, "percentage": 29.42, "elapsed_time": "12:29:23", "remaining_time": "1 day, 5:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5279, "total_steps": 17941, "loss": 1.6469, "learning_rate": 8.160617243039648e-05, "epoch": 0.29424223844824704, "percentage": 29.42, "elapsed_time": "12:29:32", "remaining_time": "1 day, 5:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5280, "total_steps": 17941, "loss": 1.762, "learning_rate": 8.159927232418325e-05, "epoch": 0.29429797670141017, "percentage": 29.43, "elapsed_time": "12:29:40", "remaining_time": "1 day, 5:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5281, "total_steps": 17941, "loss": 1.725, "learning_rate": 8.159237121582532e-05, "epoch": 0.2943537149545733, "percentage": 29.44, "elapsed_time": "12:29:49", "remaining_time": "1 day, 5:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5282, "total_steps": 17941, "loss": 1.59, "learning_rate": 8.158546910554159e-05, "epoch": 0.2944094532077365, "percentage": 29.44, "elapsed_time": "12:29:57", "remaining_time": "1 day, 5:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5283, "total_steps": 17941, "loss": 1.8722, "learning_rate": 8.157856599355093e-05, "epoch": 0.2944651914608996, "percentage": 29.45, "elapsed_time": "12:30:06", "remaining_time": "1 day, 5:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5284, "total_steps": 17941, "loss": 1.6608, "learning_rate": 8.157166188007228e-05, "epoch": 0.29452092971406274, "percentage": 29.45, "elapsed_time": "12:30:14", "remaining_time": "1 day, 5:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5285, "total_steps": 17941, "loss": 1.6745, "learning_rate": 8.156475676532458e-05, "epoch": 0.2945766679672259, "percentage": 29.46, "elapsed_time": "12:30:23", "remaining_time": "1 day, 5:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5286, "total_steps": 17941, "loss": 1.9036, "learning_rate": 8.155785064952683e-05, "epoch": 0.29463240622038905, "percentage": 29.46, "elapsed_time": "12:30:31", "remaining_time": "1 day, 5:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5287, "total_steps": 17941, "loss": 1.6749, "learning_rate": 8.155094353289807e-05, "epoch": 0.2946881444735522, "percentage": 29.47, "elapsed_time": "12:30:40", "remaining_time": "1 day, 5:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5288, "total_steps": 17941, "loss": 1.5855, "learning_rate": 8.154403541565732e-05, "epoch": 0.29474388272671537, "percentage": 29.47, "elapsed_time": "12:30:48", "remaining_time": "1 day, 5:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5289, "total_steps": 17941, "loss": 1.6667, "learning_rate": 8.153712629802369e-05, "epoch": 0.2947996209798785, "percentage": 29.48, "elapsed_time": "12:30:57", "remaining_time": "1 day, 5:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5290, "total_steps": 17941, "loss": 1.709, "learning_rate": 8.153021618021628e-05, "epoch": 0.2948553592330416, "percentage": 29.49, "elapsed_time": "12:31:05", "remaining_time": "1 day, 5:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5291, "total_steps": 17941, "loss": 1.4982, "learning_rate": 8.152330506245425e-05, "epoch": 0.2949110974862048, "percentage": 29.49, "elapsed_time": "12:31:14", "remaining_time": "1 day, 5:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5292, "total_steps": 17941, "loss": 1.6915, "learning_rate": 8.151639294495678e-05, "epoch": 0.29496683573936794, "percentage": 29.5, "elapsed_time": "12:31:22", "remaining_time": "1 day, 5:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5293, "total_steps": 17941, "loss": 1.4827, "learning_rate": 8.150947982794307e-05, "epoch": 0.29502257399253107, "percentage": 29.5, "elapsed_time": "12:31:30", "remaining_time": "1 day, 5:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5294, "total_steps": 17941, "loss": 1.805, "learning_rate": 8.150256571163238e-05, "epoch": 0.2950783122456942, "percentage": 29.51, "elapsed_time": "12:31:39", "remaining_time": "1 day, 5:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5295, "total_steps": 17941, "loss": 1.7433, "learning_rate": 8.149565059624398e-05, "epoch": 0.2951340504988574, "percentage": 29.51, "elapsed_time": "12:31:47", "remaining_time": "1 day, 5:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5296, "total_steps": 17941, "loss": 1.7681, "learning_rate": 8.148873448199717e-05, "epoch": 0.2951897887520205, "percentage": 29.52, "elapsed_time": "12:31:56", "remaining_time": "1 day, 5:55:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5297, "total_steps": 17941, "loss": 1.582, "learning_rate": 8.148181736911129e-05, "epoch": 0.29524552700518364, "percentage": 29.52, "elapsed_time": "12:32:04", "remaining_time": "1 day, 5:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5298, "total_steps": 17941, "loss": 1.8182, "learning_rate": 8.147489925780572e-05, "epoch": 0.2953012652583468, "percentage": 29.53, "elapsed_time": "12:32:13", "remaining_time": "1 day, 5:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5299, "total_steps": 17941, "loss": 1.4823, "learning_rate": 8.146798014829986e-05, "epoch": 0.29535700351150995, "percentage": 29.54, "elapsed_time": "12:32:21", "remaining_time": "1 day, 5:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5300, "total_steps": 17941, "loss": 1.6328, "learning_rate": 8.146106004081315e-05, "epoch": 0.2954127417646731, "percentage": 29.54, "elapsed_time": "12:32:30", "remaining_time": "1 day, 5:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5301, "total_steps": 17941, "loss": 1.5871, "learning_rate": 8.145413893556503e-05, "epoch": 0.29546848001783627, "percentage": 29.55, "elapsed_time": "12:32:38", "remaining_time": "1 day, 5:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5302, "total_steps": 17941, "loss": 1.6328, "learning_rate": 8.144721683277504e-05, "epoch": 0.2955242182709994, "percentage": 29.55, "elapsed_time": "12:32:46", "remaining_time": "1 day, 5:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5303, "total_steps": 17941, "loss": 1.6885, "learning_rate": 8.144029373266264e-05, "epoch": 0.2955799565241625, "percentage": 29.56, "elapsed_time": "12:32:55", "remaining_time": "1 day, 5:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5304, "total_steps": 17941, "loss": 1.8579, "learning_rate": 8.143336963544746e-05, "epoch": 0.29563569477732565, "percentage": 29.56, "elapsed_time": "12:33:04", "remaining_time": "1 day, 5:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5305, "total_steps": 17941, "loss": 1.8771, "learning_rate": 8.142644454134905e-05, "epoch": 0.29569143303048884, "percentage": 29.57, "elapsed_time": "12:33:12", "remaining_time": "1 day, 5:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5306, "total_steps": 17941, "loss": 1.6766, "learning_rate": 8.141951845058707e-05, "epoch": 0.29574717128365197, "percentage": 29.57, "elapsed_time": "12:33:20", "remaining_time": "1 day, 5:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5307, "total_steps": 17941, "loss": 1.7359, "learning_rate": 8.141259136338113e-05, "epoch": 0.2958029095368151, "percentage": 29.58, "elapsed_time": "12:33:29", "remaining_time": "1 day, 5:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5308, "total_steps": 17941, "loss": 1.9672, "learning_rate": 8.140566327995094e-05, "epoch": 0.2958586477899783, "percentage": 29.59, "elapsed_time": "12:33:37", "remaining_time": "1 day, 5:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5309, "total_steps": 17941, "loss": 1.5947, "learning_rate": 8.139873420051623e-05, "epoch": 0.2959143860431414, "percentage": 29.59, "elapsed_time": "12:33:46", "remaining_time": "1 day, 5:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5310, "total_steps": 17941, "loss": 1.7245, "learning_rate": 8.139180412529674e-05, "epoch": 0.29597012429630454, "percentage": 29.6, "elapsed_time": "12:33:55", "remaining_time": "1 day, 5:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5311, "total_steps": 17941, "loss": 1.7156, "learning_rate": 8.138487305451224e-05, "epoch": 0.2960258625494677, "percentage": 29.6, "elapsed_time": "12:34:03", "remaining_time": "1 day, 5:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5312, "total_steps": 17941, "loss": 1.78, "learning_rate": 8.137794098838257e-05, "epoch": 0.29608160080263085, "percentage": 29.61, "elapsed_time": "12:34:12", "remaining_time": "1 day, 5:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5313, "total_steps": 17941, "loss": 1.9258, "learning_rate": 8.137100792712755e-05, "epoch": 0.296137339055794, "percentage": 29.61, "elapsed_time": "12:34:20", "remaining_time": "1 day, 5:52:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5314, "total_steps": 17941, "loss": 1.7132, "learning_rate": 8.136407387096704e-05, "epoch": 0.29619307730895716, "percentage": 29.62, "elapsed_time": "12:34:28", "remaining_time": "1 day, 5:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5315, "total_steps": 17941, "loss": 1.8024, "learning_rate": 8.135713882012102e-05, "epoch": 0.2962488155621203, "percentage": 29.62, "elapsed_time": "12:34:37", "remaining_time": "1 day, 5:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5316, "total_steps": 17941, "loss": 1.7025, "learning_rate": 8.135020277480934e-05, "epoch": 0.2963045538152834, "percentage": 29.63, "elapsed_time": "12:34:45", "remaining_time": "1 day, 5:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5317, "total_steps": 17941, "loss": 1.7402, "learning_rate": 8.134326573525202e-05, "epoch": 0.29636029206844655, "percentage": 29.64, "elapsed_time": "12:34:54", "remaining_time": "1 day, 5:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5318, "total_steps": 17941, "loss": 1.585, "learning_rate": 8.133632770166907e-05, "epoch": 0.29641603032160974, "percentage": 29.64, "elapsed_time": "12:35:02", "remaining_time": "1 day, 5:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5319, "total_steps": 17941, "loss": 1.7313, "learning_rate": 8.13293886742805e-05, "epoch": 0.29647176857477286, "percentage": 29.65, "elapsed_time": "12:35:11", "remaining_time": "1 day, 5:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5320, "total_steps": 17941, "loss": 1.7854, "learning_rate": 8.132244865330638e-05, "epoch": 0.296527506827936, "percentage": 29.65, "elapsed_time": "12:35:19", "remaining_time": "1 day, 5:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5321, "total_steps": 17941, "loss": 1.6821, "learning_rate": 8.131550763896682e-05, "epoch": 0.2965832450810992, "percentage": 29.66, "elapsed_time": "12:35:27", "remaining_time": "1 day, 5:51:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5322, "total_steps": 17941, "loss": 1.6151, "learning_rate": 8.130856563148193e-05, "epoch": 0.2966389833342623, "percentage": 29.66, "elapsed_time": "12:35:36", "remaining_time": "1 day, 5:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5323, "total_steps": 17941, "loss": 1.7497, "learning_rate": 8.130162263107189e-05, "epoch": 0.29669472158742544, "percentage": 29.67, "elapsed_time": "12:35:44", "remaining_time": "1 day, 5:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5324, "total_steps": 17941, "loss": 1.7157, "learning_rate": 8.129467863795688e-05, "epoch": 0.2967504598405886, "percentage": 29.68, "elapsed_time": "12:35:53", "remaining_time": "1 day, 5:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5325, "total_steps": 17941, "loss": 1.6488, "learning_rate": 8.128773365235711e-05, "epoch": 0.29680619809375175, "percentage": 29.68, "elapsed_time": "12:36:01", "remaining_time": "1 day, 5:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5326, "total_steps": 17941, "loss": 1.6868, "learning_rate": 8.128078767449287e-05, "epoch": 0.2968619363469149, "percentage": 29.69, "elapsed_time": "12:36:10", "remaining_time": "1 day, 5:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5327, "total_steps": 17941, "loss": 1.9352, "learning_rate": 8.127384070458442e-05, "epoch": 0.296917674600078, "percentage": 29.69, "elapsed_time": "12:36:18", "remaining_time": "1 day, 5:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5328, "total_steps": 17941, "loss": 1.9085, "learning_rate": 8.126689274285207e-05, "epoch": 0.2969734128532412, "percentage": 29.7, "elapsed_time": "12:36:27", "remaining_time": "1 day, 5:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5329, "total_steps": 17941, "loss": 1.715, "learning_rate": 8.125994378951619e-05, "epoch": 0.2970291511064043, "percentage": 29.7, "elapsed_time": "12:36:35", "remaining_time": "1 day, 5:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5330, "total_steps": 17941, "loss": 1.7472, "learning_rate": 8.125299384479714e-05, "epoch": 0.29708488935956745, "percentage": 29.71, "elapsed_time": "12:36:43", "remaining_time": "1 day, 5:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5331, "total_steps": 17941, "loss": 1.8646, "learning_rate": 8.124604290891535e-05, "epoch": 0.29714062761273063, "percentage": 29.71, "elapsed_time": "12:36:52", "remaining_time": "1 day, 5:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5332, "total_steps": 17941, "loss": 1.6506, "learning_rate": 8.123909098209126e-05, "epoch": 0.29719636586589376, "percentage": 29.72, "elapsed_time": "12:37:00", "remaining_time": "1 day, 5:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5333, "total_steps": 17941, "loss": 1.805, "learning_rate": 8.123213806454535e-05, "epoch": 0.2972521041190569, "percentage": 29.73, "elapsed_time": "12:37:09", "remaining_time": "1 day, 5:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5334, "total_steps": 17941, "loss": 1.6501, "learning_rate": 8.122518415649808e-05, "epoch": 0.2973078423722201, "percentage": 29.73, "elapsed_time": "12:37:17", "remaining_time": "1 day, 5:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5335, "total_steps": 17941, "loss": 1.7944, "learning_rate": 8.121822925817006e-05, "epoch": 0.2973635806253832, "percentage": 29.74, "elapsed_time": "12:37:26", "remaining_time": "1 day, 5:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5336, "total_steps": 17941, "loss": 1.5578, "learning_rate": 8.121127336978183e-05, "epoch": 0.29741931887854633, "percentage": 29.74, "elapsed_time": "12:37:34", "remaining_time": "1 day, 5:49:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5337, "total_steps": 17941, "loss": 1.7118, "learning_rate": 8.120431649155396e-05, "epoch": 0.2974750571317095, "percentage": 29.75, "elapsed_time": "12:37:43", "remaining_time": "1 day, 5:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5338, "total_steps": 17941, "loss": 1.7363, "learning_rate": 8.11973586237071e-05, "epoch": 0.29753079538487265, "percentage": 29.75, "elapsed_time": "12:37:51", "remaining_time": "1 day, 5:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5339, "total_steps": 17941, "loss": 1.74, "learning_rate": 8.119039976646192e-05, "epoch": 0.2975865336380358, "percentage": 29.76, "elapsed_time": "12:38:00", "remaining_time": "1 day, 5:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5340, "total_steps": 17941, "loss": 1.5712, "learning_rate": 8.118343992003913e-05, "epoch": 0.2976422718911989, "percentage": 29.76, "elapsed_time": "12:38:08", "remaining_time": "1 day, 5:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5341, "total_steps": 17941, "loss": 1.5346, "learning_rate": 8.117647908465942e-05, "epoch": 0.2976980101443621, "percentage": 29.77, "elapsed_time": "12:38:17", "remaining_time": "1 day, 5:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5342, "total_steps": 17941, "loss": 2.0871, "learning_rate": 8.116951726054358e-05, "epoch": 0.2977537483975252, "percentage": 29.78, "elapsed_time": "12:38:26", "remaining_time": "1 day, 5:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5343, "total_steps": 17941, "loss": 1.5362, "learning_rate": 8.116255444791237e-05, "epoch": 0.29780948665068835, "percentage": 29.78, "elapsed_time": "12:38:34", "remaining_time": "1 day, 5:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5344, "total_steps": 17941, "loss": 1.5788, "learning_rate": 8.115559064698662e-05, "epoch": 0.29786522490385153, "percentage": 29.79, "elapsed_time": "12:38:43", "remaining_time": "1 day, 5:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5345, "total_steps": 17941, "loss": 1.7055, "learning_rate": 8.11486258579872e-05, "epoch": 0.29792096315701466, "percentage": 29.79, "elapsed_time": "12:38:51", "remaining_time": "1 day, 5:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5346, "total_steps": 17941, "loss": 1.8135, "learning_rate": 8.114166008113498e-05, "epoch": 0.2979767014101778, "percentage": 29.8, "elapsed_time": "12:39:00", "remaining_time": "1 day, 5:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5347, "total_steps": 17941, "loss": 1.655, "learning_rate": 8.113469331665085e-05, "epoch": 0.298032439663341, "percentage": 29.8, "elapsed_time": "12:39:08", "remaining_time": "1 day, 5:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5348, "total_steps": 17941, "loss": 2.0929, "learning_rate": 8.112772556475579e-05, "epoch": 0.2980881779165041, "percentage": 29.81, "elapsed_time": "12:39:17", "remaining_time": "1 day, 5:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5349, "total_steps": 17941, "loss": 1.6594, "learning_rate": 8.112075682567075e-05, "epoch": 0.29814391616966723, "percentage": 29.81, "elapsed_time": "12:39:25", "remaining_time": "1 day, 5:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5350, "total_steps": 17941, "loss": 1.7254, "learning_rate": 8.111378709961676e-05, "epoch": 0.29819965442283036, "percentage": 29.82, "elapsed_time": "12:39:34", "remaining_time": "1 day, 5:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5351, "total_steps": 17941, "loss": 1.7559, "learning_rate": 8.110681638681485e-05, "epoch": 0.29825539267599355, "percentage": 29.83, "elapsed_time": "12:39:42", "remaining_time": "1 day, 5:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5352, "total_steps": 17941, "loss": 1.6271, "learning_rate": 8.109984468748608e-05, "epoch": 0.2983111309291567, "percentage": 29.83, "elapsed_time": "12:39:51", "remaining_time": "1 day, 5:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5353, "total_steps": 17941, "loss": 1.6231, "learning_rate": 8.109287200185157e-05, "epoch": 0.2983668691823198, "percentage": 29.84, "elapsed_time": "12:40:00", "remaining_time": "1 day, 5:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5354, "total_steps": 17941, "loss": 1.5838, "learning_rate": 8.108589833013245e-05, "epoch": 0.298422607435483, "percentage": 29.84, "elapsed_time": "12:40:08", "remaining_time": "1 day, 5:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5355, "total_steps": 17941, "loss": 1.5132, "learning_rate": 8.107892367254986e-05, "epoch": 0.2984783456886461, "percentage": 29.85, "elapsed_time": "12:40:17", "remaining_time": "1 day, 5:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5356, "total_steps": 17941, "loss": 1.811, "learning_rate": 8.107194802932503e-05, "epoch": 0.29853408394180925, "percentage": 29.85, "elapsed_time": "12:40:25", "remaining_time": "1 day, 5:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5357, "total_steps": 17941, "loss": 1.8477, "learning_rate": 8.106497140067916e-05, "epoch": 0.29858982219497243, "percentage": 29.86, "elapsed_time": "12:40:34", "remaining_time": "1 day, 5:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5358, "total_steps": 17941, "loss": 1.5521, "learning_rate": 8.105799378683353e-05, "epoch": 0.29864556044813556, "percentage": 29.86, "elapsed_time": "12:40:42", "remaining_time": "1 day, 5:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5359, "total_steps": 17941, "loss": 1.6123, "learning_rate": 8.10510151880094e-05, "epoch": 0.2987012987012987, "percentage": 29.87, "elapsed_time": "12:40:51", "remaining_time": "1 day, 5:46:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5360, "total_steps": 17941, "loss": 1.6369, "learning_rate": 8.104403560442813e-05, "epoch": 0.2987570369544619, "percentage": 29.88, "elapsed_time": "12:40:59", "remaining_time": "1 day, 5:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5361, "total_steps": 17941, "loss": 1.762, "learning_rate": 8.103705503631104e-05, "epoch": 0.298812775207625, "percentage": 29.88, "elapsed_time": "12:41:08", "remaining_time": "1 day, 5:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5362, "total_steps": 17941, "loss": 1.9896, "learning_rate": 8.103007348387952e-05, "epoch": 0.29886851346078813, "percentage": 29.89, "elapsed_time": "12:41:16", "remaining_time": "1 day, 5:45:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5363, "total_steps": 17941, "loss": 1.7463, "learning_rate": 8.102309094735498e-05, "epoch": 0.29892425171395126, "percentage": 29.89, "elapsed_time": "12:41:25", "remaining_time": "1 day, 5:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5364, "total_steps": 17941, "loss": 1.4381, "learning_rate": 8.101610742695889e-05, "epoch": 0.29897998996711445, "percentage": 29.9, "elapsed_time": "12:41:33", "remaining_time": "1 day, 5:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5365, "total_steps": 17941, "loss": 1.8118, "learning_rate": 8.100912292291269e-05, "epoch": 0.2990357282202776, "percentage": 29.9, "elapsed_time": "12:41:41", "remaining_time": "1 day, 5:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5366, "total_steps": 17941, "loss": 1.7309, "learning_rate": 8.100213743543793e-05, "epoch": 0.2990914664734407, "percentage": 29.91, "elapsed_time": "12:41:50", "remaining_time": "1 day, 5:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5367, "total_steps": 17941, "loss": 1.7422, "learning_rate": 8.099515096475611e-05, "epoch": 0.2991472047266039, "percentage": 29.91, "elapsed_time": "12:41:58", "remaining_time": "1 day, 5:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5368, "total_steps": 17941, "loss": 1.5088, "learning_rate": 8.098816351108881e-05, "epoch": 0.299202942979767, "percentage": 29.92, "elapsed_time": "12:42:07", "remaining_time": "1 day, 5:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5369, "total_steps": 17941, "loss": 1.4643, "learning_rate": 8.098117507465765e-05, "epoch": 0.29925868123293015, "percentage": 29.93, "elapsed_time": "12:42:15", "remaining_time": "1 day, 5:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5370, "total_steps": 17941, "loss": 1.3811, "learning_rate": 8.097418565568424e-05, "epoch": 0.29931441948609333, "percentage": 29.93, "elapsed_time": "12:42:24", "remaining_time": "1 day, 5:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5371, "total_steps": 17941, "loss": 1.5929, "learning_rate": 8.096719525439026e-05, "epoch": 0.29937015773925646, "percentage": 29.94, "elapsed_time": "12:42:32", "remaining_time": "1 day, 5:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5372, "total_steps": 17941, "loss": 1.5428, "learning_rate": 8.096020387099739e-05, "epoch": 0.2994258959924196, "percentage": 29.94, "elapsed_time": "12:42:41", "remaining_time": "1 day, 5:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5373, "total_steps": 17941, "loss": 1.5148, "learning_rate": 8.095321150572738e-05, "epoch": 0.2994816342455827, "percentage": 29.95, "elapsed_time": "12:42:49", "remaining_time": "1 day, 5:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5374, "total_steps": 17941, "loss": 1.898, "learning_rate": 8.094621815880197e-05, "epoch": 0.2995373724987459, "percentage": 29.95, "elapsed_time": "12:42:57", "remaining_time": "1 day, 5:44:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5375, "total_steps": 17941, "loss": 1.4073, "learning_rate": 8.093922383044293e-05, "epoch": 0.29959311075190903, "percentage": 29.96, "elapsed_time": "12:43:06", "remaining_time": "1 day, 5:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5376, "total_steps": 17941, "loss": 1.7551, "learning_rate": 8.09322285208721e-05, "epoch": 0.29964884900507216, "percentage": 29.96, "elapsed_time": "12:43:14", "remaining_time": "1 day, 5:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5377, "total_steps": 17941, "loss": 1.8272, "learning_rate": 8.092523223031134e-05, "epoch": 0.29970458725823534, "percentage": 29.97, "elapsed_time": "12:43:23", "remaining_time": "1 day, 5:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5378, "total_steps": 17941, "loss": 1.6346, "learning_rate": 8.091823495898251e-05, "epoch": 0.2997603255113985, "percentage": 29.98, "elapsed_time": "12:43:31", "remaining_time": "1 day, 5:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5379, "total_steps": 17941, "loss": 1.7025, "learning_rate": 8.091123670710754e-05, "epoch": 0.2998160637645616, "percentage": 29.98, "elapsed_time": "12:43:41", "remaining_time": "1 day, 5:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5380, "total_steps": 17941, "loss": 1.6895, "learning_rate": 8.090423747490836e-05, "epoch": 0.2998718020177248, "percentage": 29.99, "elapsed_time": "12:43:49", "remaining_time": "1 day, 5:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5381, "total_steps": 17941, "loss": 1.8338, "learning_rate": 8.089723726260696e-05, "epoch": 0.2999275402708879, "percentage": 29.99, "elapsed_time": "12:43:58", "remaining_time": "1 day, 5:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5382, "total_steps": 17941, "loss": 1.65, "learning_rate": 8.089023607042534e-05, "epoch": 0.29998327852405104, "percentage": 30.0, "elapsed_time": "12:44:07", "remaining_time": "1 day, 5:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5383, "total_steps": 17941, "loss": 1.433, "learning_rate": 8.088323389858552e-05, "epoch": 0.30003901677721423, "percentage": 30.0, "elapsed_time": "12:44:15", "remaining_time": "1 day, 5:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5384, "total_steps": 17941, "loss": 1.3703, "learning_rate": 8.08762307473096e-05, "epoch": 0.30009475503037736, "percentage": 30.01, "elapsed_time": "12:44:24", "remaining_time": "1 day, 5:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5385, "total_steps": 17941, "loss": 2.1215, "learning_rate": 8.086922661681966e-05, "epoch": 0.3001504932835405, "percentage": 30.02, "elapsed_time": "12:44:33", "remaining_time": "1 day, 5:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5386, "total_steps": 17941, "loss": 1.5703, "learning_rate": 8.086222150733782e-05, "epoch": 0.3002062315367036, "percentage": 30.02, "elapsed_time": "12:44:41", "remaining_time": "1 day, 5:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5387, "total_steps": 17941, "loss": 1.5785, "learning_rate": 8.085521541908627e-05, "epoch": 0.3002619697898668, "percentage": 30.03, "elapsed_time": "12:44:50", "remaining_time": "1 day, 5:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5388, "total_steps": 17941, "loss": 1.799, "learning_rate": 8.084820835228717e-05, "epoch": 0.30031770804302993, "percentage": 30.03, "elapsed_time": "12:44:58", "remaining_time": "1 day, 5:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5389, "total_steps": 17941, "loss": 1.6782, "learning_rate": 8.084120030716275e-05, "epoch": 0.30037344629619306, "percentage": 30.04, "elapsed_time": "12:45:06", "remaining_time": "1 day, 5:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5390, "total_steps": 17941, "loss": 1.6544, "learning_rate": 8.083419128393528e-05, "epoch": 0.30042918454935624, "percentage": 30.04, "elapsed_time": "12:45:15", "remaining_time": "1 day, 5:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5391, "total_steps": 17941, "loss": 1.7962, "learning_rate": 8.082718128282705e-05, "epoch": 0.30048492280251937, "percentage": 30.05, "elapsed_time": "12:45:23", "remaining_time": "1 day, 5:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5392, "total_steps": 17941, "loss": 1.7551, "learning_rate": 8.082017030406037e-05, "epoch": 0.3005406610556825, "percentage": 30.05, "elapsed_time": "12:45:33", "remaining_time": "1 day, 5:41:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5393, "total_steps": 17941, "loss": 1.8789, "learning_rate": 8.081315834785756e-05, "epoch": 0.3005963993088457, "percentage": 30.06, "elapsed_time": "12:45:41", "remaining_time": "1 day, 5:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5394, "total_steps": 17941, "loss": 1.7545, "learning_rate": 8.080614541444103e-05, "epoch": 0.3006521375620088, "percentage": 30.07, "elapsed_time": "12:45:50", "remaining_time": "1 day, 5:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5395, "total_steps": 17941, "loss": 1.6059, "learning_rate": 8.079913150403318e-05, "epoch": 0.30070787581517194, "percentage": 30.07, "elapsed_time": "12:45:58", "remaining_time": "1 day, 5:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5396, "total_steps": 17941, "loss": 2.0125, "learning_rate": 8.079211661685644e-05, "epoch": 0.3007636140683351, "percentage": 30.08, "elapsed_time": "12:46:07", "remaining_time": "1 day, 5:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5397, "total_steps": 17941, "loss": 1.8713, "learning_rate": 8.07851007531333e-05, "epoch": 0.30081935232149826, "percentage": 30.08, "elapsed_time": "12:46:15", "remaining_time": "1 day, 5:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5398, "total_steps": 17941, "loss": 1.6547, "learning_rate": 8.077808391308626e-05, "epoch": 0.3008750905746614, "percentage": 30.09, "elapsed_time": "12:46:24", "remaining_time": "1 day, 5:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5399, "total_steps": 17941, "loss": 1.5186, "learning_rate": 8.077106609693784e-05, "epoch": 0.3009308288278245, "percentage": 30.09, "elapsed_time": "12:46:32", "remaining_time": "1 day, 5:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5400, "total_steps": 17941, "loss": 1.8402, "learning_rate": 8.076404730491061e-05, "epoch": 0.3009865670809877, "percentage": 30.1, "elapsed_time": "12:46:41", "remaining_time": "1 day, 5:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5401, "total_steps": 17941, "loss": 1.656, "learning_rate": 8.075702753722718e-05, "epoch": 0.30104230533415083, "percentage": 30.1, "elapsed_time": "12:46:49", "remaining_time": "1 day, 5:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5402, "total_steps": 17941, "loss": 1.6743, "learning_rate": 8.075000679411014e-05, "epoch": 0.30109804358731396, "percentage": 30.11, "elapsed_time": "12:46:58", "remaining_time": "1 day, 5:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5403, "total_steps": 17941, "loss": 1.7567, "learning_rate": 8.074298507578218e-05, "epoch": 0.30115378184047714, "percentage": 30.12, "elapsed_time": "12:47:06", "remaining_time": "1 day, 5:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5404, "total_steps": 17941, "loss": 1.5783, "learning_rate": 8.073596238246599e-05, "epoch": 0.30120952009364027, "percentage": 30.12, "elapsed_time": "12:47:15", "remaining_time": "1 day, 5:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5405, "total_steps": 17941, "loss": 1.7135, "learning_rate": 8.072893871438428e-05, "epoch": 0.3012652583468034, "percentage": 30.13, "elapsed_time": "12:47:23", "remaining_time": "1 day, 5:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5406, "total_steps": 17941, "loss": 1.8845, "learning_rate": 8.072191407175976e-05, "epoch": 0.3013209965999666, "percentage": 30.13, "elapsed_time": "12:47:32", "remaining_time": "1 day, 5:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5407, "total_steps": 17941, "loss": 1.6139, "learning_rate": 8.071488845481528e-05, "epoch": 0.3013767348531297, "percentage": 30.14, "elapsed_time": "12:47:40", "remaining_time": "1 day, 5:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5408, "total_steps": 17941, "loss": 1.4973, "learning_rate": 8.07078618637736e-05, "epoch": 0.30143247310629284, "percentage": 30.14, "elapsed_time": "12:47:49", "remaining_time": "1 day, 5:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5409, "total_steps": 17941, "loss": 1.7224, "learning_rate": 8.070083429885758e-05, "epoch": 0.30148821135945597, "percentage": 30.15, "elapsed_time": "12:47:57", "remaining_time": "1 day, 5:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5410, "total_steps": 17941, "loss": 1.508, "learning_rate": 8.069380576029011e-05, "epoch": 0.30154394961261916, "percentage": 30.15, "elapsed_time": "12:48:06", "remaining_time": "1 day, 5:39:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5411, "total_steps": 17941, "loss": 2.0365, "learning_rate": 8.068677624829406e-05, "epoch": 0.3015996878657823, "percentage": 30.16, "elapsed_time": "12:48:14", "remaining_time": "1 day, 5:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5412, "total_steps": 17941, "loss": 1.8489, "learning_rate": 8.067974576309241e-05, "epoch": 0.3016554261189454, "percentage": 30.17, "elapsed_time": "12:48:22", "remaining_time": "1 day, 5:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5413, "total_steps": 17941, "loss": 1.7361, "learning_rate": 8.067271430490809e-05, "epoch": 0.3017111643721086, "percentage": 30.17, "elapsed_time": "12:48:31", "remaining_time": "1 day, 5:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5414, "total_steps": 17941, "loss": 1.5648, "learning_rate": 8.066568187396409e-05, "epoch": 0.3017669026252717, "percentage": 30.18, "elapsed_time": "12:48:40", "remaining_time": "1 day, 5:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5415, "total_steps": 17941, "loss": 1.7308, "learning_rate": 8.065864847048346e-05, "epoch": 0.30182264087843486, "percentage": 30.18, "elapsed_time": "12:48:48", "remaining_time": "1 day, 5:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5416, "total_steps": 17941, "loss": 1.9456, "learning_rate": 8.065161409468925e-05, "epoch": 0.30187837913159804, "percentage": 30.19, "elapsed_time": "12:48:57", "remaining_time": "1 day, 5:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5417, "total_steps": 17941, "loss": 1.8213, "learning_rate": 8.064457874680457e-05, "epoch": 0.30193411738476117, "percentage": 30.19, "elapsed_time": "12:49:05", "remaining_time": "1 day, 5:38:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5418, "total_steps": 17941, "loss": 1.8837, "learning_rate": 8.06375424270525e-05, "epoch": 0.3019898556379243, "percentage": 30.2, "elapsed_time": "12:49:14", "remaining_time": "1 day, 5:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5419, "total_steps": 17941, "loss": 1.9783, "learning_rate": 8.063050513565624e-05, "epoch": 0.3020455938910874, "percentage": 30.2, "elapsed_time": "12:49:22", "remaining_time": "1 day, 5:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5420, "total_steps": 17941, "loss": 1.8092, "learning_rate": 8.062346687283892e-05, "epoch": 0.3021013321442506, "percentage": 30.21, "elapsed_time": "12:49:31", "remaining_time": "1 day, 5:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5421, "total_steps": 17941, "loss": 1.6994, "learning_rate": 8.06164276388238e-05, "epoch": 0.30215707039741374, "percentage": 30.22, "elapsed_time": "12:49:39", "remaining_time": "1 day, 5:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5422, "total_steps": 17941, "loss": 1.5504, "learning_rate": 8.060938743383408e-05, "epoch": 0.30221280865057687, "percentage": 30.22, "elapsed_time": "12:49:47", "remaining_time": "1 day, 5:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5423, "total_steps": 17941, "loss": 1.8898, "learning_rate": 8.060234625809306e-05, "epoch": 0.30226854690374005, "percentage": 30.23, "elapsed_time": "12:49:56", "remaining_time": "1 day, 5:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5424, "total_steps": 17941, "loss": 1.7518, "learning_rate": 8.059530411182406e-05, "epoch": 0.3023242851569032, "percentage": 30.23, "elapsed_time": "12:50:04", "remaining_time": "1 day, 5:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5425, "total_steps": 17941, "loss": 1.92, "learning_rate": 8.058826099525039e-05, "epoch": 0.3023800234100663, "percentage": 30.24, "elapsed_time": "12:50:13", "remaining_time": "1 day, 5:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5426, "total_steps": 17941, "loss": 1.7421, "learning_rate": 8.058121690859541e-05, "epoch": 0.3024357616632295, "percentage": 30.24, "elapsed_time": "12:50:21", "remaining_time": "1 day, 5:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5427, "total_steps": 17941, "loss": 1.7487, "learning_rate": 8.057417185208254e-05, "epoch": 0.3024914999163926, "percentage": 30.25, "elapsed_time": "12:50:30", "remaining_time": "1 day, 5:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5428, "total_steps": 17941, "loss": 1.7268, "learning_rate": 8.056712582593519e-05, "epoch": 0.30254723816955575, "percentage": 30.25, "elapsed_time": "12:50:38", "remaining_time": "1 day, 5:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5429, "total_steps": 17941, "loss": 1.8249, "learning_rate": 8.056007883037682e-05, "epoch": 0.30260297642271894, "percentage": 30.26, "elapsed_time": "12:50:47", "remaining_time": "1 day, 5:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5430, "total_steps": 17941, "loss": 1.8337, "learning_rate": 8.055303086563095e-05, "epoch": 0.30265871467588207, "percentage": 30.27, "elapsed_time": "12:50:55", "remaining_time": "1 day, 5:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5431, "total_steps": 17941, "loss": 2.0531, "learning_rate": 8.054598193192106e-05, "epoch": 0.3027144529290452, "percentage": 30.27, "elapsed_time": "12:51:04", "remaining_time": "1 day, 5:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5432, "total_steps": 17941, "loss": 1.6712, "learning_rate": 8.053893202947074e-05, "epoch": 0.3027701911822083, "percentage": 30.28, "elapsed_time": "12:51:12", "remaining_time": "1 day, 5:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5433, "total_steps": 17941, "loss": 1.5738, "learning_rate": 8.053188115850354e-05, "epoch": 0.3028259294353715, "percentage": 30.28, "elapsed_time": "12:51:21", "remaining_time": "1 day, 5:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5434, "total_steps": 17941, "loss": 1.8257, "learning_rate": 8.052482931924308e-05, "epoch": 0.30288166768853464, "percentage": 30.29, "elapsed_time": "12:51:29", "remaining_time": "1 day, 5:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5435, "total_steps": 17941, "loss": 1.7261, "learning_rate": 8.051777651191299e-05, "epoch": 0.30293740594169777, "percentage": 30.29, "elapsed_time": "12:51:37", "remaining_time": "1 day, 5:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5436, "total_steps": 17941, "loss": 1.7634, "learning_rate": 8.051072273673698e-05, "epoch": 0.30299314419486095, "percentage": 30.3, "elapsed_time": "12:51:46", "remaining_time": "1 day, 5:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5437, "total_steps": 17941, "loss": 1.5592, "learning_rate": 8.050366799393874e-05, "epoch": 0.3030488824480241, "percentage": 30.3, "elapsed_time": "12:51:54", "remaining_time": "1 day, 5:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5438, "total_steps": 17941, "loss": 1.7104, "learning_rate": 8.049661228374199e-05, "epoch": 0.3031046207011872, "percentage": 30.31, "elapsed_time": "12:52:04", "remaining_time": "1 day, 5:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5439, "total_steps": 17941, "loss": 1.7344, "learning_rate": 8.04895556063705e-05, "epoch": 0.3031603589543504, "percentage": 30.32, "elapsed_time": "12:52:12", "remaining_time": "1 day, 5:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5440, "total_steps": 17941, "loss": 1.6345, "learning_rate": 8.048249796204808e-05, "epoch": 0.3032160972075135, "percentage": 30.32, "elapsed_time": "12:52:21", "remaining_time": "1 day, 5:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5441, "total_steps": 17941, "loss": 1.542, "learning_rate": 8.047543935099855e-05, "epoch": 0.30327183546067665, "percentage": 30.33, "elapsed_time": "12:52:29", "remaining_time": "1 day, 5:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5442, "total_steps": 17941, "loss": 1.8106, "learning_rate": 8.046837977344577e-05, "epoch": 0.3033275737138398, "percentage": 30.33, "elapsed_time": "12:52:37", "remaining_time": "1 day, 5:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5443, "total_steps": 17941, "loss": 1.8995, "learning_rate": 8.046131922961362e-05, "epoch": 0.30338331196700297, "percentage": 30.34, "elapsed_time": "12:52:46", "remaining_time": "1 day, 5:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5444, "total_steps": 17941, "loss": 1.471, "learning_rate": 8.045425771972603e-05, "epoch": 0.3034390502201661, "percentage": 30.34, "elapsed_time": "12:52:54", "remaining_time": "1 day, 5:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5445, "total_steps": 17941, "loss": 1.6613, "learning_rate": 8.044719524400694e-05, "epoch": 0.3034947884733292, "percentage": 30.35, "elapsed_time": "12:53:04", "remaining_time": "1 day, 5:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5446, "total_steps": 17941, "loss": 1.7442, "learning_rate": 8.044013180268034e-05, "epoch": 0.3035505267264924, "percentage": 30.36, "elapsed_time": "12:53:12", "remaining_time": "1 day, 5:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5447, "total_steps": 17941, "loss": 1.7848, "learning_rate": 8.043306739597024e-05, "epoch": 0.30360626497965554, "percentage": 30.36, "elapsed_time": "12:53:21", "remaining_time": "1 day, 5:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5448, "total_steps": 17941, "loss": 1.5744, "learning_rate": 8.042600202410066e-05, "epoch": 0.30366200323281867, "percentage": 30.37, "elapsed_time": "12:53:29", "remaining_time": "1 day, 5:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5449, "total_steps": 17941, "loss": 1.6689, "learning_rate": 8.041893568729573e-05, "epoch": 0.30371774148598185, "percentage": 30.37, "elapsed_time": "12:53:37", "remaining_time": "1 day, 5:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5450, "total_steps": 17941, "loss": 1.6285, "learning_rate": 8.041186838577949e-05, "epoch": 0.303773479739145, "percentage": 30.38, "elapsed_time": "12:53:46", "remaining_time": "1 day, 5:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5451, "total_steps": 17941, "loss": 1.5176, "learning_rate": 8.04048001197761e-05, "epoch": 0.3038292179923081, "percentage": 30.38, "elapsed_time": "12:53:54", "remaining_time": "1 day, 5:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5452, "total_steps": 17941, "loss": 1.6778, "learning_rate": 8.039773088950973e-05, "epoch": 0.3038849562454713, "percentage": 30.39, "elapsed_time": "12:54:03", "remaining_time": "1 day, 5:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5453, "total_steps": 17941, "loss": 1.9253, "learning_rate": 8.039066069520455e-05, "epoch": 0.3039406944986344, "percentage": 30.39, "elapsed_time": "12:54:11", "remaining_time": "1 day, 5:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5454, "total_steps": 17941, "loss": 1.8921, "learning_rate": 8.038358953708482e-05, "epoch": 0.30399643275179755, "percentage": 30.4, "elapsed_time": "12:54:20", "remaining_time": "1 day, 5:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5455, "total_steps": 17941, "loss": 1.6157, "learning_rate": 8.037651741537478e-05, "epoch": 0.3040521710049607, "percentage": 30.41, "elapsed_time": "12:54:29", "remaining_time": "1 day, 5:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5456, "total_steps": 17941, "loss": 1.6204, "learning_rate": 8.03694443302987e-05, "epoch": 0.30410790925812387, "percentage": 30.41, "elapsed_time": "12:54:37", "remaining_time": "1 day, 5:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5457, "total_steps": 17941, "loss": 1.6984, "learning_rate": 8.036237028208092e-05, "epoch": 0.304163647511287, "percentage": 30.42, "elapsed_time": "12:54:46", "remaining_time": "1 day, 5:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5458, "total_steps": 17941, "loss": 1.5733, "learning_rate": 8.035529527094578e-05, "epoch": 0.3042193857644501, "percentage": 30.42, "elapsed_time": "12:54:54", "remaining_time": "1 day, 5:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5459, "total_steps": 17941, "loss": 1.6158, "learning_rate": 8.034821929711767e-05, "epoch": 0.3042751240176133, "percentage": 30.43, "elapsed_time": "12:55:03", "remaining_time": "1 day, 5:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5460, "total_steps": 17941, "loss": 1.8269, "learning_rate": 8.034114236082098e-05, "epoch": 0.30433086227077644, "percentage": 30.43, "elapsed_time": "12:55:11", "remaining_time": "1 day, 5:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5461, "total_steps": 17941, "loss": 1.8742, "learning_rate": 8.033406446228014e-05, "epoch": 0.30438660052393957, "percentage": 30.44, "elapsed_time": "12:55:19", "remaining_time": "1 day, 5:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5462, "total_steps": 17941, "loss": 1.9496, "learning_rate": 8.032698560171964e-05, "epoch": 0.30444233877710275, "percentage": 30.44, "elapsed_time": "12:55:28", "remaining_time": "1 day, 5:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5463, "total_steps": 17941, "loss": 1.5899, "learning_rate": 8.031990577936398e-05, "epoch": 0.3044980770302659, "percentage": 30.45, "elapsed_time": "12:55:36", "remaining_time": "1 day, 5:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5464, "total_steps": 17941, "loss": 1.6575, "learning_rate": 8.031282499543769e-05, "epoch": 0.304553815283429, "percentage": 30.46, "elapsed_time": "12:55:45", "remaining_time": "1 day, 5:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5465, "total_steps": 17941, "loss": 1.5878, "learning_rate": 8.030574325016532e-05, "epoch": 0.30460955353659214, "percentage": 30.46, "elapsed_time": "12:55:53", "remaining_time": "1 day, 5:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5466, "total_steps": 17941, "loss": 1.5681, "learning_rate": 8.029866054377148e-05, "epoch": 0.3046652917897553, "percentage": 30.47, "elapsed_time": "12:56:02", "remaining_time": "1 day, 5:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5467, "total_steps": 17941, "loss": 1.6819, "learning_rate": 8.029157687648077e-05, "epoch": 0.30472103004291845, "percentage": 30.47, "elapsed_time": "12:56:10", "remaining_time": "1 day, 5:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5468, "total_steps": 17941, "loss": 1.8688, "learning_rate": 8.028449224851785e-05, "epoch": 0.3047767682960816, "percentage": 30.48, "elapsed_time": "12:56:18", "remaining_time": "1 day, 5:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5469, "total_steps": 17941, "loss": 1.7629, "learning_rate": 8.027740666010741e-05, "epoch": 0.30483250654924476, "percentage": 30.48, "elapsed_time": "12:56:27", "remaining_time": "1 day, 5:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5470, "total_steps": 17941, "loss": 1.594, "learning_rate": 8.027032011147417e-05, "epoch": 0.3048882448024079, "percentage": 30.49, "elapsed_time": "12:56:35", "remaining_time": "1 day, 5:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5471, "total_steps": 17941, "loss": 1.6677, "learning_rate": 8.026323260284286e-05, "epoch": 0.304943983055571, "percentage": 30.49, "elapsed_time": "12:56:44", "remaining_time": "1 day, 5:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5472, "total_steps": 17941, "loss": 1.5382, "learning_rate": 8.025614413443824e-05, "epoch": 0.3049997213087342, "percentage": 30.5, "elapsed_time": "12:56:52", "remaining_time": "1 day, 5:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5473, "total_steps": 17941, "loss": 1.59, "learning_rate": 8.024905470648516e-05, "epoch": 0.30505545956189734, "percentage": 30.51, "elapsed_time": "12:57:01", "remaining_time": "1 day, 5:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5474, "total_steps": 17941, "loss": 1.6797, "learning_rate": 8.024196431920841e-05, "epoch": 0.30511119781506046, "percentage": 30.51, "elapsed_time": "12:57:09", "remaining_time": "1 day, 5:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5475, "total_steps": 17941, "loss": 1.7703, "learning_rate": 8.023487297283289e-05, "epoch": 0.30516693606822365, "percentage": 30.52, "elapsed_time": "12:57:18", "remaining_time": "1 day, 5:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5476, "total_steps": 17941, "loss": 1.5239, "learning_rate": 8.022778066758348e-05, "epoch": 0.3052226743213868, "percentage": 30.52, "elapsed_time": "12:57:26", "remaining_time": "1 day, 5:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5477, "total_steps": 17941, "loss": 1.8356, "learning_rate": 8.02206874036851e-05, "epoch": 0.3052784125745499, "percentage": 30.53, "elapsed_time": "12:57:35", "remaining_time": "1 day, 5:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5478, "total_steps": 17941, "loss": 1.8527, "learning_rate": 8.021359318136273e-05, "epoch": 0.30533415082771304, "percentage": 30.53, "elapsed_time": "12:57:43", "remaining_time": "1 day, 5:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5479, "total_steps": 17941, "loss": 1.7682, "learning_rate": 8.020649800084133e-05, "epoch": 0.3053898890808762, "percentage": 30.54, "elapsed_time": "12:57:52", "remaining_time": "1 day, 5:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5480, "total_steps": 17941, "loss": 1.7112, "learning_rate": 8.019940186234591e-05, "epoch": 0.30544562733403935, "percentage": 30.54, "elapsed_time": "12:58:00", "remaining_time": "1 day, 5:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5481, "total_steps": 17941, "loss": 1.7824, "learning_rate": 8.019230476610155e-05, "epoch": 0.3055013655872025, "percentage": 30.55, "elapsed_time": "12:58:09", "remaining_time": "1 day, 5:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5482, "total_steps": 17941, "loss": 1.8217, "learning_rate": 8.018520671233333e-05, "epoch": 0.30555710384036566, "percentage": 30.56, "elapsed_time": "12:58:17", "remaining_time": "1 day, 5:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5483, "total_steps": 17941, "loss": 1.572, "learning_rate": 8.017810770126633e-05, "epoch": 0.3056128420935288, "percentage": 30.56, "elapsed_time": "12:58:26", "remaining_time": "1 day, 5:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5484, "total_steps": 17941, "loss": 1.8889, "learning_rate": 8.017100773312572e-05, "epoch": 0.3056685803466919, "percentage": 30.57, "elapsed_time": "12:58:34", "remaining_time": "1 day, 5:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5485, "total_steps": 17941, "loss": 1.8318, "learning_rate": 8.016390680813664e-05, "epoch": 0.3057243185998551, "percentage": 30.57, "elapsed_time": "12:58:43", "remaining_time": "1 day, 5:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5486, "total_steps": 17941, "loss": 1.4898, "learning_rate": 8.015680492652432e-05, "epoch": 0.30578005685301823, "percentage": 30.58, "elapsed_time": "12:58:51", "remaining_time": "1 day, 5:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5487, "total_steps": 17941, "loss": 1.622, "learning_rate": 8.014970208851395e-05, "epoch": 0.30583579510618136, "percentage": 30.58, "elapsed_time": "12:58:59", "remaining_time": "1 day, 5:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5488, "total_steps": 17941, "loss": 1.5932, "learning_rate": 8.014259829433082e-05, "epoch": 0.3058915333593445, "percentage": 30.59, "elapsed_time": "12:59:08", "remaining_time": "1 day, 5:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5489, "total_steps": 17941, "loss": 1.7663, "learning_rate": 8.013549354420022e-05, "epoch": 0.3059472716125077, "percentage": 30.59, "elapsed_time": "12:59:16", "remaining_time": "1 day, 5:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5490, "total_steps": 17941, "loss": 1.7812, "learning_rate": 8.012838783834749e-05, "epoch": 0.3060030098656708, "percentage": 30.6, "elapsed_time": "12:59:25", "remaining_time": "1 day, 5:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5491, "total_steps": 17941, "loss": 1.8031, "learning_rate": 8.012128117699793e-05, "epoch": 0.30605874811883393, "percentage": 30.61, "elapsed_time": "12:59:33", "remaining_time": "1 day, 5:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5492, "total_steps": 17941, "loss": 1.7483, "learning_rate": 8.011417356037697e-05, "epoch": 0.3061144863719971, "percentage": 30.61, "elapsed_time": "12:59:42", "remaining_time": "1 day, 5:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5493, "total_steps": 17941, "loss": 1.6449, "learning_rate": 8.010706498870997e-05, "epoch": 0.30617022462516025, "percentage": 30.62, "elapsed_time": "12:59:50", "remaining_time": "1 day, 5:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5494, "total_steps": 17941, "loss": 1.5837, "learning_rate": 8.009995546222242e-05, "epoch": 0.3062259628783234, "percentage": 30.62, "elapsed_time": "13:00:00", "remaining_time": "1 day, 5:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5495, "total_steps": 17941, "loss": 1.7239, "learning_rate": 8.009284498113979e-05, "epoch": 0.30628170113148656, "percentage": 30.63, "elapsed_time": "13:00:08", "remaining_time": "1 day, 5:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5496, "total_steps": 17941, "loss": 1.6928, "learning_rate": 8.008573354568756e-05, "epoch": 0.3063374393846497, "percentage": 30.63, "elapsed_time": "13:00:17", "remaining_time": "1 day, 5:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5497, "total_steps": 17941, "loss": 1.7299, "learning_rate": 8.007862115609129e-05, "epoch": 0.3063931776378128, "percentage": 30.64, "elapsed_time": "13:00:25", "remaining_time": "1 day, 5:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5498, "total_steps": 17941, "loss": 1.6299, "learning_rate": 8.007150781257651e-05, "epoch": 0.306448915890976, "percentage": 30.64, "elapsed_time": "13:00:33", "remaining_time": "1 day, 5:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5499, "total_steps": 17941, "loss": 1.6814, "learning_rate": 8.006439351536883e-05, "epoch": 0.30650465414413913, "percentage": 30.65, "elapsed_time": "13:00:42", "remaining_time": "1 day, 5:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5500, "total_steps": 17941, "loss": 1.7617, "learning_rate": 8.005727826469389e-05, "epoch": 0.30656039239730226, "percentage": 30.66, "elapsed_time": "13:00:50", "remaining_time": "1 day, 5:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5501, "total_steps": 17941, "loss": 1.913, "learning_rate": 8.005016206077731e-05, "epoch": 0.3066161306504654, "percentage": 30.66, "elapsed_time": "13:00:59", "remaining_time": "1 day, 5:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5502, "total_steps": 17941, "loss": 1.6782, "learning_rate": 8.004304490384482e-05, "epoch": 0.3066718689036286, "percentage": 30.67, "elapsed_time": "13:01:07", "remaining_time": "1 day, 5:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5503, "total_steps": 17941, "loss": 1.4965, "learning_rate": 8.003592679412208e-05, "epoch": 0.3067276071567917, "percentage": 30.67, "elapsed_time": "13:01:16", "remaining_time": "1 day, 5:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5504, "total_steps": 17941, "loss": 1.4724, "learning_rate": 8.00288077318349e-05, "epoch": 0.30678334540995483, "percentage": 30.68, "elapsed_time": "13:01:25", "remaining_time": "1 day, 5:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5505, "total_steps": 17941, "loss": 1.6722, "learning_rate": 8.0021687717209e-05, "epoch": 0.306839083663118, "percentage": 30.68, "elapsed_time": "13:01:33", "remaining_time": "1 day, 5:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5506, "total_steps": 17941, "loss": 1.8088, "learning_rate": 8.001456675047019e-05, "epoch": 0.30689482191628115, "percentage": 30.69, "elapsed_time": "13:01:41", "remaining_time": "1 day, 5:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5507, "total_steps": 17941, "loss": 1.5916, "learning_rate": 8.000744483184433e-05, "epoch": 0.3069505601694443, "percentage": 30.7, "elapsed_time": "13:01:50", "remaining_time": "1 day, 5:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5508, "total_steps": 17941, "loss": 1.8253, "learning_rate": 8.000032196155726e-05, "epoch": 0.30700629842260746, "percentage": 30.7, "elapsed_time": "13:01:58", "remaining_time": "1 day, 5:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5509, "total_steps": 17941, "loss": 1.7183, "learning_rate": 7.999319813983492e-05, "epoch": 0.3070620366757706, "percentage": 30.71, "elapsed_time": "13:02:07", "remaining_time": "1 day, 5:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5510, "total_steps": 17941, "loss": 1.8415, "learning_rate": 7.99860733669032e-05, "epoch": 0.3071177749289337, "percentage": 30.71, "elapsed_time": "13:02:15", "remaining_time": "1 day, 5:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5511, "total_steps": 17941, "loss": 1.8575, "learning_rate": 7.997894764298806e-05, "epoch": 0.30717351318209685, "percentage": 30.72, "elapsed_time": "13:02:24", "remaining_time": "1 day, 5:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5512, "total_steps": 17941, "loss": 1.6398, "learning_rate": 7.997182096831548e-05, "epoch": 0.30722925143526003, "percentage": 30.72, "elapsed_time": "13:02:32", "remaining_time": "1 day, 5:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5513, "total_steps": 17941, "loss": 2.0446, "learning_rate": 7.99646933431115e-05, "epoch": 0.30728498968842316, "percentage": 30.73, "elapsed_time": "13:02:41", "remaining_time": "1 day, 5:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5514, "total_steps": 17941, "loss": 1.7335, "learning_rate": 7.995756476760214e-05, "epoch": 0.3073407279415863, "percentage": 30.73, "elapsed_time": "13:02:49", "remaining_time": "1 day, 5:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5515, "total_steps": 17941, "loss": 1.6374, "learning_rate": 7.995043524201351e-05, "epoch": 0.3073964661947495, "percentage": 30.74, "elapsed_time": "13:02:58", "remaining_time": "1 day, 5:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5516, "total_steps": 17941, "loss": 1.8542, "learning_rate": 7.994330476657168e-05, "epoch": 0.3074522044479126, "percentage": 30.75, "elapsed_time": "13:03:08", "remaining_time": "1 day, 5:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5517, "total_steps": 17941, "loss": 1.74, "learning_rate": 7.993617334150282e-05, "epoch": 0.30750794270107573, "percentage": 30.75, "elapsed_time": "13:03:16", "remaining_time": "1 day, 5:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5518, "total_steps": 17941, "loss": 1.6844, "learning_rate": 7.992904096703307e-05, "epoch": 0.3075636809542389, "percentage": 30.76, "elapsed_time": "13:03:24", "remaining_time": "1 day, 5:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5519, "total_steps": 17941, "loss": 1.7397, "learning_rate": 7.992190764338864e-05, "epoch": 0.30761941920740205, "percentage": 30.76, "elapsed_time": "13:03:33", "remaining_time": "1 day, 5:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5520, "total_steps": 17941, "loss": 1.7361, "learning_rate": 7.991477337079576e-05, "epoch": 0.3076751574605652, "percentage": 30.77, "elapsed_time": "13:03:41", "remaining_time": "1 day, 5:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5521, "total_steps": 17941, "loss": 1.8819, "learning_rate": 7.990763814948068e-05, "epoch": 0.30773089571372836, "percentage": 30.77, "elapsed_time": "13:03:50", "remaining_time": "1 day, 5:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5522, "total_steps": 17941, "loss": 1.5405, "learning_rate": 7.99005019796697e-05, "epoch": 0.3077866339668915, "percentage": 30.78, "elapsed_time": "13:03:58", "remaining_time": "1 day, 5:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5523, "total_steps": 17941, "loss": 1.6712, "learning_rate": 7.989336486158912e-05, "epoch": 0.3078423722200546, "percentage": 30.78, "elapsed_time": "13:04:07", "remaining_time": "1 day, 5:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5524, "total_steps": 17941, "loss": 2.0319, "learning_rate": 7.988622679546529e-05, "epoch": 0.30789811047321775, "percentage": 30.79, "elapsed_time": "13:04:15", "remaining_time": "1 day, 5:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5525, "total_steps": 17941, "loss": 1.5891, "learning_rate": 7.987908778152462e-05, "epoch": 0.30795384872638093, "percentage": 30.8, "elapsed_time": "13:04:24", "remaining_time": "1 day, 5:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5526, "total_steps": 17941, "loss": 1.865, "learning_rate": 7.987194781999345e-05, "epoch": 0.30800958697954406, "percentage": 30.8, "elapsed_time": "13:04:32", "remaining_time": "1 day, 5:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5527, "total_steps": 17941, "loss": 1.5777, "learning_rate": 7.98648069110983e-05, "epoch": 0.3080653252327072, "percentage": 30.81, "elapsed_time": "13:04:41", "remaining_time": "1 day, 5:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5528, "total_steps": 17941, "loss": 1.8957, "learning_rate": 7.985766505506559e-05, "epoch": 0.3081210634858704, "percentage": 30.81, "elapsed_time": "13:04:49", "remaining_time": "1 day, 5:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5529, "total_steps": 17941, "loss": 1.7575, "learning_rate": 7.985052225212181e-05, "epoch": 0.3081768017390335, "percentage": 30.82, "elapsed_time": "13:04:58", "remaining_time": "1 day, 5:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5530, "total_steps": 17941, "loss": 1.7377, "learning_rate": 7.984337850249352e-05, "epoch": 0.30823253999219663, "percentage": 30.82, "elapsed_time": "13:05:06", "remaining_time": "1 day, 5:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5531, "total_steps": 17941, "loss": 1.7941, "learning_rate": 7.983623380640729e-05, "epoch": 0.3082882782453598, "percentage": 30.83, "elapsed_time": "13:05:14", "remaining_time": "1 day, 5:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5532, "total_steps": 17941, "loss": 1.8425, "learning_rate": 7.982908816408963e-05, "epoch": 0.30834401649852294, "percentage": 30.83, "elapsed_time": "13:05:23", "remaining_time": "1 day, 5:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5533, "total_steps": 17941, "loss": 1.6765, "learning_rate": 7.982194157576723e-05, "epoch": 0.3083997547516861, "percentage": 30.84, "elapsed_time": "13:05:31", "remaining_time": "1 day, 5:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5534, "total_steps": 17941, "loss": 1.8554, "learning_rate": 7.981479404166672e-05, "epoch": 0.3084554930048492, "percentage": 30.85, "elapsed_time": "13:05:40", "remaining_time": "1 day, 5:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5535, "total_steps": 17941, "loss": 1.6513, "learning_rate": 7.980764556201478e-05, "epoch": 0.3085112312580124, "percentage": 30.85, "elapsed_time": "13:05:49", "remaining_time": "1 day, 5:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5536, "total_steps": 17941, "loss": 1.7565, "learning_rate": 7.980049613703811e-05, "epoch": 0.3085669695111755, "percentage": 30.86, "elapsed_time": "13:05:57", "remaining_time": "1 day, 5:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5537, "total_steps": 17941, "loss": 1.6711, "learning_rate": 7.979334576696344e-05, "epoch": 0.30862270776433864, "percentage": 30.86, "elapsed_time": "13:06:05", "remaining_time": "1 day, 5:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5538, "total_steps": 17941, "loss": 1.8865, "learning_rate": 7.978619445201756e-05, "epoch": 0.30867844601750183, "percentage": 30.87, "elapsed_time": "13:06:14", "remaining_time": "1 day, 5:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5539, "total_steps": 17941, "loss": 1.9338, "learning_rate": 7.977904219242724e-05, "epoch": 0.30873418427066496, "percentage": 30.87, "elapsed_time": "13:06:22", "remaining_time": "1 day, 5:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5540, "total_steps": 17941, "loss": 1.778, "learning_rate": 7.977188898841936e-05, "epoch": 0.3087899225238281, "percentage": 30.88, "elapsed_time": "13:06:31", "remaining_time": "1 day, 5:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5541, "total_steps": 17941, "loss": 1.6528, "learning_rate": 7.976473484022071e-05, "epoch": 0.30884566077699127, "percentage": 30.88, "elapsed_time": "13:06:39", "remaining_time": "1 day, 5:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5542, "total_steps": 17941, "loss": 1.6939, "learning_rate": 7.975757974805824e-05, "epoch": 0.3089013990301544, "percentage": 30.89, "elapsed_time": "13:06:48", "remaining_time": "1 day, 5:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5543, "total_steps": 17941, "loss": 1.5085, "learning_rate": 7.975042371215881e-05, "epoch": 0.30895713728331753, "percentage": 30.9, "elapsed_time": "13:06:56", "remaining_time": "1 day, 5:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5544, "total_steps": 17941, "loss": 1.7745, "learning_rate": 7.974326673274943e-05, "epoch": 0.3090128755364807, "percentage": 30.9, "elapsed_time": "13:07:05", "remaining_time": "1 day, 5:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5545, "total_steps": 17941, "loss": 1.6344, "learning_rate": 7.973610881005702e-05, "epoch": 0.30906861378964384, "percentage": 30.91, "elapsed_time": "13:07:13", "remaining_time": "1 day, 5:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5546, "total_steps": 17941, "loss": 1.8173, "learning_rate": 7.972894994430862e-05, "epoch": 0.30912435204280697, "percentage": 30.91, "elapsed_time": "13:07:21", "remaining_time": "1 day, 5:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5547, "total_steps": 17941, "loss": 1.6173, "learning_rate": 7.972179013573125e-05, "epoch": 0.3091800902959701, "percentage": 30.92, "elapsed_time": "13:07:30", "remaining_time": "1 day, 5:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5548, "total_steps": 17941, "loss": 1.5781, "learning_rate": 7.971462938455199e-05, "epoch": 0.3092358285491333, "percentage": 30.92, "elapsed_time": "13:07:38", "remaining_time": "1 day, 5:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5549, "total_steps": 17941, "loss": 1.5528, "learning_rate": 7.970746769099795e-05, "epoch": 0.3092915668022964, "percentage": 30.93, "elapsed_time": "13:07:47", "remaining_time": "1 day, 5:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5550, "total_steps": 17941, "loss": 1.9145, "learning_rate": 7.970030505529624e-05, "epoch": 0.30934730505545954, "percentage": 30.93, "elapsed_time": "13:07:56", "remaining_time": "1 day, 5:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5551, "total_steps": 17941, "loss": 1.7875, "learning_rate": 7.969314147767399e-05, "epoch": 0.3094030433086227, "percentage": 30.94, "elapsed_time": "13:08:04", "remaining_time": "1 day, 5:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5552, "total_steps": 17941, "loss": 1.5879, "learning_rate": 7.968597695835844e-05, "epoch": 0.30945878156178586, "percentage": 30.95, "elapsed_time": "13:08:13", "remaining_time": "1 day, 5:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5553, "total_steps": 17941, "loss": 1.6178, "learning_rate": 7.967881149757678e-05, "epoch": 0.309514519814949, "percentage": 30.95, "elapsed_time": "13:08:21", "remaining_time": "1 day, 5:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5554, "total_steps": 17941, "loss": 1.7701, "learning_rate": 7.967164509555624e-05, "epoch": 0.30957025806811217, "percentage": 30.96, "elapsed_time": "13:08:30", "remaining_time": "1 day, 5:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5555, "total_steps": 17941, "loss": 1.5632, "learning_rate": 7.966447775252415e-05, "epoch": 0.3096259963212753, "percentage": 30.96, "elapsed_time": "13:08:38", "remaining_time": "1 day, 5:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5556, "total_steps": 17941, "loss": 1.7161, "learning_rate": 7.965730946870775e-05, "epoch": 0.3096817345744384, "percentage": 30.97, "elapsed_time": "13:08:47", "remaining_time": "1 day, 5:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5557, "total_steps": 17941, "loss": 1.7959, "learning_rate": 7.965014024433443e-05, "epoch": 0.30973747282760156, "percentage": 30.97, "elapsed_time": "13:08:55", "remaining_time": "1 day, 5:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5558, "total_steps": 17941, "loss": 1.8631, "learning_rate": 7.964297007963151e-05, "epoch": 0.30979321108076474, "percentage": 30.98, "elapsed_time": "13:09:04", "remaining_time": "1 day, 5:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5559, "total_steps": 17941, "loss": 1.7503, "learning_rate": 7.963579897482642e-05, "epoch": 0.30984894933392787, "percentage": 30.98, "elapsed_time": "13:09:12", "remaining_time": "1 day, 5:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5560, "total_steps": 17941, "loss": 1.6935, "learning_rate": 7.96286269301466e-05, "epoch": 0.309904687587091, "percentage": 30.99, "elapsed_time": "13:09:20", "remaining_time": "1 day, 5:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5561, "total_steps": 17941, "loss": 1.7342, "learning_rate": 7.962145394581944e-05, "epoch": 0.3099604258402542, "percentage": 31.0, "elapsed_time": "13:09:29", "remaining_time": "1 day, 5:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5562, "total_steps": 17941, "loss": 1.6875, "learning_rate": 7.961428002207249e-05, "epoch": 0.3100161640934173, "percentage": 31.0, "elapsed_time": "13:09:37", "remaining_time": "1 day, 5:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5563, "total_steps": 17941, "loss": 1.6991, "learning_rate": 7.960710515913323e-05, "epoch": 0.31007190234658044, "percentage": 31.01, "elapsed_time": "13:09:46", "remaining_time": "1 day, 5:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5564, "total_steps": 17941, "loss": 1.8622, "learning_rate": 7.959992935722924e-05, "epoch": 0.3101276405997436, "percentage": 31.01, "elapsed_time": "13:09:54", "remaining_time": "1 day, 5:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5565, "total_steps": 17941, "loss": 1.8244, "learning_rate": 7.959275261658804e-05, "epoch": 0.31018337885290675, "percentage": 31.02, "elapsed_time": "13:10:03", "remaining_time": "1 day, 5:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5566, "total_steps": 17941, "loss": 1.796, "learning_rate": 7.958557493743728e-05, "epoch": 0.3102391171060699, "percentage": 31.02, "elapsed_time": "13:10:11", "remaining_time": "1 day, 5:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5567, "total_steps": 17941, "loss": 2.2928, "learning_rate": 7.957839632000457e-05, "epoch": 0.31029485535923307, "percentage": 31.03, "elapsed_time": "13:10:20", "remaining_time": "1 day, 5:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5568, "total_steps": 17941, "loss": 1.5466, "learning_rate": 7.957121676451759e-05, "epoch": 0.3103505936123962, "percentage": 31.04, "elapsed_time": "13:10:28", "remaining_time": "1 day, 5:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5569, "total_steps": 17941, "loss": 1.7847, "learning_rate": 7.956403627120403e-05, "epoch": 0.3104063318655593, "percentage": 31.04, "elapsed_time": "13:10:37", "remaining_time": "1 day, 5:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5570, "total_steps": 17941, "loss": 1.752, "learning_rate": 7.95568548402916e-05, "epoch": 0.31046207011872246, "percentage": 31.05, "elapsed_time": "13:10:45", "remaining_time": "1 day, 5:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5571, "total_steps": 17941, "loss": 1.7436, "learning_rate": 7.954967247200806e-05, "epoch": 0.31051780837188564, "percentage": 31.05, "elapsed_time": "13:10:54", "remaining_time": "1 day, 5:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5572, "total_steps": 17941, "loss": 1.3893, "learning_rate": 7.95424891665812e-05, "epoch": 0.31057354662504877, "percentage": 31.06, "elapsed_time": "13:11:02", "remaining_time": "1 day, 5:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5573, "total_steps": 17941, "loss": 1.5228, "learning_rate": 7.953530492423884e-05, "epoch": 0.3106292848782119, "percentage": 31.06, "elapsed_time": "13:11:11", "remaining_time": "1 day, 5:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5574, "total_steps": 17941, "loss": 1.7454, "learning_rate": 7.95281197452088e-05, "epoch": 0.3106850231313751, "percentage": 31.07, "elapsed_time": "13:11:19", "remaining_time": "1 day, 5:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5575, "total_steps": 17941, "loss": 1.6264, "learning_rate": 7.952093362971897e-05, "epoch": 0.3107407613845382, "percentage": 31.07, "elapsed_time": "13:11:27", "remaining_time": "1 day, 5:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5576, "total_steps": 17941, "loss": 1.4175, "learning_rate": 7.951374657799724e-05, "epoch": 0.31079649963770134, "percentage": 31.08, "elapsed_time": "13:11:36", "remaining_time": "1 day, 5:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5577, "total_steps": 17941, "loss": 1.6686, "learning_rate": 7.950655859027154e-05, "epoch": 0.3108522378908645, "percentage": 31.09, "elapsed_time": "13:11:44", "remaining_time": "1 day, 5:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5578, "total_steps": 17941, "loss": 1.7351, "learning_rate": 7.949936966676984e-05, "epoch": 0.31090797614402765, "percentage": 31.09, "elapsed_time": "13:11:53", "remaining_time": "1 day, 5:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5579, "total_steps": 17941, "loss": 1.9914, "learning_rate": 7.949217980772012e-05, "epoch": 0.3109637143971908, "percentage": 31.1, "elapsed_time": "13:12:01", "remaining_time": "1 day, 5:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5580, "total_steps": 17941, "loss": 1.9362, "learning_rate": 7.948498901335042e-05, "epoch": 0.3110194526503539, "percentage": 31.1, "elapsed_time": "13:12:10", "remaining_time": "1 day, 5:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5581, "total_steps": 17941, "loss": 1.6922, "learning_rate": 7.947779728388878e-05, "epoch": 0.3110751909035171, "percentage": 31.11, "elapsed_time": "13:12:18", "remaining_time": "1 day, 5:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5582, "total_steps": 17941, "loss": 2.146, "learning_rate": 7.947060461956329e-05, "epoch": 0.3111309291566802, "percentage": 31.11, "elapsed_time": "13:12:27", "remaining_time": "1 day, 5:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5583, "total_steps": 17941, "loss": 1.7858, "learning_rate": 7.946341102060202e-05, "epoch": 0.31118666740984335, "percentage": 31.12, "elapsed_time": "13:12:35", "remaining_time": "1 day, 5:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5584, "total_steps": 17941, "loss": 1.6921, "learning_rate": 7.945621648723313e-05, "epoch": 0.31124240566300654, "percentage": 31.12, "elapsed_time": "13:12:43", "remaining_time": "1 day, 5:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5585, "total_steps": 17941, "loss": 1.7601, "learning_rate": 7.944902101968482e-05, "epoch": 0.31129814391616967, "percentage": 31.13, "elapsed_time": "13:12:52", "remaining_time": "1 day, 5:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5586, "total_steps": 17941, "loss": 1.6861, "learning_rate": 7.944182461818525e-05, "epoch": 0.3113538821693328, "percentage": 31.14, "elapsed_time": "13:13:01", "remaining_time": "1 day, 5:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5587, "total_steps": 17941, "loss": 1.4954, "learning_rate": 7.943462728296266e-05, "epoch": 0.311409620422496, "percentage": 31.14, "elapsed_time": "13:13:09", "remaining_time": "1 day, 5:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5588, "total_steps": 17941, "loss": 1.7086, "learning_rate": 7.942742901424531e-05, "epoch": 0.3114653586756591, "percentage": 31.15, "elapsed_time": "13:13:17", "remaining_time": "1 day, 5:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5589, "total_steps": 17941, "loss": 1.7788, "learning_rate": 7.942022981226149e-05, "epoch": 0.31152109692882224, "percentage": 31.15, "elapsed_time": "13:13:26", "remaining_time": "1 day, 5:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5590, "total_steps": 17941, "loss": 1.3316, "learning_rate": 7.941302967723951e-05, "epoch": 0.3115768351819854, "percentage": 31.16, "elapsed_time": "13:13:34", "remaining_time": "1 day, 5:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5591, "total_steps": 17941, "loss": 1.6683, "learning_rate": 7.940582860940771e-05, "epoch": 0.31163257343514855, "percentage": 31.16, "elapsed_time": "13:13:43", "remaining_time": "1 day, 5:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5592, "total_steps": 17941, "loss": 1.7344, "learning_rate": 7.939862660899448e-05, "epoch": 0.3116883116883117, "percentage": 31.17, "elapsed_time": "13:13:52", "remaining_time": "1 day, 5:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5593, "total_steps": 17941, "loss": 1.5524, "learning_rate": 7.939142367622823e-05, "epoch": 0.3117440499414748, "percentage": 31.17, "elapsed_time": "13:14:00", "remaining_time": "1 day, 5:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5594, "total_steps": 17941, "loss": 1.7415, "learning_rate": 7.938421981133738e-05, "epoch": 0.311799788194638, "percentage": 31.18, "elapsed_time": "13:14:08", "remaining_time": "1 day, 5:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5595, "total_steps": 17941, "loss": 1.5333, "learning_rate": 7.937701501455039e-05, "epoch": 0.3118555264478011, "percentage": 31.19, "elapsed_time": "13:14:17", "remaining_time": "1 day, 5:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5596, "total_steps": 17941, "loss": 1.8723, "learning_rate": 7.936980928609577e-05, "epoch": 0.31191126470096425, "percentage": 31.19, "elapsed_time": "13:14:26", "remaining_time": "1 day, 5:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5597, "total_steps": 17941, "loss": 1.8915, "learning_rate": 7.936260262620205e-05, "epoch": 0.31196700295412744, "percentage": 31.2, "elapsed_time": "13:14:34", "remaining_time": "1 day, 5:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5598, "total_steps": 17941, "loss": 1.8353, "learning_rate": 7.935539503509775e-05, "epoch": 0.31202274120729057, "percentage": 31.2, "elapsed_time": "13:14:43", "remaining_time": "1 day, 5:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5599, "total_steps": 17941, "loss": 1.832, "learning_rate": 7.934818651301148e-05, "epoch": 0.3120784794604537, "percentage": 31.21, "elapsed_time": "13:14:51", "remaining_time": "1 day, 5:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5600, "total_steps": 17941, "loss": 1.7301, "learning_rate": 7.934097706017185e-05, "epoch": 0.3121342177136169, "percentage": 31.21, "elapsed_time": "13:14:59", "remaining_time": "1 day, 5:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5601, "total_steps": 17941, "loss": 1.7095, "learning_rate": 7.93337666768075e-05, "epoch": 0.31218995596678, "percentage": 31.22, "elapsed_time": "13:15:08", "remaining_time": "1 day, 5:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5602, "total_steps": 17941, "loss": 1.6071, "learning_rate": 7.932655536314708e-05, "epoch": 0.31224569421994314, "percentage": 31.22, "elapsed_time": "13:15:16", "remaining_time": "1 day, 5:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5603, "total_steps": 17941, "loss": 1.5759, "learning_rate": 7.931934311941933e-05, "epoch": 0.31230143247310627, "percentage": 31.23, "elapsed_time": "13:15:25", "remaining_time": "1 day, 5:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5604, "total_steps": 17941, "loss": 1.5492, "learning_rate": 7.931212994585294e-05, "epoch": 0.31235717072626945, "percentage": 31.24, "elapsed_time": "13:15:33", "remaining_time": "1 day, 5:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5605, "total_steps": 17941, "loss": 1.7768, "learning_rate": 7.93049158426767e-05, "epoch": 0.3124129089794326, "percentage": 31.24, "elapsed_time": "13:15:42", "remaining_time": "1 day, 5:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5606, "total_steps": 17941, "loss": 1.6003, "learning_rate": 7.92977008101194e-05, "epoch": 0.3124686472325957, "percentage": 31.25, "elapsed_time": "13:15:50", "remaining_time": "1 day, 5:11:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5607, "total_steps": 17941, "loss": 1.7666, "learning_rate": 7.929048484840984e-05, "epoch": 0.3125243854857589, "percentage": 31.25, "elapsed_time": "13:15:59", "remaining_time": "1 day, 5:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5608, "total_steps": 17941, "loss": 1.7861, "learning_rate": 7.928326795777688e-05, "epoch": 0.312580123738922, "percentage": 31.26, "elapsed_time": "13:16:07", "remaining_time": "1 day, 5:10:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5609, "total_steps": 17941, "loss": 1.614, "learning_rate": 7.927605013844939e-05, "epoch": 0.31263586199208515, "percentage": 31.26, "elapsed_time": "13:16:15", "remaining_time": "1 day, 5:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5610, "total_steps": 17941, "loss": 1.7949, "learning_rate": 7.926883139065627e-05, "epoch": 0.31269160024524834, "percentage": 31.27, "elapsed_time": "13:16:24", "remaining_time": "1 day, 5:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5611, "total_steps": 17941, "loss": 1.8147, "learning_rate": 7.926161171462648e-05, "epoch": 0.31274733849841146, "percentage": 31.27, "elapsed_time": "13:16:32", "remaining_time": "1 day, 5:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5612, "total_steps": 17941, "loss": 1.7117, "learning_rate": 7.925439111058897e-05, "epoch": 0.3128030767515746, "percentage": 31.28, "elapsed_time": "13:16:41", "remaining_time": "1 day, 5:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5613, "total_steps": 17941, "loss": 1.6873, "learning_rate": 7.924716957877275e-05, "epoch": 0.3128588150047378, "percentage": 31.29, "elapsed_time": "13:16:49", "remaining_time": "1 day, 5:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5614, "total_steps": 17941, "loss": 2.136, "learning_rate": 7.92399471194068e-05, "epoch": 0.3129145532579009, "percentage": 31.29, "elapsed_time": "13:16:58", "remaining_time": "1 day, 5:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5615, "total_steps": 17941, "loss": 1.7105, "learning_rate": 7.923272373272024e-05, "epoch": 0.31297029151106404, "percentage": 31.3, "elapsed_time": "13:17:06", "remaining_time": "1 day, 5:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5616, "total_steps": 17941, "loss": 1.7117, "learning_rate": 7.922549941894212e-05, "epoch": 0.31302602976422716, "percentage": 31.3, "elapsed_time": "13:17:15", "remaining_time": "1 day, 5:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5617, "total_steps": 17941, "loss": 1.7621, "learning_rate": 7.921827417830155e-05, "epoch": 0.31308176801739035, "percentage": 31.31, "elapsed_time": "13:17:24", "remaining_time": "1 day, 5:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5618, "total_steps": 17941, "loss": 1.7155, "learning_rate": 7.921104801102766e-05, "epoch": 0.3131375062705535, "percentage": 31.31, "elapsed_time": "13:17:32", "remaining_time": "1 day, 5:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5619, "total_steps": 17941, "loss": 1.5615, "learning_rate": 7.920382091734966e-05, "epoch": 0.3131932445237166, "percentage": 31.32, "elapsed_time": "13:17:41", "remaining_time": "1 day, 5:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5620, "total_steps": 17941, "loss": 1.6964, "learning_rate": 7.919659289749673e-05, "epoch": 0.3132489827768798, "percentage": 31.32, "elapsed_time": "13:17:49", "remaining_time": "1 day, 5:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5621, "total_steps": 17941, "loss": 1.6701, "learning_rate": 7.918936395169809e-05, "epoch": 0.3133047210300429, "percentage": 31.33, "elapsed_time": "13:17:58", "remaining_time": "1 day, 5:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5622, "total_steps": 17941, "loss": 1.8372, "learning_rate": 7.918213408018302e-05, "epoch": 0.31336045928320605, "percentage": 31.34, "elapsed_time": "13:18:06", "remaining_time": "1 day, 5:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5623, "total_steps": 17941, "loss": 1.6181, "learning_rate": 7.91749032831808e-05, "epoch": 0.31341619753636923, "percentage": 31.34, "elapsed_time": "13:18:15", "remaining_time": "1 day, 5:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5624, "total_steps": 17941, "loss": 1.8816, "learning_rate": 7.916767156092073e-05, "epoch": 0.31347193578953236, "percentage": 31.35, "elapsed_time": "13:18:23", "remaining_time": "1 day, 5:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5625, "total_steps": 17941, "loss": 1.331, "learning_rate": 7.916043891363221e-05, "epoch": 0.3135276740426955, "percentage": 31.35, "elapsed_time": "13:18:32", "remaining_time": "1 day, 5:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5626, "total_steps": 17941, "loss": 1.7526, "learning_rate": 7.915320534154457e-05, "epoch": 0.3135834122958586, "percentage": 31.36, "elapsed_time": "13:18:40", "remaining_time": "1 day, 5:08:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5627, "total_steps": 17941, "loss": 1.7204, "learning_rate": 7.914597084488723e-05, "epoch": 0.3136391505490218, "percentage": 31.36, "elapsed_time": "13:18:49", "remaining_time": "1 day, 5:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5628, "total_steps": 17941, "loss": 1.8833, "learning_rate": 7.913873542388963e-05, "epoch": 0.31369488880218493, "percentage": 31.37, "elapsed_time": "13:18:58", "remaining_time": "1 day, 5:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5629, "total_steps": 17941, "loss": 1.9049, "learning_rate": 7.913149907878123e-05, "epoch": 0.31375062705534806, "percentage": 31.38, "elapsed_time": "13:19:06", "remaining_time": "1 day, 5:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5630, "total_steps": 17941, "loss": 2.005, "learning_rate": 7.912426180979152e-05, "epoch": 0.31380636530851125, "percentage": 31.38, "elapsed_time": "13:19:15", "remaining_time": "1 day, 5:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5631, "total_steps": 17941, "loss": 1.7476, "learning_rate": 7.911702361715006e-05, "epoch": 0.3138621035616744, "percentage": 31.39, "elapsed_time": "13:19:23", "remaining_time": "1 day, 5:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5632, "total_steps": 17941, "loss": 1.69, "learning_rate": 7.910978450108634e-05, "epoch": 0.3139178418148375, "percentage": 31.39, "elapsed_time": "13:19:32", "remaining_time": "1 day, 5:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5633, "total_steps": 17941, "loss": 1.7354, "learning_rate": 7.910254446183e-05, "epoch": 0.3139735800680007, "percentage": 31.4, "elapsed_time": "13:19:40", "remaining_time": "1 day, 5:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5634, "total_steps": 17941, "loss": 1.803, "learning_rate": 7.909530349961062e-05, "epoch": 0.3140293183211638, "percentage": 31.4, "elapsed_time": "13:19:49", "remaining_time": "1 day, 5:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5635, "total_steps": 17941, "loss": 1.8425, "learning_rate": 7.908806161465785e-05, "epoch": 0.31408505657432695, "percentage": 31.41, "elapsed_time": "13:19:57", "remaining_time": "1 day, 5:06:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5636, "total_steps": 17941, "loss": 1.7041, "learning_rate": 7.908081880720137e-05, "epoch": 0.31414079482749013, "percentage": 31.41, "elapsed_time": "13:20:06", "remaining_time": "1 day, 5:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5637, "total_steps": 17941, "loss": 1.5982, "learning_rate": 7.907357507747087e-05, "epoch": 0.31419653308065326, "percentage": 31.42, "elapsed_time": "13:20:14", "remaining_time": "1 day, 5:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5638, "total_steps": 17941, "loss": 1.6506, "learning_rate": 7.906633042569607e-05, "epoch": 0.3142522713338164, "percentage": 31.43, "elapsed_time": "13:20:23", "remaining_time": "1 day, 5:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5639, "total_steps": 17941, "loss": 1.675, "learning_rate": 7.905908485210674e-05, "epoch": 0.3143080095869795, "percentage": 31.43, "elapsed_time": "13:20:31", "remaining_time": "1 day, 5:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5640, "total_steps": 17941, "loss": 1.6702, "learning_rate": 7.905183835693266e-05, "epoch": 0.3143637478401427, "percentage": 31.44, "elapsed_time": "13:20:40", "remaining_time": "1 day, 5:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5641, "total_steps": 17941, "loss": 1.8156, "learning_rate": 7.904459094040366e-05, "epoch": 0.31441948609330583, "percentage": 31.44, "elapsed_time": "13:20:48", "remaining_time": "1 day, 5:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5642, "total_steps": 17941, "loss": 1.8198, "learning_rate": 7.903734260274958e-05, "epoch": 0.31447522434646896, "percentage": 31.45, "elapsed_time": "13:20:57", "remaining_time": "1 day, 5:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5643, "total_steps": 17941, "loss": 1.6291, "learning_rate": 7.903009334420027e-05, "epoch": 0.31453096259963215, "percentage": 31.45, "elapsed_time": "13:21:05", "remaining_time": "1 day, 5:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5644, "total_steps": 17941, "loss": 1.6026, "learning_rate": 7.902284316498567e-05, "epoch": 0.3145867008527953, "percentage": 31.46, "elapsed_time": "13:21:13", "remaining_time": "1 day, 5:05:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5645, "total_steps": 17941, "loss": 1.9096, "learning_rate": 7.901559206533571e-05, "epoch": 0.3146424391059584, "percentage": 31.46, "elapsed_time": "13:21:22", "remaining_time": "1 day, 5:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5646, "total_steps": 17941, "loss": 1.9637, "learning_rate": 7.900834004548034e-05, "epoch": 0.3146981773591216, "percentage": 31.47, "elapsed_time": "13:21:31", "remaining_time": "1 day, 5:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5647, "total_steps": 17941, "loss": 1.8217, "learning_rate": 7.900108710564954e-05, "epoch": 0.3147539156122847, "percentage": 31.48, "elapsed_time": "13:21:39", "remaining_time": "1 day, 5:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5648, "total_steps": 17941, "loss": 1.7018, "learning_rate": 7.899383324607336e-05, "epoch": 0.31480965386544785, "percentage": 31.48, "elapsed_time": "13:21:48", "remaining_time": "1 day, 5:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5649, "total_steps": 17941, "loss": 1.823, "learning_rate": 7.898657846698183e-05, "epoch": 0.314865392118611, "percentage": 31.49, "elapsed_time": "13:21:56", "remaining_time": "1 day, 5:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5650, "total_steps": 17941, "loss": 1.8531, "learning_rate": 7.897932276860502e-05, "epoch": 0.31492113037177416, "percentage": 31.49, "elapsed_time": "13:22:05", "remaining_time": "1 day, 5:04:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5651, "total_steps": 17941, "loss": 1.8, "learning_rate": 7.897206615117307e-05, "epoch": 0.3149768686249373, "percentage": 31.5, "elapsed_time": "13:22:13", "remaining_time": "1 day, 5:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5652, "total_steps": 17941, "loss": 1.8554, "learning_rate": 7.89648086149161e-05, "epoch": 0.3150326068781004, "percentage": 31.5, "elapsed_time": "13:22:22", "remaining_time": "1 day, 5:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5653, "total_steps": 17941, "loss": 1.9814, "learning_rate": 7.895755016006427e-05, "epoch": 0.3150883451312636, "percentage": 31.51, "elapsed_time": "13:22:31", "remaining_time": "1 day, 5:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5654, "total_steps": 17941, "loss": 1.6895, "learning_rate": 7.895029078684779e-05, "epoch": 0.31514408338442673, "percentage": 31.51, "elapsed_time": "13:22:39", "remaining_time": "1 day, 5:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5655, "total_steps": 17941, "loss": 1.4731, "learning_rate": 7.894303049549687e-05, "epoch": 0.31519982163758986, "percentage": 31.52, "elapsed_time": "13:22:48", "remaining_time": "1 day, 5:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5656, "total_steps": 17941, "loss": 1.819, "learning_rate": 7.893576928624178e-05, "epoch": 0.31525555989075305, "percentage": 31.53, "elapsed_time": "13:22:56", "remaining_time": "1 day, 5:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5657, "total_steps": 17941, "loss": 1.6023, "learning_rate": 7.89285071593128e-05, "epoch": 0.3153112981439162, "percentage": 31.53, "elapsed_time": "13:23:05", "remaining_time": "1 day, 5:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5658, "total_steps": 17941, "loss": 1.5903, "learning_rate": 7.892124411494022e-05, "epoch": 0.3153670363970793, "percentage": 31.54, "elapsed_time": "13:23:13", "remaining_time": "1 day, 5:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5659, "total_steps": 17941, "loss": 1.646, "learning_rate": 7.891398015335442e-05, "epoch": 0.3154227746502425, "percentage": 31.54, "elapsed_time": "13:23:22", "remaining_time": "1 day, 5:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5660, "total_steps": 17941, "loss": 1.3751, "learning_rate": 7.890671527478574e-05, "epoch": 0.3154785129034056, "percentage": 31.55, "elapsed_time": "13:23:30", "remaining_time": "1 day, 5:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5661, "total_steps": 17941, "loss": 1.6491, "learning_rate": 7.88994494794646e-05, "epoch": 0.31553425115656875, "percentage": 31.55, "elapsed_time": "13:23:39", "remaining_time": "1 day, 5:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5662, "total_steps": 17941, "loss": 1.5753, "learning_rate": 7.88921827676214e-05, "epoch": 0.3155899894097319, "percentage": 31.56, "elapsed_time": "13:23:47", "remaining_time": "1 day, 5:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5663, "total_steps": 17941, "loss": 1.8023, "learning_rate": 7.888491513948661e-05, "epoch": 0.31564572766289506, "percentage": 31.56, "elapsed_time": "13:23:56", "remaining_time": "1 day, 5:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5664, "total_steps": 17941, "loss": 1.6754, "learning_rate": 7.887764659529073e-05, "epoch": 0.3157014659160582, "percentage": 31.57, "elapsed_time": "13:24:04", "remaining_time": "1 day, 5:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5665, "total_steps": 17941, "loss": 1.6262, "learning_rate": 7.887037713526428e-05, "epoch": 0.3157572041692213, "percentage": 31.58, "elapsed_time": "13:24:12", "remaining_time": "1 day, 5:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5666, "total_steps": 17941, "loss": 1.5649, "learning_rate": 7.88631067596378e-05, "epoch": 0.3158129424223845, "percentage": 31.58, "elapsed_time": "13:24:21", "remaining_time": "1 day, 5:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5667, "total_steps": 17941, "loss": 1.4968, "learning_rate": 7.885583546864184e-05, "epoch": 0.31586868067554763, "percentage": 31.59, "elapsed_time": "13:24:29", "remaining_time": "1 day, 5:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5668, "total_steps": 17941, "loss": 1.5559, "learning_rate": 7.884856326250703e-05, "epoch": 0.31592441892871076, "percentage": 31.59, "elapsed_time": "13:24:38", "remaining_time": "1 day, 5:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5669, "total_steps": 17941, "loss": 1.8384, "learning_rate": 7.884129014146397e-05, "epoch": 0.31598015718187394, "percentage": 31.6, "elapsed_time": "13:24:46", "remaining_time": "1 day, 5:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5670, "total_steps": 17941, "loss": 1.9506, "learning_rate": 7.883401610574336e-05, "epoch": 0.3160358954350371, "percentage": 31.6, "elapsed_time": "13:24:55", "remaining_time": "1 day, 5:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5671, "total_steps": 17941, "loss": 1.6864, "learning_rate": 7.882674115557587e-05, "epoch": 0.3160916336882002, "percentage": 31.61, "elapsed_time": "13:25:03", "remaining_time": "1 day, 5:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5672, "total_steps": 17941, "loss": 1.9635, "learning_rate": 7.881946529119223e-05, "epoch": 0.31614737194136333, "percentage": 31.61, "elapsed_time": "13:25:12", "remaining_time": "1 day, 5:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5673, "total_steps": 17941, "loss": 1.5806, "learning_rate": 7.881218851282317e-05, "epoch": 0.3162031101945265, "percentage": 31.62, "elapsed_time": "13:25:20", "remaining_time": "1 day, 5:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5674, "total_steps": 17941, "loss": 1.7419, "learning_rate": 7.880491082069949e-05, "epoch": 0.31625884844768964, "percentage": 31.63, "elapsed_time": "13:25:29", "remaining_time": "1 day, 5:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5675, "total_steps": 17941, "loss": 1.7392, "learning_rate": 7.879763221505197e-05, "epoch": 0.3163145867008528, "percentage": 31.63, "elapsed_time": "13:25:37", "remaining_time": "1 day, 5:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5676, "total_steps": 17941, "loss": 1.6862, "learning_rate": 7.879035269611146e-05, "epoch": 0.31637032495401596, "percentage": 31.64, "elapsed_time": "13:25:45", "remaining_time": "1 day, 5:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5677, "total_steps": 17941, "loss": 1.8253, "learning_rate": 7.878307226410882e-05, "epoch": 0.3164260632071791, "percentage": 31.64, "elapsed_time": "13:25:54", "remaining_time": "1 day, 5:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5678, "total_steps": 17941, "loss": 1.7754, "learning_rate": 7.877579091927496e-05, "epoch": 0.3164818014603422, "percentage": 31.65, "elapsed_time": "13:26:02", "remaining_time": "1 day, 5:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5679, "total_steps": 17941, "loss": 1.7315, "learning_rate": 7.876850866184077e-05, "epoch": 0.3165375397135054, "percentage": 31.65, "elapsed_time": "13:26:11", "remaining_time": "1 day, 5:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5680, "total_steps": 17941, "loss": 1.5367, "learning_rate": 7.876122549203723e-05, "epoch": 0.31659327796666853, "percentage": 31.66, "elapsed_time": "13:26:19", "remaining_time": "1 day, 5:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5681, "total_steps": 17941, "loss": 1.7551, "learning_rate": 7.87539414100953e-05, "epoch": 0.31664901621983166, "percentage": 31.66, "elapsed_time": "13:26:29", "remaining_time": "1 day, 5:00:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5682, "total_steps": 17941, "loss": 1.7739, "learning_rate": 7.874665641624599e-05, "epoch": 0.31670475447299484, "percentage": 31.67, "elapsed_time": "13:26:37", "remaining_time": "1 day, 5:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5683, "total_steps": 17941, "loss": 1.747, "learning_rate": 7.873937051072035e-05, "epoch": 0.31676049272615797, "percentage": 31.68, "elapsed_time": "13:26:45", "remaining_time": "1 day, 5:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5684, "total_steps": 17941, "loss": 1.8224, "learning_rate": 7.873208369374943e-05, "epoch": 0.3168162309793211, "percentage": 31.68, "elapsed_time": "13:26:54", "remaining_time": "1 day, 5:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5685, "total_steps": 17941, "loss": 1.6589, "learning_rate": 7.872479596556435e-05, "epoch": 0.31687196923248423, "percentage": 31.69, "elapsed_time": "13:27:02", "remaining_time": "1 day, 4:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5686, "total_steps": 17941, "loss": 1.6122, "learning_rate": 7.871750732639621e-05, "epoch": 0.3169277074856474, "percentage": 31.69, "elapsed_time": "13:27:11", "remaining_time": "1 day, 4:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5687, "total_steps": 17941, "loss": 1.766, "learning_rate": 7.871021777647618e-05, "epoch": 0.31698344573881054, "percentage": 31.7, "elapsed_time": "13:27:19", "remaining_time": "1 day, 4:59:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5688, "total_steps": 17941, "loss": 1.765, "learning_rate": 7.870292731603544e-05, "epoch": 0.31703918399197367, "percentage": 31.7, "elapsed_time": "13:27:28", "remaining_time": "1 day, 4:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5689, "total_steps": 17941, "loss": 1.6374, "learning_rate": 7.869563594530517e-05, "epoch": 0.31709492224513686, "percentage": 31.71, "elapsed_time": "13:27:36", "remaining_time": "1 day, 4:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5690, "total_steps": 17941, "loss": 1.8048, "learning_rate": 7.868834366451665e-05, "epoch": 0.3171506604983, "percentage": 31.72, "elapsed_time": "13:27:45", "remaining_time": "1 day, 4:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5691, "total_steps": 17941, "loss": 2.1298, "learning_rate": 7.868105047390113e-05, "epoch": 0.3172063987514631, "percentage": 31.72, "elapsed_time": "13:27:53", "remaining_time": "1 day, 4:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5692, "total_steps": 17941, "loss": 1.6, "learning_rate": 7.867375637368993e-05, "epoch": 0.3172621370046263, "percentage": 31.73, "elapsed_time": "13:28:01", "remaining_time": "1 day, 4:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5693, "total_steps": 17941, "loss": 1.7876, "learning_rate": 7.866646136411433e-05, "epoch": 0.31731787525778943, "percentage": 31.73, "elapsed_time": "13:28:10", "remaining_time": "1 day, 4:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5694, "total_steps": 17941, "loss": 1.7237, "learning_rate": 7.865916544540573e-05, "epoch": 0.31737361351095256, "percentage": 31.74, "elapsed_time": "13:28:18", "remaining_time": "1 day, 4:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5695, "total_steps": 17941, "loss": 1.5221, "learning_rate": 7.865186861779548e-05, "epoch": 0.3174293517641157, "percentage": 31.74, "elapsed_time": "13:28:27", "remaining_time": "1 day, 4:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5696, "total_steps": 17941, "loss": 1.7575, "learning_rate": 7.864457088151502e-05, "epoch": 0.31748509001727887, "percentage": 31.75, "elapsed_time": "13:28:35", "remaining_time": "1 day, 4:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5697, "total_steps": 17941, "loss": 1.789, "learning_rate": 7.863727223679578e-05, "epoch": 0.317540828270442, "percentage": 31.75, "elapsed_time": "13:28:44", "remaining_time": "1 day, 4:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5698, "total_steps": 17941, "loss": 1.802, "learning_rate": 7.862997268386924e-05, "epoch": 0.31759656652360513, "percentage": 31.76, "elapsed_time": "13:28:52", "remaining_time": "1 day, 4:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5699, "total_steps": 17941, "loss": 2.0765, "learning_rate": 7.862267222296687e-05, "epoch": 0.3176523047767683, "percentage": 31.77, "elapsed_time": "13:29:01", "remaining_time": "1 day, 4:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5700, "total_steps": 17941, "loss": 1.5644, "learning_rate": 7.861537085432025e-05, "epoch": 0.31770804302993144, "percentage": 31.77, "elapsed_time": "13:29:09", "remaining_time": "1 day, 4:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5701, "total_steps": 17941, "loss": 1.7291, "learning_rate": 7.860806857816088e-05, "epoch": 0.31776378128309457, "percentage": 31.78, "elapsed_time": "13:29:18", "remaining_time": "1 day, 4:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5702, "total_steps": 17941, "loss": 1.9244, "learning_rate": 7.860076539472037e-05, "epoch": 0.31781951953625776, "percentage": 31.78, "elapsed_time": "13:29:26", "remaining_time": "1 day, 4:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5703, "total_steps": 17941, "loss": 1.7579, "learning_rate": 7.859346130423035e-05, "epoch": 0.3178752577894209, "percentage": 31.79, "elapsed_time": "13:29:34", "remaining_time": "1 day, 4:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5704, "total_steps": 17941, "loss": 1.5755, "learning_rate": 7.858615630692244e-05, "epoch": 0.317930996042584, "percentage": 31.79, "elapsed_time": "13:29:43", "remaining_time": "1 day, 4:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5705, "total_steps": 17941, "loss": 1.6979, "learning_rate": 7.857885040302833e-05, "epoch": 0.3179867342957472, "percentage": 31.8, "elapsed_time": "13:29:51", "remaining_time": "1 day, 4:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5706, "total_steps": 17941, "loss": 1.6744, "learning_rate": 7.857154359277972e-05, "epoch": 0.3180424725489103, "percentage": 31.8, "elapsed_time": "13:30:00", "remaining_time": "1 day, 4:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5707, "total_steps": 17941, "loss": 1.8986, "learning_rate": 7.85642358764083e-05, "epoch": 0.31809821080207346, "percentage": 31.81, "elapsed_time": "13:30:08", "remaining_time": "1 day, 4:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5708, "total_steps": 17941, "loss": 1.5641, "learning_rate": 7.855692725414587e-05, "epoch": 0.3181539490552366, "percentage": 31.82, "elapsed_time": "13:30:17", "remaining_time": "1 day, 4:56:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5709, "total_steps": 17941, "loss": 1.6743, "learning_rate": 7.854961772622423e-05, "epoch": 0.31820968730839977, "percentage": 31.82, "elapsed_time": "13:30:25", "remaining_time": "1 day, 4:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5710, "total_steps": 17941, "loss": 1.5466, "learning_rate": 7.854230729287515e-05, "epoch": 0.3182654255615629, "percentage": 31.83, "elapsed_time": "13:30:34", "remaining_time": "1 day, 4:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5711, "total_steps": 17941, "loss": 1.7647, "learning_rate": 7.853499595433049e-05, "epoch": 0.318321163814726, "percentage": 31.83, "elapsed_time": "13:30:42", "remaining_time": "1 day, 4:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5712, "total_steps": 17941, "loss": 1.6237, "learning_rate": 7.852768371082215e-05, "epoch": 0.3183769020678892, "percentage": 31.84, "elapsed_time": "13:30:51", "remaining_time": "1 day, 4:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5713, "total_steps": 17941, "loss": 1.9955, "learning_rate": 7.852037056258199e-05, "epoch": 0.31843264032105234, "percentage": 31.84, "elapsed_time": "13:31:00", "remaining_time": "1 day, 4:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5714, "total_steps": 17941, "loss": 1.5985, "learning_rate": 7.851305650984197e-05, "epoch": 0.31848837857421547, "percentage": 31.85, "elapsed_time": "13:31:09", "remaining_time": "1 day, 4:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5715, "total_steps": 17941, "loss": 1.6371, "learning_rate": 7.850574155283404e-05, "epoch": 0.31854411682737865, "percentage": 31.85, "elapsed_time": "13:31:17", "remaining_time": "1 day, 4:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5716, "total_steps": 17941, "loss": 2.0647, "learning_rate": 7.849842569179017e-05, "epoch": 0.3185998550805418, "percentage": 31.86, "elapsed_time": "13:31:25", "remaining_time": "1 day, 4:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5717, "total_steps": 17941, "loss": 1.8005, "learning_rate": 7.849110892694242e-05, "epoch": 0.3186555933337049, "percentage": 31.87, "elapsed_time": "13:31:34", "remaining_time": "1 day, 4:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5718, "total_steps": 17941, "loss": 1.9861, "learning_rate": 7.848379125852282e-05, "epoch": 0.31871133158686804, "percentage": 31.87, "elapsed_time": "13:31:42", "remaining_time": "1 day, 4:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5719, "total_steps": 17941, "loss": 1.6806, "learning_rate": 7.847647268676341e-05, "epoch": 0.3187670698400312, "percentage": 31.88, "elapsed_time": "13:31:51", "remaining_time": "1 day, 4:55:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5720, "total_steps": 17941, "loss": 1.7323, "learning_rate": 7.846915321189632e-05, "epoch": 0.31882280809319435, "percentage": 31.88, "elapsed_time": "13:32:00", "remaining_time": "1 day, 4:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5721, "total_steps": 17941, "loss": 1.7307, "learning_rate": 7.846183283415367e-05, "epoch": 0.3188785463463575, "percentage": 31.89, "elapsed_time": "13:32:09", "remaining_time": "1 day, 4:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5722, "total_steps": 17941, "loss": 1.679, "learning_rate": 7.845451155376764e-05, "epoch": 0.31893428459952067, "percentage": 31.89, "elapsed_time": "13:32:17", "remaining_time": "1 day, 4:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5723, "total_steps": 17941, "loss": 1.6991, "learning_rate": 7.844718937097039e-05, "epoch": 0.3189900228526838, "percentage": 31.9, "elapsed_time": "13:32:26", "remaining_time": "1 day, 4:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5724, "total_steps": 17941, "loss": 1.4701, "learning_rate": 7.843986628599416e-05, "epoch": 0.3190457611058469, "percentage": 31.9, "elapsed_time": "13:32:34", "remaining_time": "1 day, 4:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5725, "total_steps": 17941, "loss": 1.7293, "learning_rate": 7.843254229907119e-05, "epoch": 0.3191014993590101, "percentage": 31.91, "elapsed_time": "13:32:42", "remaining_time": "1 day, 4:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5726, "total_steps": 17941, "loss": 1.6067, "learning_rate": 7.842521741043375e-05, "epoch": 0.31915723761217324, "percentage": 31.92, "elapsed_time": "13:32:51", "remaining_time": "1 day, 4:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5727, "total_steps": 17941, "loss": 1.8573, "learning_rate": 7.841789162031415e-05, "epoch": 0.31921297586533637, "percentage": 31.92, "elapsed_time": "13:32:59", "remaining_time": "1 day, 4:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5728, "total_steps": 17941, "loss": 1.7482, "learning_rate": 7.84105649289447e-05, "epoch": 0.31926871411849955, "percentage": 31.93, "elapsed_time": "13:33:08", "remaining_time": "1 day, 4:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5729, "total_steps": 17941, "loss": 1.8564, "learning_rate": 7.840323733655778e-05, "epoch": 0.3193244523716627, "percentage": 31.93, "elapsed_time": "13:33:16", "remaining_time": "1 day, 4:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5730, "total_steps": 17941, "loss": 1.4677, "learning_rate": 7.839590884338579e-05, "epoch": 0.3193801906248258, "percentage": 31.94, "elapsed_time": "13:33:25", "remaining_time": "1 day, 4:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5731, "total_steps": 17941, "loss": 1.7656, "learning_rate": 7.838857944966113e-05, "epoch": 0.31943592887798894, "percentage": 31.94, "elapsed_time": "13:33:33", "remaining_time": "1 day, 4:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5732, "total_steps": 17941, "loss": 1.525, "learning_rate": 7.838124915561623e-05, "epoch": 0.3194916671311521, "percentage": 31.95, "elapsed_time": "13:33:41", "remaining_time": "1 day, 4:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5733, "total_steps": 17941, "loss": 1.9737, "learning_rate": 7.837391796148359e-05, "epoch": 0.31954740538431525, "percentage": 31.95, "elapsed_time": "13:33:50", "remaining_time": "1 day, 4:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5734, "total_steps": 17941, "loss": 1.6783, "learning_rate": 7.83665858674957e-05, "epoch": 0.3196031436374784, "percentage": 31.96, "elapsed_time": "13:33:58", "remaining_time": "1 day, 4:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5735, "total_steps": 17941, "loss": 1.5786, "learning_rate": 7.835925287388511e-05, "epoch": 0.31965888189064157, "percentage": 31.97, "elapsed_time": "13:34:07", "remaining_time": "1 day, 4:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5736, "total_steps": 17941, "loss": 1.7969, "learning_rate": 7.835191898088435e-05, "epoch": 0.3197146201438047, "percentage": 31.97, "elapsed_time": "13:34:15", "remaining_time": "1 day, 4:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5737, "total_steps": 17941, "loss": 1.619, "learning_rate": 7.8344584188726e-05, "epoch": 0.3197703583969678, "percentage": 31.98, "elapsed_time": "13:34:24", "remaining_time": "1 day, 4:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5738, "total_steps": 17941, "loss": 1.6193, "learning_rate": 7.833724849764273e-05, "epoch": 0.319826096650131, "percentage": 31.98, "elapsed_time": "13:34:32", "remaining_time": "1 day, 4:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5739, "total_steps": 17941, "loss": 1.7853, "learning_rate": 7.832991190786716e-05, "epoch": 0.31988183490329414, "percentage": 31.99, "elapsed_time": "13:34:41", "remaining_time": "1 day, 4:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5740, "total_steps": 17941, "loss": 1.8835, "learning_rate": 7.832257441963195e-05, "epoch": 0.31993757315645727, "percentage": 31.99, "elapsed_time": "13:34:50", "remaining_time": "1 day, 4:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5741, "total_steps": 17941, "loss": 2.1082, "learning_rate": 7.83152360331698e-05, "epoch": 0.3199933114096204, "percentage": 32.0, "elapsed_time": "13:34:58", "remaining_time": "1 day, 4:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5742, "total_steps": 17941, "loss": 1.7184, "learning_rate": 7.830789674871346e-05, "epoch": 0.3200490496627836, "percentage": 32.0, "elapsed_time": "13:35:07", "remaining_time": "1 day, 4:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5743, "total_steps": 17941, "loss": 1.5133, "learning_rate": 7.830055656649568e-05, "epoch": 0.3201047879159467, "percentage": 32.01, "elapsed_time": "13:35:15", "remaining_time": "1 day, 4:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5744, "total_steps": 17941, "loss": 1.6203, "learning_rate": 7.829321548674926e-05, "epoch": 0.32016052616910984, "percentage": 32.02, "elapsed_time": "13:35:24", "remaining_time": "1 day, 4:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5745, "total_steps": 17941, "loss": 1.8658, "learning_rate": 7.8285873509707e-05, "epoch": 0.320216264422273, "percentage": 32.02, "elapsed_time": "13:35:32", "remaining_time": "1 day, 4:51:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5746, "total_steps": 17941, "loss": 1.509, "learning_rate": 7.827853063560175e-05, "epoch": 0.32027200267543615, "percentage": 32.03, "elapsed_time": "13:35:41", "remaining_time": "1 day, 4:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5747, "total_steps": 17941, "loss": 1.8333, "learning_rate": 7.82711868646664e-05, "epoch": 0.3203277409285993, "percentage": 32.03, "elapsed_time": "13:35:49", "remaining_time": "1 day, 4:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5748, "total_steps": 17941, "loss": 1.6984, "learning_rate": 7.82638421971338e-05, "epoch": 0.32038347918176246, "percentage": 32.04, "elapsed_time": "13:35:58", "remaining_time": "1 day, 4:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5749, "total_steps": 17941, "loss": 1.6667, "learning_rate": 7.825649663323693e-05, "epoch": 0.3204392174349256, "percentage": 32.04, "elapsed_time": "13:36:06", "remaining_time": "1 day, 4:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5750, "total_steps": 17941, "loss": 1.7763, "learning_rate": 7.824915017320874e-05, "epoch": 0.3204949556880887, "percentage": 32.05, "elapsed_time": "13:36:15", "remaining_time": "1 day, 4:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5751, "total_steps": 17941, "loss": 1.5632, "learning_rate": 7.824180281728222e-05, "epoch": 0.3205506939412519, "percentage": 32.06, "elapsed_time": "13:36:23", "remaining_time": "1 day, 4:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5752, "total_steps": 17941, "loss": 1.8129, "learning_rate": 7.823445456569036e-05, "epoch": 0.32060643219441504, "percentage": 32.06, "elapsed_time": "13:36:31", "remaining_time": "1 day, 4:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5753, "total_steps": 17941, "loss": 1.8126, "learning_rate": 7.822710541866622e-05, "epoch": 0.32066217044757817, "percentage": 32.07, "elapsed_time": "13:36:40", "remaining_time": "1 day, 4:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5754, "total_steps": 17941, "loss": 1.7802, "learning_rate": 7.821975537644286e-05, "epoch": 0.3207179087007413, "percentage": 32.07, "elapsed_time": "13:36:48", "remaining_time": "1 day, 4:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5755, "total_steps": 17941, "loss": 1.9406, "learning_rate": 7.821240443925341e-05, "epoch": 0.3207736469539045, "percentage": 32.08, "elapsed_time": "13:36:57", "remaining_time": "1 day, 4:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5756, "total_steps": 17941, "loss": 1.4748, "learning_rate": 7.820505260733098e-05, "epoch": 0.3208293852070676, "percentage": 32.08, "elapsed_time": "13:37:06", "remaining_time": "1 day, 4:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5757, "total_steps": 17941, "loss": 1.716, "learning_rate": 7.819769988090873e-05, "epoch": 0.32088512346023074, "percentage": 32.09, "elapsed_time": "13:37:14", "remaining_time": "1 day, 4:49:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5758, "total_steps": 17941, "loss": 1.8005, "learning_rate": 7.819034626021983e-05, "epoch": 0.3209408617133939, "percentage": 32.09, "elapsed_time": "13:37:23", "remaining_time": "1 day, 4:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5759, "total_steps": 17941, "loss": 1.675, "learning_rate": 7.818299174549752e-05, "epoch": 0.32099659996655705, "percentage": 32.1, "elapsed_time": "13:37:31", "remaining_time": "1 day, 4:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5760, "total_steps": 17941, "loss": 1.9635, "learning_rate": 7.817563633697503e-05, "epoch": 0.3210523382197202, "percentage": 32.11, "elapsed_time": "13:37:40", "remaining_time": "1 day, 4:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5761, "total_steps": 17941, "loss": 1.7265, "learning_rate": 7.816828003488563e-05, "epoch": 0.32110807647288336, "percentage": 32.11, "elapsed_time": "13:37:49", "remaining_time": "1 day, 4:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5762, "total_steps": 17941, "loss": 1.6653, "learning_rate": 7.816092283946261e-05, "epoch": 0.3211638147260465, "percentage": 32.12, "elapsed_time": "13:37:58", "remaining_time": "1 day, 4:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5763, "total_steps": 17941, "loss": 1.6578, "learning_rate": 7.815356475093931e-05, "epoch": 0.3212195529792096, "percentage": 32.12, "elapsed_time": "13:38:06", "remaining_time": "1 day, 4:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5764, "total_steps": 17941, "loss": 1.787, "learning_rate": 7.81462057695491e-05, "epoch": 0.32127529123237275, "percentage": 32.13, "elapsed_time": "13:38:14", "remaining_time": "1 day, 4:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5765, "total_steps": 17941, "loss": 1.5927, "learning_rate": 7.813884589552534e-05, "epoch": 0.32133102948553594, "percentage": 32.13, "elapsed_time": "13:38:23", "remaining_time": "1 day, 4:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5766, "total_steps": 17941, "loss": 1.7973, "learning_rate": 7.813148512910144e-05, "epoch": 0.32138676773869906, "percentage": 32.14, "elapsed_time": "13:38:31", "remaining_time": "1 day, 4:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5767, "total_steps": 17941, "loss": 1.7949, "learning_rate": 7.812412347051083e-05, "epoch": 0.3214425059918622, "percentage": 32.14, "elapsed_time": "13:38:40", "remaining_time": "1 day, 4:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5768, "total_steps": 17941, "loss": 1.7011, "learning_rate": 7.811676091998704e-05, "epoch": 0.3214982442450254, "percentage": 32.15, "elapsed_time": "13:38:48", "remaining_time": "1 day, 4:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5769, "total_steps": 17941, "loss": 1.7513, "learning_rate": 7.81093974777635e-05, "epoch": 0.3215539824981885, "percentage": 32.16, "elapsed_time": "13:38:57", "remaining_time": "1 day, 4:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5770, "total_steps": 17941, "loss": 1.9528, "learning_rate": 7.810203314407377e-05, "epoch": 0.32160972075135164, "percentage": 32.16, "elapsed_time": "13:39:05", "remaining_time": "1 day, 4:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5771, "total_steps": 17941, "loss": 1.6544, "learning_rate": 7.80946679191514e-05, "epoch": 0.3216654590045148, "percentage": 32.17, "elapsed_time": "13:39:14", "remaining_time": "1 day, 4:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5772, "total_steps": 17941, "loss": 1.6561, "learning_rate": 7.808730180322996e-05, "epoch": 0.32172119725767795, "percentage": 32.17, "elapsed_time": "13:39:22", "remaining_time": "1 day, 4:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5773, "total_steps": 17941, "loss": 1.6776, "learning_rate": 7.807993479654307e-05, "epoch": 0.3217769355108411, "percentage": 32.18, "elapsed_time": "13:39:30", "remaining_time": "1 day, 4:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5774, "total_steps": 17941, "loss": 1.6976, "learning_rate": 7.807256689932435e-05, "epoch": 0.32183267376400426, "percentage": 32.18, "elapsed_time": "13:39:39", "remaining_time": "1 day, 4:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5775, "total_steps": 17941, "loss": 1.4983, "learning_rate": 7.806519811180751e-05, "epoch": 0.3218884120171674, "percentage": 32.19, "elapsed_time": "13:39:47", "remaining_time": "1 day, 4:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5776, "total_steps": 17941, "loss": 1.7632, "learning_rate": 7.805782843422618e-05, "epoch": 0.3219441502703305, "percentage": 32.19, "elapsed_time": "13:39:56", "remaining_time": "1 day, 4:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5777, "total_steps": 17941, "loss": 1.6873, "learning_rate": 7.805045786681415e-05, "epoch": 0.32199988852349365, "percentage": 32.2, "elapsed_time": "13:40:04", "remaining_time": "1 day, 4:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5778, "total_steps": 17941, "loss": 1.6692, "learning_rate": 7.804308640980513e-05, "epoch": 0.32205562677665683, "percentage": 32.21, "elapsed_time": "13:40:13", "remaining_time": "1 day, 4:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5779, "total_steps": 17941, "loss": 1.631, "learning_rate": 7.803571406343293e-05, "epoch": 0.32211136502981996, "percentage": 32.21, "elapsed_time": "13:40:21", "remaining_time": "1 day, 4:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5780, "total_steps": 17941, "loss": 1.4774, "learning_rate": 7.802834082793131e-05, "epoch": 0.3221671032829831, "percentage": 32.22, "elapsed_time": "13:40:30", "remaining_time": "1 day, 4:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5781, "total_steps": 17941, "loss": 1.9247, "learning_rate": 7.802096670353416e-05, "epoch": 0.3222228415361463, "percentage": 32.22, "elapsed_time": "13:40:39", "remaining_time": "1 day, 4:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5782, "total_steps": 17941, "loss": 1.9075, "learning_rate": 7.80135916904753e-05, "epoch": 0.3222785797893094, "percentage": 32.23, "elapsed_time": "13:40:48", "remaining_time": "1 day, 4:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5783, "total_steps": 17941, "loss": 1.6338, "learning_rate": 7.800621578898867e-05, "epoch": 0.32233431804247253, "percentage": 32.23, "elapsed_time": "13:40:56", "remaining_time": "1 day, 4:45:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5784, "total_steps": 17941, "loss": 1.6214, "learning_rate": 7.799883899930815e-05, "epoch": 0.3223900562956357, "percentage": 32.24, "elapsed_time": "13:41:05", "remaining_time": "1 day, 4:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5785, "total_steps": 17941, "loss": 1.7258, "learning_rate": 7.79914613216677e-05, "epoch": 0.32244579454879885, "percentage": 32.24, "elapsed_time": "13:41:13", "remaining_time": "1 day, 4:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5786, "total_steps": 17941, "loss": 1.6471, "learning_rate": 7.798408275630129e-05, "epoch": 0.322501532801962, "percentage": 32.25, "elapsed_time": "13:41:22", "remaining_time": "1 day, 4:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5787, "total_steps": 17941, "loss": 1.7154, "learning_rate": 7.797670330344294e-05, "epoch": 0.3225572710551251, "percentage": 32.26, "elapsed_time": "13:41:30", "remaining_time": "1 day, 4:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5788, "total_steps": 17941, "loss": 1.7534, "learning_rate": 7.796932296332667e-05, "epoch": 0.3226130093082883, "percentage": 32.26, "elapsed_time": "13:41:38", "remaining_time": "1 day, 4:45:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5789, "total_steps": 17941, "loss": 1.5581, "learning_rate": 7.796194173618654e-05, "epoch": 0.3226687475614514, "percentage": 32.27, "elapsed_time": "13:41:47", "remaining_time": "1 day, 4:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5790, "total_steps": 17941, "loss": 1.7255, "learning_rate": 7.795455962225669e-05, "epoch": 0.32272448581461455, "percentage": 32.27, "elapsed_time": "13:41:55", "remaining_time": "1 day, 4:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5791, "total_steps": 17941, "loss": 1.6029, "learning_rate": 7.794717662177115e-05, "epoch": 0.32278022406777773, "percentage": 32.28, "elapsed_time": "13:42:04", "remaining_time": "1 day, 4:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5792, "total_steps": 17941, "loss": 1.6035, "learning_rate": 7.793979273496414e-05, "epoch": 0.32283596232094086, "percentage": 32.28, "elapsed_time": "13:42:12", "remaining_time": "1 day, 4:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5793, "total_steps": 17941, "loss": 1.8577, "learning_rate": 7.793240796206979e-05, "epoch": 0.322891700574104, "percentage": 32.29, "elapsed_time": "13:42:21", "remaining_time": "1 day, 4:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5794, "total_steps": 17941, "loss": 1.4227, "learning_rate": 7.79250223033223e-05, "epoch": 0.3229474388272672, "percentage": 32.29, "elapsed_time": "13:42:29", "remaining_time": "1 day, 4:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5795, "total_steps": 17941, "loss": 1.5865, "learning_rate": 7.791763575895594e-05, "epoch": 0.3230031770804303, "percentage": 32.3, "elapsed_time": "13:42:38", "remaining_time": "1 day, 4:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5796, "total_steps": 17941, "loss": 1.8056, "learning_rate": 7.791024832920496e-05, "epoch": 0.32305891533359343, "percentage": 32.31, "elapsed_time": "13:42:46", "remaining_time": "1 day, 4:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5797, "total_steps": 17941, "loss": 1.8124, "learning_rate": 7.79028600143036e-05, "epoch": 0.3231146535867566, "percentage": 32.31, "elapsed_time": "13:42:55", "remaining_time": "1 day, 4:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5798, "total_steps": 17941, "loss": 1.614, "learning_rate": 7.789547081448622e-05, "epoch": 0.32317039183991975, "percentage": 32.32, "elapsed_time": "13:43:03", "remaining_time": "1 day, 4:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5799, "total_steps": 17941, "loss": 1.784, "learning_rate": 7.788808072998715e-05, "epoch": 0.3232261300930829, "percentage": 32.32, "elapsed_time": "13:43:11", "remaining_time": "1 day, 4:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5800, "total_steps": 17941, "loss": 1.462, "learning_rate": 7.788068976104074e-05, "epoch": 0.323281868346246, "percentage": 32.33, "elapsed_time": "13:43:20", "remaining_time": "1 day, 4:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5801, "total_steps": 17941, "loss": 1.5523, "learning_rate": 7.787329790788142e-05, "epoch": 0.3233376065994092, "percentage": 32.33, "elapsed_time": "13:43:28", "remaining_time": "1 day, 4:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5802, "total_steps": 17941, "loss": 1.6292, "learning_rate": 7.78659051707436e-05, "epoch": 0.3233933448525723, "percentage": 32.34, "elapsed_time": "13:43:37", "remaining_time": "1 day, 4:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5803, "total_steps": 17941, "loss": 1.4811, "learning_rate": 7.785851154986174e-05, "epoch": 0.32344908310573545, "percentage": 32.34, "elapsed_time": "13:43:45", "remaining_time": "1 day, 4:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5804, "total_steps": 17941, "loss": 1.8426, "learning_rate": 7.785111704547032e-05, "epoch": 0.32350482135889863, "percentage": 32.35, "elapsed_time": "13:43:54", "remaining_time": "1 day, 4:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5805, "total_steps": 17941, "loss": 1.4918, "learning_rate": 7.784372165780386e-05, "epoch": 0.32356055961206176, "percentage": 32.36, "elapsed_time": "13:44:03", "remaining_time": "1 day, 4:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5806, "total_steps": 17941, "loss": 1.6687, "learning_rate": 7.783632538709688e-05, "epoch": 0.3236162978652249, "percentage": 32.36, "elapsed_time": "13:44:11", "remaining_time": "1 day, 4:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5807, "total_steps": 17941, "loss": 1.7208, "learning_rate": 7.782892823358394e-05, "epoch": 0.3236720361183881, "percentage": 32.37, "elapsed_time": "13:44:19", "remaining_time": "1 day, 4:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5808, "total_steps": 17941, "loss": 1.9566, "learning_rate": 7.782153019749967e-05, "epoch": 0.3237277743715512, "percentage": 32.37, "elapsed_time": "13:44:28", "remaining_time": "1 day, 4:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5809, "total_steps": 17941, "loss": 1.7169, "learning_rate": 7.781413127907868e-05, "epoch": 0.32378351262471433, "percentage": 32.38, "elapsed_time": "13:44:36", "remaining_time": "1 day, 4:42:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5810, "total_steps": 17941, "loss": 1.7084, "learning_rate": 7.780673147855559e-05, "epoch": 0.32383925087787746, "percentage": 32.38, "elapsed_time": "13:44:45", "remaining_time": "1 day, 4:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5811, "total_steps": 17941, "loss": 1.6815, "learning_rate": 7.779933079616512e-05, "epoch": 0.32389498913104064, "percentage": 32.39, "elapsed_time": "13:44:54", "remaining_time": "1 day, 4:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5812, "total_steps": 17941, "loss": 1.6899, "learning_rate": 7.779192923214196e-05, "epoch": 0.3239507273842038, "percentage": 32.4, "elapsed_time": "13:45:02", "remaining_time": "1 day, 4:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5813, "total_steps": 17941, "loss": 2.0061, "learning_rate": 7.778452678672084e-05, "epoch": 0.3240064656373669, "percentage": 32.4, "elapsed_time": "13:45:11", "remaining_time": "1 day, 4:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5814, "total_steps": 17941, "loss": 1.6939, "learning_rate": 7.777712346013651e-05, "epoch": 0.3240622038905301, "percentage": 32.41, "elapsed_time": "13:45:19", "remaining_time": "1 day, 4:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5815, "total_steps": 17941, "loss": 1.4296, "learning_rate": 7.776971925262379e-05, "epoch": 0.3241179421436932, "percentage": 32.41, "elapsed_time": "13:45:28", "remaining_time": "1 day, 4:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5816, "total_steps": 17941, "loss": 1.8693, "learning_rate": 7.776231416441748e-05, "epoch": 0.32417368039685635, "percentage": 32.42, "elapsed_time": "13:45:36", "remaining_time": "1 day, 4:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5817, "total_steps": 17941, "loss": 1.5215, "learning_rate": 7.775490819575242e-05, "epoch": 0.32422941865001953, "percentage": 32.42, "elapsed_time": "13:45:44", "remaining_time": "1 day, 4:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5818, "total_steps": 17941, "loss": 1.6002, "learning_rate": 7.774750134686352e-05, "epoch": 0.32428515690318266, "percentage": 32.43, "elapsed_time": "13:45:53", "remaining_time": "1 day, 4:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5819, "total_steps": 17941, "loss": 1.42, "learning_rate": 7.774009361798565e-05, "epoch": 0.3243408951563458, "percentage": 32.43, "elapsed_time": "13:46:01", "remaining_time": "1 day, 4:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5820, "total_steps": 17941, "loss": 1.6076, "learning_rate": 7.773268500935372e-05, "epoch": 0.32439663340950897, "percentage": 32.44, "elapsed_time": "13:46:10", "remaining_time": "1 day, 4:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5821, "total_steps": 17941, "loss": 1.6444, "learning_rate": 7.772527552120273e-05, "epoch": 0.3244523716626721, "percentage": 32.45, "elapsed_time": "13:46:18", "remaining_time": "1 day, 4:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5822, "total_steps": 17941, "loss": 1.3809, "learning_rate": 7.771786515376765e-05, "epoch": 0.32450810991583523, "percentage": 32.45, "elapsed_time": "13:46:27", "remaining_time": "1 day, 4:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5823, "total_steps": 17941, "loss": 1.8976, "learning_rate": 7.77104539072835e-05, "epoch": 0.32456384816899836, "percentage": 32.46, "elapsed_time": "13:46:35", "remaining_time": "1 day, 4:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5824, "total_steps": 17941, "loss": 1.7352, "learning_rate": 7.770304178198531e-05, "epoch": 0.32461958642216154, "percentage": 32.46, "elapsed_time": "13:46:44", "remaining_time": "1 day, 4:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5825, "total_steps": 17941, "loss": 1.5827, "learning_rate": 7.769562877810816e-05, "epoch": 0.3246753246753247, "percentage": 32.47, "elapsed_time": "13:46:52", "remaining_time": "1 day, 4:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5826, "total_steps": 17941, "loss": 1.44, "learning_rate": 7.768821489588713e-05, "epoch": 0.3247310629284878, "percentage": 32.47, "elapsed_time": "13:47:01", "remaining_time": "1 day, 4:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5827, "total_steps": 17941, "loss": 1.6719, "learning_rate": 7.768080013555737e-05, "epoch": 0.324786801181651, "percentage": 32.48, "elapsed_time": "13:47:09", "remaining_time": "1 day, 4:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5828, "total_steps": 17941, "loss": 1.355, "learning_rate": 7.767338449735401e-05, "epoch": 0.3248425394348141, "percentage": 32.48, "elapsed_time": "13:47:18", "remaining_time": "1 day, 4:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5829, "total_steps": 17941, "loss": 1.6764, "learning_rate": 7.766596798151224e-05, "epoch": 0.32489827768797724, "percentage": 32.49, "elapsed_time": "13:47:26", "remaining_time": "1 day, 4:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5830, "total_steps": 17941, "loss": 1.8243, "learning_rate": 7.765855058826727e-05, "epoch": 0.32495401594114043, "percentage": 32.5, "elapsed_time": "13:47:35", "remaining_time": "1 day, 4:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5831, "total_steps": 17941, "loss": 1.7313, "learning_rate": 7.765113231785435e-05, "epoch": 0.32500975419430356, "percentage": 32.5, "elapsed_time": "13:47:43", "remaining_time": "1 day, 4:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5832, "total_steps": 17941, "loss": 1.7546, "learning_rate": 7.764371317050873e-05, "epoch": 0.3250654924474667, "percentage": 32.51, "elapsed_time": "13:47:51", "remaining_time": "1 day, 4:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5833, "total_steps": 17941, "loss": 1.7879, "learning_rate": 7.763629314646568e-05, "epoch": 0.3251212307006298, "percentage": 32.51, "elapsed_time": "13:48:00", "remaining_time": "1 day, 4:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5834, "total_steps": 17941, "loss": 1.8066, "learning_rate": 7.762887224596055e-05, "epoch": 0.325176968953793, "percentage": 32.52, "elapsed_time": "13:48:08", "remaining_time": "1 day, 4:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5835, "total_steps": 17941, "loss": 1.6913, "learning_rate": 7.76214504692287e-05, "epoch": 0.32523270720695613, "percentage": 32.52, "elapsed_time": "13:48:17", "remaining_time": "1 day, 4:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5836, "total_steps": 17941, "loss": 1.7581, "learning_rate": 7.761402781650547e-05, "epoch": 0.32528844546011926, "percentage": 32.53, "elapsed_time": "13:48:25", "remaining_time": "1 day, 4:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5837, "total_steps": 17941, "loss": 1.5955, "learning_rate": 7.760660428802628e-05, "epoch": 0.32534418371328244, "percentage": 32.53, "elapsed_time": "13:48:34", "remaining_time": "1 day, 4:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5838, "total_steps": 17941, "loss": 1.6833, "learning_rate": 7.759917988402657e-05, "epoch": 0.32539992196644557, "percentage": 32.54, "elapsed_time": "13:48:42", "remaining_time": "1 day, 4:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5839, "total_steps": 17941, "loss": 1.8303, "learning_rate": 7.759175460474177e-05, "epoch": 0.3254556602196087, "percentage": 32.55, "elapsed_time": "13:48:51", "remaining_time": "1 day, 4:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5840, "total_steps": 17941, "loss": 1.7216, "learning_rate": 7.758432845040737e-05, "epoch": 0.3255113984727719, "percentage": 32.55, "elapsed_time": "13:48:59", "remaining_time": "1 day, 4:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5841, "total_steps": 17941, "loss": 1.6099, "learning_rate": 7.757690142125893e-05, "epoch": 0.325567136725935, "percentage": 32.56, "elapsed_time": "13:49:08", "remaining_time": "1 day, 4:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5842, "total_steps": 17941, "loss": 1.5388, "learning_rate": 7.756947351753196e-05, "epoch": 0.32562287497909814, "percentage": 32.56, "elapsed_time": "13:49:16", "remaining_time": "1 day, 4:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5843, "total_steps": 17941, "loss": 1.6813, "learning_rate": 7.756204473946203e-05, "epoch": 0.3256786132322613, "percentage": 32.57, "elapsed_time": "13:49:25", "remaining_time": "1 day, 4:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5844, "total_steps": 17941, "loss": 1.5549, "learning_rate": 7.755461508728472e-05, "epoch": 0.32573435148542446, "percentage": 32.57, "elapsed_time": "13:49:34", "remaining_time": "1 day, 4:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5845, "total_steps": 17941, "loss": 1.5658, "learning_rate": 7.75471845612357e-05, "epoch": 0.3257900897385876, "percentage": 32.58, "elapsed_time": "13:49:42", "remaining_time": "1 day, 4:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5846, "total_steps": 17941, "loss": 1.8505, "learning_rate": 7.753975316155057e-05, "epoch": 0.3258458279917507, "percentage": 32.58, "elapsed_time": "13:49:51", "remaining_time": "1 day, 4:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5847, "total_steps": 17941, "loss": 1.953, "learning_rate": 7.753232088846505e-05, "epoch": 0.3259015662449139, "percentage": 32.59, "elapsed_time": "13:49:59", "remaining_time": "1 day, 4:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5848, "total_steps": 17941, "loss": 1.9068, "learning_rate": 7.752488774221485e-05, "epoch": 0.325957304498077, "percentage": 32.6, "elapsed_time": "13:50:08", "remaining_time": "1 day, 4:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5849, "total_steps": 17941, "loss": 1.6766, "learning_rate": 7.751745372303567e-05, "epoch": 0.32601304275124016, "percentage": 32.6, "elapsed_time": "13:50:16", "remaining_time": "1 day, 4:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5850, "total_steps": 17941, "loss": 1.874, "learning_rate": 7.751001883116331e-05, "epoch": 0.32606878100440334, "percentage": 32.61, "elapsed_time": "13:50:25", "remaining_time": "1 day, 4:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5851, "total_steps": 17941, "loss": 1.7491, "learning_rate": 7.750258306683353e-05, "epoch": 0.32612451925756647, "percentage": 32.61, "elapsed_time": "13:50:33", "remaining_time": "1 day, 4:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5852, "total_steps": 17941, "loss": 1.3701, "learning_rate": 7.749514643028218e-05, "epoch": 0.3261802575107296, "percentage": 32.62, "elapsed_time": "13:50:42", "remaining_time": "1 day, 4:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5853, "total_steps": 17941, "loss": 1.4772, "learning_rate": 7.748770892174509e-05, "epoch": 0.3262359957638928, "percentage": 32.62, "elapsed_time": "13:50:50", "remaining_time": "1 day, 4:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5854, "total_steps": 17941, "loss": 1.7885, "learning_rate": 7.748027054145814e-05, "epoch": 0.3262917340170559, "percentage": 32.63, "elapsed_time": "13:50:59", "remaining_time": "1 day, 4:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5855, "total_steps": 17941, "loss": 1.8875, "learning_rate": 7.747283128965723e-05, "epoch": 0.32634747227021904, "percentage": 32.63, "elapsed_time": "13:51:07", "remaining_time": "1 day, 4:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5856, "total_steps": 17941, "loss": 2.0948, "learning_rate": 7.74653911665783e-05, "epoch": 0.32640321052338217, "percentage": 32.64, "elapsed_time": "13:51:16", "remaining_time": "1 day, 4:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5857, "total_steps": 17941, "loss": 1.572, "learning_rate": 7.745795017245729e-05, "epoch": 0.32645894877654535, "percentage": 32.65, "elapsed_time": "13:51:25", "remaining_time": "1 day, 4:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5858, "total_steps": 17941, "loss": 1.7464, "learning_rate": 7.745050830753018e-05, "epoch": 0.3265146870297085, "percentage": 32.65, "elapsed_time": "13:51:33", "remaining_time": "1 day, 4:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5859, "total_steps": 17941, "loss": 1.9168, "learning_rate": 7.744306557203299e-05, "epoch": 0.3265704252828716, "percentage": 32.66, "elapsed_time": "13:51:41", "remaining_time": "1 day, 4:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5860, "total_steps": 17941, "loss": 1.6884, "learning_rate": 7.743562196620177e-05, "epoch": 0.3266261635360348, "percentage": 32.66, "elapsed_time": "13:51:50", "remaining_time": "1 day, 4:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5861, "total_steps": 17941, "loss": 1.815, "learning_rate": 7.74281774902726e-05, "epoch": 0.3266819017891979, "percentage": 32.67, "elapsed_time": "13:51:58", "remaining_time": "1 day, 4:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5862, "total_steps": 17941, "loss": 1.832, "learning_rate": 7.742073214448153e-05, "epoch": 0.32673764004236105, "percentage": 32.67, "elapsed_time": "13:52:07", "remaining_time": "1 day, 4:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5863, "total_steps": 17941, "loss": 1.7179, "learning_rate": 7.741328592906474e-05, "epoch": 0.32679337829552424, "percentage": 32.68, "elapsed_time": "13:52:15", "remaining_time": "1 day, 4:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5864, "total_steps": 17941, "loss": 1.8319, "learning_rate": 7.740583884425833e-05, "epoch": 0.32684911654868737, "percentage": 32.68, "elapsed_time": "13:52:24", "remaining_time": "1 day, 4:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5865, "total_steps": 17941, "loss": 1.6868, "learning_rate": 7.73983908902985e-05, "epoch": 0.3269048548018505, "percentage": 32.69, "elapsed_time": "13:52:32", "remaining_time": "1 day, 4:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5866, "total_steps": 17941, "loss": 1.6426, "learning_rate": 7.739094206742146e-05, "epoch": 0.3269605930550137, "percentage": 32.7, "elapsed_time": "13:52:41", "remaining_time": "1 day, 4:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5867, "total_steps": 17941, "loss": 1.6661, "learning_rate": 7.738349237586343e-05, "epoch": 0.3270163313081768, "percentage": 32.7, "elapsed_time": "13:52:49", "remaining_time": "1 day, 4:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5868, "total_steps": 17941, "loss": 1.7263, "learning_rate": 7.737604181586068e-05, "epoch": 0.32707206956133994, "percentage": 32.71, "elapsed_time": "13:52:57", "remaining_time": "1 day, 4:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5869, "total_steps": 17941, "loss": 1.7197, "learning_rate": 7.736859038764952e-05, "epoch": 0.32712780781450307, "percentage": 32.71, "elapsed_time": "13:53:06", "remaining_time": "1 day, 4:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5870, "total_steps": 17941, "loss": 1.7229, "learning_rate": 7.73611380914662e-05, "epoch": 0.32718354606766625, "percentage": 32.72, "elapsed_time": "13:53:14", "remaining_time": "1 day, 4:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5871, "total_steps": 17941, "loss": 1.5273, "learning_rate": 7.735368492754715e-05, "epoch": 0.3272392843208294, "percentage": 32.72, "elapsed_time": "13:53:23", "remaining_time": "1 day, 4:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5872, "total_steps": 17941, "loss": 1.7926, "learning_rate": 7.734623089612867e-05, "epoch": 0.3272950225739925, "percentage": 32.73, "elapsed_time": "13:53:31", "remaining_time": "1 day, 4:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5873, "total_steps": 17941, "loss": 1.492, "learning_rate": 7.73387759974472e-05, "epoch": 0.3273507608271557, "percentage": 32.74, "elapsed_time": "13:53:40", "remaining_time": "1 day, 4:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5874, "total_steps": 17941, "loss": 1.6155, "learning_rate": 7.733132023173915e-05, "epoch": 0.3274064990803188, "percentage": 32.74, "elapsed_time": "13:53:48", "remaining_time": "1 day, 4:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5875, "total_steps": 17941, "loss": 1.7757, "learning_rate": 7.732386359924097e-05, "epoch": 0.32746223733348195, "percentage": 32.75, "elapsed_time": "13:53:57", "remaining_time": "1 day, 4:32:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5876, "total_steps": 17941, "loss": 1.6669, "learning_rate": 7.731640610018914e-05, "epoch": 0.32751797558664514, "percentage": 32.75, "elapsed_time": "13:54:05", "remaining_time": "1 day, 4:32:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5877, "total_steps": 17941, "loss": 1.944, "learning_rate": 7.730894773482019e-05, "epoch": 0.32757371383980827, "percentage": 32.76, "elapsed_time": "13:54:13", "remaining_time": "1 day, 4:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5878, "total_steps": 17941, "loss": 1.7491, "learning_rate": 7.730148850337062e-05, "epoch": 0.3276294520929714, "percentage": 32.76, "elapsed_time": "13:54:22", "remaining_time": "1 day, 4:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5879, "total_steps": 17941, "loss": 1.7473, "learning_rate": 7.729402840607702e-05, "epoch": 0.3276851903461345, "percentage": 32.77, "elapsed_time": "13:54:30", "remaining_time": "1 day, 4:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5880, "total_steps": 17941, "loss": 1.7703, "learning_rate": 7.728656744317598e-05, "epoch": 0.3277409285992977, "percentage": 32.77, "elapsed_time": "13:54:39", "remaining_time": "1 day, 4:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5881, "total_steps": 17941, "loss": 1.6632, "learning_rate": 7.727910561490411e-05, "epoch": 0.32779666685246084, "percentage": 32.78, "elapsed_time": "13:54:47", "remaining_time": "1 day, 4:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5882, "total_steps": 17941, "loss": 1.7289, "learning_rate": 7.727164292149806e-05, "epoch": 0.32785240510562397, "percentage": 32.79, "elapsed_time": "13:54:56", "remaining_time": "1 day, 4:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5883, "total_steps": 17941, "loss": 1.9396, "learning_rate": 7.72641793631945e-05, "epoch": 0.32790814335878715, "percentage": 32.79, "elapsed_time": "13:55:04", "remaining_time": "1 day, 4:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5884, "total_steps": 17941, "loss": 1.6176, "learning_rate": 7.725671494023014e-05, "epoch": 0.3279638816119503, "percentage": 32.8, "elapsed_time": "13:55:13", "remaining_time": "1 day, 4:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5885, "total_steps": 17941, "loss": 1.7997, "learning_rate": 7.724924965284169e-05, "epoch": 0.3280196198651134, "percentage": 32.8, "elapsed_time": "13:55:21", "remaining_time": "1 day, 4:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5886, "total_steps": 17941, "loss": 1.762, "learning_rate": 7.72417835012659e-05, "epoch": 0.3280753581182766, "percentage": 32.81, "elapsed_time": "13:55:30", "remaining_time": "1 day, 4:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5887, "total_steps": 17941, "loss": 1.29, "learning_rate": 7.72343164857396e-05, "epoch": 0.3281310963714397, "percentage": 32.81, "elapsed_time": "13:55:38", "remaining_time": "1 day, 4:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5888, "total_steps": 17941, "loss": 1.8285, "learning_rate": 7.722684860649953e-05, "epoch": 0.32818683462460285, "percentage": 32.82, "elapsed_time": "13:55:47", "remaining_time": "1 day, 4:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5889, "total_steps": 17941, "loss": 1.6134, "learning_rate": 7.721937986378261e-05, "epoch": 0.32824257287776604, "percentage": 32.82, "elapsed_time": "13:55:55", "remaining_time": "1 day, 4:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5890, "total_steps": 17941, "loss": 1.5536, "learning_rate": 7.721191025782563e-05, "epoch": 0.32829831113092917, "percentage": 32.83, "elapsed_time": "13:56:03", "remaining_time": "1 day, 4:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5891, "total_steps": 17941, "loss": 1.6102, "learning_rate": 7.720443978886551e-05, "epoch": 0.3283540493840923, "percentage": 32.84, "elapsed_time": "13:56:12", "remaining_time": "1 day, 4:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5892, "total_steps": 17941, "loss": 1.7258, "learning_rate": 7.71969684571392e-05, "epoch": 0.3284097876372554, "percentage": 32.84, "elapsed_time": "13:56:20", "remaining_time": "1 day, 4:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5893, "total_steps": 17941, "loss": 1.7538, "learning_rate": 7.718949626288359e-05, "epoch": 0.3284655258904186, "percentage": 32.85, "elapsed_time": "13:56:29", "remaining_time": "1 day, 4:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5894, "total_steps": 17941, "loss": 1.5929, "learning_rate": 7.718202320633572e-05, "epoch": 0.32852126414358174, "percentage": 32.85, "elapsed_time": "13:56:37", "remaining_time": "1 day, 4:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5895, "total_steps": 17941, "loss": 1.5781, "learning_rate": 7.717454928773253e-05, "epoch": 0.32857700239674487, "percentage": 32.86, "elapsed_time": "13:56:45", "remaining_time": "1 day, 4:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5896, "total_steps": 17941, "loss": 1.97, "learning_rate": 7.716707450731109e-05, "epoch": 0.32863274064990805, "percentage": 32.86, "elapsed_time": "13:56:54", "remaining_time": "1 day, 4:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5897, "total_steps": 17941, "loss": 1.6759, "learning_rate": 7.715959886530843e-05, "epoch": 0.3286884789030712, "percentage": 32.87, "elapsed_time": "13:57:02", "remaining_time": "1 day, 4:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5898, "total_steps": 17941, "loss": 1.6515, "learning_rate": 7.715212236196164e-05, "epoch": 0.3287442171562343, "percentage": 32.87, "elapsed_time": "13:57:11", "remaining_time": "1 day, 4:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5899, "total_steps": 17941, "loss": 1.7267, "learning_rate": 7.714464499750784e-05, "epoch": 0.3287999554093975, "percentage": 32.88, "elapsed_time": "13:57:19", "remaining_time": "1 day, 4:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5900, "total_steps": 17941, "loss": 1.6431, "learning_rate": 7.713716677218416e-05, "epoch": 0.3288556936625606, "percentage": 32.89, "elapsed_time": "13:57:28", "remaining_time": "1 day, 4:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5901, "total_steps": 17941, "loss": 1.5909, "learning_rate": 7.712968768622779e-05, "epoch": 0.32891143191572375, "percentage": 32.89, "elapsed_time": "13:57:36", "remaining_time": "1 day, 4:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5902, "total_steps": 17941, "loss": 1.6273, "learning_rate": 7.712220773987589e-05, "epoch": 0.3289671701688869, "percentage": 32.9, "elapsed_time": "13:57:45", "remaining_time": "1 day, 4:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5903, "total_steps": 17941, "loss": 1.8497, "learning_rate": 7.71147269333657e-05, "epoch": 0.32902290842205006, "percentage": 32.9, "elapsed_time": "13:57:53", "remaining_time": "1 day, 4:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5904, "total_steps": 17941, "loss": 1.6606, "learning_rate": 7.710724526693445e-05, "epoch": 0.3290786466752132, "percentage": 32.91, "elapsed_time": "13:58:02", "remaining_time": "1 day, 4:28:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5905, "total_steps": 17941, "loss": 1.8094, "learning_rate": 7.709976274081944e-05, "epoch": 0.3291343849283763, "percentage": 32.91, "elapsed_time": "13:58:10", "remaining_time": "1 day, 4:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5906, "total_steps": 17941, "loss": 1.7477, "learning_rate": 7.709227935525796e-05, "epoch": 0.3291901231815395, "percentage": 32.92, "elapsed_time": "13:58:18", "remaining_time": "1 day, 4:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5907, "total_steps": 17941, "loss": 1.4591, "learning_rate": 7.708479511048732e-05, "epoch": 0.32924586143470264, "percentage": 32.92, "elapsed_time": "13:58:27", "remaining_time": "1 day, 4:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5908, "total_steps": 17941, "loss": 1.6762, "learning_rate": 7.707731000674492e-05, "epoch": 0.32930159968786576, "percentage": 32.93, "elapsed_time": "13:58:35", "remaining_time": "1 day, 4:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5909, "total_steps": 17941, "loss": 1.529, "learning_rate": 7.70698240442681e-05, "epoch": 0.32935733794102895, "percentage": 32.94, "elapsed_time": "13:58:44", "remaining_time": "1 day, 4:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5910, "total_steps": 17941, "loss": 1.6953, "learning_rate": 7.70623372232943e-05, "epoch": 0.3294130761941921, "percentage": 32.94, "elapsed_time": "13:58:52", "remaining_time": "1 day, 4:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5911, "total_steps": 17941, "loss": 1.6728, "learning_rate": 7.705484954406092e-05, "epoch": 0.3294688144473552, "percentage": 32.95, "elapsed_time": "13:59:01", "remaining_time": "1 day, 4:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5912, "total_steps": 17941, "loss": 1.6731, "learning_rate": 7.704736100680547e-05, "epoch": 0.3295245527005184, "percentage": 32.95, "elapsed_time": "13:59:09", "remaining_time": "1 day, 4:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5913, "total_steps": 17941, "loss": 1.9063, "learning_rate": 7.703987161176545e-05, "epoch": 0.3295802909536815, "percentage": 32.96, "elapsed_time": "13:59:17", "remaining_time": "1 day, 4:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5914, "total_steps": 17941, "loss": 1.6984, "learning_rate": 7.703238135917832e-05, "epoch": 0.32963602920684465, "percentage": 32.96, "elapsed_time": "13:59:26", "remaining_time": "1 day, 4:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5915, "total_steps": 17941, "loss": 1.7057, "learning_rate": 7.702489024928168e-05, "epoch": 0.3296917674600078, "percentage": 32.97, "elapsed_time": "13:59:34", "remaining_time": "1 day, 4:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5916, "total_steps": 17941, "loss": 1.8851, "learning_rate": 7.701739828231309e-05, "epoch": 0.32974750571317096, "percentage": 32.97, "elapsed_time": "13:59:43", "remaining_time": "1 day, 4:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5917, "total_steps": 17941, "loss": 1.6514, "learning_rate": 7.700990545851014e-05, "epoch": 0.3298032439663341, "percentage": 32.98, "elapsed_time": "13:59:51", "remaining_time": "1 day, 4:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5918, "total_steps": 17941, "loss": 1.7474, "learning_rate": 7.700241177811048e-05, "epoch": 0.3298589822194972, "percentage": 32.99, "elapsed_time": "14:00:00", "remaining_time": "1 day, 4:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5919, "total_steps": 17941, "loss": 1.65, "learning_rate": 7.699491724135175e-05, "epoch": 0.3299147204726604, "percentage": 32.99, "elapsed_time": "14:00:09", "remaining_time": "1 day, 4:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5920, "total_steps": 17941, "loss": 1.7039, "learning_rate": 7.698742184847163e-05, "epoch": 0.32997045872582353, "percentage": 33.0, "elapsed_time": "14:00:17", "remaining_time": "1 day, 4:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5921, "total_steps": 17941, "loss": 1.7428, "learning_rate": 7.697992559970784e-05, "epoch": 0.33002619697898666, "percentage": 33.0, "elapsed_time": "14:00:26", "remaining_time": "1 day, 4:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5922, "total_steps": 17941, "loss": 1.7935, "learning_rate": 7.697242849529812e-05, "epoch": 0.33008193523214985, "percentage": 33.01, "elapsed_time": "14:00:34", "remaining_time": "1 day, 4:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5923, "total_steps": 17941, "loss": 1.7302, "learning_rate": 7.69649305354802e-05, "epoch": 0.330137673485313, "percentage": 33.01, "elapsed_time": "14:00:43", "remaining_time": "1 day, 4:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5924, "total_steps": 17941, "loss": 1.6529, "learning_rate": 7.695743172049192e-05, "epoch": 0.3301934117384761, "percentage": 33.02, "elapsed_time": "14:00:52", "remaining_time": "1 day, 4:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5925, "total_steps": 17941, "loss": 1.696, "learning_rate": 7.694993205057108e-05, "epoch": 0.33024914999163923, "percentage": 33.02, "elapsed_time": "14:01:00", "remaining_time": "1 day, 4:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5926, "total_steps": 17941, "loss": 1.6173, "learning_rate": 7.694243152595552e-05, "epoch": 0.3303048882448024, "percentage": 33.03, "elapsed_time": "14:01:09", "remaining_time": "1 day, 4:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5927, "total_steps": 17941, "loss": 1.4818, "learning_rate": 7.693493014688313e-05, "epoch": 0.33036062649796555, "percentage": 33.04, "elapsed_time": "14:01:17", "remaining_time": "1 day, 4:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5928, "total_steps": 17941, "loss": 1.631, "learning_rate": 7.69274279135918e-05, "epoch": 0.3304163647511287, "percentage": 33.04, "elapsed_time": "14:01:26", "remaining_time": "1 day, 4:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5929, "total_steps": 17941, "loss": 1.8426, "learning_rate": 7.691992482631944e-05, "epoch": 0.33047210300429186, "percentage": 33.05, "elapsed_time": "14:01:35", "remaining_time": "1 day, 4:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5930, "total_steps": 17941, "loss": 1.8106, "learning_rate": 7.691242088530401e-05, "epoch": 0.330527841257455, "percentage": 33.05, "elapsed_time": "14:01:43", "remaining_time": "1 day, 4:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5931, "total_steps": 17941, "loss": 1.7523, "learning_rate": 7.690491609078351e-05, "epoch": 0.3305835795106181, "percentage": 33.06, "elapsed_time": "14:01:52", "remaining_time": "1 day, 4:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5932, "total_steps": 17941, "loss": 1.7299, "learning_rate": 7.689741044299595e-05, "epoch": 0.3306393177637813, "percentage": 33.06, "elapsed_time": "14:02:00", "remaining_time": "1 day, 4:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5933, "total_steps": 17941, "loss": 1.691, "learning_rate": 7.688990394217933e-05, "epoch": 0.33069505601694443, "percentage": 33.07, "elapsed_time": "14:02:09", "remaining_time": "1 day, 4:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5934, "total_steps": 17941, "loss": 1.45, "learning_rate": 7.688239658857174e-05, "epoch": 0.33075079427010756, "percentage": 33.08, "elapsed_time": "14:02:17", "remaining_time": "1 day, 4:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5935, "total_steps": 17941, "loss": 1.8009, "learning_rate": 7.687488838241128e-05, "epoch": 0.33080653252327075, "percentage": 33.08, "elapsed_time": "14:02:25", "remaining_time": "1 day, 4:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5936, "total_steps": 17941, "loss": 1.7873, "learning_rate": 7.686737932393605e-05, "epoch": 0.3308622707764339, "percentage": 33.09, "elapsed_time": "14:02:34", "remaining_time": "1 day, 4:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5937, "total_steps": 17941, "loss": 1.6196, "learning_rate": 7.685986941338419e-05, "epoch": 0.330918009029597, "percentage": 33.09, "elapsed_time": "14:02:42", "remaining_time": "1 day, 4:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5938, "total_steps": 17941, "loss": 1.7915, "learning_rate": 7.685235865099387e-05, "epoch": 0.33097374728276013, "percentage": 33.1, "elapsed_time": "14:02:51", "remaining_time": "1 day, 4:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5939, "total_steps": 17941, "loss": 1.6648, "learning_rate": 7.684484703700332e-05, "epoch": 0.3310294855359233, "percentage": 33.1, "elapsed_time": "14:03:00", "remaining_time": "1 day, 4:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5940, "total_steps": 17941, "loss": 2.0054, "learning_rate": 7.683733457165071e-05, "epoch": 0.33108522378908645, "percentage": 33.11, "elapsed_time": "14:03:08", "remaining_time": "1 day, 4:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5941, "total_steps": 17941, "loss": 1.7598, "learning_rate": 7.682982125517433e-05, "epoch": 0.3311409620422496, "percentage": 33.11, "elapsed_time": "14:03:17", "remaining_time": "1 day, 4:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5942, "total_steps": 17941, "loss": 1.4258, "learning_rate": 7.682230708781244e-05, "epoch": 0.33119670029541276, "percentage": 33.12, "elapsed_time": "14:03:25", "remaining_time": "1 day, 4:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5943, "total_steps": 17941, "loss": 1.766, "learning_rate": 7.681479206980338e-05, "epoch": 0.3312524385485759, "percentage": 33.13, "elapsed_time": "14:03:33", "remaining_time": "1 day, 4:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5944, "total_steps": 17941, "loss": 1.879, "learning_rate": 7.680727620138542e-05, "epoch": 0.331308176801739, "percentage": 33.13, "elapsed_time": "14:03:42", "remaining_time": "1 day, 4:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5945, "total_steps": 17941, "loss": 1.4933, "learning_rate": 7.679975948279699e-05, "epoch": 0.3313639150549022, "percentage": 33.14, "elapsed_time": "14:03:50", "remaining_time": "1 day, 4:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5946, "total_steps": 17941, "loss": 1.6821, "learning_rate": 7.679224191427642e-05, "epoch": 0.33141965330806533, "percentage": 33.14, "elapsed_time": "14:03:59", "remaining_time": "1 day, 4:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5947, "total_steps": 17941, "loss": 1.8599, "learning_rate": 7.678472349606215e-05, "epoch": 0.33147539156122846, "percentage": 33.15, "elapsed_time": "14:04:07", "remaining_time": "1 day, 4:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5948, "total_steps": 17941, "loss": 1.6659, "learning_rate": 7.677720422839263e-05, "epoch": 0.3315311298143916, "percentage": 33.15, "elapsed_time": "14:04:16", "remaining_time": "1 day, 4:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5949, "total_steps": 17941, "loss": 1.9657, "learning_rate": 7.676968411150629e-05, "epoch": 0.3315868680675548, "percentage": 33.16, "elapsed_time": "14:04:25", "remaining_time": "1 day, 4:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5950, "total_steps": 17941, "loss": 1.9396, "learning_rate": 7.676216314564166e-05, "epoch": 0.3316426063207179, "percentage": 33.16, "elapsed_time": "14:04:33", "remaining_time": "1 day, 4:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5951, "total_steps": 17941, "loss": 1.6447, "learning_rate": 7.675464133103726e-05, "epoch": 0.33169834457388103, "percentage": 33.17, "elapsed_time": "14:04:42", "remaining_time": "1 day, 4:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5952, "total_steps": 17941, "loss": 1.7975, "learning_rate": 7.674711866793163e-05, "epoch": 0.3317540828270442, "percentage": 33.18, "elapsed_time": "14:04:50", "remaining_time": "1 day, 4:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5953, "total_steps": 17941, "loss": 1.6343, "learning_rate": 7.673959515656333e-05, "epoch": 0.33180982108020735, "percentage": 33.18, "elapsed_time": "14:04:59", "remaining_time": "1 day, 4:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5954, "total_steps": 17941, "loss": 1.7215, "learning_rate": 7.673207079717098e-05, "epoch": 0.3318655593333705, "percentage": 33.19, "elapsed_time": "14:05:08", "remaining_time": "1 day, 4:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5955, "total_steps": 17941, "loss": 1.5058, "learning_rate": 7.672454558999318e-05, "epoch": 0.33192129758653366, "percentage": 33.19, "elapsed_time": "14:05:16", "remaining_time": "1 day, 4:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5956, "total_steps": 17941, "loss": 1.8826, "learning_rate": 7.671701953526863e-05, "epoch": 0.3319770358396968, "percentage": 33.2, "elapsed_time": "14:05:25", "remaining_time": "1 day, 4:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5957, "total_steps": 17941, "loss": 1.3823, "learning_rate": 7.670949263323599e-05, "epoch": 0.3320327740928599, "percentage": 33.2, "elapsed_time": "14:05:33", "remaining_time": "1 day, 4:21:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5958, "total_steps": 17941, "loss": 1.3208, "learning_rate": 7.670196488413397e-05, "epoch": 0.3320885123460231, "percentage": 33.21, "elapsed_time": "14:05:42", "remaining_time": "1 day, 4:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5959, "total_steps": 17941, "loss": 1.4293, "learning_rate": 7.66944362882013e-05, "epoch": 0.33214425059918623, "percentage": 33.21, "elapsed_time": "14:05:50", "remaining_time": "1 day, 4:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5960, "total_steps": 17941, "loss": 1.5585, "learning_rate": 7.668690684567676e-05, "epoch": 0.33219998885234936, "percentage": 33.22, "elapsed_time": "14:05:58", "remaining_time": "1 day, 4:20:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5961, "total_steps": 17941, "loss": 1.5834, "learning_rate": 7.667937655679913e-05, "epoch": 0.3322557271055125, "percentage": 33.23, "elapsed_time": "14:06:07", "remaining_time": "1 day, 4:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5962, "total_steps": 17941, "loss": 2.0935, "learning_rate": 7.667184542180723e-05, "epoch": 0.3323114653586757, "percentage": 33.23, "elapsed_time": "14:06:15", "remaining_time": "1 day, 4:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5963, "total_steps": 17941, "loss": 1.6838, "learning_rate": 7.666431344093988e-05, "epoch": 0.3323672036118388, "percentage": 33.24, "elapsed_time": "14:06:24", "remaining_time": "1 day, 4:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5964, "total_steps": 17941, "loss": 1.6688, "learning_rate": 7.665678061443599e-05, "epoch": 0.33242294186500193, "percentage": 33.24, "elapsed_time": "14:06:32", "remaining_time": "1 day, 4:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5965, "total_steps": 17941, "loss": 1.6131, "learning_rate": 7.664924694253443e-05, "epoch": 0.3324786801181651, "percentage": 33.25, "elapsed_time": "14:06:41", "remaining_time": "1 day, 4:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5966, "total_steps": 17941, "loss": 1.859, "learning_rate": 7.664171242547414e-05, "epoch": 0.33253441837132824, "percentage": 33.25, "elapsed_time": "14:06:50", "remaining_time": "1 day, 4:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5967, "total_steps": 17941, "loss": 1.6848, "learning_rate": 7.663417706349407e-05, "epoch": 0.3325901566244914, "percentage": 33.26, "elapsed_time": "14:06:58", "remaining_time": "1 day, 4:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5968, "total_steps": 17941, "loss": 1.7, "learning_rate": 7.662664085683317e-05, "epoch": 0.33264589487765456, "percentage": 33.26, "elapsed_time": "14:07:07", "remaining_time": "1 day, 4:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5969, "total_steps": 17941, "loss": 1.87, "learning_rate": 7.66191038057305e-05, "epoch": 0.3327016331308177, "percentage": 33.27, "elapsed_time": "14:07:15", "remaining_time": "1 day, 4:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5970, "total_steps": 17941, "loss": 1.6083, "learning_rate": 7.661156591042502e-05, "epoch": 0.3327573713839808, "percentage": 33.28, "elapsed_time": "14:07:24", "remaining_time": "1 day, 4:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5971, "total_steps": 17941, "loss": 1.6786, "learning_rate": 7.660402717115584e-05, "epoch": 0.33281310963714394, "percentage": 33.28, "elapsed_time": "14:07:32", "remaining_time": "1 day, 4:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5972, "total_steps": 17941, "loss": 1.595, "learning_rate": 7.659648758816205e-05, "epoch": 0.33286884789030713, "percentage": 33.29, "elapsed_time": "14:07:41", "remaining_time": "1 day, 4:18:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5973, "total_steps": 17941, "loss": 2.0188, "learning_rate": 7.658894716168271e-05, "epoch": 0.33292458614347026, "percentage": 33.29, "elapsed_time": "14:07:50", "remaining_time": "1 day, 4:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5974, "total_steps": 17941, "loss": 1.6095, "learning_rate": 7.658140589195701e-05, "epoch": 0.3329803243966334, "percentage": 33.3, "elapsed_time": "14:07:58", "remaining_time": "1 day, 4:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5975, "total_steps": 17941, "loss": 1.6199, "learning_rate": 7.657386377922409e-05, "epoch": 0.33303606264979657, "percentage": 33.3, "elapsed_time": "14:08:07", "remaining_time": "1 day, 4:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5976, "total_steps": 17941, "loss": 1.5635, "learning_rate": 7.656632082372315e-05, "epoch": 0.3330918009029597, "percentage": 33.31, "elapsed_time": "14:08:15", "remaining_time": "1 day, 4:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5977, "total_steps": 17941, "loss": 1.7578, "learning_rate": 7.65587770256934e-05, "epoch": 0.33314753915612283, "percentage": 33.31, "elapsed_time": "14:08:24", "remaining_time": "1 day, 4:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5978, "total_steps": 17941, "loss": 1.4157, "learning_rate": 7.655123238537409e-05, "epoch": 0.333203277409286, "percentage": 33.32, "elapsed_time": "14:08:33", "remaining_time": "1 day, 4:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5979, "total_steps": 17941, "loss": 1.8876, "learning_rate": 7.65436869030045e-05, "epoch": 0.33325901566244914, "percentage": 33.33, "elapsed_time": "14:08:41", "remaining_time": "1 day, 4:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5980, "total_steps": 17941, "loss": 1.7052, "learning_rate": 7.653614057882393e-05, "epoch": 0.33331475391561227, "percentage": 33.33, "elapsed_time": "14:08:50", "remaining_time": "1 day, 4:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5981, "total_steps": 17941, "loss": 1.7011, "learning_rate": 7.652859341307168e-05, "epoch": 0.33337049216877546, "percentage": 33.34, "elapsed_time": "14:08:58", "remaining_time": "1 day, 4:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5982, "total_steps": 17941, "loss": 1.7664, "learning_rate": 7.652104540598712e-05, "epoch": 0.3334262304219386, "percentage": 33.34, "elapsed_time": "14:09:07", "remaining_time": "1 day, 4:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5983, "total_steps": 17941, "loss": 1.5627, "learning_rate": 7.651349655780965e-05, "epoch": 0.3334819686751017, "percentage": 33.35, "elapsed_time": "14:09:16", "remaining_time": "1 day, 4:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5984, "total_steps": 17941, "loss": 1.8128, "learning_rate": 7.650594686877863e-05, "epoch": 0.33353770692826484, "percentage": 33.35, "elapsed_time": "14:09:24", "remaining_time": "1 day, 4:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5985, "total_steps": 17941, "loss": 1.6395, "learning_rate": 7.649839633913352e-05, "epoch": 0.333593445181428, "percentage": 33.36, "elapsed_time": "14:09:33", "remaining_time": "1 day, 4:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5986, "total_steps": 17941, "loss": 1.7467, "learning_rate": 7.649084496911378e-05, "epoch": 0.33364918343459116, "percentage": 33.36, "elapsed_time": "14:09:42", "remaining_time": "1 day, 4:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5987, "total_steps": 17941, "loss": 1.8314, "learning_rate": 7.648329275895889e-05, "epoch": 0.3337049216877543, "percentage": 33.37, "elapsed_time": "14:09:50", "remaining_time": "1 day, 4:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5988, "total_steps": 17941, "loss": 1.5876, "learning_rate": 7.647573970890837e-05, "epoch": 0.33376065994091747, "percentage": 33.38, "elapsed_time": "14:09:59", "remaining_time": "1 day, 4:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5989, "total_steps": 17941, "loss": 1.6042, "learning_rate": 7.646818581920173e-05, "epoch": 0.3338163981940806, "percentage": 33.38, "elapsed_time": "14:10:08", "remaining_time": "1 day, 4:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5990, "total_steps": 17941, "loss": 1.5054, "learning_rate": 7.646063109007858e-05, "epoch": 0.33387213644724373, "percentage": 33.39, "elapsed_time": "14:10:17", "remaining_time": "1 day, 4:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5991, "total_steps": 17941, "loss": 1.7355, "learning_rate": 7.645307552177847e-05, "epoch": 0.3339278747004069, "percentage": 33.39, "elapsed_time": "14:10:25", "remaining_time": "1 day, 4:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5992, "total_steps": 17941, "loss": 1.5428, "learning_rate": 7.644551911454103e-05, "epoch": 0.33398361295357004, "percentage": 33.4, "elapsed_time": "14:10:34", "remaining_time": "1 day, 4:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5993, "total_steps": 17941, "loss": 1.8064, "learning_rate": 7.643796186860595e-05, "epoch": 0.33403935120673317, "percentage": 33.4, "elapsed_time": "14:10:43", "remaining_time": "1 day, 4:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5994, "total_steps": 17941, "loss": 1.9495, "learning_rate": 7.643040378421282e-05, "epoch": 0.3340950894598963, "percentage": 33.41, "elapsed_time": "14:10:51", "remaining_time": "1 day, 4:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5995, "total_steps": 17941, "loss": 1.6926, "learning_rate": 7.64228448616014e-05, "epoch": 0.3341508277130595, "percentage": 33.42, "elapsed_time": "14:11:00", "remaining_time": "1 day, 4:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5996, "total_steps": 17941, "loss": 1.6566, "learning_rate": 7.64152851010114e-05, "epoch": 0.3342065659662226, "percentage": 33.42, "elapsed_time": "14:11:09", "remaining_time": "1 day, 4:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5997, "total_steps": 17941, "loss": 1.6196, "learning_rate": 7.640772450268255e-05, "epoch": 0.33426230421938574, "percentage": 33.43, "elapsed_time": "14:11:18", "remaining_time": "1 day, 4:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5998, "total_steps": 17941, "loss": 1.6845, "learning_rate": 7.640016306685467e-05, "epoch": 0.3343180424725489, "percentage": 33.43, "elapsed_time": "14:11:26", "remaining_time": "1 day, 4:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5999, "total_steps": 17941, "loss": 1.9948, "learning_rate": 7.639260079376753e-05, "epoch": 0.33437378072571206, "percentage": 33.44, "elapsed_time": "14:11:35", "remaining_time": "1 day, 4:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6000, "total_steps": 17941, "loss": 1.6778, "learning_rate": 7.638503768366098e-05, "epoch": 0.3344295189788752, "percentage": 33.44, "elapsed_time": "14:11:43", "remaining_time": "1 day, 4:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6001, "total_steps": 17941, "loss": 1.6279, "learning_rate": 7.637747373677486e-05, "epoch": 0.33448525723203837, "percentage": 33.45, "elapsed_time": "14:11:53", "remaining_time": "1 day, 4:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6002, "total_steps": 17941, "loss": 1.7001, "learning_rate": 7.636990895334907e-05, "epoch": 0.3345409954852015, "percentage": 33.45, "elapsed_time": "14:12:01", "remaining_time": "1 day, 4:14:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6003, "total_steps": 17941, "loss": 1.7576, "learning_rate": 7.63623433336235e-05, "epoch": 0.3345967337383646, "percentage": 33.46, "elapsed_time": "14:12:10", "remaining_time": "1 day, 4:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6004, "total_steps": 17941, "loss": 1.844, "learning_rate": 7.635477687783814e-05, "epoch": 0.3346524719915278, "percentage": 33.47, "elapsed_time": "14:12:18", "remaining_time": "1 day, 4:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6005, "total_steps": 17941, "loss": 1.6125, "learning_rate": 7.634720958623287e-05, "epoch": 0.33470821024469094, "percentage": 33.47, "elapsed_time": "14:12:27", "remaining_time": "1 day, 4:14:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6006, "total_steps": 17941, "loss": 1.7169, "learning_rate": 7.633964145904777e-05, "epoch": 0.33476394849785407, "percentage": 33.48, "elapsed_time": "14:12:35", "remaining_time": "1 day, 4:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6007, "total_steps": 17941, "loss": 1.6944, "learning_rate": 7.633207249652278e-05, "epoch": 0.3348196867510172, "percentage": 33.48, "elapsed_time": "14:12:44", "remaining_time": "1 day, 4:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6008, "total_steps": 17941, "loss": 1.4025, "learning_rate": 7.6324502698898e-05, "epoch": 0.3348754250041804, "percentage": 33.49, "elapsed_time": "14:12:53", "remaining_time": "1 day, 4:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6009, "total_steps": 17941, "loss": 1.7292, "learning_rate": 7.631693206641346e-05, "epoch": 0.3349311632573435, "percentage": 33.49, "elapsed_time": "14:13:01", "remaining_time": "1 day, 4:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6010, "total_steps": 17941, "loss": 1.5525, "learning_rate": 7.630936059930927e-05, "epoch": 0.33498690151050664, "percentage": 33.5, "elapsed_time": "14:13:09", "remaining_time": "1 day, 4:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6011, "total_steps": 17941, "loss": 1.7284, "learning_rate": 7.630178829782558e-05, "epoch": 0.3350426397636698, "percentage": 33.5, "elapsed_time": "14:13:18", "remaining_time": "1 day, 4:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6012, "total_steps": 17941, "loss": 1.6727, "learning_rate": 7.629421516220249e-05, "epoch": 0.33509837801683295, "percentage": 33.51, "elapsed_time": "14:13:26", "remaining_time": "1 day, 4:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6013, "total_steps": 17941, "loss": 1.7325, "learning_rate": 7.628664119268023e-05, "epoch": 0.3351541162699961, "percentage": 33.52, "elapsed_time": "14:13:35", "remaining_time": "1 day, 4:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6014, "total_steps": 17941, "loss": 1.5102, "learning_rate": 7.627906638949895e-05, "epoch": 0.33520985452315927, "percentage": 33.52, "elapsed_time": "14:13:43", "remaining_time": "1 day, 4:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6015, "total_steps": 17941, "loss": 1.5725, "learning_rate": 7.62714907528989e-05, "epoch": 0.3352655927763224, "percentage": 33.53, "elapsed_time": "14:13:52", "remaining_time": "1 day, 4:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6016, "total_steps": 17941, "loss": 1.8119, "learning_rate": 7.626391428312035e-05, "epoch": 0.3353213310294855, "percentage": 33.53, "elapsed_time": "14:14:00", "remaining_time": "1 day, 4:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6017, "total_steps": 17941, "loss": 1.4209, "learning_rate": 7.625633698040357e-05, "epoch": 0.33537706928264865, "percentage": 33.54, "elapsed_time": "14:14:09", "remaining_time": "1 day, 4:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6018, "total_steps": 17941, "loss": 1.8436, "learning_rate": 7.624875884498886e-05, "epoch": 0.33543280753581184, "percentage": 33.54, "elapsed_time": "14:14:17", "remaining_time": "1 day, 4:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6019, "total_steps": 17941, "loss": 1.836, "learning_rate": 7.624117987711656e-05, "epoch": 0.33548854578897497, "percentage": 33.55, "elapsed_time": "14:14:26", "remaining_time": "1 day, 4:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6020, "total_steps": 17941, "loss": 1.7539, "learning_rate": 7.623360007702702e-05, "epoch": 0.3355442840421381, "percentage": 33.55, "elapsed_time": "14:14:34", "remaining_time": "1 day, 4:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6021, "total_steps": 17941, "loss": 1.6686, "learning_rate": 7.622601944496064e-05, "epoch": 0.3356000222953013, "percentage": 33.56, "elapsed_time": "14:14:42", "remaining_time": "1 day, 4:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6022, "total_steps": 17941, "loss": 1.5361, "learning_rate": 7.621843798115785e-05, "epoch": 0.3356557605484644, "percentage": 33.57, "elapsed_time": "14:14:51", "remaining_time": "1 day, 4:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6023, "total_steps": 17941, "loss": 1.8225, "learning_rate": 7.621085568585905e-05, "epoch": 0.33571149880162754, "percentage": 33.57, "elapsed_time": "14:14:59", "remaining_time": "1 day, 4:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6024, "total_steps": 17941, "loss": 1.908, "learning_rate": 7.620327255930474e-05, "epoch": 0.3357672370547907, "percentage": 33.58, "elapsed_time": "14:15:08", "remaining_time": "1 day, 4:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6025, "total_steps": 17941, "loss": 1.6388, "learning_rate": 7.61956886017354e-05, "epoch": 0.33582297530795385, "percentage": 33.58, "elapsed_time": "14:15:16", "remaining_time": "1 day, 4:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6026, "total_steps": 17941, "loss": 1.8774, "learning_rate": 7.618810381339155e-05, "epoch": 0.335878713561117, "percentage": 33.59, "elapsed_time": "14:15:25", "remaining_time": "1 day, 4:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6027, "total_steps": 17941, "loss": 1.6372, "learning_rate": 7.618051819451373e-05, "epoch": 0.33593445181428017, "percentage": 33.59, "elapsed_time": "14:15:33", "remaining_time": "1 day, 4:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6028, "total_steps": 17941, "loss": 1.7415, "learning_rate": 7.617293174534253e-05, "epoch": 0.3359901900674433, "percentage": 33.6, "elapsed_time": "14:15:42", "remaining_time": "1 day, 4:11:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6029, "total_steps": 17941, "loss": 1.6005, "learning_rate": 7.616534446611851e-05, "epoch": 0.3360459283206064, "percentage": 33.6, "elapsed_time": "14:15:50", "remaining_time": "1 day, 4:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6030, "total_steps": 17941, "loss": 1.6998, "learning_rate": 7.615775635708234e-05, "epoch": 0.33610166657376955, "percentage": 33.61, "elapsed_time": "14:15:59", "remaining_time": "1 day, 4:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6031, "total_steps": 17941, "loss": 1.6948, "learning_rate": 7.615016741847463e-05, "epoch": 0.33615740482693274, "percentage": 33.62, "elapsed_time": "14:16:08", "remaining_time": "1 day, 4:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6032, "total_steps": 17941, "loss": 1.5575, "learning_rate": 7.614257765053609e-05, "epoch": 0.33621314308009587, "percentage": 33.62, "elapsed_time": "14:16:16", "remaining_time": "1 day, 4:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6033, "total_steps": 17941, "loss": 1.7633, "learning_rate": 7.61349870535074e-05, "epoch": 0.336268881333259, "percentage": 33.63, "elapsed_time": "14:16:25", "remaining_time": "1 day, 4:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6034, "total_steps": 17941, "loss": 1.8196, "learning_rate": 7.612739562762929e-05, "epoch": 0.3363246195864222, "percentage": 33.63, "elapsed_time": "14:16:33", "remaining_time": "1 day, 4:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6035, "total_steps": 17941, "loss": 1.7916, "learning_rate": 7.611980337314254e-05, "epoch": 0.3363803578395853, "percentage": 33.64, "elapsed_time": "14:16:42", "remaining_time": "1 day, 4:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6036, "total_steps": 17941, "loss": 1.6909, "learning_rate": 7.61122102902879e-05, "epoch": 0.33643609609274844, "percentage": 33.64, "elapsed_time": "14:16:50", "remaining_time": "1 day, 4:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6037, "total_steps": 17941, "loss": 1.7166, "learning_rate": 7.610461637930621e-05, "epoch": 0.3364918343459116, "percentage": 33.65, "elapsed_time": "14:16:59", "remaining_time": "1 day, 4:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6038, "total_steps": 17941, "loss": 1.6479, "learning_rate": 7.609702164043829e-05, "epoch": 0.33654757259907475, "percentage": 33.65, "elapsed_time": "14:17:07", "remaining_time": "1 day, 4:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6039, "total_steps": 17941, "loss": 1.7645, "learning_rate": 7.6089426073925e-05, "epoch": 0.3366033108522379, "percentage": 33.66, "elapsed_time": "14:17:16", "remaining_time": "1 day, 4:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6040, "total_steps": 17941, "loss": 1.7543, "learning_rate": 7.608182968000721e-05, "epoch": 0.336659049105401, "percentage": 33.67, "elapsed_time": "14:17:24", "remaining_time": "1 day, 4:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6041, "total_steps": 17941, "loss": 1.6023, "learning_rate": 7.607423245892586e-05, "epoch": 0.3367147873585642, "percentage": 33.67, "elapsed_time": "14:17:33", "remaining_time": "1 day, 4:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6042, "total_steps": 17941, "loss": 1.7298, "learning_rate": 7.606663441092188e-05, "epoch": 0.3367705256117273, "percentage": 33.68, "elapsed_time": "14:17:41", "remaining_time": "1 day, 4:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6043, "total_steps": 17941, "loss": 1.9093, "learning_rate": 7.605903553623625e-05, "epoch": 0.33682626386489045, "percentage": 33.68, "elapsed_time": "14:17:49", "remaining_time": "1 day, 4:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6044, "total_steps": 17941, "loss": 1.7111, "learning_rate": 7.605143583510991e-05, "epoch": 0.33688200211805364, "percentage": 33.69, "elapsed_time": "14:17:58", "remaining_time": "1 day, 4:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6045, "total_steps": 17941, "loss": 1.5154, "learning_rate": 7.604383530778396e-05, "epoch": 0.33693774037121677, "percentage": 33.69, "elapsed_time": "14:18:06", "remaining_time": "1 day, 4:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6046, "total_steps": 17941, "loss": 1.7287, "learning_rate": 7.603623395449937e-05, "epoch": 0.3369934786243799, "percentage": 33.7, "elapsed_time": "14:18:15", "remaining_time": "1 day, 4:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6047, "total_steps": 17941, "loss": 1.7299, "learning_rate": 7.602863177549724e-05, "epoch": 0.3370492168775431, "percentage": 33.7, "elapsed_time": "14:18:24", "remaining_time": "1 day, 4:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6048, "total_steps": 17941, "loss": 1.8304, "learning_rate": 7.602102877101869e-05, "epoch": 0.3371049551307062, "percentage": 33.71, "elapsed_time": "14:18:33", "remaining_time": "1 day, 4:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6049, "total_steps": 17941, "loss": 1.5754, "learning_rate": 7.60134249413048e-05, "epoch": 0.33716069338386934, "percentage": 33.72, "elapsed_time": "14:18:42", "remaining_time": "1 day, 4:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6050, "total_steps": 17941, "loss": 1.7943, "learning_rate": 7.600582028659675e-05, "epoch": 0.3372164316370325, "percentage": 33.72, "elapsed_time": "14:18:50", "remaining_time": "1 day, 4:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6051, "total_steps": 17941, "loss": 1.4528, "learning_rate": 7.59982148071357e-05, "epoch": 0.33727216989019565, "percentage": 33.73, "elapsed_time": "14:18:58", "remaining_time": "1 day, 4:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6052, "total_steps": 17941, "loss": 1.7503, "learning_rate": 7.599060850316287e-05, "epoch": 0.3373279081433588, "percentage": 33.73, "elapsed_time": "14:19:07", "remaining_time": "1 day, 4:07:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6053, "total_steps": 17941, "loss": 1.7732, "learning_rate": 7.598300137491946e-05, "epoch": 0.3373836463965219, "percentage": 33.74, "elapsed_time": "14:19:15", "remaining_time": "1 day, 4:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6054, "total_steps": 17941, "loss": 1.6534, "learning_rate": 7.597539342264675e-05, "epoch": 0.3374393846496851, "percentage": 33.74, "elapsed_time": "14:19:24", "remaining_time": "1 day, 4:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6055, "total_steps": 17941, "loss": 1.6286, "learning_rate": 7.596778464658599e-05, "epoch": 0.3374951229028482, "percentage": 33.75, "elapsed_time": "14:19:32", "remaining_time": "1 day, 4:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6056, "total_steps": 17941, "loss": 1.7787, "learning_rate": 7.596017504697851e-05, "epoch": 0.33755086115601135, "percentage": 33.76, "elapsed_time": "14:19:41", "remaining_time": "1 day, 4:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6057, "total_steps": 17941, "loss": 1.7862, "learning_rate": 7.595256462406564e-05, "epoch": 0.33760659940917453, "percentage": 33.76, "elapsed_time": "14:19:49", "remaining_time": "1 day, 4:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6058, "total_steps": 17941, "loss": 1.6926, "learning_rate": 7.594495337808873e-05, "epoch": 0.33766233766233766, "percentage": 33.77, "elapsed_time": "14:19:58", "remaining_time": "1 day, 4:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6059, "total_steps": 17941, "loss": 1.6135, "learning_rate": 7.593734130928918e-05, "epoch": 0.3377180759155008, "percentage": 33.77, "elapsed_time": "14:20:06", "remaining_time": "1 day, 4:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6060, "total_steps": 17941, "loss": 1.5746, "learning_rate": 7.592972841790837e-05, "epoch": 0.337773814168664, "percentage": 33.78, "elapsed_time": "14:20:14", "remaining_time": "1 day, 4:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6061, "total_steps": 17941, "loss": 1.6457, "learning_rate": 7.592211470418777e-05, "epoch": 0.3378295524218271, "percentage": 33.78, "elapsed_time": "14:20:23", "remaining_time": "1 day, 4:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6062, "total_steps": 17941, "loss": 1.7026, "learning_rate": 7.59145001683688e-05, "epoch": 0.33788529067499024, "percentage": 33.79, "elapsed_time": "14:20:31", "remaining_time": "1 day, 4:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6063, "total_steps": 17941, "loss": 1.8168, "learning_rate": 7.590688481069302e-05, "epoch": 0.33794102892815336, "percentage": 33.79, "elapsed_time": "14:20:40", "remaining_time": "1 day, 4:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6064, "total_steps": 17941, "loss": 1.607, "learning_rate": 7.589926863140187e-05, "epoch": 0.33799676718131655, "percentage": 33.8, "elapsed_time": "14:20:48", "remaining_time": "1 day, 4:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6065, "total_steps": 17941, "loss": 1.9372, "learning_rate": 7.589165163073695e-05, "epoch": 0.3380525054344797, "percentage": 33.81, "elapsed_time": "14:20:57", "remaining_time": "1 day, 4:05:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6066, "total_steps": 17941, "loss": 1.6545, "learning_rate": 7.588403380893979e-05, "epoch": 0.3381082436876428, "percentage": 33.81, "elapsed_time": "14:21:05", "remaining_time": "1 day, 4:05:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6067, "total_steps": 17941, "loss": 1.8205, "learning_rate": 7.587641516625197e-05, "epoch": 0.338163981940806, "percentage": 33.82, "elapsed_time": "14:21:14", "remaining_time": "1 day, 4:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6068, "total_steps": 17941, "loss": 1.8597, "learning_rate": 7.586879570291514e-05, "epoch": 0.3382197201939691, "percentage": 33.82, "elapsed_time": "14:21:23", "remaining_time": "1 day, 4:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6069, "total_steps": 17941, "loss": 1.5266, "learning_rate": 7.586117541917095e-05, "epoch": 0.33827545844713225, "percentage": 33.83, "elapsed_time": "14:21:32", "remaining_time": "1 day, 4:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6070, "total_steps": 17941, "loss": 1.721, "learning_rate": 7.585355431526104e-05, "epoch": 0.33833119670029543, "percentage": 33.83, "elapsed_time": "14:21:40", "remaining_time": "1 day, 4:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6071, "total_steps": 17941, "loss": 1.624, "learning_rate": 7.584593239142712e-05, "epoch": 0.33838693495345856, "percentage": 33.84, "elapsed_time": "14:21:49", "remaining_time": "1 day, 4:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6072, "total_steps": 17941, "loss": 1.8765, "learning_rate": 7.583830964791094e-05, "epoch": 0.3384426732066217, "percentage": 33.84, "elapsed_time": "14:21:57", "remaining_time": "1 day, 4:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6073, "total_steps": 17941, "loss": 1.6027, "learning_rate": 7.58306860849542e-05, "epoch": 0.3384984114597849, "percentage": 33.85, "elapsed_time": "14:22:06", "remaining_time": "1 day, 4:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6074, "total_steps": 17941, "loss": 1.8485, "learning_rate": 7.582306170279872e-05, "epoch": 0.338554149712948, "percentage": 33.86, "elapsed_time": "14:22:14", "remaining_time": "1 day, 4:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6075, "total_steps": 17941, "loss": 1.7822, "learning_rate": 7.581543650168628e-05, "epoch": 0.33860988796611113, "percentage": 33.86, "elapsed_time": "14:22:23", "remaining_time": "1 day, 4:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6076, "total_steps": 17941, "loss": 1.6443, "learning_rate": 7.580781048185871e-05, "epoch": 0.33866562621927426, "percentage": 33.87, "elapsed_time": "14:22:32", "remaining_time": "1 day, 4:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6077, "total_steps": 17941, "loss": 1.5943, "learning_rate": 7.580018364355785e-05, "epoch": 0.33872136447243745, "percentage": 33.87, "elapsed_time": "14:22:40", "remaining_time": "1 day, 4:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6078, "total_steps": 17941, "loss": 1.4501, "learning_rate": 7.579255598702562e-05, "epoch": 0.3387771027256006, "percentage": 33.88, "elapsed_time": "14:22:49", "remaining_time": "1 day, 4:04:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6079, "total_steps": 17941, "loss": 1.7001, "learning_rate": 7.578492751250386e-05, "epoch": 0.3388328409787637, "percentage": 33.88, "elapsed_time": "14:22:57", "remaining_time": "1 day, 4:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6080, "total_steps": 17941, "loss": 1.6652, "learning_rate": 7.577729822023455e-05, "epoch": 0.3388885792319269, "percentage": 33.89, "elapsed_time": "14:23:06", "remaining_time": "1 day, 4:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6081, "total_steps": 17941, "loss": 1.6988, "learning_rate": 7.576966811045963e-05, "epoch": 0.33894431748509, "percentage": 33.89, "elapsed_time": "14:23:14", "remaining_time": "1 day, 4:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6082, "total_steps": 17941, "loss": 1.9584, "learning_rate": 7.576203718342108e-05, "epoch": 0.33900005573825315, "percentage": 33.9, "elapsed_time": "14:23:23", "remaining_time": "1 day, 4:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6083, "total_steps": 17941, "loss": 2.0357, "learning_rate": 7.575440543936092e-05, "epoch": 0.33905579399141633, "percentage": 33.91, "elapsed_time": "14:23:31", "remaining_time": "1 day, 4:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6084, "total_steps": 17941, "loss": 1.6323, "learning_rate": 7.574677287852117e-05, "epoch": 0.33911153224457946, "percentage": 33.91, "elapsed_time": "14:23:40", "remaining_time": "1 day, 4:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6085, "total_steps": 17941, "loss": 1.538, "learning_rate": 7.573913950114391e-05, "epoch": 0.3391672704977426, "percentage": 33.92, "elapsed_time": "14:23:48", "remaining_time": "1 day, 4:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6086, "total_steps": 17941, "loss": 1.6013, "learning_rate": 7.573150530747122e-05, "epoch": 0.3392230087509057, "percentage": 33.92, "elapsed_time": "14:23:56", "remaining_time": "1 day, 4:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6087, "total_steps": 17941, "loss": 1.6444, "learning_rate": 7.572387029774519e-05, "epoch": 0.3392787470040689, "percentage": 33.93, "elapsed_time": "14:24:05", "remaining_time": "1 day, 4:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6088, "total_steps": 17941, "loss": 1.6733, "learning_rate": 7.571623447220797e-05, "epoch": 0.33933448525723203, "percentage": 33.93, "elapsed_time": "14:24:13", "remaining_time": "1 day, 4:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6089, "total_steps": 17941, "loss": 1.7219, "learning_rate": 7.570859783110176e-05, "epoch": 0.33939022351039516, "percentage": 33.94, "elapsed_time": "14:24:22", "remaining_time": "1 day, 4:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6090, "total_steps": 17941, "loss": 1.407, "learning_rate": 7.570096037466869e-05, "epoch": 0.33944596176355835, "percentage": 33.94, "elapsed_time": "14:24:30", "remaining_time": "1 day, 4:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6091, "total_steps": 17941, "loss": 1.4608, "learning_rate": 7.5693322103151e-05, "epoch": 0.3395017000167215, "percentage": 33.95, "elapsed_time": "14:24:39", "remaining_time": "1 day, 4:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6092, "total_steps": 17941, "loss": 1.6756, "learning_rate": 7.568568301679096e-05, "epoch": 0.3395574382698846, "percentage": 33.96, "elapsed_time": "14:24:47", "remaining_time": "1 day, 4:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6093, "total_steps": 17941, "loss": 1.7648, "learning_rate": 7.56780431158308e-05, "epoch": 0.3396131765230478, "percentage": 33.96, "elapsed_time": "14:24:56", "remaining_time": "1 day, 4:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6094, "total_steps": 17941, "loss": 1.6954, "learning_rate": 7.567040240051281e-05, "epoch": 0.3396689147762109, "percentage": 33.97, "elapsed_time": "14:25:04", "remaining_time": "1 day, 4:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6095, "total_steps": 17941, "loss": 1.8131, "learning_rate": 7.566276087107935e-05, "epoch": 0.33972465302937405, "percentage": 33.97, "elapsed_time": "14:25:12", "remaining_time": "1 day, 4:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6096, "total_steps": 17941, "loss": 1.6522, "learning_rate": 7.565511852777274e-05, "epoch": 0.33978039128253723, "percentage": 33.98, "elapsed_time": "14:25:21", "remaining_time": "1 day, 4:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6097, "total_steps": 17941, "loss": 1.6971, "learning_rate": 7.564747537083534e-05, "epoch": 0.33983612953570036, "percentage": 33.98, "elapsed_time": "14:25:29", "remaining_time": "1 day, 4:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6098, "total_steps": 17941, "loss": 1.6759, "learning_rate": 7.563983140050955e-05, "epoch": 0.3398918677888635, "percentage": 33.99, "elapsed_time": "14:25:39", "remaining_time": "1 day, 4:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6099, "total_steps": 17941, "loss": 1.7203, "learning_rate": 7.563218661703782e-05, "epoch": 0.3399476060420266, "percentage": 33.99, "elapsed_time": "14:25:48", "remaining_time": "1 day, 4:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6100, "total_steps": 17941, "loss": 1.9364, "learning_rate": 7.562454102066255e-05, "epoch": 0.3400033442951898, "percentage": 34.0, "elapsed_time": "14:25:56", "remaining_time": "1 day, 4:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6101, "total_steps": 17941, "loss": 1.6623, "learning_rate": 7.561689461162625e-05, "epoch": 0.34005908254835293, "percentage": 34.01, "elapsed_time": "14:26:05", "remaining_time": "1 day, 4:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6102, "total_steps": 17941, "loss": 1.567, "learning_rate": 7.56092473901714e-05, "epoch": 0.34011482080151606, "percentage": 34.01, "elapsed_time": "14:26:13", "remaining_time": "1 day, 4:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6103, "total_steps": 17941, "loss": 1.8714, "learning_rate": 7.560159935654056e-05, "epoch": 0.34017055905467924, "percentage": 34.02, "elapsed_time": "14:26:22", "remaining_time": "1 day, 4:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6104, "total_steps": 17941, "loss": 1.6713, "learning_rate": 7.559395051097624e-05, "epoch": 0.3402262973078424, "percentage": 34.02, "elapsed_time": "14:26:30", "remaining_time": "1 day, 4:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6105, "total_steps": 17941, "loss": 1.6552, "learning_rate": 7.558630085372105e-05, "epoch": 0.3402820355610055, "percentage": 34.03, "elapsed_time": "14:26:39", "remaining_time": "1 day, 4:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6106, "total_steps": 17941, "loss": 1.65, "learning_rate": 7.557865038501756e-05, "epoch": 0.3403377738141687, "percentage": 34.03, "elapsed_time": "14:26:47", "remaining_time": "1 day, 4:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6107, "total_steps": 17941, "loss": 1.8507, "learning_rate": 7.55709991051084e-05, "epoch": 0.3403935120673318, "percentage": 34.04, "elapsed_time": "14:26:56", "remaining_time": "1 day, 3:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6108, "total_steps": 17941, "loss": 2.0143, "learning_rate": 7.556334701423627e-05, "epoch": 0.34044925032049494, "percentage": 34.04, "elapsed_time": "14:27:04", "remaining_time": "1 day, 3:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6109, "total_steps": 17941, "loss": 1.9006, "learning_rate": 7.555569411264378e-05, "epoch": 0.3405049885736581, "percentage": 34.05, "elapsed_time": "14:27:12", "remaining_time": "1 day, 3:59:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6110, "total_steps": 17941, "loss": 1.4028, "learning_rate": 7.554804040057369e-05, "epoch": 0.34056072682682126, "percentage": 34.06, "elapsed_time": "14:27:21", "remaining_time": "1 day, 3:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6111, "total_steps": 17941, "loss": 1.6835, "learning_rate": 7.554038587826872e-05, "epoch": 0.3406164650799844, "percentage": 34.06, "elapsed_time": "14:27:29", "remaining_time": "1 day, 3:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6112, "total_steps": 17941, "loss": 1.5901, "learning_rate": 7.553273054597163e-05, "epoch": 0.3406722033331475, "percentage": 34.07, "elapsed_time": "14:27:38", "remaining_time": "1 day, 3:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6113, "total_steps": 17941, "loss": 1.8776, "learning_rate": 7.552507440392518e-05, "epoch": 0.3407279415863107, "percentage": 34.07, "elapsed_time": "14:27:46", "remaining_time": "1 day, 3:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6114, "total_steps": 17941, "loss": 1.4647, "learning_rate": 7.551741745237218e-05, "epoch": 0.34078367983947383, "percentage": 34.08, "elapsed_time": "14:27:55", "remaining_time": "1 day, 3:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6115, "total_steps": 17941, "loss": 1.8638, "learning_rate": 7.55097596915555e-05, "epoch": 0.34083941809263696, "percentage": 34.08, "elapsed_time": "14:28:03", "remaining_time": "1 day, 3:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6116, "total_steps": 17941, "loss": 1.7598, "learning_rate": 7.550210112171796e-05, "epoch": 0.34089515634580014, "percentage": 34.09, "elapsed_time": "14:28:12", "remaining_time": "1 day, 3:58:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6117, "total_steps": 17941, "loss": 1.8239, "learning_rate": 7.549444174310246e-05, "epoch": 0.34095089459896327, "percentage": 34.1, "elapsed_time": "14:28:20", "remaining_time": "1 day, 3:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6118, "total_steps": 17941, "loss": 1.7103, "learning_rate": 7.548678155595192e-05, "epoch": 0.3410066328521264, "percentage": 34.1, "elapsed_time": "14:28:29", "remaining_time": "1 day, 3:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6119, "total_steps": 17941, "loss": 1.8269, "learning_rate": 7.547912056050925e-05, "epoch": 0.3410623711052896, "percentage": 34.11, "elapsed_time": "14:28:37", "remaining_time": "1 day, 3:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6120, "total_steps": 17941, "loss": 1.7221, "learning_rate": 7.547145875701744e-05, "epoch": 0.3411181093584527, "percentage": 34.11, "elapsed_time": "14:28:46", "remaining_time": "1 day, 3:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6121, "total_steps": 17941, "loss": 1.6879, "learning_rate": 7.546379614571947e-05, "epoch": 0.34117384761161584, "percentage": 34.12, "elapsed_time": "14:28:54", "remaining_time": "1 day, 3:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6122, "total_steps": 17941, "loss": 1.9402, "learning_rate": 7.545613272685834e-05, "epoch": 0.341229585864779, "percentage": 34.12, "elapsed_time": "14:29:02", "remaining_time": "1 day, 3:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6123, "total_steps": 17941, "loss": 1.6331, "learning_rate": 7.544846850067711e-05, "epoch": 0.34128532411794216, "percentage": 34.13, "elapsed_time": "14:29:11", "remaining_time": "1 day, 3:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6124, "total_steps": 17941, "loss": 1.6547, "learning_rate": 7.544080346741884e-05, "epoch": 0.3413410623711053, "percentage": 34.13, "elapsed_time": "14:29:19", "remaining_time": "1 day, 3:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6125, "total_steps": 17941, "loss": 1.5988, "learning_rate": 7.54331376273266e-05, "epoch": 0.3413968006242684, "percentage": 34.14, "elapsed_time": "14:29:29", "remaining_time": "1 day, 3:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6126, "total_steps": 17941, "loss": 1.8314, "learning_rate": 7.542547098064351e-05, "epoch": 0.3414525388774316, "percentage": 34.15, "elapsed_time": "14:29:37", "remaining_time": "1 day, 3:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6127, "total_steps": 17941, "loss": 1.7797, "learning_rate": 7.541780352761275e-05, "epoch": 0.34150827713059473, "percentage": 34.15, "elapsed_time": "14:29:46", "remaining_time": "1 day, 3:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6128, "total_steps": 17941, "loss": 1.7118, "learning_rate": 7.541013526847745e-05, "epoch": 0.34156401538375786, "percentage": 34.16, "elapsed_time": "14:29:54", "remaining_time": "1 day, 3:56:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6129, "total_steps": 17941, "loss": 1.8582, "learning_rate": 7.540246620348079e-05, "epoch": 0.34161975363692104, "percentage": 34.16, "elapsed_time": "14:30:02", "remaining_time": "1 day, 3:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6130, "total_steps": 17941, "loss": 1.5773, "learning_rate": 7.539479633286604e-05, "epoch": 0.34167549189008417, "percentage": 34.17, "elapsed_time": "14:30:11", "remaining_time": "1 day, 3:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6131, "total_steps": 17941, "loss": 1.6079, "learning_rate": 7.538712565687637e-05, "epoch": 0.3417312301432473, "percentage": 34.17, "elapsed_time": "14:30:19", "remaining_time": "1 day, 3:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6132, "total_steps": 17941, "loss": 1.7772, "learning_rate": 7.537945417575513e-05, "epoch": 0.34178696839641043, "percentage": 34.18, "elapsed_time": "14:30:28", "remaining_time": "1 day, 3:56:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6133, "total_steps": 17941, "loss": 1.8646, "learning_rate": 7.537178188974556e-05, "epoch": 0.3418427066495736, "percentage": 34.18, "elapsed_time": "14:30:36", "remaining_time": "1 day, 3:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6134, "total_steps": 17941, "loss": 1.7059, "learning_rate": 7.5364108799091e-05, "epoch": 0.34189844490273674, "percentage": 34.19, "elapsed_time": "14:30:45", "remaining_time": "1 day, 3:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6135, "total_steps": 17941, "loss": 1.5904, "learning_rate": 7.535643490403478e-05, "epoch": 0.34195418315589987, "percentage": 34.2, "elapsed_time": "14:30:53", "remaining_time": "1 day, 3:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6136, "total_steps": 17941, "loss": 1.6569, "learning_rate": 7.534876020482032e-05, "epoch": 0.34200992140906306, "percentage": 34.2, "elapsed_time": "14:31:02", "remaining_time": "1 day, 3:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6137, "total_steps": 17941, "loss": 1.947, "learning_rate": 7.534108470169094e-05, "epoch": 0.3420656596622262, "percentage": 34.21, "elapsed_time": "14:31:11", "remaining_time": "1 day, 3:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6138, "total_steps": 17941, "loss": 1.6199, "learning_rate": 7.533340839489011e-05, "epoch": 0.3421213979153893, "percentage": 34.21, "elapsed_time": "14:31:19", "remaining_time": "1 day, 3:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6139, "total_steps": 17941, "loss": 1.901, "learning_rate": 7.532573128466129e-05, "epoch": 0.3421771361685525, "percentage": 34.22, "elapsed_time": "14:31:28", "remaining_time": "1 day, 3:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6140, "total_steps": 17941, "loss": 1.7284, "learning_rate": 7.53180533712479e-05, "epoch": 0.3422328744217156, "percentage": 34.22, "elapsed_time": "14:31:37", "remaining_time": "1 day, 3:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6141, "total_steps": 17941, "loss": 1.8184, "learning_rate": 7.53103746548935e-05, "epoch": 0.34228861267487876, "percentage": 34.23, "elapsed_time": "14:31:45", "remaining_time": "1 day, 3:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6142, "total_steps": 17941, "loss": 1.6444, "learning_rate": 7.530269513584158e-05, "epoch": 0.34234435092804194, "percentage": 34.23, "elapsed_time": "14:31:54", "remaining_time": "1 day, 3:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6143, "total_steps": 17941, "loss": 1.5748, "learning_rate": 7.52950148143357e-05, "epoch": 0.34240008918120507, "percentage": 34.24, "elapsed_time": "14:32:03", "remaining_time": "1 day, 3:54:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6144, "total_steps": 17941, "loss": 1.8188, "learning_rate": 7.528733369061942e-05, "epoch": 0.3424558274343682, "percentage": 34.25, "elapsed_time": "14:32:11", "remaining_time": "1 day, 3:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6145, "total_steps": 17941, "loss": 1.5839, "learning_rate": 7.527965176493636e-05, "epoch": 0.3425115656875313, "percentage": 34.25, "elapsed_time": "14:32:20", "remaining_time": "1 day, 3:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6146, "total_steps": 17941, "loss": 1.3862, "learning_rate": 7.527196903753011e-05, "epoch": 0.3425673039406945, "percentage": 34.26, "elapsed_time": "14:32:29", "remaining_time": "1 day, 3:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6147, "total_steps": 17941, "loss": 1.5308, "learning_rate": 7.526428550864437e-05, "epoch": 0.34262304219385764, "percentage": 34.26, "elapsed_time": "14:32:37", "remaining_time": "1 day, 3:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6148, "total_steps": 17941, "loss": 1.7377, "learning_rate": 7.525660117852279e-05, "epoch": 0.34267878044702077, "percentage": 34.27, "elapsed_time": "14:32:46", "remaining_time": "1 day, 3:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6149, "total_steps": 17941, "loss": 1.7305, "learning_rate": 7.524891604740908e-05, "epoch": 0.34273451870018395, "percentage": 34.27, "elapsed_time": "14:32:54", "remaining_time": "1 day, 3:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6150, "total_steps": 17941, "loss": 1.5379, "learning_rate": 7.524123011554697e-05, "epoch": 0.3427902569533471, "percentage": 34.28, "elapsed_time": "14:33:03", "remaining_time": "1 day, 3:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6151, "total_steps": 17941, "loss": 1.7069, "learning_rate": 7.52335433831802e-05, "epoch": 0.3428459952065102, "percentage": 34.28, "elapsed_time": "14:33:11", "remaining_time": "1 day, 3:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6152, "total_steps": 17941, "loss": 1.8944, "learning_rate": 7.522585585055255e-05, "epoch": 0.3429017334596734, "percentage": 34.29, "elapsed_time": "14:33:20", "remaining_time": "1 day, 3:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6153, "total_steps": 17941, "loss": 1.622, "learning_rate": 7.521816751790783e-05, "epoch": 0.3429574717128365, "percentage": 34.3, "elapsed_time": "14:33:28", "remaining_time": "1 day, 3:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6154, "total_steps": 17941, "loss": 1.8005, "learning_rate": 7.521047838548988e-05, "epoch": 0.34301320996599965, "percentage": 34.3, "elapsed_time": "14:33:37", "remaining_time": "1 day, 3:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6155, "total_steps": 17941, "loss": 1.4795, "learning_rate": 7.520278845354254e-05, "epoch": 0.3430689482191628, "percentage": 34.31, "elapsed_time": "14:33:45", "remaining_time": "1 day, 3:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6156, "total_steps": 17941, "loss": 1.5029, "learning_rate": 7.519509772230968e-05, "epoch": 0.34312468647232597, "percentage": 34.31, "elapsed_time": "14:33:54", "remaining_time": "1 day, 3:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6157, "total_steps": 17941, "loss": 1.7075, "learning_rate": 7.518740619203523e-05, "epoch": 0.3431804247254891, "percentage": 34.32, "elapsed_time": "14:34:02", "remaining_time": "1 day, 3:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6158, "total_steps": 17941, "loss": 1.9524, "learning_rate": 7.517971386296309e-05, "epoch": 0.3432361629786522, "percentage": 34.32, "elapsed_time": "14:34:10", "remaining_time": "1 day, 3:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6159, "total_steps": 17941, "loss": 1.533, "learning_rate": 7.517202073533727e-05, "epoch": 0.3432919012318154, "percentage": 34.33, "elapsed_time": "14:34:19", "remaining_time": "1 day, 3:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6160, "total_steps": 17941, "loss": 1.7298, "learning_rate": 7.516432680940168e-05, "epoch": 0.34334763948497854, "percentage": 34.33, "elapsed_time": "14:34:27", "remaining_time": "1 day, 3:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6161, "total_steps": 17941, "loss": 1.7295, "learning_rate": 7.515663208540037e-05, "epoch": 0.34340337773814167, "percentage": 34.34, "elapsed_time": "14:34:36", "remaining_time": "1 day, 3:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6162, "total_steps": 17941, "loss": 1.756, "learning_rate": 7.514893656357738e-05, "epoch": 0.34345911599130485, "percentage": 34.35, "elapsed_time": "14:34:45", "remaining_time": "1 day, 3:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6163, "total_steps": 17941, "loss": 1.7149, "learning_rate": 7.514124024417674e-05, "epoch": 0.343514854244468, "percentage": 34.35, "elapsed_time": "14:34:53", "remaining_time": "1 day, 3:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6164, "total_steps": 17941, "loss": 1.7262, "learning_rate": 7.513354312744256e-05, "epoch": 0.3435705924976311, "percentage": 34.36, "elapsed_time": "14:35:02", "remaining_time": "1 day, 3:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6165, "total_steps": 17941, "loss": 1.6434, "learning_rate": 7.512584521361891e-05, "epoch": 0.3436263307507943, "percentage": 34.36, "elapsed_time": "14:35:10", "remaining_time": "1 day, 3:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6166, "total_steps": 17941, "loss": 1.5353, "learning_rate": 7.511814650294994e-05, "epoch": 0.3436820690039574, "percentage": 34.37, "elapsed_time": "14:35:19", "remaining_time": "1 day, 3:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6167, "total_steps": 17941, "loss": 1.8312, "learning_rate": 7.511044699567981e-05, "epoch": 0.34373780725712055, "percentage": 34.37, "elapsed_time": "14:35:27", "remaining_time": "1 day, 3:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6168, "total_steps": 17941, "loss": 1.6326, "learning_rate": 7.510274669205273e-05, "epoch": 0.3437935455102837, "percentage": 34.38, "elapsed_time": "14:35:36", "remaining_time": "1 day, 3:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6169, "total_steps": 17941, "loss": 1.7319, "learning_rate": 7.509504559231287e-05, "epoch": 0.34384928376344687, "percentage": 34.38, "elapsed_time": "14:35:44", "remaining_time": "1 day, 3:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6170, "total_steps": 17941, "loss": 1.69, "learning_rate": 7.508734369670447e-05, "epoch": 0.34390502201661, "percentage": 34.39, "elapsed_time": "14:35:53", "remaining_time": "1 day, 3:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6171, "total_steps": 17941, "loss": 1.6961, "learning_rate": 7.507964100547181e-05, "epoch": 0.3439607602697731, "percentage": 34.4, "elapsed_time": "14:36:01", "remaining_time": "1 day, 3:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6172, "total_steps": 17941, "loss": 1.794, "learning_rate": 7.507193751885915e-05, "epoch": 0.3440164985229363, "percentage": 34.4, "elapsed_time": "14:36:10", "remaining_time": "1 day, 3:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6173, "total_steps": 17941, "loss": 1.637, "learning_rate": 7.506423323711083e-05, "epoch": 0.34407223677609944, "percentage": 34.41, "elapsed_time": "14:36:19", "remaining_time": "1 day, 3:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6174, "total_steps": 17941, "loss": 1.4696, "learning_rate": 7.505652816047115e-05, "epoch": 0.34412797502926257, "percentage": 34.41, "elapsed_time": "14:36:27", "remaining_time": "1 day, 3:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6175, "total_steps": 17941, "loss": 1.6329, "learning_rate": 7.504882228918449e-05, "epoch": 0.34418371328242575, "percentage": 34.42, "elapsed_time": "14:36:36", "remaining_time": "1 day, 3:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6176, "total_steps": 17941, "loss": 1.5929, "learning_rate": 7.504111562349524e-05, "epoch": 0.3442394515355889, "percentage": 34.42, "elapsed_time": "14:36:44", "remaining_time": "1 day, 3:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6177, "total_steps": 17941, "loss": 1.6935, "learning_rate": 7.503340816364779e-05, "epoch": 0.344295189788752, "percentage": 34.43, "elapsed_time": "14:36:54", "remaining_time": "1 day, 3:50:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6178, "total_steps": 17941, "loss": 1.5508, "learning_rate": 7.502569990988659e-05, "epoch": 0.3443509280419152, "percentage": 34.44, "elapsed_time": "14:37:02", "remaining_time": "1 day, 3:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6179, "total_steps": 17941, "loss": 1.3464, "learning_rate": 7.50179908624561e-05, "epoch": 0.3444066662950783, "percentage": 34.44, "elapsed_time": "14:37:11", "remaining_time": "1 day, 3:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6180, "total_steps": 17941, "loss": 1.6306, "learning_rate": 7.501028102160082e-05, "epoch": 0.34446240454824145, "percentage": 34.45, "elapsed_time": "14:37:19", "remaining_time": "1 day, 3:49:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6181, "total_steps": 17941, "loss": 1.9743, "learning_rate": 7.500257038756522e-05, "epoch": 0.3445181428014046, "percentage": 34.45, "elapsed_time": "14:37:27", "remaining_time": "1 day, 3:49:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6182, "total_steps": 17941, "loss": 1.7876, "learning_rate": 7.499485896059389e-05, "epoch": 0.34457388105456777, "percentage": 34.46, "elapsed_time": "14:37:36", "remaining_time": "1 day, 3:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6183, "total_steps": 17941, "loss": 1.599, "learning_rate": 7.498714674093134e-05, "epoch": 0.3446296193077309, "percentage": 34.46, "elapsed_time": "14:37:44", "remaining_time": "1 day, 3:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6184, "total_steps": 17941, "loss": 1.3671, "learning_rate": 7.497943372882219e-05, "epoch": 0.344685357560894, "percentage": 34.47, "elapsed_time": "14:37:53", "remaining_time": "1 day, 3:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6185, "total_steps": 17941, "loss": 1.8846, "learning_rate": 7.497171992451104e-05, "epoch": 0.3447410958140572, "percentage": 34.47, "elapsed_time": "14:38:01", "remaining_time": "1 day, 3:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6186, "total_steps": 17941, "loss": 1.8147, "learning_rate": 7.496400532824252e-05, "epoch": 0.34479683406722034, "percentage": 34.48, "elapsed_time": "14:38:10", "remaining_time": "1 day, 3:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6187, "total_steps": 17941, "loss": 1.8584, "learning_rate": 7.495628994026131e-05, "epoch": 0.34485257232038347, "percentage": 34.49, "elapsed_time": "14:38:18", "remaining_time": "1 day, 3:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6188, "total_steps": 17941, "loss": 1.6254, "learning_rate": 7.49485737608121e-05, "epoch": 0.34490831057354665, "percentage": 34.49, "elapsed_time": "14:38:27", "remaining_time": "1 day, 3:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6189, "total_steps": 17941, "loss": 1.5997, "learning_rate": 7.494085679013959e-05, "epoch": 0.3449640488267098, "percentage": 34.5, "elapsed_time": "14:38:35", "remaining_time": "1 day, 3:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6190, "total_steps": 17941, "loss": 1.7723, "learning_rate": 7.49331390284885e-05, "epoch": 0.3450197870798729, "percentage": 34.5, "elapsed_time": "14:38:43", "remaining_time": "1 day, 3:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6191, "total_steps": 17941, "loss": 1.7536, "learning_rate": 7.492542047610362e-05, "epoch": 0.34507552533303604, "percentage": 34.51, "elapsed_time": "14:38:52", "remaining_time": "1 day, 3:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6192, "total_steps": 17941, "loss": 1.5518, "learning_rate": 7.491770113322972e-05, "epoch": 0.3451312635861992, "percentage": 34.51, "elapsed_time": "14:39:00", "remaining_time": "1 day, 3:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6193, "total_steps": 17941, "loss": 1.8805, "learning_rate": 7.490998100011164e-05, "epoch": 0.34518700183936235, "percentage": 34.52, "elapsed_time": "14:39:09", "remaining_time": "1 day, 3:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6194, "total_steps": 17941, "loss": 1.7369, "learning_rate": 7.490226007699418e-05, "epoch": 0.3452427400925255, "percentage": 34.52, "elapsed_time": "14:39:17", "remaining_time": "1 day, 3:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6195, "total_steps": 17941, "loss": 1.7199, "learning_rate": 7.489453836412224e-05, "epoch": 0.34529847834568866, "percentage": 34.53, "elapsed_time": "14:39:26", "remaining_time": "1 day, 3:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6196, "total_steps": 17941, "loss": 1.8962, "learning_rate": 7.488681586174066e-05, "epoch": 0.3453542165988518, "percentage": 34.54, "elapsed_time": "14:39:34", "remaining_time": "1 day, 3:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6197, "total_steps": 17941, "loss": 1.6779, "learning_rate": 7.48790925700944e-05, "epoch": 0.3454099548520149, "percentage": 34.54, "elapsed_time": "14:39:43", "remaining_time": "1 day, 3:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6198, "total_steps": 17941, "loss": 1.837, "learning_rate": 7.487136848942838e-05, "epoch": 0.3454656931051781, "percentage": 34.55, "elapsed_time": "14:39:51", "remaining_time": "1 day, 3:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6199, "total_steps": 17941, "loss": 1.5438, "learning_rate": 7.486364361998754e-05, "epoch": 0.34552143135834124, "percentage": 34.55, "elapsed_time": "14:39:59", "remaining_time": "1 day, 3:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6200, "total_steps": 17941, "loss": 1.8893, "learning_rate": 7.485591796201692e-05, "epoch": 0.34557716961150436, "percentage": 34.56, "elapsed_time": "14:40:08", "remaining_time": "1 day, 3:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6201, "total_steps": 17941, "loss": 1.7063, "learning_rate": 7.484819151576147e-05, "epoch": 0.34563290786466755, "percentage": 34.56, "elapsed_time": "14:40:16", "remaining_time": "1 day, 3:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6202, "total_steps": 17941, "loss": 1.6052, "learning_rate": 7.48404642814663e-05, "epoch": 0.3456886461178307, "percentage": 34.57, "elapsed_time": "14:40:25", "remaining_time": "1 day, 3:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6203, "total_steps": 17941, "loss": 1.5859, "learning_rate": 7.48327362593764e-05, "epoch": 0.3457443843709938, "percentage": 34.57, "elapsed_time": "14:40:33", "remaining_time": "1 day, 3:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6204, "total_steps": 17941, "loss": 1.9669, "learning_rate": 7.48250074497369e-05, "epoch": 0.34580012262415694, "percentage": 34.58, "elapsed_time": "14:40:43", "remaining_time": "1 day, 3:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6205, "total_steps": 17941, "loss": 1.6103, "learning_rate": 7.48172778527929e-05, "epoch": 0.3458558608773201, "percentage": 34.59, "elapsed_time": "14:40:51", "remaining_time": "1 day, 3:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6206, "total_steps": 17941, "loss": 1.4648, "learning_rate": 7.480954746878955e-05, "epoch": 0.34591159913048325, "percentage": 34.59, "elapsed_time": "14:41:00", "remaining_time": "1 day, 3:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6207, "total_steps": 17941, "loss": 1.7882, "learning_rate": 7.480181629797201e-05, "epoch": 0.3459673373836464, "percentage": 34.6, "elapsed_time": "14:41:08", "remaining_time": "1 day, 3:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6208, "total_steps": 17941, "loss": 1.757, "learning_rate": 7.479408434058545e-05, "epoch": 0.34602307563680956, "percentage": 34.6, "elapsed_time": "14:41:16", "remaining_time": "1 day, 3:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6209, "total_steps": 17941, "loss": 1.6573, "learning_rate": 7.47863515968751e-05, "epoch": 0.3460788138899727, "percentage": 34.61, "elapsed_time": "14:41:25", "remaining_time": "1 day, 3:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6210, "total_steps": 17941, "loss": 1.8348, "learning_rate": 7.477861806708618e-05, "epoch": 0.3461345521431358, "percentage": 34.61, "elapsed_time": "14:41:33", "remaining_time": "1 day, 3:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6211, "total_steps": 17941, "loss": 2.1581, "learning_rate": 7.477088375146397e-05, "epoch": 0.346190290396299, "percentage": 34.62, "elapsed_time": "14:41:42", "remaining_time": "1 day, 3:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6212, "total_steps": 17941, "loss": 1.7823, "learning_rate": 7.476314865025376e-05, "epoch": 0.34624602864946213, "percentage": 34.62, "elapsed_time": "14:41:51", "remaining_time": "1 day, 3:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6213, "total_steps": 17941, "loss": 1.5717, "learning_rate": 7.475541276370083e-05, "epoch": 0.34630176690262526, "percentage": 34.63, "elapsed_time": "14:41:59", "remaining_time": "1 day, 3:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6214, "total_steps": 17941, "loss": 1.8471, "learning_rate": 7.474767609205057e-05, "epoch": 0.3463575051557884, "percentage": 34.64, "elapsed_time": "14:42:08", "remaining_time": "1 day, 3:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6215, "total_steps": 17941, "loss": 1.5991, "learning_rate": 7.473993863554832e-05, "epoch": 0.3464132434089516, "percentage": 34.64, "elapsed_time": "14:42:16", "remaining_time": "1 day, 3:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6216, "total_steps": 17941, "loss": 1.8795, "learning_rate": 7.473220039443942e-05, "epoch": 0.3464689816621147, "percentage": 34.65, "elapsed_time": "14:42:25", "remaining_time": "1 day, 3:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6217, "total_steps": 17941, "loss": 1.5189, "learning_rate": 7.472446136896935e-05, "epoch": 0.34652471991527783, "percentage": 34.65, "elapsed_time": "14:42:33", "remaining_time": "1 day, 3:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6218, "total_steps": 17941, "loss": 1.5113, "learning_rate": 7.471672155938351e-05, "epoch": 0.346580458168441, "percentage": 34.66, "elapsed_time": "14:42:42", "remaining_time": "1 day, 3:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6219, "total_steps": 17941, "loss": 1.62, "learning_rate": 7.470898096592738e-05, "epoch": 0.34663619642160415, "percentage": 34.66, "elapsed_time": "14:42:50", "remaining_time": "1 day, 3:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6220, "total_steps": 17941, "loss": 1.7652, "learning_rate": 7.470123958884643e-05, "epoch": 0.3466919346747673, "percentage": 34.67, "elapsed_time": "14:42:59", "remaining_time": "1 day, 3:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6221, "total_steps": 17941, "loss": 1.816, "learning_rate": 7.469349742838619e-05, "epoch": 0.34674767292793046, "percentage": 34.67, "elapsed_time": "14:43:07", "remaining_time": "1 day, 3:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6222, "total_steps": 17941, "loss": 1.4521, "learning_rate": 7.468575448479217e-05, "epoch": 0.3468034111810936, "percentage": 34.68, "elapsed_time": "14:43:16", "remaining_time": "1 day, 3:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6223, "total_steps": 17941, "loss": 1.6393, "learning_rate": 7.467801075830995e-05, "epoch": 0.3468591494342567, "percentage": 34.69, "elapsed_time": "14:43:24", "remaining_time": "1 day, 3:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6224, "total_steps": 17941, "loss": 1.8486, "learning_rate": 7.467026624918511e-05, "epoch": 0.3469148876874199, "percentage": 34.69, "elapsed_time": "14:43:33", "remaining_time": "1 day, 3:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6225, "total_steps": 17941, "loss": 1.9639, "learning_rate": 7.466252095766326e-05, "epoch": 0.34697062594058303, "percentage": 34.7, "elapsed_time": "14:43:41", "remaining_time": "1 day, 3:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6226, "total_steps": 17941, "loss": 1.7672, "learning_rate": 7.465477488399004e-05, "epoch": 0.34702636419374616, "percentage": 34.7, "elapsed_time": "14:43:49", "remaining_time": "1 day, 3:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6227, "total_steps": 17941, "loss": 1.8587, "learning_rate": 7.464702802841111e-05, "epoch": 0.3470821024469093, "percentage": 34.71, "elapsed_time": "14:43:58", "remaining_time": "1 day, 3:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6228, "total_steps": 17941, "loss": 1.6798, "learning_rate": 7.463928039117216e-05, "epoch": 0.3471378407000725, "percentage": 34.71, "elapsed_time": "14:44:06", "remaining_time": "1 day, 3:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6229, "total_steps": 17941, "loss": 1.6258, "learning_rate": 7.463153197251889e-05, "epoch": 0.3471935789532356, "percentage": 34.72, "elapsed_time": "14:44:15", "remaining_time": "1 day, 3:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6230, "total_steps": 17941, "loss": 1.6253, "learning_rate": 7.462378277269704e-05, "epoch": 0.34724931720639873, "percentage": 34.72, "elapsed_time": "14:44:23", "remaining_time": "1 day, 3:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6231, "total_steps": 17941, "loss": 1.7417, "learning_rate": 7.461603279195235e-05, "epoch": 0.3473050554595619, "percentage": 34.73, "elapsed_time": "14:44:32", "remaining_time": "1 day, 3:42:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6232, "total_steps": 17941, "loss": 1.8448, "learning_rate": 7.460828203053063e-05, "epoch": 0.34736079371272505, "percentage": 34.74, "elapsed_time": "14:44:40", "remaining_time": "1 day, 3:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6233, "total_steps": 17941, "loss": 1.783, "learning_rate": 7.460053048867768e-05, "epoch": 0.3474165319658882, "percentage": 34.74, "elapsed_time": "14:44:49", "remaining_time": "1 day, 3:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6234, "total_steps": 17941, "loss": 1.8757, "learning_rate": 7.459277816663934e-05, "epoch": 0.34747227021905136, "percentage": 34.75, "elapsed_time": "14:44:57", "remaining_time": "1 day, 3:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6235, "total_steps": 17941, "loss": 1.622, "learning_rate": 7.458502506466147e-05, "epoch": 0.3475280084722145, "percentage": 34.75, "elapsed_time": "14:45:06", "remaining_time": "1 day, 3:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6236, "total_steps": 17941, "loss": 1.4801, "learning_rate": 7.457727118298991e-05, "epoch": 0.3475837467253776, "percentage": 34.76, "elapsed_time": "14:45:15", "remaining_time": "1 day, 3:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6237, "total_steps": 17941, "loss": 1.6797, "learning_rate": 7.456951652187063e-05, "epoch": 0.34763948497854075, "percentage": 34.76, "elapsed_time": "14:45:23", "remaining_time": "1 day, 3:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6238, "total_steps": 17941, "loss": 2.0804, "learning_rate": 7.456176108154956e-05, "epoch": 0.34769522323170393, "percentage": 34.77, "elapsed_time": "14:45:32", "remaining_time": "1 day, 3:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6239, "total_steps": 17941, "loss": 1.881, "learning_rate": 7.45540048622726e-05, "epoch": 0.34775096148486706, "percentage": 34.78, "elapsed_time": "14:45:40", "remaining_time": "1 day, 3:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6240, "total_steps": 17941, "loss": 1.7058, "learning_rate": 7.454624786428576e-05, "epoch": 0.3478066997380302, "percentage": 34.78, "elapsed_time": "14:45:49", "remaining_time": "1 day, 3:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6241, "total_steps": 17941, "loss": 1.7262, "learning_rate": 7.453849008783507e-05, "epoch": 0.3478624379911934, "percentage": 34.79, "elapsed_time": "14:45:57", "remaining_time": "1 day, 3:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6242, "total_steps": 17941, "loss": 1.7584, "learning_rate": 7.453073153316654e-05, "epoch": 0.3479181762443565, "percentage": 34.79, "elapsed_time": "14:46:06", "remaining_time": "1 day, 3:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6243, "total_steps": 17941, "loss": 1.7057, "learning_rate": 7.452297220052624e-05, "epoch": 0.34797391449751963, "percentage": 34.8, "elapsed_time": "14:46:14", "remaining_time": "1 day, 3:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6244, "total_steps": 17941, "loss": 1.8928, "learning_rate": 7.451521209016021e-05, "epoch": 0.3480296527506828, "percentage": 34.8, "elapsed_time": "14:46:23", "remaining_time": "1 day, 3:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6245, "total_steps": 17941, "loss": 1.9479, "learning_rate": 7.450745120231462e-05, "epoch": 0.34808539100384595, "percentage": 34.81, "elapsed_time": "14:46:31", "remaining_time": "1 day, 3:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6246, "total_steps": 17941, "loss": 1.678, "learning_rate": 7.449968953723554e-05, "epoch": 0.3481411292570091, "percentage": 34.81, "elapsed_time": "14:46:39", "remaining_time": "1 day, 3:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6247, "total_steps": 17941, "loss": 1.7936, "learning_rate": 7.449192709516916e-05, "epoch": 0.34819686751017226, "percentage": 34.82, "elapsed_time": "14:46:48", "remaining_time": "1 day, 3:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6248, "total_steps": 17941, "loss": 1.8022, "learning_rate": 7.448416387636166e-05, "epoch": 0.3482526057633354, "percentage": 34.83, "elapsed_time": "14:46:56", "remaining_time": "1 day, 3:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6249, "total_steps": 17941, "loss": 1.6318, "learning_rate": 7.447639988105922e-05, "epoch": 0.3483083440164985, "percentage": 34.83, "elapsed_time": "14:47:05", "remaining_time": "1 day, 3:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6250, "total_steps": 17941, "loss": 2.0857, "learning_rate": 7.44686351095081e-05, "epoch": 0.34836408226966165, "percentage": 34.84, "elapsed_time": "14:47:13", "remaining_time": "1 day, 3:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6251, "total_steps": 17941, "loss": 1.6236, "learning_rate": 7.446086956195452e-05, "epoch": 0.34841982052282483, "percentage": 34.84, "elapsed_time": "14:47:22", "remaining_time": "1 day, 3:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6252, "total_steps": 17941, "loss": 1.895, "learning_rate": 7.445310323864478e-05, "epoch": 0.34847555877598796, "percentage": 34.85, "elapsed_time": "14:47:30", "remaining_time": "1 day, 3:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6253, "total_steps": 17941, "loss": 1.6158, "learning_rate": 7.444533613982519e-05, "epoch": 0.3485312970291511, "percentage": 34.85, "elapsed_time": "14:47:39", "remaining_time": "1 day, 3:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6254, "total_steps": 17941, "loss": 1.7887, "learning_rate": 7.443756826574204e-05, "epoch": 0.3485870352823143, "percentage": 34.86, "elapsed_time": "14:47:47", "remaining_time": "1 day, 3:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6255, "total_steps": 17941, "loss": 1.7628, "learning_rate": 7.442979961664171e-05, "epoch": 0.3486427735354774, "percentage": 34.86, "elapsed_time": "14:47:56", "remaining_time": "1 day, 3:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6256, "total_steps": 17941, "loss": 1.6563, "learning_rate": 7.442203019277059e-05, "epoch": 0.34869851178864053, "percentage": 34.87, "elapsed_time": "14:48:04", "remaining_time": "1 day, 3:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6257, "total_steps": 17941, "loss": 1.7944, "learning_rate": 7.441425999437505e-05, "epoch": 0.3487542500418037, "percentage": 34.88, "elapsed_time": "14:48:13", "remaining_time": "1 day, 3:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6258, "total_steps": 17941, "loss": 1.6007, "learning_rate": 7.440648902170153e-05, "epoch": 0.34880998829496684, "percentage": 34.88, "elapsed_time": "14:48:21", "remaining_time": "1 day, 3:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6259, "total_steps": 17941, "loss": 1.6401, "learning_rate": 7.439871727499648e-05, "epoch": 0.34886572654813, "percentage": 34.89, "elapsed_time": "14:48:30", "remaining_time": "1 day, 3:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6260, "total_steps": 17941, "loss": 1.6605, "learning_rate": 7.439094475450638e-05, "epoch": 0.3489214648012931, "percentage": 34.89, "elapsed_time": "14:48:38", "remaining_time": "1 day, 3:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6261, "total_steps": 17941, "loss": 1.7541, "learning_rate": 7.43831714604777e-05, "epoch": 0.3489772030544563, "percentage": 34.9, "elapsed_time": "14:48:47", "remaining_time": "1 day, 3:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6262, "total_steps": 17941, "loss": 1.5488, "learning_rate": 7.4375397393157e-05, "epoch": 0.3490329413076194, "percentage": 34.9, "elapsed_time": "14:48:55", "remaining_time": "1 day, 3:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6263, "total_steps": 17941, "loss": 1.7463, "learning_rate": 7.43676225527908e-05, "epoch": 0.34908867956078254, "percentage": 34.91, "elapsed_time": "14:49:04", "remaining_time": "1 day, 3:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6264, "total_steps": 17941, "loss": 2.106, "learning_rate": 7.43598469396257e-05, "epoch": 0.34914441781394573, "percentage": 34.91, "elapsed_time": "14:49:12", "remaining_time": "1 day, 3:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6265, "total_steps": 17941, "loss": 1.8146, "learning_rate": 7.435207055390828e-05, "epoch": 0.34920015606710886, "percentage": 34.92, "elapsed_time": "14:49:20", "remaining_time": "1 day, 3:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6266, "total_steps": 17941, "loss": 1.8598, "learning_rate": 7.434429339588516e-05, "epoch": 0.349255894320272, "percentage": 34.93, "elapsed_time": "14:49:29", "remaining_time": "1 day, 3:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6267, "total_steps": 17941, "loss": 1.7508, "learning_rate": 7.4336515465803e-05, "epoch": 0.34931163257343517, "percentage": 34.93, "elapsed_time": "14:49:37", "remaining_time": "1 day, 3:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6268, "total_steps": 17941, "loss": 1.7749, "learning_rate": 7.432873676390845e-05, "epoch": 0.3493673708265983, "percentage": 34.94, "elapsed_time": "14:49:46", "remaining_time": "1 day, 3:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6269, "total_steps": 17941, "loss": 1.6954, "learning_rate": 7.432095729044823e-05, "epoch": 0.34942310907976143, "percentage": 34.94, "elapsed_time": "14:49:54", "remaining_time": "1 day, 3:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6270, "total_steps": 17941, "loss": 1.5363, "learning_rate": 7.431317704566902e-05, "epoch": 0.3494788473329246, "percentage": 34.95, "elapsed_time": "14:50:03", "remaining_time": "1 day, 3:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6271, "total_steps": 17941, "loss": 1.7007, "learning_rate": 7.430539602981761e-05, "epoch": 0.34953458558608774, "percentage": 34.95, "elapsed_time": "14:50:11", "remaining_time": "1 day, 3:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6272, "total_steps": 17941, "loss": 1.9324, "learning_rate": 7.429761424314075e-05, "epoch": 0.34959032383925087, "percentage": 34.96, "elapsed_time": "14:50:20", "remaining_time": "1 day, 3:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6273, "total_steps": 17941, "loss": 1.6236, "learning_rate": 7.428983168588522e-05, "epoch": 0.349646062092414, "percentage": 34.96, "elapsed_time": "14:50:28", "remaining_time": "1 day, 3:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6274, "total_steps": 17941, "loss": 1.8567, "learning_rate": 7.428204835829787e-05, "epoch": 0.3497018003455772, "percentage": 34.97, "elapsed_time": "14:50:37", "remaining_time": "1 day, 3:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6275, "total_steps": 17941, "loss": 1.7612, "learning_rate": 7.42742642606255e-05, "epoch": 0.3497575385987403, "percentage": 34.98, "elapsed_time": "14:50:45", "remaining_time": "1 day, 3:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6276, "total_steps": 17941, "loss": 1.8783, "learning_rate": 7.426647939311499e-05, "epoch": 0.34981327685190344, "percentage": 34.98, "elapsed_time": "14:50:54", "remaining_time": "1 day, 3:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6277, "total_steps": 17941, "loss": 1.533, "learning_rate": 7.425869375601324e-05, "epoch": 0.3498690151050666, "percentage": 34.99, "elapsed_time": "14:51:02", "remaining_time": "1 day, 3:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6278, "total_steps": 17941, "loss": 1.7922, "learning_rate": 7.425090734956717e-05, "epoch": 0.34992475335822976, "percentage": 34.99, "elapsed_time": "14:51:11", "remaining_time": "1 day, 3:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6279, "total_steps": 17941, "loss": 1.5523, "learning_rate": 7.424312017402371e-05, "epoch": 0.3499804916113929, "percentage": 35.0, "elapsed_time": "14:51:19", "remaining_time": "1 day, 3:35:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6280, "total_steps": 17941, "loss": 1.7528, "learning_rate": 7.423533222962984e-05, "epoch": 0.35003622986455607, "percentage": 35.0, "elapsed_time": "14:51:28", "remaining_time": "1 day, 3:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6281, "total_steps": 17941, "loss": 1.6118, "learning_rate": 7.422754351663252e-05, "epoch": 0.3500919681177192, "percentage": 35.01, "elapsed_time": "14:51:37", "remaining_time": "1 day, 3:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6282, "total_steps": 17941, "loss": 1.7999, "learning_rate": 7.421975403527877e-05, "epoch": 0.35014770637088233, "percentage": 35.01, "elapsed_time": "14:51:45", "remaining_time": "1 day, 3:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6283, "total_steps": 17941, "loss": 1.8317, "learning_rate": 7.421196378581563e-05, "epoch": 0.35020344462404546, "percentage": 35.02, "elapsed_time": "14:51:54", "remaining_time": "1 day, 3:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6284, "total_steps": 17941, "loss": 1.6949, "learning_rate": 7.420417276849018e-05, "epoch": 0.35025918287720864, "percentage": 35.03, "elapsed_time": "14:52:02", "remaining_time": "1 day, 3:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6285, "total_steps": 17941, "loss": 1.666, "learning_rate": 7.419638098354948e-05, "epoch": 0.35031492113037177, "percentage": 35.03, "elapsed_time": "14:52:11", "remaining_time": "1 day, 3:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6286, "total_steps": 17941, "loss": 1.7663, "learning_rate": 7.418858843124065e-05, "epoch": 0.3503706593835349, "percentage": 35.04, "elapsed_time": "14:52:19", "remaining_time": "1 day, 3:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6287, "total_steps": 17941, "loss": 1.6048, "learning_rate": 7.418079511181084e-05, "epoch": 0.3504263976366981, "percentage": 35.04, "elapsed_time": "14:52:27", "remaining_time": "1 day, 3:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6288, "total_steps": 17941, "loss": 1.7153, "learning_rate": 7.417300102550718e-05, "epoch": 0.3504821358898612, "percentage": 35.05, "elapsed_time": "14:52:36", "remaining_time": "1 day, 3:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6289, "total_steps": 17941, "loss": 2.0466, "learning_rate": 7.416520617257686e-05, "epoch": 0.35053787414302434, "percentage": 35.05, "elapsed_time": "14:52:45", "remaining_time": "1 day, 3:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6290, "total_steps": 17941, "loss": 1.7793, "learning_rate": 7.41574105532671e-05, "epoch": 0.3505936123961875, "percentage": 35.06, "elapsed_time": "14:52:53", "remaining_time": "1 day, 3:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6291, "total_steps": 17941, "loss": 1.6958, "learning_rate": 7.414961416782512e-05, "epoch": 0.35064935064935066, "percentage": 35.06, "elapsed_time": "14:53:02", "remaining_time": "1 day, 3:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6292, "total_steps": 17941, "loss": 1.7336, "learning_rate": 7.414181701649818e-05, "epoch": 0.3507050889025138, "percentage": 35.07, "elapsed_time": "14:53:10", "remaining_time": "1 day, 3:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6293, "total_steps": 17941, "loss": 1.5585, "learning_rate": 7.413401909953356e-05, "epoch": 0.35076082715567697, "percentage": 35.08, "elapsed_time": "14:53:19", "remaining_time": "1 day, 3:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6294, "total_steps": 17941, "loss": 1.5692, "learning_rate": 7.412622041717858e-05, "epoch": 0.3508165654088401, "percentage": 35.08, "elapsed_time": "14:53:27", "remaining_time": "1 day, 3:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6295, "total_steps": 17941, "loss": 1.6424, "learning_rate": 7.411842096968055e-05, "epoch": 0.3508723036620032, "percentage": 35.09, "elapsed_time": "14:53:36", "remaining_time": "1 day, 3:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6296, "total_steps": 17941, "loss": 1.7084, "learning_rate": 7.411062075728681e-05, "epoch": 0.35092804191516636, "percentage": 35.09, "elapsed_time": "14:53:44", "remaining_time": "1 day, 3:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6297, "total_steps": 17941, "loss": 1.6269, "learning_rate": 7.410281978024478e-05, "epoch": 0.35098378016832954, "percentage": 35.1, "elapsed_time": "14:53:53", "remaining_time": "1 day, 3:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6298, "total_steps": 17941, "loss": 1.6821, "learning_rate": 7.409501803880182e-05, "epoch": 0.35103951842149267, "percentage": 35.1, "elapsed_time": "14:54:02", "remaining_time": "1 day, 3:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6299, "total_steps": 17941, "loss": 1.8958, "learning_rate": 7.408721553320536e-05, "epoch": 0.3510952566746558, "percentage": 35.11, "elapsed_time": "14:54:10", "remaining_time": "1 day, 3:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6300, "total_steps": 17941, "loss": 1.6456, "learning_rate": 7.407941226370289e-05, "epoch": 0.351150994927819, "percentage": 35.12, "elapsed_time": "14:54:19", "remaining_time": "1 day, 3:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6301, "total_steps": 17941, "loss": 1.7168, "learning_rate": 7.407160823054182e-05, "epoch": 0.3512067331809821, "percentage": 35.12, "elapsed_time": "14:54:27", "remaining_time": "1 day, 3:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6302, "total_steps": 17941, "loss": 2.0034, "learning_rate": 7.406380343396973e-05, "epoch": 0.35126247143414524, "percentage": 35.13, "elapsed_time": "14:54:36", "remaining_time": "1 day, 3:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6303, "total_steps": 17941, "loss": 1.5787, "learning_rate": 7.405599787423406e-05, "epoch": 0.3513182096873084, "percentage": 35.13, "elapsed_time": "14:54:45", "remaining_time": "1 day, 3:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6304, "total_steps": 17941, "loss": 1.8993, "learning_rate": 7.40481915515824e-05, "epoch": 0.35137394794047155, "percentage": 35.14, "elapsed_time": "14:54:53", "remaining_time": "1 day, 3:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6305, "total_steps": 17941, "loss": 1.9086, "learning_rate": 7.404038446626231e-05, "epoch": 0.3514296861936347, "percentage": 35.14, "elapsed_time": "14:55:02", "remaining_time": "1 day, 3:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6306, "total_steps": 17941, "loss": 1.74, "learning_rate": 7.403257661852142e-05, "epoch": 0.3514854244467978, "percentage": 35.15, "elapsed_time": "14:55:10", "remaining_time": "1 day, 3:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6307, "total_steps": 17941, "loss": 1.7519, "learning_rate": 7.40247680086073e-05, "epoch": 0.351541162699961, "percentage": 35.15, "elapsed_time": "14:55:19", "remaining_time": "1 day, 3:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6308, "total_steps": 17941, "loss": 1.8393, "learning_rate": 7.401695863676761e-05, "epoch": 0.3515969009531241, "percentage": 35.16, "elapsed_time": "14:55:27", "remaining_time": "1 day, 3:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6309, "total_steps": 17941, "loss": 1.7958, "learning_rate": 7.400914850325001e-05, "epoch": 0.35165263920628725, "percentage": 35.17, "elapsed_time": "14:55:35", "remaining_time": "1 day, 3:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6310, "total_steps": 17941, "loss": 1.7113, "learning_rate": 7.400133760830221e-05, "epoch": 0.35170837745945044, "percentage": 35.17, "elapsed_time": "14:55:44", "remaining_time": "1 day, 3:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6311, "total_steps": 17941, "loss": 1.6819, "learning_rate": 7.399352595217193e-05, "epoch": 0.35176411571261357, "percentage": 35.18, "elapsed_time": "14:55:52", "remaining_time": "1 day, 3:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6312, "total_steps": 17941, "loss": 1.5692, "learning_rate": 7.39857135351069e-05, "epoch": 0.3518198539657767, "percentage": 35.18, "elapsed_time": "14:56:01", "remaining_time": "1 day, 3:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6313, "total_steps": 17941, "loss": 1.813, "learning_rate": 7.397790035735487e-05, "epoch": 0.3518755922189399, "percentage": 35.19, "elapsed_time": "14:56:09", "remaining_time": "1 day, 3:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6314, "total_steps": 17941, "loss": 1.6653, "learning_rate": 7.397008641916364e-05, "epoch": 0.351931330472103, "percentage": 35.19, "elapsed_time": "14:56:18", "remaining_time": "1 day, 3:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6315, "total_steps": 17941, "loss": 1.7948, "learning_rate": 7.396227172078103e-05, "epoch": 0.35198706872526614, "percentage": 35.2, "elapsed_time": "14:56:27", "remaining_time": "1 day, 3:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6316, "total_steps": 17941, "loss": 1.6823, "learning_rate": 7.395445626245486e-05, "epoch": 0.3520428069784293, "percentage": 35.2, "elapsed_time": "14:56:35", "remaining_time": "1 day, 3:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6317, "total_steps": 17941, "loss": 1.4832, "learning_rate": 7.394664004443302e-05, "epoch": 0.35209854523159245, "percentage": 35.21, "elapsed_time": "14:56:44", "remaining_time": "1 day, 3:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6318, "total_steps": 17941, "loss": 1.5743, "learning_rate": 7.393882306696338e-05, "epoch": 0.3521542834847556, "percentage": 35.22, "elapsed_time": "14:56:53", "remaining_time": "1 day, 3:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6319, "total_steps": 17941, "loss": 1.7726, "learning_rate": 7.393100533029383e-05, "epoch": 0.3522100217379187, "percentage": 35.22, "elapsed_time": "14:57:01", "remaining_time": "1 day, 3:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6320, "total_steps": 17941, "loss": 1.5639, "learning_rate": 7.392318683467232e-05, "epoch": 0.3522657599910819, "percentage": 35.23, "elapsed_time": "14:57:10", "remaining_time": "1 day, 3:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6321, "total_steps": 17941, "loss": 1.9563, "learning_rate": 7.391536758034682e-05, "epoch": 0.352321498244245, "percentage": 35.23, "elapsed_time": "14:57:19", "remaining_time": "1 day, 3:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6322, "total_steps": 17941, "loss": 1.6392, "learning_rate": 7.390754756756526e-05, "epoch": 0.35237723649740815, "percentage": 35.24, "elapsed_time": "14:57:27", "remaining_time": "1 day, 3:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6323, "total_steps": 17941, "loss": 1.6262, "learning_rate": 7.389972679657571e-05, "epoch": 0.35243297475057134, "percentage": 35.24, "elapsed_time": "14:57:36", "remaining_time": "1 day, 3:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6324, "total_steps": 17941, "loss": 1.7317, "learning_rate": 7.389190526762618e-05, "epoch": 0.35248871300373447, "percentage": 35.25, "elapsed_time": "14:57:44", "remaining_time": "1 day, 3:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6325, "total_steps": 17941, "loss": 1.7069, "learning_rate": 7.38840829809647e-05, "epoch": 0.3525444512568976, "percentage": 35.25, "elapsed_time": "14:57:53", "remaining_time": "1 day, 3:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6326, "total_steps": 17941, "loss": 1.6009, "learning_rate": 7.387625993683937e-05, "epoch": 0.3526001895100608, "percentage": 35.26, "elapsed_time": "14:58:01", "remaining_time": "1 day, 3:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6327, "total_steps": 17941, "loss": 1.7174, "learning_rate": 7.386843613549827e-05, "epoch": 0.3526559277632239, "percentage": 35.27, "elapsed_time": "14:58:09", "remaining_time": "1 day, 3:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6328, "total_steps": 17941, "loss": 1.5927, "learning_rate": 7.386061157718955e-05, "epoch": 0.35271166601638704, "percentage": 35.27, "elapsed_time": "14:58:18", "remaining_time": "1 day, 3:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6329, "total_steps": 17941, "loss": 1.7494, "learning_rate": 7.385278626216133e-05, "epoch": 0.35276740426955017, "percentage": 35.28, "elapsed_time": "14:58:26", "remaining_time": "1 day, 3:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6330, "total_steps": 17941, "loss": 1.8777, "learning_rate": 7.384496019066182e-05, "epoch": 0.35282314252271335, "percentage": 35.28, "elapsed_time": "14:58:35", "remaining_time": "1 day, 3:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6331, "total_steps": 17941, "loss": 1.7538, "learning_rate": 7.383713336293919e-05, "epoch": 0.3528788807758765, "percentage": 35.29, "elapsed_time": "14:58:43", "remaining_time": "1 day, 3:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6332, "total_steps": 17941, "loss": 1.6307, "learning_rate": 7.382930577924168e-05, "epoch": 0.3529346190290396, "percentage": 35.29, "elapsed_time": "14:58:52", "remaining_time": "1 day, 3:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6333, "total_steps": 17941, "loss": 1.6945, "learning_rate": 7.382147743981751e-05, "epoch": 0.3529903572822028, "percentage": 35.3, "elapsed_time": "14:59:00", "remaining_time": "1 day, 3:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6334, "total_steps": 17941, "loss": 1.7531, "learning_rate": 7.381364834491499e-05, "epoch": 0.3530460955353659, "percentage": 35.3, "elapsed_time": "14:59:09", "remaining_time": "1 day, 3:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6335, "total_steps": 17941, "loss": 1.8593, "learning_rate": 7.380581849478236e-05, "epoch": 0.35310183378852905, "percentage": 35.31, "elapsed_time": "14:59:17", "remaining_time": "1 day, 3:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6336, "total_steps": 17941, "loss": 1.7638, "learning_rate": 7.379798788966798e-05, "epoch": 0.35315757204169224, "percentage": 35.32, "elapsed_time": "14:59:26", "remaining_time": "1 day, 3:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6337, "total_steps": 17941, "loss": 1.7042, "learning_rate": 7.379015652982016e-05, "epoch": 0.35321331029485536, "percentage": 35.32, "elapsed_time": "14:59:34", "remaining_time": "1 day, 3:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6338, "total_steps": 17941, "loss": 1.607, "learning_rate": 7.378232441548729e-05, "epoch": 0.3532690485480185, "percentage": 35.33, "elapsed_time": "14:59:43", "remaining_time": "1 day, 3:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6339, "total_steps": 17941, "loss": 1.7222, "learning_rate": 7.377449154691775e-05, "epoch": 0.3533247868011817, "percentage": 35.33, "elapsed_time": "14:59:51", "remaining_time": "1 day, 3:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6340, "total_steps": 17941, "loss": 1.6946, "learning_rate": 7.376665792435996e-05, "epoch": 0.3533805250543448, "percentage": 35.34, "elapsed_time": "15:00:00", "remaining_time": "1 day, 3:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6341, "total_steps": 17941, "loss": 1.6551, "learning_rate": 7.375882354806235e-05, "epoch": 0.35343626330750794, "percentage": 35.34, "elapsed_time": "15:00:08", "remaining_time": "1 day, 3:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6342, "total_steps": 17941, "loss": 1.7594, "learning_rate": 7.375098841827337e-05, "epoch": 0.35349200156067107, "percentage": 35.35, "elapsed_time": "15:00:17", "remaining_time": "1 day, 3:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6343, "total_steps": 17941, "loss": 1.6205, "learning_rate": 7.374315253524152e-05, "epoch": 0.35354773981383425, "percentage": 35.35, "elapsed_time": "15:00:25", "remaining_time": "1 day, 3:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6344, "total_steps": 17941, "loss": 1.5776, "learning_rate": 7.373531589921531e-05, "epoch": 0.3536034780669974, "percentage": 35.36, "elapsed_time": "15:00:34", "remaining_time": "1 day, 3:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6345, "total_steps": 17941, "loss": 1.5603, "learning_rate": 7.372747851044326e-05, "epoch": 0.3536592163201605, "percentage": 35.37, "elapsed_time": "15:00:43", "remaining_time": "1 day, 3:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6346, "total_steps": 17941, "loss": 1.7814, "learning_rate": 7.371964036917394e-05, "epoch": 0.3537149545733237, "percentage": 35.37, "elapsed_time": "15:00:51", "remaining_time": "1 day, 3:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6347, "total_steps": 17941, "loss": 1.5941, "learning_rate": 7.371180147565592e-05, "epoch": 0.3537706928264868, "percentage": 35.38, "elapsed_time": "15:00:59", "remaining_time": "1 day, 3:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6348, "total_steps": 17941, "loss": 1.2328, "learning_rate": 7.370396183013779e-05, "epoch": 0.35382643107964995, "percentage": 35.38, "elapsed_time": "15:01:08", "remaining_time": "1 day, 3:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6349, "total_steps": 17941, "loss": 1.7327, "learning_rate": 7.369612143286822e-05, "epoch": 0.35388216933281313, "percentage": 35.39, "elapsed_time": "15:01:16", "remaining_time": "1 day, 3:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6350, "total_steps": 17941, "loss": 1.8406, "learning_rate": 7.368828028409581e-05, "epoch": 0.35393790758597626, "percentage": 35.39, "elapsed_time": "15:01:25", "remaining_time": "1 day, 3:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6351, "total_steps": 17941, "loss": 1.7841, "learning_rate": 7.368043838406927e-05, "epoch": 0.3539936458391394, "percentage": 35.4, "elapsed_time": "15:01:33", "remaining_time": "1 day, 3:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6352, "total_steps": 17941, "loss": 1.787, "learning_rate": 7.36725957330373e-05, "epoch": 0.3540493840923025, "percentage": 35.4, "elapsed_time": "15:01:42", "remaining_time": "1 day, 3:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6353, "total_steps": 17941, "loss": 1.7946, "learning_rate": 7.366475233124861e-05, "epoch": 0.3541051223454657, "percentage": 35.41, "elapsed_time": "15:01:50", "remaining_time": "1 day, 3:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6354, "total_steps": 17941, "loss": 1.6904, "learning_rate": 7.365690817895195e-05, "epoch": 0.35416086059862883, "percentage": 35.42, "elapsed_time": "15:01:59", "remaining_time": "1 day, 3:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6355, "total_steps": 17941, "loss": 1.7634, "learning_rate": 7.364906327639608e-05, "epoch": 0.35421659885179196, "percentage": 35.42, "elapsed_time": "15:02:07", "remaining_time": "1 day, 3:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6356, "total_steps": 17941, "loss": 1.7406, "learning_rate": 7.364121762382983e-05, "epoch": 0.35427233710495515, "percentage": 35.43, "elapsed_time": "15:02:16", "remaining_time": "1 day, 3:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6357, "total_steps": 17941, "loss": 1.5078, "learning_rate": 7.363337122150197e-05, "epoch": 0.3543280753581183, "percentage": 35.43, "elapsed_time": "15:02:24", "remaining_time": "1 day, 3:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6358, "total_steps": 17941, "loss": 1.767, "learning_rate": 7.36255240696614e-05, "epoch": 0.3543838136112814, "percentage": 35.44, "elapsed_time": "15:02:32", "remaining_time": "1 day, 3:24:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6359, "total_steps": 17941, "loss": 1.6409, "learning_rate": 7.361767616855692e-05, "epoch": 0.3544395518644446, "percentage": 35.44, "elapsed_time": "15:02:41", "remaining_time": "1 day, 3:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6360, "total_steps": 17941, "loss": 1.6319, "learning_rate": 7.360982751843747e-05, "epoch": 0.3544952901176077, "percentage": 35.45, "elapsed_time": "15:02:49", "remaining_time": "1 day, 3:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6361, "total_steps": 17941, "loss": 1.511, "learning_rate": 7.360197811955194e-05, "epoch": 0.35455102837077085, "percentage": 35.46, "elapsed_time": "15:02:58", "remaining_time": "1 day, 3:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6362, "total_steps": 17941, "loss": 1.7604, "learning_rate": 7.359412797214929e-05, "epoch": 0.35460676662393403, "percentage": 35.46, "elapsed_time": "15:03:06", "remaining_time": "1 day, 3:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6363, "total_steps": 17941, "loss": 1.5816, "learning_rate": 7.358627707647844e-05, "epoch": 0.35466250487709716, "percentage": 35.47, "elapsed_time": "15:03:15", "remaining_time": "1 day, 3:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6364, "total_steps": 17941, "loss": 1.2601, "learning_rate": 7.357842543278841e-05, "epoch": 0.3547182431302603, "percentage": 35.47, "elapsed_time": "15:03:23", "remaining_time": "1 day, 3:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6365, "total_steps": 17941, "loss": 1.8474, "learning_rate": 7.357057304132819e-05, "epoch": 0.3547739813834234, "percentage": 35.48, "elapsed_time": "15:03:31", "remaining_time": "1 day, 3:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6366, "total_steps": 17941, "loss": 1.7508, "learning_rate": 7.356271990234683e-05, "epoch": 0.3548297196365866, "percentage": 35.48, "elapsed_time": "15:03:40", "remaining_time": "1 day, 3:23:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6367, "total_steps": 17941, "loss": 1.5589, "learning_rate": 7.355486601609339e-05, "epoch": 0.35488545788974973, "percentage": 35.49, "elapsed_time": "15:03:48", "remaining_time": "1 day, 3:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6368, "total_steps": 17941, "loss": 1.7982, "learning_rate": 7.354701138281688e-05, "epoch": 0.35494119614291286, "percentage": 35.49, "elapsed_time": "15:03:57", "remaining_time": "1 day, 3:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6369, "total_steps": 17941, "loss": 1.7944, "learning_rate": 7.35391560027665e-05, "epoch": 0.35499693439607605, "percentage": 35.5, "elapsed_time": "15:04:05", "remaining_time": "1 day, 3:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6370, "total_steps": 17941, "loss": 1.8376, "learning_rate": 7.353129987619133e-05, "epoch": 0.3550526726492392, "percentage": 35.51, "elapsed_time": "15:04:14", "remaining_time": "1 day, 3:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6371, "total_steps": 17941, "loss": 1.575, "learning_rate": 7.352344300334053e-05, "epoch": 0.3551084109024023, "percentage": 35.51, "elapsed_time": "15:04:22", "remaining_time": "1 day, 3:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6372, "total_steps": 17941, "loss": 1.3716, "learning_rate": 7.351558538446326e-05, "epoch": 0.3551641491555655, "percentage": 35.52, "elapsed_time": "15:04:31", "remaining_time": "1 day, 3:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6373, "total_steps": 17941, "loss": 1.9018, "learning_rate": 7.350772701980872e-05, "epoch": 0.3552198874087286, "percentage": 35.52, "elapsed_time": "15:04:39", "remaining_time": "1 day, 3:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6374, "total_steps": 17941, "loss": 1.6401, "learning_rate": 7.349986790962613e-05, "epoch": 0.35527562566189175, "percentage": 35.53, "elapsed_time": "15:04:48", "remaining_time": "1 day, 3:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6375, "total_steps": 17941, "loss": 1.5694, "learning_rate": 7.349200805416478e-05, "epoch": 0.3553313639150549, "percentage": 35.53, "elapsed_time": "15:04:56", "remaining_time": "1 day, 3:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6376, "total_steps": 17941, "loss": 1.6291, "learning_rate": 7.348414745367387e-05, "epoch": 0.35538710216821806, "percentage": 35.54, "elapsed_time": "15:05:05", "remaining_time": "1 day, 3:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6377, "total_steps": 17941, "loss": 1.6777, "learning_rate": 7.347628610840274e-05, "epoch": 0.3554428404213812, "percentage": 35.54, "elapsed_time": "15:05:13", "remaining_time": "1 day, 3:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6378, "total_steps": 17941, "loss": 1.922, "learning_rate": 7.346842401860069e-05, "epoch": 0.3554985786745443, "percentage": 35.55, "elapsed_time": "15:05:22", "remaining_time": "1 day, 3:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6379, "total_steps": 17941, "loss": 1.7305, "learning_rate": 7.346056118451705e-05, "epoch": 0.3555543169277075, "percentage": 35.56, "elapsed_time": "15:05:30", "remaining_time": "1 day, 3:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6380, "total_steps": 17941, "loss": 1.7387, "learning_rate": 7.345269760640121e-05, "epoch": 0.35561005518087063, "percentage": 35.56, "elapsed_time": "15:05:38", "remaining_time": "1 day, 3:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6381, "total_steps": 17941, "loss": 1.6662, "learning_rate": 7.344483328450253e-05, "epoch": 0.35566579343403376, "percentage": 35.57, "elapsed_time": "15:05:47", "remaining_time": "1 day, 3:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6382, "total_steps": 17941, "loss": 1.8065, "learning_rate": 7.343696821907042e-05, "epoch": 0.35572153168719695, "percentage": 35.57, "elapsed_time": "15:05:56", "remaining_time": "1 day, 3:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6383, "total_steps": 17941, "loss": 1.7933, "learning_rate": 7.342910241035434e-05, "epoch": 0.3557772699403601, "percentage": 35.58, "elapsed_time": "15:06:05", "remaining_time": "1 day, 3:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6384, "total_steps": 17941, "loss": 1.6203, "learning_rate": 7.342123585860374e-05, "epoch": 0.3558330081935232, "percentage": 35.58, "elapsed_time": "15:06:13", "remaining_time": "1 day, 3:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6385, "total_steps": 17941, "loss": 1.6706, "learning_rate": 7.341336856406808e-05, "epoch": 0.3558887464466864, "percentage": 35.59, "elapsed_time": "15:06:22", "remaining_time": "1 day, 3:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6386, "total_steps": 17941, "loss": 1.8427, "learning_rate": 7.340550052699689e-05, "epoch": 0.3559444846998495, "percentage": 35.59, "elapsed_time": "15:06:30", "remaining_time": "1 day, 3:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6387, "total_steps": 17941, "loss": 1.7332, "learning_rate": 7.339763174763968e-05, "epoch": 0.35600022295301265, "percentage": 35.6, "elapsed_time": "15:06:39", "remaining_time": "1 day, 3:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6388, "total_steps": 17941, "loss": 1.5966, "learning_rate": 7.3389762226246e-05, "epoch": 0.3560559612061758, "percentage": 35.61, "elapsed_time": "15:06:47", "remaining_time": "1 day, 3:19:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6389, "total_steps": 17941, "loss": 1.8137, "learning_rate": 7.338189196306544e-05, "epoch": 0.35611169945933896, "percentage": 35.61, "elapsed_time": "15:06:56", "remaining_time": "1 day, 3:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6390, "total_steps": 17941, "loss": 1.6799, "learning_rate": 7.33740209583476e-05, "epoch": 0.3561674377125021, "percentage": 35.62, "elapsed_time": "15:07:04", "remaining_time": "1 day, 3:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6391, "total_steps": 17941, "loss": 1.6959, "learning_rate": 7.33661492123421e-05, "epoch": 0.3562231759656652, "percentage": 35.62, "elapsed_time": "15:07:12", "remaining_time": "1 day, 3:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6392, "total_steps": 17941, "loss": 1.7565, "learning_rate": 7.335827672529856e-05, "epoch": 0.3562789142188284, "percentage": 35.63, "elapsed_time": "15:07:21", "remaining_time": "1 day, 3:19:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6393, "total_steps": 17941, "loss": 1.7526, "learning_rate": 7.335040349746669e-05, "epoch": 0.35633465247199153, "percentage": 35.63, "elapsed_time": "15:07:30", "remaining_time": "1 day, 3:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6394, "total_steps": 17941, "loss": 1.64, "learning_rate": 7.334252952909615e-05, "epoch": 0.35639039072515466, "percentage": 35.64, "elapsed_time": "15:07:39", "remaining_time": "1 day, 3:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6395, "total_steps": 17941, "loss": 1.7358, "learning_rate": 7.333465482043667e-05, "epoch": 0.35644612897831784, "percentage": 35.64, "elapsed_time": "15:07:47", "remaining_time": "1 day, 3:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6396, "total_steps": 17941, "loss": 1.854, "learning_rate": 7.3326779371738e-05, "epoch": 0.356501867231481, "percentage": 35.65, "elapsed_time": "15:07:56", "remaining_time": "1 day, 3:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6397, "total_steps": 17941, "loss": 1.6502, "learning_rate": 7.33189031832499e-05, "epoch": 0.3565576054846441, "percentage": 35.66, "elapsed_time": "15:08:04", "remaining_time": "1 day, 3:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6398, "total_steps": 17941, "loss": 1.6757, "learning_rate": 7.331102625522212e-05, "epoch": 0.35661334373780723, "percentage": 35.66, "elapsed_time": "15:08:13", "remaining_time": "1 day, 3:18:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6399, "total_steps": 17941, "loss": 1.5362, "learning_rate": 7.330314858790453e-05, "epoch": 0.3566690819909704, "percentage": 35.67, "elapsed_time": "15:08:21", "remaining_time": "1 day, 3:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6400, "total_steps": 17941, "loss": 1.7302, "learning_rate": 7.32952701815469e-05, "epoch": 0.35672482024413354, "percentage": 35.67, "elapsed_time": "15:08:29", "remaining_time": "1 day, 3:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6401, "total_steps": 17941, "loss": 1.7755, "learning_rate": 7.328739103639916e-05, "epoch": 0.3567805584972967, "percentage": 35.68, "elapsed_time": "15:08:38", "remaining_time": "1 day, 3:18:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6402, "total_steps": 17941, "loss": 1.5803, "learning_rate": 7.327951115271113e-05, "epoch": 0.35683629675045986, "percentage": 35.68, "elapsed_time": "15:08:46", "remaining_time": "1 day, 3:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6403, "total_steps": 17941, "loss": 1.5991, "learning_rate": 7.327163053073273e-05, "epoch": 0.356892035003623, "percentage": 35.69, "elapsed_time": "15:08:55", "remaining_time": "1 day, 3:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6404, "total_steps": 17941, "loss": 1.6789, "learning_rate": 7.32637491707139e-05, "epoch": 0.3569477732567861, "percentage": 35.69, "elapsed_time": "15:09:03", "remaining_time": "1 day, 3:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6405, "total_steps": 17941, "loss": 1.8266, "learning_rate": 7.32558670729046e-05, "epoch": 0.3570035115099493, "percentage": 35.7, "elapsed_time": "15:09:12", "remaining_time": "1 day, 3:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6406, "total_steps": 17941, "loss": 1.6093, "learning_rate": 7.324798423755476e-05, "epoch": 0.35705924976311243, "percentage": 35.71, "elapsed_time": "15:09:20", "remaining_time": "1 day, 3:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6407, "total_steps": 17941, "loss": 1.6672, "learning_rate": 7.324010066491442e-05, "epoch": 0.35711498801627556, "percentage": 35.71, "elapsed_time": "15:09:29", "remaining_time": "1 day, 3:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6408, "total_steps": 17941, "loss": 1.7776, "learning_rate": 7.323221635523358e-05, "epoch": 0.35717072626943874, "percentage": 35.72, "elapsed_time": "15:09:37", "remaining_time": "1 day, 3:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6409, "total_steps": 17941, "loss": 1.9326, "learning_rate": 7.32243313087623e-05, "epoch": 0.35722646452260187, "percentage": 35.72, "elapsed_time": "15:09:46", "remaining_time": "1 day, 3:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6410, "total_steps": 17941, "loss": 1.8942, "learning_rate": 7.321644552575062e-05, "epoch": 0.357282202775765, "percentage": 35.73, "elapsed_time": "15:09:54", "remaining_time": "1 day, 3:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6411, "total_steps": 17941, "loss": 1.6339, "learning_rate": 7.320855900644867e-05, "epoch": 0.35733794102892813, "percentage": 35.73, "elapsed_time": "15:10:02", "remaining_time": "1 day, 3:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6412, "total_steps": 17941, "loss": 1.681, "learning_rate": 7.320067175110653e-05, "epoch": 0.3573936792820913, "percentage": 35.74, "elapsed_time": "15:10:11", "remaining_time": "1 day, 3:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6413, "total_steps": 17941, "loss": 1.847, "learning_rate": 7.319278375997436e-05, "epoch": 0.35744941753525444, "percentage": 35.74, "elapsed_time": "15:10:19", "remaining_time": "1 day, 3:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6414, "total_steps": 17941, "loss": 1.7616, "learning_rate": 7.31848950333023e-05, "epoch": 0.3575051557884176, "percentage": 35.75, "elapsed_time": "15:10:28", "remaining_time": "1 day, 3:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6415, "total_steps": 17941, "loss": 1.7561, "learning_rate": 7.317700557134056e-05, "epoch": 0.35756089404158076, "percentage": 35.76, "elapsed_time": "15:10:36", "remaining_time": "1 day, 3:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6416, "total_steps": 17941, "loss": 1.6086, "learning_rate": 7.316911537433933e-05, "epoch": 0.3576166322947439, "percentage": 35.76, "elapsed_time": "15:10:45", "remaining_time": "1 day, 3:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6417, "total_steps": 17941, "loss": 1.7853, "learning_rate": 7.316122444254884e-05, "epoch": 0.357672370547907, "percentage": 35.77, "elapsed_time": "15:10:53", "remaining_time": "1 day, 3:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6418, "total_steps": 17941, "loss": 1.5816, "learning_rate": 7.315333277621935e-05, "epoch": 0.3577281088010702, "percentage": 35.77, "elapsed_time": "15:11:02", "remaining_time": "1 day, 3:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6419, "total_steps": 17941, "loss": 1.5703, "learning_rate": 7.314544037560114e-05, "epoch": 0.35778384705423333, "percentage": 35.78, "elapsed_time": "15:11:10", "remaining_time": "1 day, 3:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6420, "total_steps": 17941, "loss": 1.6222, "learning_rate": 7.313754724094451e-05, "epoch": 0.35783958530739646, "percentage": 35.78, "elapsed_time": "15:11:18", "remaining_time": "1 day, 3:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6421, "total_steps": 17941, "loss": 1.7888, "learning_rate": 7.312965337249979e-05, "epoch": 0.3578953235605596, "percentage": 35.79, "elapsed_time": "15:11:27", "remaining_time": "1 day, 3:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6422, "total_steps": 17941, "loss": 1.7508, "learning_rate": 7.312175877051732e-05, "epoch": 0.35795106181372277, "percentage": 35.8, "elapsed_time": "15:11:35", "remaining_time": "1 day, 3:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6423, "total_steps": 17941, "loss": 1.8401, "learning_rate": 7.311386343524747e-05, "epoch": 0.3580068000668859, "percentage": 35.8, "elapsed_time": "15:11:44", "remaining_time": "1 day, 3:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6424, "total_steps": 17941, "loss": 1.5428, "learning_rate": 7.310596736694062e-05, "epoch": 0.35806253832004903, "percentage": 35.81, "elapsed_time": "15:11:52", "remaining_time": "1 day, 3:14:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6425, "total_steps": 17941, "loss": 1.464, "learning_rate": 7.309807056584722e-05, "epoch": 0.3581182765732122, "percentage": 35.81, "elapsed_time": "15:12:01", "remaining_time": "1 day, 3:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6426, "total_steps": 17941, "loss": 1.7063, "learning_rate": 7.309017303221768e-05, "epoch": 0.35817401482637534, "percentage": 35.82, "elapsed_time": "15:12:09", "remaining_time": "1 day, 3:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6427, "total_steps": 17941, "loss": 1.6636, "learning_rate": 7.308227476630249e-05, "epoch": 0.35822975307953847, "percentage": 35.82, "elapsed_time": "15:12:18", "remaining_time": "1 day, 3:14:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6428, "total_steps": 17941, "loss": 1.5777, "learning_rate": 7.30743757683521e-05, "epoch": 0.35828549133270166, "percentage": 35.83, "elapsed_time": "15:12:26", "remaining_time": "1 day, 3:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6429, "total_steps": 17941, "loss": 1.5602, "learning_rate": 7.306647603861706e-05, "epoch": 0.3583412295858648, "percentage": 35.83, "elapsed_time": "15:12:34", "remaining_time": "1 day, 3:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6430, "total_steps": 17941, "loss": 1.659, "learning_rate": 7.305857557734789e-05, "epoch": 0.3583969678390279, "percentage": 35.84, "elapsed_time": "15:12:43", "remaining_time": "1 day, 3:13:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6431, "total_steps": 17941, "loss": 1.9413, "learning_rate": 7.305067438479513e-05, "epoch": 0.3584527060921911, "percentage": 35.85, "elapsed_time": "15:12:51", "remaining_time": "1 day, 3:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6432, "total_steps": 17941, "loss": 1.7138, "learning_rate": 7.30427724612094e-05, "epoch": 0.3585084443453542, "percentage": 35.85, "elapsed_time": "15:13:00", "remaining_time": "1 day, 3:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6433, "total_steps": 17941, "loss": 1.7588, "learning_rate": 7.303486980684125e-05, "epoch": 0.35856418259851736, "percentage": 35.86, "elapsed_time": "15:13:09", "remaining_time": "1 day, 3:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6434, "total_steps": 17941, "loss": 1.8426, "learning_rate": 7.302696642194134e-05, "epoch": 0.3586199208516805, "percentage": 35.86, "elapsed_time": "15:13:18", "remaining_time": "1 day, 3:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6435, "total_steps": 17941, "loss": 1.5852, "learning_rate": 7.30190623067603e-05, "epoch": 0.35867565910484367, "percentage": 35.87, "elapsed_time": "15:13:26", "remaining_time": "1 day, 3:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6436, "total_steps": 17941, "loss": 1.5495, "learning_rate": 7.301115746154884e-05, "epoch": 0.3587313973580068, "percentage": 35.87, "elapsed_time": "15:13:35", "remaining_time": "1 day, 3:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6437, "total_steps": 17941, "loss": 1.8611, "learning_rate": 7.300325188655761e-05, "epoch": 0.3587871356111699, "percentage": 35.88, "elapsed_time": "15:13:43", "remaining_time": "1 day, 3:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6438, "total_steps": 17941, "loss": 1.6437, "learning_rate": 7.299534558203735e-05, "epoch": 0.3588428738643331, "percentage": 35.88, "elapsed_time": "15:13:51", "remaining_time": "1 day, 3:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6439, "total_steps": 17941, "loss": 1.8723, "learning_rate": 7.298743854823882e-05, "epoch": 0.35889861211749624, "percentage": 35.89, "elapsed_time": "15:14:00", "remaining_time": "1 day, 3:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6440, "total_steps": 17941, "loss": 1.518, "learning_rate": 7.297953078541274e-05, "epoch": 0.35895435037065937, "percentage": 35.9, "elapsed_time": "15:14:08", "remaining_time": "1 day, 3:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6441, "total_steps": 17941, "loss": 1.8528, "learning_rate": 7.297162229380994e-05, "epoch": 0.35901008862382255, "percentage": 35.9, "elapsed_time": "15:14:17", "remaining_time": "1 day, 3:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6442, "total_steps": 17941, "loss": 1.6619, "learning_rate": 7.29637130736812e-05, "epoch": 0.3590658268769857, "percentage": 35.91, "elapsed_time": "15:14:25", "remaining_time": "1 day, 3:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6443, "total_steps": 17941, "loss": 1.8209, "learning_rate": 7.295580312527739e-05, "epoch": 0.3591215651301488, "percentage": 35.91, "elapsed_time": "15:14:34", "remaining_time": "1 day, 3:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6444, "total_steps": 17941, "loss": 1.6109, "learning_rate": 7.294789244884932e-05, "epoch": 0.35917730338331194, "percentage": 35.92, "elapsed_time": "15:14:43", "remaining_time": "1 day, 3:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6445, "total_steps": 17941, "loss": 1.7449, "learning_rate": 7.293998104464792e-05, "epoch": 0.3592330416364751, "percentage": 35.92, "elapsed_time": "15:14:52", "remaining_time": "1 day, 3:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6446, "total_steps": 17941, "loss": 1.7952, "learning_rate": 7.293206891292405e-05, "epoch": 0.35928877988963825, "percentage": 35.93, "elapsed_time": "15:15:00", "remaining_time": "1 day, 3:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6447, "total_steps": 17941, "loss": 1.8784, "learning_rate": 7.292415605392867e-05, "epoch": 0.3593445181428014, "percentage": 35.93, "elapsed_time": "15:15:08", "remaining_time": "1 day, 3:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6448, "total_steps": 17941, "loss": 1.8764, "learning_rate": 7.291624246791272e-05, "epoch": 0.35940025639596457, "percentage": 35.94, "elapsed_time": "15:15:17", "remaining_time": "1 day, 3:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6449, "total_steps": 17941, "loss": 1.7389, "learning_rate": 7.290832815512716e-05, "epoch": 0.3594559946491277, "percentage": 35.95, "elapsed_time": "15:15:25", "remaining_time": "1 day, 3:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6450, "total_steps": 17941, "loss": 1.591, "learning_rate": 7.290041311582301e-05, "epoch": 0.3595117329022908, "percentage": 35.95, "elapsed_time": "15:15:34", "remaining_time": "1 day, 3:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6451, "total_steps": 17941, "loss": 1.765, "learning_rate": 7.289249735025127e-05, "epoch": 0.359567471155454, "percentage": 35.96, "elapsed_time": "15:15:42", "remaining_time": "1 day, 3:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6452, "total_steps": 17941, "loss": 1.6685, "learning_rate": 7.288458085866298e-05, "epoch": 0.35962320940861714, "percentage": 35.96, "elapsed_time": "15:15:51", "remaining_time": "1 day, 3:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6453, "total_steps": 17941, "loss": 1.6956, "learning_rate": 7.287666364130921e-05, "epoch": 0.35967894766178027, "percentage": 35.97, "elapsed_time": "15:16:00", "remaining_time": "1 day, 3:10:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6454, "total_steps": 17941, "loss": 1.7829, "learning_rate": 7.286874569844106e-05, "epoch": 0.35973468591494345, "percentage": 35.97, "elapsed_time": "15:16:09", "remaining_time": "1 day, 3:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6455, "total_steps": 17941, "loss": 1.8747, "learning_rate": 7.286082703030961e-05, "epoch": 0.3597904241681066, "percentage": 35.98, "elapsed_time": "15:16:18", "remaining_time": "1 day, 3:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6456, "total_steps": 17941, "loss": 1.5944, "learning_rate": 7.285290763716604e-05, "epoch": 0.3598461624212697, "percentage": 35.98, "elapsed_time": "15:16:26", "remaining_time": "1 day, 3:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6457, "total_steps": 17941, "loss": 1.6307, "learning_rate": 7.284498751926147e-05, "epoch": 0.35990190067443284, "percentage": 35.99, "elapsed_time": "15:16:35", "remaining_time": "1 day, 3:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6458, "total_steps": 17941, "loss": 1.6096, "learning_rate": 7.283706667684709e-05, "epoch": 0.359957638927596, "percentage": 36.0, "elapsed_time": "15:16:43", "remaining_time": "1 day, 3:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6459, "total_steps": 17941, "loss": 1.6963, "learning_rate": 7.28291451101741e-05, "epoch": 0.36001337718075915, "percentage": 36.0, "elapsed_time": "15:16:52", "remaining_time": "1 day, 3:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6460, "total_steps": 17941, "loss": 1.7304, "learning_rate": 7.282122281949374e-05, "epoch": 0.3600691154339223, "percentage": 36.01, "elapsed_time": "15:17:00", "remaining_time": "1 day, 3:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6461, "total_steps": 17941, "loss": 1.8304, "learning_rate": 7.281329980505724e-05, "epoch": 0.36012485368708547, "percentage": 36.01, "elapsed_time": "15:17:08", "remaining_time": "1 day, 3:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6462, "total_steps": 17941, "loss": 1.509, "learning_rate": 7.280537606711589e-05, "epoch": 0.3601805919402486, "percentage": 36.02, "elapsed_time": "15:17:17", "remaining_time": "1 day, 3:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6463, "total_steps": 17941, "loss": 1.765, "learning_rate": 7.279745160592097e-05, "epoch": 0.3602363301934117, "percentage": 36.02, "elapsed_time": "15:17:25", "remaining_time": "1 day, 3:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6464, "total_steps": 17941, "loss": 1.6604, "learning_rate": 7.278952642172381e-05, "epoch": 0.3602920684465749, "percentage": 36.03, "elapsed_time": "15:17:34", "remaining_time": "1 day, 3:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6465, "total_steps": 17941, "loss": 1.6273, "learning_rate": 7.278160051477574e-05, "epoch": 0.36034780669973804, "percentage": 36.03, "elapsed_time": "15:17:43", "remaining_time": "1 day, 3:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6466, "total_steps": 17941, "loss": 1.7693, "learning_rate": 7.277367388532812e-05, "epoch": 0.36040354495290117, "percentage": 36.04, "elapsed_time": "15:17:51", "remaining_time": "1 day, 3:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6467, "total_steps": 17941, "loss": 1.6402, "learning_rate": 7.276574653363236e-05, "epoch": 0.3604592832060643, "percentage": 36.05, "elapsed_time": "15:18:00", "remaining_time": "1 day, 3:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6468, "total_steps": 17941, "loss": 1.9642, "learning_rate": 7.275781845993983e-05, "epoch": 0.3605150214592275, "percentage": 36.05, "elapsed_time": "15:18:09", "remaining_time": "1 day, 3:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6469, "total_steps": 17941, "loss": 1.8417, "learning_rate": 7.274988966450201e-05, "epoch": 0.3605707597123906, "percentage": 36.06, "elapsed_time": "15:18:17", "remaining_time": "1 day, 3:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6470, "total_steps": 17941, "loss": 1.6307, "learning_rate": 7.274196014757032e-05, "epoch": 0.36062649796555374, "percentage": 36.06, "elapsed_time": "15:18:26", "remaining_time": "1 day, 3:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6471, "total_steps": 17941, "loss": 1.7725, "learning_rate": 7.273402990939626e-05, "epoch": 0.3606822362187169, "percentage": 36.07, "elapsed_time": "15:18:34", "remaining_time": "1 day, 3:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6472, "total_steps": 17941, "loss": 1.831, "learning_rate": 7.272609895023129e-05, "epoch": 0.36073797447188005, "percentage": 36.07, "elapsed_time": "15:18:42", "remaining_time": "1 day, 3:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6473, "total_steps": 17941, "loss": 1.4942, "learning_rate": 7.2718167270327e-05, "epoch": 0.3607937127250432, "percentage": 36.08, "elapsed_time": "15:18:51", "remaining_time": "1 day, 3:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6474, "total_steps": 17941, "loss": 1.722, "learning_rate": 7.271023486993488e-05, "epoch": 0.36084945097820637, "percentage": 36.08, "elapsed_time": "15:19:00", "remaining_time": "1 day, 3:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6475, "total_steps": 17941, "loss": 1.5921, "learning_rate": 7.270230174930653e-05, "epoch": 0.3609051892313695, "percentage": 36.09, "elapsed_time": "15:19:08", "remaining_time": "1 day, 3:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6476, "total_steps": 17941, "loss": 1.7303, "learning_rate": 7.269436790869352e-05, "epoch": 0.3609609274845326, "percentage": 36.1, "elapsed_time": "15:19:16", "remaining_time": "1 day, 3:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6477, "total_steps": 17941, "loss": 1.4386, "learning_rate": 7.268643334834748e-05, "epoch": 0.3610166657376958, "percentage": 36.1, "elapsed_time": "15:19:25", "remaining_time": "1 day, 3:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6478, "total_steps": 17941, "loss": 1.7803, "learning_rate": 7.267849806852005e-05, "epoch": 0.36107240399085894, "percentage": 36.11, "elapsed_time": "15:19:33", "remaining_time": "1 day, 3:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6479, "total_steps": 17941, "loss": 1.6513, "learning_rate": 7.267056206946289e-05, "epoch": 0.36112814224402207, "percentage": 36.11, "elapsed_time": "15:19:42", "remaining_time": "1 day, 3:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6480, "total_steps": 17941, "loss": 1.718, "learning_rate": 7.266262535142767e-05, "epoch": 0.3611838804971852, "percentage": 36.12, "elapsed_time": "15:19:50", "remaining_time": "1 day, 3:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6481, "total_steps": 17941, "loss": 1.8295, "learning_rate": 7.26546879146661e-05, "epoch": 0.3612396187503484, "percentage": 36.12, "elapsed_time": "15:19:59", "remaining_time": "1 day, 3:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6482, "total_steps": 17941, "loss": 1.8042, "learning_rate": 7.264674975942994e-05, "epoch": 0.3612953570035115, "percentage": 36.13, "elapsed_time": "15:20:07", "remaining_time": "1 day, 3:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6483, "total_steps": 17941, "loss": 1.6976, "learning_rate": 7.26388108859709e-05, "epoch": 0.36135109525667464, "percentage": 36.14, "elapsed_time": "15:20:16", "remaining_time": "1 day, 3:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6484, "total_steps": 17941, "loss": 1.5425, "learning_rate": 7.263087129454078e-05, "epoch": 0.3614068335098378, "percentage": 36.14, "elapsed_time": "15:20:24", "remaining_time": "1 day, 3:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6485, "total_steps": 17941, "loss": 1.7552, "learning_rate": 7.262293098539134e-05, "epoch": 0.36146257176300095, "percentage": 36.15, "elapsed_time": "15:20:33", "remaining_time": "1 day, 3:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6486, "total_steps": 17941, "loss": 1.5728, "learning_rate": 7.261498995877447e-05, "epoch": 0.3615183100161641, "percentage": 36.15, "elapsed_time": "15:20:41", "remaining_time": "1 day, 3:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6487, "total_steps": 17941, "loss": 1.7926, "learning_rate": 7.260704821494196e-05, "epoch": 0.36157404826932726, "percentage": 36.16, "elapsed_time": "15:20:49", "remaining_time": "1 day, 3:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6488, "total_steps": 17941, "loss": 1.46, "learning_rate": 7.259910575414569e-05, "epoch": 0.3616297865224904, "percentage": 36.16, "elapsed_time": "15:20:58", "remaining_time": "1 day, 3:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6489, "total_steps": 17941, "loss": 1.4995, "learning_rate": 7.259116257663753e-05, "epoch": 0.3616855247756535, "percentage": 36.17, "elapsed_time": "15:21:07", "remaining_time": "1 day, 3:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6490, "total_steps": 17941, "loss": 1.6736, "learning_rate": 7.258321868266943e-05, "epoch": 0.36174126302881665, "percentage": 36.17, "elapsed_time": "15:21:15", "remaining_time": "1 day, 3:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6491, "total_steps": 17941, "loss": 1.6224, "learning_rate": 7.25752740724933e-05, "epoch": 0.36179700128197984, "percentage": 36.18, "elapsed_time": "15:21:24", "remaining_time": "1 day, 3:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6492, "total_steps": 17941, "loss": 1.7814, "learning_rate": 7.256732874636109e-05, "epoch": 0.36185273953514296, "percentage": 36.19, "elapsed_time": "15:21:32", "remaining_time": "1 day, 3:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6493, "total_steps": 17941, "loss": 1.7024, "learning_rate": 7.255938270452479e-05, "epoch": 0.3619084777883061, "percentage": 36.19, "elapsed_time": "15:21:41", "remaining_time": "1 day, 3:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6494, "total_steps": 17941, "loss": 1.5576, "learning_rate": 7.25514359472364e-05, "epoch": 0.3619642160414693, "percentage": 36.2, "elapsed_time": "15:21:49", "remaining_time": "1 day, 3:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6495, "total_steps": 17941, "loss": 1.8389, "learning_rate": 7.254348847474797e-05, "epoch": 0.3620199542946324, "percentage": 36.2, "elapsed_time": "15:21:57", "remaining_time": "1 day, 3:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6496, "total_steps": 17941, "loss": 1.7194, "learning_rate": 7.253554028731148e-05, "epoch": 0.36207569254779554, "percentage": 36.21, "elapsed_time": "15:22:07", "remaining_time": "1 day, 3:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6497, "total_steps": 17941, "loss": 1.3394, "learning_rate": 7.252759138517909e-05, "epoch": 0.3621314308009587, "percentage": 36.21, "elapsed_time": "15:22:16", "remaining_time": "1 day, 3:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6498, "total_steps": 17941, "loss": 1.6234, "learning_rate": 7.251964176860281e-05, "epoch": 0.36218716905412185, "percentage": 36.22, "elapsed_time": "15:22:24", "remaining_time": "1 day, 3:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6499, "total_steps": 17941, "loss": 1.8937, "learning_rate": 7.25116914378348e-05, "epoch": 0.362242907307285, "percentage": 36.22, "elapsed_time": "15:22:33", "remaining_time": "1 day, 3:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6500, "total_steps": 17941, "loss": 1.5599, "learning_rate": 7.25037403931272e-05, "epoch": 0.36229864556044816, "percentage": 36.23, "elapsed_time": "15:22:41", "remaining_time": "1 day, 3:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6501, "total_steps": 17941, "loss": 1.8547, "learning_rate": 7.249578863473216e-05, "epoch": 0.3623543838136113, "percentage": 36.24, "elapsed_time": "15:22:50", "remaining_time": "1 day, 3:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6502, "total_steps": 17941, "loss": 1.4538, "learning_rate": 7.248783616290186e-05, "epoch": 0.3624101220667744, "percentage": 36.24, "elapsed_time": "15:22:59", "remaining_time": "1 day, 3:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6503, "total_steps": 17941, "loss": 1.8237, "learning_rate": 7.24798829778885e-05, "epoch": 0.36246586031993755, "percentage": 36.25, "elapsed_time": "15:23:08", "remaining_time": "1 day, 3:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6504, "total_steps": 17941, "loss": 1.5705, "learning_rate": 7.247192907994433e-05, "epoch": 0.36252159857310073, "percentage": 36.25, "elapsed_time": "15:23:16", "remaining_time": "1 day, 3:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6505, "total_steps": 17941, "loss": 1.6597, "learning_rate": 7.246397446932159e-05, "epoch": 0.36257733682626386, "percentage": 36.26, "elapsed_time": "15:23:26", "remaining_time": "1 day, 3:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6506, "total_steps": 17941, "loss": 1.9137, "learning_rate": 7.245601914627255e-05, "epoch": 0.362633075079427, "percentage": 36.26, "elapsed_time": "15:23:34", "remaining_time": "1 day, 3:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6507, "total_steps": 17941, "loss": 1.5883, "learning_rate": 7.244806311104952e-05, "epoch": 0.3626888133325902, "percentage": 36.27, "elapsed_time": "15:23:43", "remaining_time": "1 day, 3:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6508, "total_steps": 17941, "loss": 1.9112, "learning_rate": 7.24401063639048e-05, "epoch": 0.3627445515857533, "percentage": 36.27, "elapsed_time": "15:23:51", "remaining_time": "1 day, 3:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6509, "total_steps": 17941, "loss": 1.6557, "learning_rate": 7.243214890509073e-05, "epoch": 0.36280028983891643, "percentage": 36.28, "elapsed_time": "15:23:59", "remaining_time": "1 day, 3:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6510, "total_steps": 17941, "loss": 1.4815, "learning_rate": 7.24241907348597e-05, "epoch": 0.3628560280920796, "percentage": 36.29, "elapsed_time": "15:24:08", "remaining_time": "1 day, 3:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6511, "total_steps": 17941, "loss": 1.6867, "learning_rate": 7.241623185346409e-05, "epoch": 0.36291176634524275, "percentage": 36.29, "elapsed_time": "15:24:16", "remaining_time": "1 day, 3:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6512, "total_steps": 17941, "loss": 1.5461, "learning_rate": 7.240827226115629e-05, "epoch": 0.3629675045984059, "percentage": 36.3, "elapsed_time": "15:24:25", "remaining_time": "1 day, 3:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6513, "total_steps": 17941, "loss": 1.7713, "learning_rate": 7.240031195818874e-05, "epoch": 0.363023242851569, "percentage": 36.3, "elapsed_time": "15:24:34", "remaining_time": "1 day, 3:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6514, "total_steps": 17941, "loss": 1.3757, "learning_rate": 7.239235094481391e-05, "epoch": 0.3630789811047322, "percentage": 36.31, "elapsed_time": "15:24:42", "remaining_time": "1 day, 3:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6515, "total_steps": 17941, "loss": 1.9571, "learning_rate": 7.238438922128425e-05, "epoch": 0.3631347193578953, "percentage": 36.31, "elapsed_time": "15:24:51", "remaining_time": "1 day, 3:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6516, "total_steps": 17941, "loss": 1.9311, "learning_rate": 7.237642678785228e-05, "epoch": 0.36319045761105845, "percentage": 36.32, "elapsed_time": "15:24:59", "remaining_time": "1 day, 3:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6517, "total_steps": 17941, "loss": 1.6393, "learning_rate": 7.236846364477052e-05, "epoch": 0.36324619586422163, "percentage": 36.32, "elapsed_time": "15:25:08", "remaining_time": "1 day, 3:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6518, "total_steps": 17941, "loss": 1.5183, "learning_rate": 7.23604997922915e-05, "epoch": 0.36330193411738476, "percentage": 36.33, "elapsed_time": "15:25:16", "remaining_time": "1 day, 3:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6519, "total_steps": 17941, "loss": 1.8529, "learning_rate": 7.235253523066781e-05, "epoch": 0.3633576723705479, "percentage": 36.34, "elapsed_time": "15:25:25", "remaining_time": "1 day, 3:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6520, "total_steps": 17941, "loss": 1.6463, "learning_rate": 7.234456996015202e-05, "epoch": 0.3634134106237111, "percentage": 36.34, "elapsed_time": "15:25:33", "remaining_time": "1 day, 3:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6521, "total_steps": 17941, "loss": 1.4439, "learning_rate": 7.233660398099675e-05, "epoch": 0.3634691488768742, "percentage": 36.35, "elapsed_time": "15:25:42", "remaining_time": "1 day, 3:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6522, "total_steps": 17941, "loss": 1.5871, "learning_rate": 7.232863729345464e-05, "epoch": 0.36352488713003733, "percentage": 36.35, "elapsed_time": "15:25:50", "remaining_time": "1 day, 3:01:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6523, "total_steps": 17941, "loss": 1.978, "learning_rate": 7.232066989777833e-05, "epoch": 0.3635806253832005, "percentage": 36.36, "elapsed_time": "15:26:00", "remaining_time": "1 day, 3:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6524, "total_steps": 17941, "loss": 1.5579, "learning_rate": 7.231270179422051e-05, "epoch": 0.36363636363636365, "percentage": 36.36, "elapsed_time": "15:26:08", "remaining_time": "1 day, 3:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6525, "total_steps": 17941, "loss": 1.6899, "learning_rate": 7.230473298303388e-05, "epoch": 0.3636921018895268, "percentage": 36.37, "elapsed_time": "15:26:17", "remaining_time": "1 day, 3:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6526, "total_steps": 17941, "loss": 2.1324, "learning_rate": 7.229676346447117e-05, "epoch": 0.3637478401426899, "percentage": 36.37, "elapsed_time": "15:26:26", "remaining_time": "1 day, 3:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6527, "total_steps": 17941, "loss": 1.453, "learning_rate": 7.228879323878512e-05, "epoch": 0.3638035783958531, "percentage": 36.38, "elapsed_time": "15:26:34", "remaining_time": "1 day, 3:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6528, "total_steps": 17941, "loss": 1.8623, "learning_rate": 7.22808223062285e-05, "epoch": 0.3638593166490162, "percentage": 36.39, "elapsed_time": "15:26:43", "remaining_time": "1 day, 3:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6529, "total_steps": 17941, "loss": 1.41, "learning_rate": 7.227285066705412e-05, "epoch": 0.36391505490217935, "percentage": 36.39, "elapsed_time": "15:26:51", "remaining_time": "1 day, 3:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6530, "total_steps": 17941, "loss": 1.6551, "learning_rate": 7.226487832151476e-05, "epoch": 0.36397079315534253, "percentage": 36.4, "elapsed_time": "15:27:00", "remaining_time": "1 day, 2:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6531, "total_steps": 17941, "loss": 1.7853, "learning_rate": 7.225690526986326e-05, "epoch": 0.36402653140850566, "percentage": 36.4, "elapsed_time": "15:27:08", "remaining_time": "1 day, 2:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6532, "total_steps": 17941, "loss": 1.5544, "learning_rate": 7.224893151235251e-05, "epoch": 0.3640822696616688, "percentage": 36.41, "elapsed_time": "15:27:17", "remaining_time": "1 day, 2:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6533, "total_steps": 17941, "loss": 1.9824, "learning_rate": 7.224095704923537e-05, "epoch": 0.364138007914832, "percentage": 36.41, "elapsed_time": "15:27:25", "remaining_time": "1 day, 2:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6534, "total_steps": 17941, "loss": 1.5978, "learning_rate": 7.223298188076475e-05, "epoch": 0.3641937461679951, "percentage": 36.42, "elapsed_time": "15:27:34", "remaining_time": "1 day, 2:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6535, "total_steps": 17941, "loss": 1.5945, "learning_rate": 7.222500600719356e-05, "epoch": 0.36424948442115823, "percentage": 36.42, "elapsed_time": "15:27:42", "remaining_time": "1 day, 2:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6536, "total_steps": 17941, "loss": 1.717, "learning_rate": 7.221702942877477e-05, "epoch": 0.36430522267432136, "percentage": 36.43, "elapsed_time": "15:27:50", "remaining_time": "1 day, 2:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6537, "total_steps": 17941, "loss": 1.6535, "learning_rate": 7.220905214576134e-05, "epoch": 0.36436096092748455, "percentage": 36.44, "elapsed_time": "15:27:59", "remaining_time": "1 day, 2:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6538, "total_steps": 17941, "loss": 1.5444, "learning_rate": 7.220107415840626e-05, "epoch": 0.3644166991806477, "percentage": 36.44, "elapsed_time": "15:28:08", "remaining_time": "1 day, 2:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6539, "total_steps": 17941, "loss": 1.3543, "learning_rate": 7.219309546696255e-05, "epoch": 0.3644724374338108, "percentage": 36.45, "elapsed_time": "15:28:16", "remaining_time": "1 day, 2:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6540, "total_steps": 17941, "loss": 1.7422, "learning_rate": 7.218511607168326e-05, "epoch": 0.364528175686974, "percentage": 36.45, "elapsed_time": "15:28:25", "remaining_time": "1 day, 2:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6541, "total_steps": 17941, "loss": 1.9125, "learning_rate": 7.21771359728214e-05, "epoch": 0.3645839139401371, "percentage": 36.46, "elapsed_time": "15:28:33", "remaining_time": "1 day, 2:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6542, "total_steps": 17941, "loss": 1.8743, "learning_rate": 7.216915517063012e-05, "epoch": 0.36463965219330025, "percentage": 36.46, "elapsed_time": "15:28:42", "remaining_time": "1 day, 2:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6543, "total_steps": 17941, "loss": 1.476, "learning_rate": 7.216117366536249e-05, "epoch": 0.36469539044646343, "percentage": 36.47, "elapsed_time": "15:28:50", "remaining_time": "1 day, 2:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6544, "total_steps": 17941, "loss": 1.7591, "learning_rate": 7.215319145727161e-05, "epoch": 0.36475112869962656, "percentage": 36.48, "elapsed_time": "15:28:59", "remaining_time": "1 day, 2:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6545, "total_steps": 17941, "loss": 1.9996, "learning_rate": 7.214520854661071e-05, "epoch": 0.3648068669527897, "percentage": 36.48, "elapsed_time": "15:29:07", "remaining_time": "1 day, 2:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6546, "total_steps": 17941, "loss": 1.6909, "learning_rate": 7.213722493363288e-05, "epoch": 0.3648626052059529, "percentage": 36.49, "elapsed_time": "15:29:16", "remaining_time": "1 day, 2:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6547, "total_steps": 17941, "loss": 1.6429, "learning_rate": 7.212924061859135e-05, "epoch": 0.364918343459116, "percentage": 36.49, "elapsed_time": "15:29:25", "remaining_time": "1 day, 2:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6548, "total_steps": 17941, "loss": 1.9055, "learning_rate": 7.212125560173933e-05, "epoch": 0.36497408171227913, "percentage": 36.5, "elapsed_time": "15:29:33", "remaining_time": "1 day, 2:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6549, "total_steps": 17941, "loss": 1.7073, "learning_rate": 7.211326988333006e-05, "epoch": 0.36502981996544226, "percentage": 36.5, "elapsed_time": "15:29:42", "remaining_time": "1 day, 2:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6550, "total_steps": 17941, "loss": 1.6739, "learning_rate": 7.210528346361678e-05, "epoch": 0.36508555821860544, "percentage": 36.51, "elapsed_time": "15:29:50", "remaining_time": "1 day, 2:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6551, "total_steps": 17941, "loss": 1.7179, "learning_rate": 7.209729634285282e-05, "epoch": 0.3651412964717686, "percentage": 36.51, "elapsed_time": "15:29:59", "remaining_time": "1 day, 2:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6552, "total_steps": 17941, "loss": 1.7484, "learning_rate": 7.208930852129143e-05, "epoch": 0.3651970347249317, "percentage": 36.52, "elapsed_time": "15:30:07", "remaining_time": "1 day, 2:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6553, "total_steps": 17941, "loss": 1.6169, "learning_rate": 7.208131999918599e-05, "epoch": 0.3652527729780949, "percentage": 36.53, "elapsed_time": "15:30:16", "remaining_time": "1 day, 2:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6554, "total_steps": 17941, "loss": 1.4029, "learning_rate": 7.20733307767898e-05, "epoch": 0.365308511231258, "percentage": 36.53, "elapsed_time": "15:30:24", "remaining_time": "1 day, 2:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6555, "total_steps": 17941, "loss": 1.6399, "learning_rate": 7.206534085435625e-05, "epoch": 0.36536424948442114, "percentage": 36.54, "elapsed_time": "15:30:32", "remaining_time": "1 day, 2:56:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6556, "total_steps": 17941, "loss": 1.7943, "learning_rate": 7.205735023213877e-05, "epoch": 0.36541998773758433, "percentage": 36.54, "elapsed_time": "15:30:41", "remaining_time": "1 day, 2:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6557, "total_steps": 17941, "loss": 1.7919, "learning_rate": 7.204935891039071e-05, "epoch": 0.36547572599074746, "percentage": 36.55, "elapsed_time": "15:30:49", "remaining_time": "1 day, 2:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6558, "total_steps": 17941, "loss": 1.8125, "learning_rate": 7.204136688936556e-05, "epoch": 0.3655314642439106, "percentage": 36.55, "elapsed_time": "15:30:58", "remaining_time": "1 day, 2:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6559, "total_steps": 17941, "loss": 1.6377, "learning_rate": 7.203337416931675e-05, "epoch": 0.3655872024970737, "percentage": 36.56, "elapsed_time": "15:31:06", "remaining_time": "1 day, 2:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6560, "total_steps": 17941, "loss": 1.6929, "learning_rate": 7.202538075049781e-05, "epoch": 0.3656429407502369, "percentage": 36.56, "elapsed_time": "15:31:15", "remaining_time": "1 day, 2:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6561, "total_steps": 17941, "loss": 1.7849, "learning_rate": 7.201738663316217e-05, "epoch": 0.36569867900340003, "percentage": 36.57, "elapsed_time": "15:31:23", "remaining_time": "1 day, 2:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6562, "total_steps": 17941, "loss": 1.3314, "learning_rate": 7.200939181756341e-05, "epoch": 0.36575441725656316, "percentage": 36.58, "elapsed_time": "15:31:31", "remaining_time": "1 day, 2:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6563, "total_steps": 17941, "loss": 1.8517, "learning_rate": 7.200139630395507e-05, "epoch": 0.36581015550972634, "percentage": 36.58, "elapsed_time": "15:31:40", "remaining_time": "1 day, 2:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6564, "total_steps": 17941, "loss": 1.58, "learning_rate": 7.199340009259072e-05, "epoch": 0.36586589376288947, "percentage": 36.59, "elapsed_time": "15:31:48", "remaining_time": "1 day, 2:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6565, "total_steps": 17941, "loss": 1.9478, "learning_rate": 7.198540318372394e-05, "epoch": 0.3659216320160526, "percentage": 36.59, "elapsed_time": "15:31:57", "remaining_time": "1 day, 2:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6566, "total_steps": 17941, "loss": 1.6334, "learning_rate": 7.197740557760834e-05, "epoch": 0.3659773702692158, "percentage": 36.6, "elapsed_time": "15:32:05", "remaining_time": "1 day, 2:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6567, "total_steps": 17941, "loss": 1.4779, "learning_rate": 7.196940727449759e-05, "epoch": 0.3660331085223789, "percentage": 36.6, "elapsed_time": "15:32:14", "remaining_time": "1 day, 2:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6568, "total_steps": 17941, "loss": 1.5101, "learning_rate": 7.196140827464533e-05, "epoch": 0.36608884677554204, "percentage": 36.61, "elapsed_time": "15:32:22", "remaining_time": "1 day, 2:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6569, "total_steps": 17941, "loss": 1.7219, "learning_rate": 7.195340857830524e-05, "epoch": 0.3661445850287052, "percentage": 36.61, "elapsed_time": "15:32:31", "remaining_time": "1 day, 2:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6570, "total_steps": 17941, "loss": 1.6491, "learning_rate": 7.194540818573103e-05, "epoch": 0.36620032328186836, "percentage": 36.62, "elapsed_time": "15:32:40", "remaining_time": "1 day, 2:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6571, "total_steps": 17941, "loss": 1.7846, "learning_rate": 7.193740709717643e-05, "epoch": 0.3662560615350315, "percentage": 36.63, "elapsed_time": "15:32:48", "remaining_time": "1 day, 2:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6572, "total_steps": 17941, "loss": 1.5521, "learning_rate": 7.192940531289517e-05, "epoch": 0.3663117997881946, "percentage": 36.63, "elapsed_time": "15:32:56", "remaining_time": "1 day, 2:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6573, "total_steps": 17941, "loss": 1.7968, "learning_rate": 7.192140283314104e-05, "epoch": 0.3663675380413578, "percentage": 36.64, "elapsed_time": "15:33:05", "remaining_time": "1 day, 2:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6574, "total_steps": 17941, "loss": 1.6086, "learning_rate": 7.191339965816781e-05, "epoch": 0.3664232762945209, "percentage": 36.64, "elapsed_time": "15:33:13", "remaining_time": "1 day, 2:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6575, "total_steps": 17941, "loss": 1.8264, "learning_rate": 7.190539578822932e-05, "epoch": 0.36647901454768406, "percentage": 36.65, "elapsed_time": "15:33:22", "remaining_time": "1 day, 2:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6576, "total_steps": 17941, "loss": 1.8426, "learning_rate": 7.189739122357939e-05, "epoch": 0.36653475280084724, "percentage": 36.65, "elapsed_time": "15:33:30", "remaining_time": "1 day, 2:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6577, "total_steps": 17941, "loss": 1.7968, "learning_rate": 7.188938596447188e-05, "epoch": 0.36659049105401037, "percentage": 36.66, "elapsed_time": "15:33:39", "remaining_time": "1 day, 2:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6578, "total_steps": 17941, "loss": 1.6745, "learning_rate": 7.188138001116065e-05, "epoch": 0.3666462293071735, "percentage": 36.66, "elapsed_time": "15:33:47", "remaining_time": "1 day, 2:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6579, "total_steps": 17941, "loss": 2.0264, "learning_rate": 7.187337336389966e-05, "epoch": 0.3667019675603367, "percentage": 36.67, "elapsed_time": "15:33:56", "remaining_time": "1 day, 2:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6580, "total_steps": 17941, "loss": 1.5105, "learning_rate": 7.186536602294278e-05, "epoch": 0.3667577058134998, "percentage": 36.68, "elapsed_time": "15:34:04", "remaining_time": "1 day, 2:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6581, "total_steps": 17941, "loss": 1.6055, "learning_rate": 7.185735798854396e-05, "epoch": 0.36681344406666294, "percentage": 36.68, "elapsed_time": "15:34:12", "remaining_time": "1 day, 2:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6582, "total_steps": 17941, "loss": 1.7493, "learning_rate": 7.184934926095721e-05, "epoch": 0.36686918231982607, "percentage": 36.69, "elapsed_time": "15:34:21", "remaining_time": "1 day, 2:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6583, "total_steps": 17941, "loss": 1.6443, "learning_rate": 7.184133984043646e-05, "epoch": 0.36692492057298925, "percentage": 36.69, "elapsed_time": "15:34:29", "remaining_time": "1 day, 2:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6584, "total_steps": 17941, "loss": 1.816, "learning_rate": 7.183332972723578e-05, "epoch": 0.3669806588261524, "percentage": 36.7, "elapsed_time": "15:34:38", "remaining_time": "1 day, 2:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6585, "total_steps": 17941, "loss": 1.6545, "learning_rate": 7.182531892160917e-05, "epoch": 0.3670363970793155, "percentage": 36.7, "elapsed_time": "15:34:46", "remaining_time": "1 day, 2:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6586, "total_steps": 17941, "loss": 1.634, "learning_rate": 7.18173074238107e-05, "epoch": 0.3670921353324787, "percentage": 36.71, "elapsed_time": "15:34:55", "remaining_time": "1 day, 2:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6587, "total_steps": 17941, "loss": 1.7378, "learning_rate": 7.180929523409443e-05, "epoch": 0.3671478735856418, "percentage": 36.71, "elapsed_time": "15:35:04", "remaining_time": "1 day, 2:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6588, "total_steps": 17941, "loss": 1.5528, "learning_rate": 7.180128235271449e-05, "epoch": 0.36720361183880496, "percentage": 36.72, "elapsed_time": "15:35:12", "remaining_time": "1 day, 2:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6589, "total_steps": 17941, "loss": 1.7482, "learning_rate": 7.179326877992497e-05, "epoch": 0.36725935009196814, "percentage": 36.73, "elapsed_time": "15:35:21", "remaining_time": "1 day, 2:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6590, "total_steps": 17941, "loss": 1.4865, "learning_rate": 7.178525451598003e-05, "epoch": 0.36731508834513127, "percentage": 36.73, "elapsed_time": "15:35:29", "remaining_time": "1 day, 2:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6591, "total_steps": 17941, "loss": 1.9031, "learning_rate": 7.177723956113383e-05, "epoch": 0.3673708265982944, "percentage": 36.74, "elapsed_time": "15:35:38", "remaining_time": "1 day, 2:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6592, "total_steps": 17941, "loss": 1.6702, "learning_rate": 7.176922391564056e-05, "epoch": 0.3674265648514576, "percentage": 36.74, "elapsed_time": "15:35:46", "remaining_time": "1 day, 2:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6593, "total_steps": 17941, "loss": 1.6571, "learning_rate": 7.176120757975444e-05, "epoch": 0.3674823031046207, "percentage": 36.75, "elapsed_time": "15:35:55", "remaining_time": "1 day, 2:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6594, "total_steps": 17941, "loss": 1.7841, "learning_rate": 7.175319055372969e-05, "epoch": 0.36753804135778384, "percentage": 36.75, "elapsed_time": "15:36:03", "remaining_time": "1 day, 2:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6595, "total_steps": 17941, "loss": 1.6785, "learning_rate": 7.174517283782058e-05, "epoch": 0.36759377961094697, "percentage": 36.76, "elapsed_time": "15:36:11", "remaining_time": "1 day, 2:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6596, "total_steps": 17941, "loss": 1.6604, "learning_rate": 7.173715443228133e-05, "epoch": 0.36764951786411015, "percentage": 36.76, "elapsed_time": "15:36:20", "remaining_time": "1 day, 2:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6597, "total_steps": 17941, "loss": 1.7003, "learning_rate": 7.172913533736632e-05, "epoch": 0.3677052561172733, "percentage": 36.77, "elapsed_time": "15:36:28", "remaining_time": "1 day, 2:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6598, "total_steps": 17941, "loss": 1.9955, "learning_rate": 7.17211155533298e-05, "epoch": 0.3677609943704364, "percentage": 36.78, "elapsed_time": "15:36:37", "remaining_time": "1 day, 2:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6599, "total_steps": 17941, "loss": 1.5601, "learning_rate": 7.171309508042615e-05, "epoch": 0.3678167326235996, "percentage": 36.78, "elapsed_time": "15:36:45", "remaining_time": "1 day, 2:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6600, "total_steps": 17941, "loss": 2.1675, "learning_rate": 7.170507391890972e-05, "epoch": 0.3678724708767627, "percentage": 36.79, "elapsed_time": "15:36:54", "remaining_time": "1 day, 2:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6601, "total_steps": 17941, "loss": 1.6509, "learning_rate": 7.16970520690349e-05, "epoch": 0.36792820912992585, "percentage": 36.79, "elapsed_time": "15:37:02", "remaining_time": "1 day, 2:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6602, "total_steps": 17941, "loss": 1.7301, "learning_rate": 7.168902953105608e-05, "epoch": 0.36798394738308904, "percentage": 36.8, "elapsed_time": "15:37:11", "remaining_time": "1 day, 2:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6603, "total_steps": 17941, "loss": 1.4945, "learning_rate": 7.16810063052277e-05, "epoch": 0.36803968563625217, "percentage": 36.8, "elapsed_time": "15:37:19", "remaining_time": "1 day, 2:49:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6604, "total_steps": 17941, "loss": 1.8281, "learning_rate": 7.16729823918042e-05, "epoch": 0.3680954238894153, "percentage": 36.81, "elapsed_time": "15:37:28", "remaining_time": "1 day, 2:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6605, "total_steps": 17941, "loss": 1.6996, "learning_rate": 7.166495779104007e-05, "epoch": 0.3681511621425784, "percentage": 36.82, "elapsed_time": "15:37:36", "remaining_time": "1 day, 2:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6606, "total_steps": 17941, "loss": 1.9787, "learning_rate": 7.16569325031898e-05, "epoch": 0.3682069003957416, "percentage": 36.82, "elapsed_time": "15:37:45", "remaining_time": "1 day, 2:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6607, "total_steps": 17941, "loss": 1.7931, "learning_rate": 7.164890652850789e-05, "epoch": 0.36826263864890474, "percentage": 36.83, "elapsed_time": "15:37:53", "remaining_time": "1 day, 2:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6608, "total_steps": 17941, "loss": 1.664, "learning_rate": 7.16408798672489e-05, "epoch": 0.36831837690206787, "percentage": 36.83, "elapsed_time": "15:38:02", "remaining_time": "1 day, 2:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6609, "total_steps": 17941, "loss": 1.6754, "learning_rate": 7.163285251966736e-05, "epoch": 0.36837411515523105, "percentage": 36.84, "elapsed_time": "15:38:10", "remaining_time": "1 day, 2:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6610, "total_steps": 17941, "loss": 1.5501, "learning_rate": 7.162482448601789e-05, "epoch": 0.3684298534083942, "percentage": 36.84, "elapsed_time": "15:38:19", "remaining_time": "1 day, 2:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6611, "total_steps": 17941, "loss": 1.6168, "learning_rate": 7.161679576655503e-05, "epoch": 0.3684855916615573, "percentage": 36.85, "elapsed_time": "15:38:27", "remaining_time": "1 day, 2:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6612, "total_steps": 17941, "loss": 1.8576, "learning_rate": 7.160876636153349e-05, "epoch": 0.3685413299147205, "percentage": 36.85, "elapsed_time": "15:38:35", "remaining_time": "1 day, 2:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6613, "total_steps": 17941, "loss": 1.5803, "learning_rate": 7.160073627120784e-05, "epoch": 0.3685970681678836, "percentage": 36.86, "elapsed_time": "15:38:44", "remaining_time": "1 day, 2:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6614, "total_steps": 17941, "loss": 1.2999, "learning_rate": 7.159270549583278e-05, "epoch": 0.36865280642104675, "percentage": 36.87, "elapsed_time": "15:38:52", "remaining_time": "1 day, 2:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6615, "total_steps": 17941, "loss": 1.559, "learning_rate": 7.158467403566299e-05, "epoch": 0.36870854467420994, "percentage": 36.87, "elapsed_time": "15:39:01", "remaining_time": "1 day, 2:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6616, "total_steps": 17941, "loss": 1.2871, "learning_rate": 7.15766418909532e-05, "epoch": 0.36876428292737307, "percentage": 36.88, "elapsed_time": "15:39:09", "remaining_time": "1 day, 2:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6617, "total_steps": 17941, "loss": 1.717, "learning_rate": 7.156860906195811e-05, "epoch": 0.3688200211805362, "percentage": 36.88, "elapsed_time": "15:39:18", "remaining_time": "1 day, 2:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6618, "total_steps": 17941, "loss": 1.8828, "learning_rate": 7.156057554893251e-05, "epoch": 0.3688757594336993, "percentage": 36.89, "elapsed_time": "15:39:26", "remaining_time": "1 day, 2:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6619, "total_steps": 17941, "loss": 1.6727, "learning_rate": 7.155254135213117e-05, "epoch": 0.3689314976868625, "percentage": 36.89, "elapsed_time": "15:39:35", "remaining_time": "1 day, 2:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6620, "total_steps": 17941, "loss": 1.7273, "learning_rate": 7.154450647180886e-05, "epoch": 0.36898723594002564, "percentage": 36.9, "elapsed_time": "15:39:43", "remaining_time": "1 day, 2:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6621, "total_steps": 17941, "loss": 1.5732, "learning_rate": 7.153647090822043e-05, "epoch": 0.36904297419318877, "percentage": 36.9, "elapsed_time": "15:39:52", "remaining_time": "1 day, 2:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6622, "total_steps": 17941, "loss": 1.5612, "learning_rate": 7.152843466162069e-05, "epoch": 0.36909871244635195, "percentage": 36.91, "elapsed_time": "15:40:01", "remaining_time": "1 day, 2:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6623, "total_steps": 17941, "loss": 1.6601, "learning_rate": 7.152039773226456e-05, "epoch": 0.3691544506995151, "percentage": 36.92, "elapsed_time": "15:40:09", "remaining_time": "1 day, 2:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6624, "total_steps": 17941, "loss": 1.6467, "learning_rate": 7.151236012040685e-05, "epoch": 0.3692101889526782, "percentage": 36.92, "elapsed_time": "15:40:18", "remaining_time": "1 day, 2:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6625, "total_steps": 17941, "loss": 1.6429, "learning_rate": 7.150432182630252e-05, "epoch": 0.3692659272058414, "percentage": 36.93, "elapsed_time": "15:40:26", "remaining_time": "1 day, 2:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6626, "total_steps": 17941, "loss": 1.7369, "learning_rate": 7.149628285020648e-05, "epoch": 0.3693216654590045, "percentage": 36.93, "elapsed_time": "15:40:34", "remaining_time": "1 day, 2:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6627, "total_steps": 17941, "loss": 1.7329, "learning_rate": 7.148824319237367e-05, "epoch": 0.36937740371216765, "percentage": 36.94, "elapsed_time": "15:40:43", "remaining_time": "1 day, 2:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6628, "total_steps": 17941, "loss": 1.5495, "learning_rate": 7.148020285305907e-05, "epoch": 0.3694331419653308, "percentage": 36.94, "elapsed_time": "15:40:51", "remaining_time": "1 day, 2:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6629, "total_steps": 17941, "loss": 1.7592, "learning_rate": 7.147216183251768e-05, "epoch": 0.36948888021849396, "percentage": 36.95, "elapsed_time": "15:41:00", "remaining_time": "1 day, 2:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6630, "total_steps": 17941, "loss": 1.5094, "learning_rate": 7.146412013100451e-05, "epoch": 0.3695446184716571, "percentage": 36.95, "elapsed_time": "15:41:08", "remaining_time": "1 day, 2:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6631, "total_steps": 17941, "loss": 1.9804, "learning_rate": 7.14560777487746e-05, "epoch": 0.3696003567248202, "percentage": 36.96, "elapsed_time": "15:41:17", "remaining_time": "1 day, 2:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6632, "total_steps": 17941, "loss": 1.4165, "learning_rate": 7.144803468608298e-05, "epoch": 0.3696560949779834, "percentage": 36.97, "elapsed_time": "15:41:25", "remaining_time": "1 day, 2:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6633, "total_steps": 17941, "loss": 1.6362, "learning_rate": 7.143999094318477e-05, "epoch": 0.36971183323114654, "percentage": 36.97, "elapsed_time": "15:41:34", "remaining_time": "1 day, 2:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6634, "total_steps": 17941, "loss": 1.8459, "learning_rate": 7.143194652033505e-05, "epoch": 0.36976757148430967, "percentage": 36.98, "elapsed_time": "15:41:42", "remaining_time": "1 day, 2:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6635, "total_steps": 17941, "loss": 1.655, "learning_rate": 7.142390141778895e-05, "epoch": 0.36982330973747285, "percentage": 36.98, "elapsed_time": "15:41:50", "remaining_time": "1 day, 2:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6636, "total_steps": 17941, "loss": 1.8284, "learning_rate": 7.141585563580158e-05, "epoch": 0.369879047990636, "percentage": 36.99, "elapsed_time": "15:41:59", "remaining_time": "1 day, 2:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6637, "total_steps": 17941, "loss": 1.6024, "learning_rate": 7.140780917462814e-05, "epoch": 0.3699347862437991, "percentage": 36.99, "elapsed_time": "15:42:07", "remaining_time": "1 day, 2:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6638, "total_steps": 17941, "loss": 1.6143, "learning_rate": 7.139976203452383e-05, "epoch": 0.3699905244969623, "percentage": 37.0, "elapsed_time": "15:42:16", "remaining_time": "1 day, 2:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6639, "total_steps": 17941, "loss": 1.7714, "learning_rate": 7.139171421574383e-05, "epoch": 0.3700462627501254, "percentage": 37.0, "elapsed_time": "15:42:25", "remaining_time": "1 day, 2:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6640, "total_steps": 17941, "loss": 1.5943, "learning_rate": 7.138366571854338e-05, "epoch": 0.37010200100328855, "percentage": 37.01, "elapsed_time": "15:42:33", "remaining_time": "1 day, 2:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6641, "total_steps": 17941, "loss": 1.7892, "learning_rate": 7.137561654317772e-05, "epoch": 0.3701577392564517, "percentage": 37.02, "elapsed_time": "15:42:41", "remaining_time": "1 day, 2:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6642, "total_steps": 17941, "loss": 1.7051, "learning_rate": 7.136756668990213e-05, "epoch": 0.37021347750961486, "percentage": 37.02, "elapsed_time": "15:42:50", "remaining_time": "1 day, 2:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6643, "total_steps": 17941, "loss": 1.6284, "learning_rate": 7.13595161589719e-05, "epoch": 0.370269215762778, "percentage": 37.03, "elapsed_time": "15:42:59", "remaining_time": "1 day, 2:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6644, "total_steps": 17941, "loss": 1.5837, "learning_rate": 7.135146495064236e-05, "epoch": 0.3703249540159411, "percentage": 37.03, "elapsed_time": "15:43:07", "remaining_time": "1 day, 2:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6645, "total_steps": 17941, "loss": 1.891, "learning_rate": 7.134341306516885e-05, "epoch": 0.3703806922691043, "percentage": 37.04, "elapsed_time": "15:43:15", "remaining_time": "1 day, 2:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6646, "total_steps": 17941, "loss": 1.676, "learning_rate": 7.13353605028067e-05, "epoch": 0.37043643052226743, "percentage": 37.04, "elapsed_time": "15:43:24", "remaining_time": "1 day, 2:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6647, "total_steps": 17941, "loss": 1.8638, "learning_rate": 7.132730726381134e-05, "epoch": 0.37049216877543056, "percentage": 37.05, "elapsed_time": "15:43:32", "remaining_time": "1 day, 2:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6648, "total_steps": 17941, "loss": 2.0887, "learning_rate": 7.13192533484381e-05, "epoch": 0.37054790702859375, "percentage": 37.05, "elapsed_time": "15:43:41", "remaining_time": "1 day, 2:43:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6649, "total_steps": 17941, "loss": 1.5408, "learning_rate": 7.131119875694246e-05, "epoch": 0.3706036452817569, "percentage": 37.06, "elapsed_time": "15:43:49", "remaining_time": "1 day, 2:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6650, "total_steps": 17941, "loss": 1.4246, "learning_rate": 7.130314348957986e-05, "epoch": 0.37065938353492, "percentage": 37.07, "elapsed_time": "15:43:58", "remaining_time": "1 day, 2:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6651, "total_steps": 17941, "loss": 1.4972, "learning_rate": 7.129508754660575e-05, "epoch": 0.37071512178808314, "percentage": 37.07, "elapsed_time": "15:44:06", "remaining_time": "1 day, 2:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6652, "total_steps": 17941, "loss": 1.9089, "learning_rate": 7.128703092827562e-05, "epoch": 0.3707708600412463, "percentage": 37.08, "elapsed_time": "15:44:15", "remaining_time": "1 day, 2:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6653, "total_steps": 17941, "loss": 1.9196, "learning_rate": 7.127897363484497e-05, "epoch": 0.37082659829440945, "percentage": 37.08, "elapsed_time": "15:44:23", "remaining_time": "1 day, 2:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6654, "total_steps": 17941, "loss": 1.7842, "learning_rate": 7.127091566656936e-05, "epoch": 0.3708823365475726, "percentage": 37.09, "elapsed_time": "15:44:32", "remaining_time": "1 day, 2:42:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6655, "total_steps": 17941, "loss": 1.6261, "learning_rate": 7.12628570237043e-05, "epoch": 0.37093807480073576, "percentage": 37.09, "elapsed_time": "15:44:40", "remaining_time": "1 day, 2:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6656, "total_steps": 17941, "loss": 1.6085, "learning_rate": 7.125479770650539e-05, "epoch": 0.3709938130538989, "percentage": 37.1, "elapsed_time": "15:44:49", "remaining_time": "1 day, 2:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6657, "total_steps": 17941, "loss": 1.905, "learning_rate": 7.124673771522824e-05, "epoch": 0.371049551307062, "percentage": 37.1, "elapsed_time": "15:44:57", "remaining_time": "1 day, 2:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6658, "total_steps": 17941, "loss": 1.5081, "learning_rate": 7.123867705012843e-05, "epoch": 0.3711052895602252, "percentage": 37.11, "elapsed_time": "15:45:06", "remaining_time": "1 day, 2:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6659, "total_steps": 17941, "loss": 1.6793, "learning_rate": 7.123061571146161e-05, "epoch": 0.37116102781338833, "percentage": 37.12, "elapsed_time": "15:45:14", "remaining_time": "1 day, 2:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6660, "total_steps": 17941, "loss": 1.6402, "learning_rate": 7.122255369948346e-05, "epoch": 0.37121676606655146, "percentage": 37.12, "elapsed_time": "15:45:22", "remaining_time": "1 day, 2:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6661, "total_steps": 17941, "loss": 1.6232, "learning_rate": 7.121449101444964e-05, "epoch": 0.37127250431971465, "percentage": 37.13, "elapsed_time": "15:45:31", "remaining_time": "1 day, 2:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6662, "total_steps": 17941, "loss": 1.7163, "learning_rate": 7.120642765661584e-05, "epoch": 0.3713282425728778, "percentage": 37.13, "elapsed_time": "15:45:40", "remaining_time": "1 day, 2:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6663, "total_steps": 17941, "loss": 1.9706, "learning_rate": 7.119836362623781e-05, "epoch": 0.3713839808260409, "percentage": 37.14, "elapsed_time": "15:45:48", "remaining_time": "1 day, 2:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6664, "total_steps": 17941, "loss": 1.9116, "learning_rate": 7.119029892357128e-05, "epoch": 0.37143971907920403, "percentage": 37.14, "elapsed_time": "15:45:57", "remaining_time": "1 day, 2:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6665, "total_steps": 17941, "loss": 1.5862, "learning_rate": 7.118223354887201e-05, "epoch": 0.3714954573323672, "percentage": 37.15, "elapsed_time": "15:46:05", "remaining_time": "1 day, 2:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6666, "total_steps": 17941, "loss": 1.5945, "learning_rate": 7.11741675023958e-05, "epoch": 0.37155119558553035, "percentage": 37.16, "elapsed_time": "15:46:14", "remaining_time": "1 day, 2:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6667, "total_steps": 17941, "loss": 1.5802, "learning_rate": 7.116610078439845e-05, "epoch": 0.3716069338386935, "percentage": 37.16, "elapsed_time": "15:46:22", "remaining_time": "1 day, 2:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6668, "total_steps": 17941, "loss": 2.005, "learning_rate": 7.115803339513578e-05, "epoch": 0.37166267209185666, "percentage": 37.17, "elapsed_time": "15:46:31", "remaining_time": "1 day, 2:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6669, "total_steps": 17941, "loss": 1.5013, "learning_rate": 7.114996533486366e-05, "epoch": 0.3717184103450198, "percentage": 37.17, "elapsed_time": "15:46:39", "remaining_time": "1 day, 2:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6670, "total_steps": 17941, "loss": 2.0418, "learning_rate": 7.114189660383794e-05, "epoch": 0.3717741485981829, "percentage": 37.18, "elapsed_time": "15:46:49", "remaining_time": "1 day, 2:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6671, "total_steps": 17941, "loss": 1.7955, "learning_rate": 7.113382720231454e-05, "epoch": 0.3718298868513461, "percentage": 37.18, "elapsed_time": "15:46:57", "remaining_time": "1 day, 2:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6672, "total_steps": 17941, "loss": 1.4315, "learning_rate": 7.112575713054936e-05, "epoch": 0.37188562510450923, "percentage": 37.19, "elapsed_time": "15:47:06", "remaining_time": "1 day, 2:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6673, "total_steps": 17941, "loss": 1.566, "learning_rate": 7.111768638879833e-05, "epoch": 0.37194136335767236, "percentage": 37.19, "elapsed_time": "15:47:14", "remaining_time": "1 day, 2:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6674, "total_steps": 17941, "loss": 1.8572, "learning_rate": 7.110961497731742e-05, "epoch": 0.3719971016108355, "percentage": 37.2, "elapsed_time": "15:47:23", "remaining_time": "1 day, 2:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6675, "total_steps": 17941, "loss": 2.0372, "learning_rate": 7.110154289636259e-05, "epoch": 0.3720528398639987, "percentage": 37.21, "elapsed_time": "15:47:31", "remaining_time": "1 day, 2:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6676, "total_steps": 17941, "loss": 1.6665, "learning_rate": 7.109347014618985e-05, "epoch": 0.3721085781171618, "percentage": 37.21, "elapsed_time": "15:47:40", "remaining_time": "1 day, 2:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6677, "total_steps": 17941, "loss": 1.747, "learning_rate": 7.108539672705523e-05, "epoch": 0.37216431637032493, "percentage": 37.22, "elapsed_time": "15:47:48", "remaining_time": "1 day, 2:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6678, "total_steps": 17941, "loss": 1.4182, "learning_rate": 7.107732263921475e-05, "epoch": 0.3722200546234881, "percentage": 37.22, "elapsed_time": "15:47:57", "remaining_time": "1 day, 2:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6679, "total_steps": 17941, "loss": 1.6223, "learning_rate": 7.106924788292448e-05, "epoch": 0.37227579287665125, "percentage": 37.23, "elapsed_time": "15:48:05", "remaining_time": "1 day, 2:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6680, "total_steps": 17941, "loss": 1.5979, "learning_rate": 7.106117245844054e-05, "epoch": 0.3723315311298144, "percentage": 37.23, "elapsed_time": "15:48:15", "remaining_time": "1 day, 2:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6681, "total_steps": 17941, "loss": 1.9983, "learning_rate": 7.105309636601898e-05, "epoch": 0.37238726938297756, "percentage": 37.24, "elapsed_time": "15:48:23", "remaining_time": "1 day, 2:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6682, "total_steps": 17941, "loss": 1.5488, "learning_rate": 7.104501960591595e-05, "epoch": 0.3724430076361407, "percentage": 37.24, "elapsed_time": "15:48:31", "remaining_time": "1 day, 2:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6683, "total_steps": 17941, "loss": 1.6376, "learning_rate": 7.103694217838761e-05, "epoch": 0.3724987458893038, "percentage": 37.25, "elapsed_time": "15:48:40", "remaining_time": "1 day, 2:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6684, "total_steps": 17941, "loss": 1.4654, "learning_rate": 7.102886408369012e-05, "epoch": 0.372554484142467, "percentage": 37.26, "elapsed_time": "15:48:48", "remaining_time": "1 day, 2:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6685, "total_steps": 17941, "loss": 1.7554, "learning_rate": 7.102078532207966e-05, "epoch": 0.37261022239563013, "percentage": 37.26, "elapsed_time": "15:48:57", "remaining_time": "1 day, 2:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6686, "total_steps": 17941, "loss": 1.8247, "learning_rate": 7.101270589381245e-05, "epoch": 0.37266596064879326, "percentage": 37.27, "elapsed_time": "15:49:06", "remaining_time": "1 day, 2:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6687, "total_steps": 17941, "loss": 1.7902, "learning_rate": 7.100462579914474e-05, "epoch": 0.3727216989019564, "percentage": 37.27, "elapsed_time": "15:49:14", "remaining_time": "1 day, 2:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6688, "total_steps": 17941, "loss": 1.7138, "learning_rate": 7.099654503833273e-05, "epoch": 0.3727774371551196, "percentage": 37.28, "elapsed_time": "15:49:23", "remaining_time": "1 day, 2:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6689, "total_steps": 17941, "loss": 1.6607, "learning_rate": 7.098846361163273e-05, "epoch": 0.3728331754082827, "percentage": 37.28, "elapsed_time": "15:49:31", "remaining_time": "1 day, 2:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6690, "total_steps": 17941, "loss": 1.8834, "learning_rate": 7.098038151930107e-05, "epoch": 0.37288891366144583, "percentage": 37.29, "elapsed_time": "15:49:40", "remaining_time": "1 day, 2:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6691, "total_steps": 17941, "loss": 1.67, "learning_rate": 7.097229876159401e-05, "epoch": 0.372944651914609, "percentage": 37.29, "elapsed_time": "15:49:49", "remaining_time": "1 day, 2:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6692, "total_steps": 17941, "loss": 1.6881, "learning_rate": 7.096421533876792e-05, "epoch": 0.37300039016777214, "percentage": 37.3, "elapsed_time": "15:49:57", "remaining_time": "1 day, 2:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6693, "total_steps": 17941, "loss": 1.6077, "learning_rate": 7.095613125107915e-05, "epoch": 0.3730561284209353, "percentage": 37.31, "elapsed_time": "15:50:06", "remaining_time": "1 day, 2:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6694, "total_steps": 17941, "loss": 1.6124, "learning_rate": 7.094804649878407e-05, "epoch": 0.37311186667409846, "percentage": 37.31, "elapsed_time": "15:50:15", "remaining_time": "1 day, 2:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6695, "total_steps": 17941, "loss": 1.735, "learning_rate": 7.093996108213909e-05, "epoch": 0.3731676049272616, "percentage": 37.32, "elapsed_time": "15:50:23", "remaining_time": "1 day, 2:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6696, "total_steps": 17941, "loss": 1.9465, "learning_rate": 7.093187500140064e-05, "epoch": 0.3732233431804247, "percentage": 37.32, "elapsed_time": "15:50:31", "remaining_time": "1 day, 2:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6697, "total_steps": 17941, "loss": 1.6817, "learning_rate": 7.092378825682517e-05, "epoch": 0.37327908143358784, "percentage": 37.33, "elapsed_time": "15:50:40", "remaining_time": "1 day, 2:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6698, "total_steps": 17941, "loss": 1.7072, "learning_rate": 7.091570084866909e-05, "epoch": 0.37333481968675103, "percentage": 37.33, "elapsed_time": "15:50:48", "remaining_time": "1 day, 2:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6699, "total_steps": 17941, "loss": 1.7315, "learning_rate": 7.090761277718897e-05, "epoch": 0.37339055793991416, "percentage": 37.34, "elapsed_time": "15:50:57", "remaining_time": "1 day, 2:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6700, "total_steps": 17941, "loss": 1.5599, "learning_rate": 7.089952404264126e-05, "epoch": 0.3734462961930773, "percentage": 37.34, "elapsed_time": "15:51:05", "remaining_time": "1 day, 2:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6701, "total_steps": 17941, "loss": 1.6328, "learning_rate": 7.089143464528249e-05, "epoch": 0.37350203444624047, "percentage": 37.35, "elapsed_time": "15:51:14", "remaining_time": "1 day, 2:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6702, "total_steps": 17941, "loss": 1.8025, "learning_rate": 7.088334458536921e-05, "epoch": 0.3735577726994036, "percentage": 37.36, "elapsed_time": "15:51:22", "remaining_time": "1 day, 2:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6703, "total_steps": 17941, "loss": 1.6715, "learning_rate": 7.087525386315802e-05, "epoch": 0.37361351095256673, "percentage": 37.36, "elapsed_time": "15:51:31", "remaining_time": "1 day, 2:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6704, "total_steps": 17941, "loss": 1.7321, "learning_rate": 7.086716247890548e-05, "epoch": 0.3736692492057299, "percentage": 37.37, "elapsed_time": "15:51:39", "remaining_time": "1 day, 2:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6705, "total_steps": 17941, "loss": 1.5648, "learning_rate": 7.08590704328682e-05, "epoch": 0.37372498745889304, "percentage": 37.37, "elapsed_time": "15:51:48", "remaining_time": "1 day, 2:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6706, "total_steps": 17941, "loss": 1.9348, "learning_rate": 7.085097772530283e-05, "epoch": 0.37378072571205617, "percentage": 37.38, "elapsed_time": "15:51:56", "remaining_time": "1 day, 2:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6707, "total_steps": 17941, "loss": 1.5634, "learning_rate": 7.084288435646603e-05, "epoch": 0.37383646396521936, "percentage": 37.38, "elapsed_time": "15:52:05", "remaining_time": "1 day, 2:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6708, "total_steps": 17941, "loss": 1.6525, "learning_rate": 7.083479032661445e-05, "epoch": 0.3738922022183825, "percentage": 37.39, "elapsed_time": "15:52:13", "remaining_time": "1 day, 2:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6709, "total_steps": 17941, "loss": 1.885, "learning_rate": 7.082669563600478e-05, "epoch": 0.3739479404715456, "percentage": 37.39, "elapsed_time": "15:52:22", "remaining_time": "1 day, 2:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6710, "total_steps": 17941, "loss": 1.8645, "learning_rate": 7.081860028489377e-05, "epoch": 0.37400367872470874, "percentage": 37.4, "elapsed_time": "15:52:30", "remaining_time": "1 day, 2:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6711, "total_steps": 17941, "loss": 1.8752, "learning_rate": 7.081050427353814e-05, "epoch": 0.37405941697787193, "percentage": 37.41, "elapsed_time": "15:52:39", "remaining_time": "1 day, 2:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6712, "total_steps": 17941, "loss": 1.5953, "learning_rate": 7.080240760219465e-05, "epoch": 0.37411515523103506, "percentage": 37.41, "elapsed_time": "15:52:47", "remaining_time": "1 day, 2:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6713, "total_steps": 17941, "loss": 1.4812, "learning_rate": 7.079431027112006e-05, "epoch": 0.3741708934841982, "percentage": 37.42, "elapsed_time": "15:52:56", "remaining_time": "1 day, 2:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6714, "total_steps": 17941, "loss": 1.8588, "learning_rate": 7.078621228057121e-05, "epoch": 0.37422663173736137, "percentage": 37.42, "elapsed_time": "15:53:04", "remaining_time": "1 day, 2:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6715, "total_steps": 17941, "loss": 1.745, "learning_rate": 7.077811363080489e-05, "epoch": 0.3742823699905245, "percentage": 37.43, "elapsed_time": "15:53:13", "remaining_time": "1 day, 2:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6716, "total_steps": 17941, "loss": 1.511, "learning_rate": 7.077001432207795e-05, "epoch": 0.37433810824368763, "percentage": 37.43, "elapsed_time": "15:53:21", "remaining_time": "1 day, 2:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6717, "total_steps": 17941, "loss": 1.6644, "learning_rate": 7.076191435464725e-05, "epoch": 0.3743938464968508, "percentage": 37.44, "elapsed_time": "15:53:30", "remaining_time": "1 day, 2:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6718, "total_steps": 17941, "loss": 1.73, "learning_rate": 7.075381372876967e-05, "epoch": 0.37444958475001394, "percentage": 37.44, "elapsed_time": "15:53:38", "remaining_time": "1 day, 2:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6719, "total_steps": 17941, "loss": 1.6284, "learning_rate": 7.074571244470214e-05, "epoch": 0.37450532300317707, "percentage": 37.45, "elapsed_time": "15:53:47", "remaining_time": "1 day, 2:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6720, "total_steps": 17941, "loss": 1.84, "learning_rate": 7.073761050270156e-05, "epoch": 0.3745610612563402, "percentage": 37.46, "elapsed_time": "15:53:55", "remaining_time": "1 day, 2:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6721, "total_steps": 17941, "loss": 1.4598, "learning_rate": 7.072950790302487e-05, "epoch": 0.3746167995095034, "percentage": 37.46, "elapsed_time": "15:54:04", "remaining_time": "1 day, 2:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6722, "total_steps": 17941, "loss": 1.5442, "learning_rate": 7.072140464592907e-05, "epoch": 0.3746725377626665, "percentage": 37.47, "elapsed_time": "15:54:12", "remaining_time": "1 day, 2:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6723, "total_steps": 17941, "loss": 1.6898, "learning_rate": 7.071330073167112e-05, "epoch": 0.37472827601582964, "percentage": 37.47, "elapsed_time": "15:54:21", "remaining_time": "1 day, 2:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6724, "total_steps": 17941, "loss": 1.731, "learning_rate": 7.070519616050804e-05, "epoch": 0.3747840142689928, "percentage": 37.48, "elapsed_time": "15:54:30", "remaining_time": "1 day, 2:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6725, "total_steps": 17941, "loss": 1.796, "learning_rate": 7.069709093269687e-05, "epoch": 0.37483975252215596, "percentage": 37.48, "elapsed_time": "15:54:38", "remaining_time": "1 day, 2:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6726, "total_steps": 17941, "loss": 1.656, "learning_rate": 7.068898504849462e-05, "epoch": 0.3748954907753191, "percentage": 37.49, "elapsed_time": "15:54:47", "remaining_time": "1 day, 2:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6727, "total_steps": 17941, "loss": 1.6656, "learning_rate": 7.06808785081584e-05, "epoch": 0.37495122902848227, "percentage": 37.5, "elapsed_time": "15:54:55", "remaining_time": "1 day, 2:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6728, "total_steps": 17941, "loss": 1.7658, "learning_rate": 7.067277131194529e-05, "epoch": 0.3750069672816454, "percentage": 37.5, "elapsed_time": "15:55:04", "remaining_time": "1 day, 2:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6729, "total_steps": 17941, "loss": 1.6342, "learning_rate": 7.066466346011242e-05, "epoch": 0.3750627055348085, "percentage": 37.51, "elapsed_time": "15:55:12", "remaining_time": "1 day, 2:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6730, "total_steps": 17941, "loss": 1.7829, "learning_rate": 7.06565549529169e-05, "epoch": 0.3751184437879717, "percentage": 37.51, "elapsed_time": "15:55:21", "remaining_time": "1 day, 2:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6731, "total_steps": 17941, "loss": 1.8819, "learning_rate": 7.064844579061588e-05, "epoch": 0.37517418204113484, "percentage": 37.52, "elapsed_time": "15:55:29", "remaining_time": "1 day, 2:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6732, "total_steps": 17941, "loss": 1.6654, "learning_rate": 7.064033597346658e-05, "epoch": 0.37522992029429797, "percentage": 37.52, "elapsed_time": "15:55:38", "remaining_time": "1 day, 2:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6733, "total_steps": 17941, "loss": 1.6577, "learning_rate": 7.063222550172612e-05, "epoch": 0.3752856585474611, "percentage": 37.53, "elapsed_time": "15:55:47", "remaining_time": "1 day, 2:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6734, "total_steps": 17941, "loss": 1.7532, "learning_rate": 7.062411437565179e-05, "epoch": 0.3753413968006243, "percentage": 37.53, "elapsed_time": "15:55:55", "remaining_time": "1 day, 2:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6735, "total_steps": 17941, "loss": 1.7744, "learning_rate": 7.06160025955008e-05, "epoch": 0.3753971350537874, "percentage": 37.54, "elapsed_time": "15:56:04", "remaining_time": "1 day, 2:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6736, "total_steps": 17941, "loss": 1.9847, "learning_rate": 7.06078901615304e-05, "epoch": 0.37545287330695054, "percentage": 37.55, "elapsed_time": "15:56:12", "remaining_time": "1 day, 2:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6737, "total_steps": 17941, "loss": 1.4559, "learning_rate": 7.059977707399787e-05, "epoch": 0.3755086115601137, "percentage": 37.55, "elapsed_time": "15:56:21", "remaining_time": "1 day, 2:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6738, "total_steps": 17941, "loss": 1.6796, "learning_rate": 7.059166333316054e-05, "epoch": 0.37556434981327685, "percentage": 37.56, "elapsed_time": "15:56:29", "remaining_time": "1 day, 2:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6739, "total_steps": 17941, "loss": 1.5015, "learning_rate": 7.058354893927568e-05, "epoch": 0.37562008806644, "percentage": 37.56, "elapsed_time": "15:56:38", "remaining_time": "1 day, 2:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6740, "total_steps": 17941, "loss": 1.8178, "learning_rate": 7.057543389260068e-05, "epoch": 0.37567582631960317, "percentage": 37.57, "elapsed_time": "15:56:47", "remaining_time": "1 day, 2:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6741, "total_steps": 17941, "loss": 1.7513, "learning_rate": 7.056731819339286e-05, "epoch": 0.3757315645727663, "percentage": 37.57, "elapsed_time": "15:56:55", "remaining_time": "1 day, 2:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6742, "total_steps": 17941, "loss": 1.6351, "learning_rate": 7.055920184190964e-05, "epoch": 0.3757873028259294, "percentage": 37.58, "elapsed_time": "15:57:04", "remaining_time": "1 day, 2:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6743, "total_steps": 17941, "loss": 1.6854, "learning_rate": 7.055108483840839e-05, "epoch": 0.37584304107909255, "percentage": 37.58, "elapsed_time": "15:57:12", "remaining_time": "1 day, 2:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6744, "total_steps": 17941, "loss": 1.7937, "learning_rate": 7.054296718314656e-05, "epoch": 0.37589877933225574, "percentage": 37.59, "elapsed_time": "15:57:20", "remaining_time": "1 day, 2:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6745, "total_steps": 17941, "loss": 1.6708, "learning_rate": 7.053484887638158e-05, "epoch": 0.37595451758541887, "percentage": 37.6, "elapsed_time": "15:57:29", "remaining_time": "1 day, 2:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6746, "total_steps": 17941, "loss": 1.6565, "learning_rate": 7.052672991837093e-05, "epoch": 0.376010255838582, "percentage": 37.6, "elapsed_time": "15:57:37", "remaining_time": "1 day, 2:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6747, "total_steps": 17941, "loss": 1.5376, "learning_rate": 7.051861030937207e-05, "epoch": 0.3760659940917452, "percentage": 37.61, "elapsed_time": "15:57:46", "remaining_time": "1 day, 2:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6748, "total_steps": 17941, "loss": 1.7518, "learning_rate": 7.051049004964254e-05, "epoch": 0.3761217323449083, "percentage": 37.61, "elapsed_time": "15:57:54", "remaining_time": "1 day, 2:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6749, "total_steps": 17941, "loss": 1.5384, "learning_rate": 7.050236913943984e-05, "epoch": 0.37617747059807144, "percentage": 37.62, "elapsed_time": "15:58:03", "remaining_time": "1 day, 2:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6750, "total_steps": 17941, "loss": 1.6072, "learning_rate": 7.049424757902153e-05, "epoch": 0.3762332088512346, "percentage": 37.62, "elapsed_time": "15:58:11", "remaining_time": "1 day, 2:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6751, "total_steps": 17941, "loss": 1.8342, "learning_rate": 7.048612536864517e-05, "epoch": 0.37628894710439775, "percentage": 37.63, "elapsed_time": "15:58:20", "remaining_time": "1 day, 2:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6752, "total_steps": 17941, "loss": 1.6988, "learning_rate": 7.047800250856837e-05, "epoch": 0.3763446853575609, "percentage": 37.63, "elapsed_time": "15:58:29", "remaining_time": "1 day, 2:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6753, "total_steps": 17941, "loss": 1.4647, "learning_rate": 7.046987899904871e-05, "epoch": 0.37640042361072407, "percentage": 37.64, "elapsed_time": "15:58:38", "remaining_time": "1 day, 2:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6754, "total_steps": 17941, "loss": 1.5224, "learning_rate": 7.046175484034384e-05, "epoch": 0.3764561618638872, "percentage": 37.65, "elapsed_time": "15:58:46", "remaining_time": "1 day, 2:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6755, "total_steps": 17941, "loss": 1.664, "learning_rate": 7.045363003271141e-05, "epoch": 0.3765119001170503, "percentage": 37.65, "elapsed_time": "15:58:55", "remaining_time": "1 day, 2:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6756, "total_steps": 17941, "loss": 1.6422, "learning_rate": 7.044550457640909e-05, "epoch": 0.37656763837021345, "percentage": 37.66, "elapsed_time": "15:59:03", "remaining_time": "1 day, 2:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6757, "total_steps": 17941, "loss": 2.0161, "learning_rate": 7.043737847169455e-05, "epoch": 0.37662337662337664, "percentage": 37.66, "elapsed_time": "15:59:12", "remaining_time": "1 day, 2:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6758, "total_steps": 17941, "loss": 1.6388, "learning_rate": 7.042925171882557e-05, "epoch": 0.37667911487653977, "percentage": 37.67, "elapsed_time": "15:59:20", "remaining_time": "1 day, 2:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6759, "total_steps": 17941, "loss": 1.546, "learning_rate": 7.042112431805979e-05, "epoch": 0.3767348531297029, "percentage": 37.67, "elapsed_time": "15:59:29", "remaining_time": "1 day, 2:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6760, "total_steps": 17941, "loss": 1.6727, "learning_rate": 7.041299626965503e-05, "epoch": 0.3767905913828661, "percentage": 37.68, "elapsed_time": "15:59:38", "remaining_time": "1 day, 2:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6761, "total_steps": 17941, "loss": 1.7527, "learning_rate": 7.040486757386904e-05, "epoch": 0.3768463296360292, "percentage": 37.68, "elapsed_time": "15:59:47", "remaining_time": "1 day, 2:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6762, "total_steps": 17941, "loss": 1.9415, "learning_rate": 7.039673823095963e-05, "epoch": 0.37690206788919234, "percentage": 37.69, "elapsed_time": "15:59:55", "remaining_time": "1 day, 2:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6763, "total_steps": 17941, "loss": 1.6316, "learning_rate": 7.03886082411846e-05, "epoch": 0.3769578061423555, "percentage": 37.7, "elapsed_time": "16:00:04", "remaining_time": "1 day, 2:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6764, "total_steps": 17941, "loss": 1.6363, "learning_rate": 7.038047760480179e-05, "epoch": 0.37701354439551865, "percentage": 37.7, "elapsed_time": "16:00:12", "remaining_time": "1 day, 2:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6765, "total_steps": 17941, "loss": 1.7243, "learning_rate": 7.037234632206905e-05, "epoch": 0.3770692826486818, "percentage": 37.71, "elapsed_time": "16:00:21", "remaining_time": "1 day, 2:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6766, "total_steps": 17941, "loss": 1.6807, "learning_rate": 7.036421439324427e-05, "epoch": 0.3771250209018449, "percentage": 37.71, "elapsed_time": "16:00:29", "remaining_time": "1 day, 2:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6767, "total_steps": 17941, "loss": 1.6641, "learning_rate": 7.035608181858533e-05, "epoch": 0.3771807591550081, "percentage": 37.72, "elapsed_time": "16:00:38", "remaining_time": "1 day, 2:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6768, "total_steps": 17941, "loss": 1.8226, "learning_rate": 7.034794859835016e-05, "epoch": 0.3772364974081712, "percentage": 37.72, "elapsed_time": "16:00:46", "remaining_time": "1 day, 2:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6769, "total_steps": 17941, "loss": 1.6291, "learning_rate": 7.033981473279672e-05, "epoch": 0.37729223566133435, "percentage": 37.73, "elapsed_time": "16:00:56", "remaining_time": "1 day, 2:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6770, "total_steps": 17941, "loss": 1.5797, "learning_rate": 7.033168022218292e-05, "epoch": 0.37734797391449754, "percentage": 37.73, "elapsed_time": "16:01:04", "remaining_time": "1 day, 2:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6771, "total_steps": 17941, "loss": 1.7165, "learning_rate": 7.032354506676678e-05, "epoch": 0.37740371216766067, "percentage": 37.74, "elapsed_time": "16:01:13", "remaining_time": "1 day, 2:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6772, "total_steps": 17941, "loss": 1.9454, "learning_rate": 7.031540926680627e-05, "epoch": 0.3774594504208238, "percentage": 37.75, "elapsed_time": "16:01:21", "remaining_time": "1 day, 2:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6773, "total_steps": 17941, "loss": 1.9527, "learning_rate": 7.030727282255944e-05, "epoch": 0.377515188673987, "percentage": 37.75, "elapsed_time": "16:01:30", "remaining_time": "1 day, 2:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6774, "total_steps": 17941, "loss": 1.4055, "learning_rate": 7.02991357342843e-05, "epoch": 0.3775709269271501, "percentage": 37.76, "elapsed_time": "16:01:38", "remaining_time": "1 day, 2:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6775, "total_steps": 17941, "loss": 1.5683, "learning_rate": 7.029099800223895e-05, "epoch": 0.37762666518031324, "percentage": 37.76, "elapsed_time": "16:01:47", "remaining_time": "1 day, 2:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6776, "total_steps": 17941, "loss": 1.6576, "learning_rate": 7.028285962668144e-05, "epoch": 0.3776824034334764, "percentage": 37.77, "elapsed_time": "16:01:56", "remaining_time": "1 day, 2:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6777, "total_steps": 17941, "loss": 1.6046, "learning_rate": 7.027472060786988e-05, "epoch": 0.37773814168663955, "percentage": 37.77, "elapsed_time": "16:02:04", "remaining_time": "1 day, 2:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6778, "total_steps": 17941, "loss": 1.8251, "learning_rate": 7.026658094606238e-05, "epoch": 0.3777938799398027, "percentage": 37.78, "elapsed_time": "16:02:13", "remaining_time": "1 day, 2:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6779, "total_steps": 17941, "loss": 1.9974, "learning_rate": 7.02584406415171e-05, "epoch": 0.3778496181929658, "percentage": 37.78, "elapsed_time": "16:02:22", "remaining_time": "1 day, 2:24:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6780, "total_steps": 17941, "loss": 1.5211, "learning_rate": 7.02502996944922e-05, "epoch": 0.377905356446129, "percentage": 37.79, "elapsed_time": "16:02:30", "remaining_time": "1 day, 2:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6781, "total_steps": 17941, "loss": 1.7317, "learning_rate": 7.024215810524586e-05, "epoch": 0.3779610946992921, "percentage": 37.8, "elapsed_time": "16:02:39", "remaining_time": "1 day, 2:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6782, "total_steps": 17941, "loss": 1.6749, "learning_rate": 7.023401587403629e-05, "epoch": 0.37801683295245525, "percentage": 37.8, "elapsed_time": "16:02:47", "remaining_time": "1 day, 2:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6783, "total_steps": 17941, "loss": 1.7105, "learning_rate": 7.022587300112171e-05, "epoch": 0.37807257120561844, "percentage": 37.81, "elapsed_time": "16:02:56", "remaining_time": "1 day, 2:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6784, "total_steps": 17941, "loss": 1.8057, "learning_rate": 7.021772948676037e-05, "epoch": 0.37812830945878156, "percentage": 37.81, "elapsed_time": "16:03:04", "remaining_time": "1 day, 2:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6785, "total_steps": 17941, "loss": 1.6275, "learning_rate": 7.020958533121051e-05, "epoch": 0.3781840477119447, "percentage": 37.82, "elapsed_time": "16:03:13", "remaining_time": "1 day, 2:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6786, "total_steps": 17941, "loss": 1.786, "learning_rate": 7.020144053473044e-05, "epoch": 0.3782397859651079, "percentage": 37.82, "elapsed_time": "16:03:21", "remaining_time": "1 day, 2:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6787, "total_steps": 17941, "loss": 1.6452, "learning_rate": 7.019329509757845e-05, "epoch": 0.378295524218271, "percentage": 37.83, "elapsed_time": "16:03:30", "remaining_time": "1 day, 2:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6788, "total_steps": 17941, "loss": 1.5128, "learning_rate": 7.01851490200129e-05, "epoch": 0.37835126247143414, "percentage": 37.84, "elapsed_time": "16:03:39", "remaining_time": "1 day, 2:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6789, "total_steps": 17941, "loss": 1.4683, "learning_rate": 7.017700230229208e-05, "epoch": 0.37840700072459726, "percentage": 37.84, "elapsed_time": "16:03:47", "remaining_time": "1 day, 2:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6790, "total_steps": 17941, "loss": 1.6131, "learning_rate": 7.01688549446744e-05, "epoch": 0.37846273897776045, "percentage": 37.85, "elapsed_time": "16:03:56", "remaining_time": "1 day, 2:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6791, "total_steps": 17941, "loss": 1.6499, "learning_rate": 7.016070694741824e-05, "epoch": 0.3785184772309236, "percentage": 37.85, "elapsed_time": "16:04:04", "remaining_time": "1 day, 2:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6792, "total_steps": 17941, "loss": 1.6677, "learning_rate": 7.015255831078201e-05, "epoch": 0.3785742154840867, "percentage": 37.86, "elapsed_time": "16:04:12", "remaining_time": "1 day, 2:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6793, "total_steps": 17941, "loss": 1.6498, "learning_rate": 7.01444090350241e-05, "epoch": 0.3786299537372499, "percentage": 37.86, "elapsed_time": "16:04:21", "remaining_time": "1 day, 2:22:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6794, "total_steps": 17941, "loss": 1.8393, "learning_rate": 7.0136259120403e-05, "epoch": 0.378685691990413, "percentage": 37.87, "elapsed_time": "16:04:29", "remaining_time": "1 day, 2:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6795, "total_steps": 17941, "loss": 1.5817, "learning_rate": 7.012810856717717e-05, "epoch": 0.37874143024357615, "percentage": 37.87, "elapsed_time": "16:04:38", "remaining_time": "1 day, 2:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6796, "total_steps": 17941, "loss": 1.736, "learning_rate": 7.011995737560507e-05, "epoch": 0.37879716849673933, "percentage": 37.88, "elapsed_time": "16:04:46", "remaining_time": "1 day, 2:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6797, "total_steps": 17941, "loss": 1.7195, "learning_rate": 7.011180554594525e-05, "epoch": 0.37885290674990246, "percentage": 37.89, "elapsed_time": "16:04:55", "remaining_time": "1 day, 2:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6798, "total_steps": 17941, "loss": 1.5784, "learning_rate": 7.010365307845621e-05, "epoch": 0.3789086450030656, "percentage": 37.89, "elapsed_time": "16:05:03", "remaining_time": "1 day, 2:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6799, "total_steps": 17941, "loss": 1.4703, "learning_rate": 7.00954999733965e-05, "epoch": 0.3789643832562288, "percentage": 37.9, "elapsed_time": "16:05:12", "remaining_time": "1 day, 2:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6800, "total_steps": 17941, "loss": 1.7026, "learning_rate": 7.008734623102471e-05, "epoch": 0.3790201215093919, "percentage": 37.9, "elapsed_time": "16:05:20", "remaining_time": "1 day, 2:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6801, "total_steps": 17941, "loss": 1.6358, "learning_rate": 7.007919185159942e-05, "epoch": 0.37907585976255503, "percentage": 37.91, "elapsed_time": "16:05:29", "remaining_time": "1 day, 2:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6802, "total_steps": 17941, "loss": 1.5224, "learning_rate": 7.007103683537922e-05, "epoch": 0.37913159801571816, "percentage": 37.91, "elapsed_time": "16:05:37", "remaining_time": "1 day, 2:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6803, "total_steps": 17941, "loss": 1.5611, "learning_rate": 7.006288118262277e-05, "epoch": 0.37918733626888135, "percentage": 37.92, "elapsed_time": "16:05:45", "remaining_time": "1 day, 2:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6804, "total_steps": 17941, "loss": 1.9112, "learning_rate": 7.005472489358868e-05, "epoch": 0.3792430745220445, "percentage": 37.92, "elapsed_time": "16:05:54", "remaining_time": "1 day, 2:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6805, "total_steps": 17941, "loss": 1.678, "learning_rate": 7.004656796853565e-05, "epoch": 0.3792988127752076, "percentage": 37.93, "elapsed_time": "16:06:03", "remaining_time": "1 day, 2:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6806, "total_steps": 17941, "loss": 1.6372, "learning_rate": 7.003841040772237e-05, "epoch": 0.3793545510283708, "percentage": 37.94, "elapsed_time": "16:06:12", "remaining_time": "1 day, 2:20:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6807, "total_steps": 17941, "loss": 1.7838, "learning_rate": 7.003025221140754e-05, "epoch": 0.3794102892815339, "percentage": 37.94, "elapsed_time": "16:06:20", "remaining_time": "1 day, 2:20:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6808, "total_steps": 17941, "loss": 1.8518, "learning_rate": 7.00220933798499e-05, "epoch": 0.37946602753469705, "percentage": 37.95, "elapsed_time": "16:06:29", "remaining_time": "1 day, 2:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6809, "total_steps": 17941, "loss": 1.4928, "learning_rate": 7.001393391330819e-05, "epoch": 0.37952176578786023, "percentage": 37.95, "elapsed_time": "16:06:38", "remaining_time": "1 day, 2:20:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6810, "total_steps": 17941, "loss": 1.5464, "learning_rate": 7.000577381204118e-05, "epoch": 0.37957750404102336, "percentage": 37.96, "elapsed_time": "16:06:47", "remaining_time": "1 day, 2:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6811, "total_steps": 17941, "loss": 1.4929, "learning_rate": 6.999761307630767e-05, "epoch": 0.3796332422941865, "percentage": 37.96, "elapsed_time": "16:06:55", "remaining_time": "1 day, 2:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6812, "total_steps": 17941, "loss": 1.8435, "learning_rate": 6.998945170636647e-05, "epoch": 0.3796889805473496, "percentage": 37.97, "elapsed_time": "16:07:04", "remaining_time": "1 day, 2:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6813, "total_steps": 17941, "loss": 1.5962, "learning_rate": 6.998128970247641e-05, "epoch": 0.3797447188005128, "percentage": 37.97, "elapsed_time": "16:07:12", "remaining_time": "1 day, 2:19:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6814, "total_steps": 17941, "loss": 1.4978, "learning_rate": 6.997312706489634e-05, "epoch": 0.37980045705367593, "percentage": 37.98, "elapsed_time": "16:07:20", "remaining_time": "1 day, 2:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6815, "total_steps": 17941, "loss": 1.7663, "learning_rate": 6.996496379388512e-05, "epoch": 0.37985619530683906, "percentage": 37.99, "elapsed_time": "16:07:29", "remaining_time": "1 day, 2:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6816, "total_steps": 17941, "loss": 1.9011, "learning_rate": 6.995679988970167e-05, "epoch": 0.37991193356000225, "percentage": 37.99, "elapsed_time": "16:07:37", "remaining_time": "1 day, 2:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6817, "total_steps": 17941, "loss": 1.5928, "learning_rate": 6.994863535260488e-05, "epoch": 0.3799676718131654, "percentage": 38.0, "elapsed_time": "16:07:46", "remaining_time": "1 day, 2:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6818, "total_steps": 17941, "loss": 1.6347, "learning_rate": 6.994047018285368e-05, "epoch": 0.3800234100663285, "percentage": 38.0, "elapsed_time": "16:07:54", "remaining_time": "1 day, 2:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6819, "total_steps": 17941, "loss": 1.4441, "learning_rate": 6.993230438070702e-05, "epoch": 0.3800791483194917, "percentage": 38.01, "elapsed_time": "16:08:03", "remaining_time": "1 day, 2:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6820, "total_steps": 17941, "loss": 1.6603, "learning_rate": 6.99241379464239e-05, "epoch": 0.3801348865726548, "percentage": 38.01, "elapsed_time": "16:08:11", "remaining_time": "1 day, 2:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6821, "total_steps": 17941, "loss": 1.5785, "learning_rate": 6.991597088026327e-05, "epoch": 0.38019062482581795, "percentage": 38.02, "elapsed_time": "16:08:20", "remaining_time": "1 day, 2:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6822, "total_steps": 17941, "loss": 1.7017, "learning_rate": 6.990780318248416e-05, "epoch": 0.38024636307898113, "percentage": 38.02, "elapsed_time": "16:08:28", "remaining_time": "1 day, 2:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6823, "total_steps": 17941, "loss": 1.7205, "learning_rate": 6.989963485334562e-05, "epoch": 0.38030210133214426, "percentage": 38.03, "elapsed_time": "16:08:36", "remaining_time": "1 day, 2:18:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6824, "total_steps": 17941, "loss": 1.8499, "learning_rate": 6.989146589310667e-05, "epoch": 0.3803578395853074, "percentage": 38.04, "elapsed_time": "16:08:45", "remaining_time": "1 day, 2:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6825, "total_steps": 17941, "loss": 1.7783, "learning_rate": 6.988329630202641e-05, "epoch": 0.3804135778384705, "percentage": 38.04, "elapsed_time": "16:08:53", "remaining_time": "1 day, 2:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6826, "total_steps": 17941, "loss": 1.6106, "learning_rate": 6.98751260803639e-05, "epoch": 0.3804693160916337, "percentage": 38.05, "elapsed_time": "16:09:02", "remaining_time": "1 day, 2:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6827, "total_steps": 17941, "loss": 1.652, "learning_rate": 6.98669552283783e-05, "epoch": 0.38052505434479683, "percentage": 38.05, "elapsed_time": "16:09:11", "remaining_time": "1 day, 2:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6828, "total_steps": 17941, "loss": 1.6075, "learning_rate": 6.98587837463287e-05, "epoch": 0.38058079259795996, "percentage": 38.06, "elapsed_time": "16:09:20", "remaining_time": "1 day, 2:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6829, "total_steps": 17941, "loss": 1.7205, "learning_rate": 6.985061163447426e-05, "epoch": 0.38063653085112314, "percentage": 38.06, "elapsed_time": "16:09:28", "remaining_time": "1 day, 2:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6830, "total_steps": 17941, "loss": 1.605, "learning_rate": 6.984243889307415e-05, "epoch": 0.3806922691042863, "percentage": 38.07, "elapsed_time": "16:09:37", "remaining_time": "1 day, 2:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6831, "total_steps": 17941, "loss": 1.6532, "learning_rate": 6.983426552238756e-05, "epoch": 0.3807480073574494, "percentage": 38.07, "elapsed_time": "16:09:45", "remaining_time": "1 day, 2:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6832, "total_steps": 17941, "loss": 1.856, "learning_rate": 6.982609152267374e-05, "epoch": 0.3808037456106126, "percentage": 38.08, "elapsed_time": "16:09:54", "remaining_time": "1 day, 2:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6833, "total_steps": 17941, "loss": 1.5632, "learning_rate": 6.981791689419186e-05, "epoch": 0.3808594838637757, "percentage": 38.09, "elapsed_time": "16:10:03", "remaining_time": "1 day, 2:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6834, "total_steps": 17941, "loss": 1.648, "learning_rate": 6.980974163720123e-05, "epoch": 0.38091522211693885, "percentage": 38.09, "elapsed_time": "16:10:11", "remaining_time": "1 day, 2:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6835, "total_steps": 17941, "loss": 1.7048, "learning_rate": 6.980156575196107e-05, "epoch": 0.380970960370102, "percentage": 38.1, "elapsed_time": "16:10:19", "remaining_time": "1 day, 2:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6836, "total_steps": 17941, "loss": 1.7984, "learning_rate": 6.979338923873073e-05, "epoch": 0.38102669862326516, "percentage": 38.1, "elapsed_time": "16:10:28", "remaining_time": "1 day, 2:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6837, "total_steps": 17941, "loss": 1.6214, "learning_rate": 6.978521209776945e-05, "epoch": 0.3810824368764283, "percentage": 38.11, "elapsed_time": "16:10:36", "remaining_time": "1 day, 2:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6838, "total_steps": 17941, "loss": 1.5048, "learning_rate": 6.977703432933661e-05, "epoch": 0.3811381751295914, "percentage": 38.11, "elapsed_time": "16:10:45", "remaining_time": "1 day, 2:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6839, "total_steps": 17941, "loss": 1.4111, "learning_rate": 6.976885593369155e-05, "epoch": 0.3811939133827546, "percentage": 38.12, "elapsed_time": "16:10:54", "remaining_time": "1 day, 2:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6840, "total_steps": 17941, "loss": 1.6715, "learning_rate": 6.976067691109365e-05, "epoch": 0.38124965163591773, "percentage": 38.12, "elapsed_time": "16:11:02", "remaining_time": "1 day, 2:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6841, "total_steps": 17941, "loss": 1.586, "learning_rate": 6.975249726180227e-05, "epoch": 0.38130538988908086, "percentage": 38.13, "elapsed_time": "16:11:11", "remaining_time": "1 day, 2:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6842, "total_steps": 17941, "loss": 1.8532, "learning_rate": 6.974431698607686e-05, "epoch": 0.38136112814224404, "percentage": 38.14, "elapsed_time": "16:11:19", "remaining_time": "1 day, 2:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6843, "total_steps": 17941, "loss": 1.8658, "learning_rate": 6.973613608417683e-05, "epoch": 0.3814168663954072, "percentage": 38.14, "elapsed_time": "16:11:28", "remaining_time": "1 day, 2:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6844, "total_steps": 17941, "loss": 1.5298, "learning_rate": 6.972795455636163e-05, "epoch": 0.3814726046485703, "percentage": 38.15, "elapsed_time": "16:11:36", "remaining_time": "1 day, 2:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6845, "total_steps": 17941, "loss": 1.7494, "learning_rate": 6.971977240289073e-05, "epoch": 0.3815283429017335, "percentage": 38.15, "elapsed_time": "16:11:45", "remaining_time": "1 day, 2:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6846, "total_steps": 17941, "loss": 1.9495, "learning_rate": 6.971158962402362e-05, "epoch": 0.3815840811548966, "percentage": 38.16, "elapsed_time": "16:11:54", "remaining_time": "1 day, 2:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6847, "total_steps": 17941, "loss": 1.6167, "learning_rate": 6.970340622001983e-05, "epoch": 0.38163981940805974, "percentage": 38.16, "elapsed_time": "16:12:02", "remaining_time": "1 day, 2:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6848, "total_steps": 17941, "loss": 1.7636, "learning_rate": 6.969522219113886e-05, "epoch": 0.3816955576612229, "percentage": 38.17, "elapsed_time": "16:12:11", "remaining_time": "1 day, 2:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6849, "total_steps": 17941, "loss": 1.779, "learning_rate": 6.968703753764027e-05, "epoch": 0.38175129591438606, "percentage": 38.18, "elapsed_time": "16:12:19", "remaining_time": "1 day, 2:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6850, "total_steps": 17941, "loss": 1.5693, "learning_rate": 6.967885225978365e-05, "epoch": 0.3818070341675492, "percentage": 38.18, "elapsed_time": "16:12:28", "remaining_time": "1 day, 2:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6851, "total_steps": 17941, "loss": 1.8075, "learning_rate": 6.967066635782855e-05, "epoch": 0.3818627724207123, "percentage": 38.19, "elapsed_time": "16:12:36", "remaining_time": "1 day, 2:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6852, "total_steps": 17941, "loss": 1.8192, "learning_rate": 6.966247983203462e-05, "epoch": 0.3819185106738755, "percentage": 38.19, "elapsed_time": "16:12:45", "remaining_time": "1 day, 2:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6853, "total_steps": 17941, "loss": 1.5787, "learning_rate": 6.965429268266147e-05, "epoch": 0.38197424892703863, "percentage": 38.2, "elapsed_time": "16:12:54", "remaining_time": "1 day, 2:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6854, "total_steps": 17941, "loss": 1.7935, "learning_rate": 6.964610490996874e-05, "epoch": 0.38202998718020176, "percentage": 38.2, "elapsed_time": "16:13:03", "remaining_time": "1 day, 2:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6855, "total_steps": 17941, "loss": 1.6204, "learning_rate": 6.963791651421612e-05, "epoch": 0.38208572543336494, "percentage": 38.21, "elapsed_time": "16:13:12", "remaining_time": "1 day, 2:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6856, "total_steps": 17941, "loss": 1.6198, "learning_rate": 6.962972749566326e-05, "epoch": 0.38214146368652807, "percentage": 38.21, "elapsed_time": "16:13:20", "remaining_time": "1 day, 2:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6857, "total_steps": 17941, "loss": 1.3949, "learning_rate": 6.962153785456991e-05, "epoch": 0.3821972019396912, "percentage": 38.22, "elapsed_time": "16:13:29", "remaining_time": "1 day, 2:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6858, "total_steps": 17941, "loss": 1.7137, "learning_rate": 6.961334759119577e-05, "epoch": 0.38225294019285433, "percentage": 38.23, "elapsed_time": "16:13:37", "remaining_time": "1 day, 2:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6859, "total_steps": 17941, "loss": 1.809, "learning_rate": 6.960515670580061e-05, "epoch": 0.3823086784460175, "percentage": 38.23, "elapsed_time": "16:13:46", "remaining_time": "1 day, 2:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6860, "total_steps": 17941, "loss": 1.8777, "learning_rate": 6.959696519864418e-05, "epoch": 0.38236441669918064, "percentage": 38.24, "elapsed_time": "16:13:54", "remaining_time": "1 day, 2:13:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6861, "total_steps": 17941, "loss": 1.7168, "learning_rate": 6.958877306998627e-05, "epoch": 0.38242015495234377, "percentage": 38.24, "elapsed_time": "16:14:02", "remaining_time": "1 day, 2:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6862, "total_steps": 17941, "loss": 1.7136, "learning_rate": 6.95805803200867e-05, "epoch": 0.38247589320550696, "percentage": 38.25, "elapsed_time": "16:14:11", "remaining_time": "1 day, 2:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6863, "total_steps": 17941, "loss": 1.7348, "learning_rate": 6.957238694920527e-05, "epoch": 0.3825316314586701, "percentage": 38.25, "elapsed_time": "16:14:19", "remaining_time": "1 day, 2:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6864, "total_steps": 17941, "loss": 1.8087, "learning_rate": 6.956419295760184e-05, "epoch": 0.3825873697118332, "percentage": 38.26, "elapsed_time": "16:14:28", "remaining_time": "1 day, 2:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6865, "total_steps": 17941, "loss": 1.226, "learning_rate": 6.95559983455363e-05, "epoch": 0.3826431079649964, "percentage": 38.26, "elapsed_time": "16:14:36", "remaining_time": "1 day, 2:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6866, "total_steps": 17941, "loss": 1.6166, "learning_rate": 6.954780311326849e-05, "epoch": 0.3826988462181595, "percentage": 38.27, "elapsed_time": "16:14:45", "remaining_time": "1 day, 2:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6867, "total_steps": 17941, "loss": 1.6143, "learning_rate": 6.953960726105835e-05, "epoch": 0.38275458447132266, "percentage": 38.28, "elapsed_time": "16:14:53", "remaining_time": "1 day, 2:12:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6868, "total_steps": 17941, "loss": 1.8417, "learning_rate": 6.953141078916578e-05, "epoch": 0.38281032272448584, "percentage": 38.28, "elapsed_time": "16:15:02", "remaining_time": "1 day, 2:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6869, "total_steps": 17941, "loss": 1.6908, "learning_rate": 6.952321369785075e-05, "epoch": 0.38286606097764897, "percentage": 38.29, "elapsed_time": "16:15:10", "remaining_time": "1 day, 2:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6870, "total_steps": 17941, "loss": 1.9328, "learning_rate": 6.951501598737318e-05, "epoch": 0.3829217992308121, "percentage": 38.29, "elapsed_time": "16:15:19", "remaining_time": "1 day, 2:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6871, "total_steps": 17941, "loss": 1.7226, "learning_rate": 6.95068176579931e-05, "epoch": 0.38297753748397523, "percentage": 38.3, "elapsed_time": "16:15:27", "remaining_time": "1 day, 2:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6872, "total_steps": 17941, "loss": 1.8162, "learning_rate": 6.94986187099705e-05, "epoch": 0.3830332757371384, "percentage": 38.3, "elapsed_time": "16:15:36", "remaining_time": "1 day, 2:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6873, "total_steps": 17941, "loss": 1.5981, "learning_rate": 6.949041914356541e-05, "epoch": 0.38308901399030154, "percentage": 38.31, "elapsed_time": "16:15:44", "remaining_time": "1 day, 2:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6874, "total_steps": 17941, "loss": 1.688, "learning_rate": 6.948221895903784e-05, "epoch": 0.38314475224346467, "percentage": 38.31, "elapsed_time": "16:15:53", "remaining_time": "1 day, 2:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6875, "total_steps": 17941, "loss": 1.6411, "learning_rate": 6.94740181566479e-05, "epoch": 0.38320049049662785, "percentage": 38.32, "elapsed_time": "16:16:01", "remaining_time": "1 day, 2:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6876, "total_steps": 17941, "loss": 1.3411, "learning_rate": 6.946581673665561e-05, "epoch": 0.383256228749791, "percentage": 38.33, "elapsed_time": "16:16:10", "remaining_time": "1 day, 2:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6877, "total_steps": 17941, "loss": 1.5896, "learning_rate": 6.945761469932114e-05, "epoch": 0.3833119670029541, "percentage": 38.33, "elapsed_time": "16:16:18", "remaining_time": "1 day, 2:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6878, "total_steps": 17941, "loss": 1.7555, "learning_rate": 6.944941204490456e-05, "epoch": 0.3833677052561173, "percentage": 38.34, "elapsed_time": "16:16:26", "remaining_time": "1 day, 2:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6879, "total_steps": 17941, "loss": 1.8117, "learning_rate": 6.944120877366604e-05, "epoch": 0.3834234435092804, "percentage": 38.34, "elapsed_time": "16:16:35", "remaining_time": "1 day, 2:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6880, "total_steps": 17941, "loss": 1.5363, "learning_rate": 6.943300488586572e-05, "epoch": 0.38347918176244356, "percentage": 38.35, "elapsed_time": "16:16:44", "remaining_time": "1 day, 2:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6881, "total_steps": 17941, "loss": 1.4549, "learning_rate": 6.942480038176379e-05, "epoch": 0.3835349200156067, "percentage": 38.35, "elapsed_time": "16:16:52", "remaining_time": "1 day, 2:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6882, "total_steps": 17941, "loss": 1.5041, "learning_rate": 6.941659526162045e-05, "epoch": 0.38359065826876987, "percentage": 38.36, "elapsed_time": "16:17:00", "remaining_time": "1 day, 2:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6883, "total_steps": 17941, "loss": 1.8509, "learning_rate": 6.940838952569589e-05, "epoch": 0.383646396521933, "percentage": 38.36, "elapsed_time": "16:17:09", "remaining_time": "1 day, 2:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6884, "total_steps": 17941, "loss": 1.6337, "learning_rate": 6.94001831742504e-05, "epoch": 0.3837021347750961, "percentage": 38.37, "elapsed_time": "16:17:17", "remaining_time": "1 day, 2:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6885, "total_steps": 17941, "loss": 1.6887, "learning_rate": 6.939197620754419e-05, "epoch": 0.3837578730282593, "percentage": 38.38, "elapsed_time": "16:17:26", "remaining_time": "1 day, 2:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6886, "total_steps": 17941, "loss": 1.6762, "learning_rate": 6.938376862583757e-05, "epoch": 0.38381361128142244, "percentage": 38.38, "elapsed_time": "16:17:34", "remaining_time": "1 day, 2:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6887, "total_steps": 17941, "loss": 1.5778, "learning_rate": 6.937556042939083e-05, "epoch": 0.38386934953458557, "percentage": 38.39, "elapsed_time": "16:17:43", "remaining_time": "1 day, 2:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6888, "total_steps": 17941, "loss": 1.6806, "learning_rate": 6.936735161846429e-05, "epoch": 0.38392508778774875, "percentage": 38.39, "elapsed_time": "16:17:51", "remaining_time": "1 day, 2:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6889, "total_steps": 17941, "loss": 1.5607, "learning_rate": 6.935914219331825e-05, "epoch": 0.3839808260409119, "percentage": 38.4, "elapsed_time": "16:18:00", "remaining_time": "1 day, 2:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6890, "total_steps": 17941, "loss": 1.6835, "learning_rate": 6.93509321542131e-05, "epoch": 0.384036564294075, "percentage": 38.4, "elapsed_time": "16:18:08", "remaining_time": "1 day, 2:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6891, "total_steps": 17941, "loss": 1.3228, "learning_rate": 6.934272150140921e-05, "epoch": 0.3840923025472382, "percentage": 38.41, "elapsed_time": "16:18:17", "remaining_time": "1 day, 2:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6892, "total_steps": 17941, "loss": 1.6331, "learning_rate": 6.933451023516697e-05, "epoch": 0.3841480408004013, "percentage": 38.41, "elapsed_time": "16:18:25", "remaining_time": "1 day, 2:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6893, "total_steps": 17941, "loss": 1.7666, "learning_rate": 6.932629835574679e-05, "epoch": 0.38420377905356445, "percentage": 38.42, "elapsed_time": "16:18:33", "remaining_time": "1 day, 2:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6894, "total_steps": 17941, "loss": 1.5809, "learning_rate": 6.93180858634091e-05, "epoch": 0.3842595173067276, "percentage": 38.43, "elapsed_time": "16:18:42", "remaining_time": "1 day, 2:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6895, "total_steps": 17941, "loss": 1.7695, "learning_rate": 6.930987275841439e-05, "epoch": 0.38431525555989077, "percentage": 38.43, "elapsed_time": "16:18:50", "remaining_time": "1 day, 2:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6896, "total_steps": 17941, "loss": 1.8917, "learning_rate": 6.930165904102305e-05, "epoch": 0.3843709938130539, "percentage": 38.44, "elapsed_time": "16:18:59", "remaining_time": "1 day, 2:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6897, "total_steps": 17941, "loss": 1.8922, "learning_rate": 6.929344471149566e-05, "epoch": 0.384426732066217, "percentage": 38.44, "elapsed_time": "16:19:07", "remaining_time": "1 day, 2:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6898, "total_steps": 17941, "loss": 1.6488, "learning_rate": 6.928522977009268e-05, "epoch": 0.3844824703193802, "percentage": 38.45, "elapsed_time": "16:19:16", "remaining_time": "1 day, 2:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6899, "total_steps": 17941, "loss": 1.6886, "learning_rate": 6.927701421707466e-05, "epoch": 0.38453820857254334, "percentage": 38.45, "elapsed_time": "16:19:24", "remaining_time": "1 day, 2:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6900, "total_steps": 17941, "loss": 1.6532, "learning_rate": 6.926879805270212e-05, "epoch": 0.38459394682570647, "percentage": 38.46, "elapsed_time": "16:19:33", "remaining_time": "1 day, 2:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6901, "total_steps": 17941, "loss": 1.6202, "learning_rate": 6.926058127723568e-05, "epoch": 0.38464968507886965, "percentage": 38.46, "elapsed_time": "16:19:41", "remaining_time": "1 day, 2:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6902, "total_steps": 17941, "loss": 1.1835, "learning_rate": 6.925236389093588e-05, "epoch": 0.3847054233320328, "percentage": 38.47, "elapsed_time": "16:19:50", "remaining_time": "1 day, 2:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6903, "total_steps": 17941, "loss": 1.9214, "learning_rate": 6.924414589406335e-05, "epoch": 0.3847611615851959, "percentage": 38.48, "elapsed_time": "16:19:58", "remaining_time": "1 day, 2:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6904, "total_steps": 17941, "loss": 1.8236, "learning_rate": 6.923592728687871e-05, "epoch": 0.38481689983835904, "percentage": 38.48, "elapsed_time": "16:20:07", "remaining_time": "1 day, 2:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6905, "total_steps": 17941, "loss": 1.5128, "learning_rate": 6.922770806964263e-05, "epoch": 0.3848726380915222, "percentage": 38.49, "elapsed_time": "16:20:15", "remaining_time": "1 day, 2:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6906, "total_steps": 17941, "loss": 1.5956, "learning_rate": 6.921948824261573e-05, "epoch": 0.38492837634468535, "percentage": 38.49, "elapsed_time": "16:20:24", "remaining_time": "1 day, 2:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6907, "total_steps": 17941, "loss": 1.5846, "learning_rate": 6.921126780605873e-05, "epoch": 0.3849841145978485, "percentage": 38.5, "elapsed_time": "16:20:32", "remaining_time": "1 day, 2:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6908, "total_steps": 17941, "loss": 1.6645, "learning_rate": 6.920304676023233e-05, "epoch": 0.38503985285101167, "percentage": 38.5, "elapsed_time": "16:20:41", "remaining_time": "1 day, 2:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6909, "total_steps": 17941, "loss": 1.6028, "learning_rate": 6.919482510539723e-05, "epoch": 0.3850955911041748, "percentage": 38.51, "elapsed_time": "16:20:49", "remaining_time": "1 day, 2:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6910, "total_steps": 17941, "loss": 1.7378, "learning_rate": 6.918660284181421e-05, "epoch": 0.3851513293573379, "percentage": 38.52, "elapsed_time": "16:20:58", "remaining_time": "1 day, 2:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6911, "total_steps": 17941, "loss": 1.8591, "learning_rate": 6.9178379969744e-05, "epoch": 0.3852070676105011, "percentage": 38.52, "elapsed_time": "16:21:07", "remaining_time": "1 day, 2:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6912, "total_steps": 17941, "loss": 1.527, "learning_rate": 6.917015648944741e-05, "epoch": 0.38526280586366424, "percentage": 38.53, "elapsed_time": "16:21:15", "remaining_time": "1 day, 2:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6913, "total_steps": 17941, "loss": 1.6982, "learning_rate": 6.916193240118522e-05, "epoch": 0.38531854411682737, "percentage": 38.53, "elapsed_time": "16:21:24", "remaining_time": "1 day, 2:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6914, "total_steps": 17941, "loss": 1.6709, "learning_rate": 6.915370770521825e-05, "epoch": 0.38537428236999055, "percentage": 38.54, "elapsed_time": "16:21:32", "remaining_time": "1 day, 2:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6915, "total_steps": 17941, "loss": 1.8178, "learning_rate": 6.914548240180736e-05, "epoch": 0.3854300206231537, "percentage": 38.54, "elapsed_time": "16:21:41", "remaining_time": "1 day, 2:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6916, "total_steps": 17941, "loss": 1.8038, "learning_rate": 6.913725649121337e-05, "epoch": 0.3854857588763168, "percentage": 38.55, "elapsed_time": "16:21:49", "remaining_time": "1 day, 2:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6917, "total_steps": 17941, "loss": 1.7155, "learning_rate": 6.91290299736972e-05, "epoch": 0.38554149712947994, "percentage": 38.55, "elapsed_time": "16:21:58", "remaining_time": "1 day, 2:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6918, "total_steps": 17941, "loss": 1.7316, "learning_rate": 6.912080284951972e-05, "epoch": 0.3855972353826431, "percentage": 38.56, "elapsed_time": "16:22:06", "remaining_time": "1 day, 2:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6919, "total_steps": 17941, "loss": 1.7607, "learning_rate": 6.911257511894188e-05, "epoch": 0.38565297363580625, "percentage": 38.57, "elapsed_time": "16:22:14", "remaining_time": "1 day, 2:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6920, "total_steps": 17941, "loss": 1.8731, "learning_rate": 6.910434678222457e-05, "epoch": 0.3857087118889694, "percentage": 38.57, "elapsed_time": "16:22:23", "remaining_time": "1 day, 2:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6921, "total_steps": 17941, "loss": 1.3704, "learning_rate": 6.909611783962877e-05, "epoch": 0.38576445014213256, "percentage": 38.58, "elapsed_time": "16:22:31", "remaining_time": "1 day, 2:04:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6922, "total_steps": 17941, "loss": 1.6253, "learning_rate": 6.908788829141544e-05, "epoch": 0.3858201883952957, "percentage": 38.58, "elapsed_time": "16:22:40", "remaining_time": "1 day, 2:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6923, "total_steps": 17941, "loss": 1.9226, "learning_rate": 6.907965813784558e-05, "epoch": 0.3858759266484588, "percentage": 38.59, "elapsed_time": "16:22:48", "remaining_time": "1 day, 2:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6924, "total_steps": 17941, "loss": 1.5934, "learning_rate": 6.907142737918023e-05, "epoch": 0.385931664901622, "percentage": 38.59, "elapsed_time": "16:22:57", "remaining_time": "1 day, 2:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6925, "total_steps": 17941, "loss": 1.8197, "learning_rate": 6.906319601568038e-05, "epoch": 0.38598740315478514, "percentage": 38.6, "elapsed_time": "16:23:05", "remaining_time": "1 day, 2:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6926, "total_steps": 17941, "loss": 1.9775, "learning_rate": 6.90549640476071e-05, "epoch": 0.38604314140794826, "percentage": 38.6, "elapsed_time": "16:23:14", "remaining_time": "1 day, 2:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6927, "total_steps": 17941, "loss": 1.9008, "learning_rate": 6.904673147522147e-05, "epoch": 0.3860988796611114, "percentage": 38.61, "elapsed_time": "16:23:22", "remaining_time": "1 day, 2:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6928, "total_steps": 17941, "loss": 1.9632, "learning_rate": 6.903849829878457e-05, "epoch": 0.3861546179142746, "percentage": 38.62, "elapsed_time": "16:23:31", "remaining_time": "1 day, 2:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6929, "total_steps": 17941, "loss": 1.7489, "learning_rate": 6.903026451855748e-05, "epoch": 0.3862103561674377, "percentage": 38.62, "elapsed_time": "16:23:39", "remaining_time": "1 day, 2:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6930, "total_steps": 17941, "loss": 1.7719, "learning_rate": 6.902203013480137e-05, "epoch": 0.38626609442060084, "percentage": 38.63, "elapsed_time": "16:23:48", "remaining_time": "1 day, 2:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6931, "total_steps": 17941, "loss": 1.5504, "learning_rate": 6.901379514777739e-05, "epoch": 0.386321832673764, "percentage": 38.63, "elapsed_time": "16:23:56", "remaining_time": "1 day, 2:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6932, "total_steps": 17941, "loss": 1.6045, "learning_rate": 6.900555955774666e-05, "epoch": 0.38637757092692715, "percentage": 38.64, "elapsed_time": "16:24:05", "remaining_time": "1 day, 2:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6933, "total_steps": 17941, "loss": 1.7366, "learning_rate": 6.899732336497038e-05, "epoch": 0.3864333091800903, "percentage": 38.64, "elapsed_time": "16:24:14", "remaining_time": "1 day, 2:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6934, "total_steps": 17941, "loss": 1.3954, "learning_rate": 6.898908656970979e-05, "epoch": 0.38648904743325346, "percentage": 38.65, "elapsed_time": "16:24:22", "remaining_time": "1 day, 2:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6935, "total_steps": 17941, "loss": 1.791, "learning_rate": 6.898084917222609e-05, "epoch": 0.3865447856864166, "percentage": 38.65, "elapsed_time": "16:24:31", "remaining_time": "1 day, 2:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6936, "total_steps": 17941, "loss": 1.7835, "learning_rate": 6.89726111727805e-05, "epoch": 0.3866005239395797, "percentage": 38.66, "elapsed_time": "16:24:39", "remaining_time": "1 day, 2:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6937, "total_steps": 17941, "loss": 1.651, "learning_rate": 6.896437257163432e-05, "epoch": 0.3866562621927429, "percentage": 38.67, "elapsed_time": "16:24:48", "remaining_time": "1 day, 2:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6938, "total_steps": 17941, "loss": 1.8836, "learning_rate": 6.89561333690488e-05, "epoch": 0.38671200044590603, "percentage": 38.67, "elapsed_time": "16:24:56", "remaining_time": "1 day, 2:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6939, "total_steps": 17941, "loss": 1.5643, "learning_rate": 6.894789356528526e-05, "epoch": 0.38676773869906916, "percentage": 38.68, "elapsed_time": "16:25:04", "remaining_time": "1 day, 2:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6940, "total_steps": 17941, "loss": 1.6483, "learning_rate": 6.893965316060501e-05, "epoch": 0.3868234769522323, "percentage": 38.68, "elapsed_time": "16:25:13", "remaining_time": "1 day, 2:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6941, "total_steps": 17941, "loss": 1.5949, "learning_rate": 6.893141215526938e-05, "epoch": 0.3868792152053955, "percentage": 38.69, "elapsed_time": "16:25:22", "remaining_time": "1 day, 2:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6942, "total_steps": 17941, "loss": 1.7971, "learning_rate": 6.892317054953975e-05, "epoch": 0.3869349534585586, "percentage": 38.69, "elapsed_time": "16:25:30", "remaining_time": "1 day, 2:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6943, "total_steps": 17941, "loss": 1.8339, "learning_rate": 6.891492834367746e-05, "epoch": 0.38699069171172173, "percentage": 38.7, "elapsed_time": "16:25:39", "remaining_time": "1 day, 2:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6944, "total_steps": 17941, "loss": 1.6175, "learning_rate": 6.890668553794392e-05, "epoch": 0.3870464299648849, "percentage": 38.7, "elapsed_time": "16:25:48", "remaining_time": "1 day, 2:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6945, "total_steps": 17941, "loss": 1.7679, "learning_rate": 6.889844213260057e-05, "epoch": 0.38710216821804805, "percentage": 38.71, "elapsed_time": "16:25:56", "remaining_time": "1 day, 2:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6946, "total_steps": 17941, "loss": 1.5769, "learning_rate": 6.88901981279088e-05, "epoch": 0.3871579064712112, "percentage": 38.72, "elapsed_time": "16:26:05", "remaining_time": "1 day, 2:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6947, "total_steps": 17941, "loss": 1.4678, "learning_rate": 6.88819535241301e-05, "epoch": 0.38721364472437436, "percentage": 38.72, "elapsed_time": "16:26:13", "remaining_time": "1 day, 2:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6948, "total_steps": 17941, "loss": 1.6784, "learning_rate": 6.887370832152592e-05, "epoch": 0.3872693829775375, "percentage": 38.73, "elapsed_time": "16:26:21", "remaining_time": "1 day, 2:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6949, "total_steps": 17941, "loss": 1.6139, "learning_rate": 6.886546252035775e-05, "epoch": 0.3873251212307006, "percentage": 38.73, "elapsed_time": "16:26:30", "remaining_time": "1 day, 2:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6950, "total_steps": 17941, "loss": 1.8137, "learning_rate": 6.88572161208871e-05, "epoch": 0.38738085948386375, "percentage": 38.74, "elapsed_time": "16:26:38", "remaining_time": "1 day, 2:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6951, "total_steps": 17941, "loss": 1.5237, "learning_rate": 6.88489691233755e-05, "epoch": 0.38743659773702693, "percentage": 38.74, "elapsed_time": "16:26:47", "remaining_time": "1 day, 2:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6952, "total_steps": 17941, "loss": 1.686, "learning_rate": 6.884072152808451e-05, "epoch": 0.38749233599019006, "percentage": 38.75, "elapsed_time": "16:26:55", "remaining_time": "1 day, 2:00:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6953, "total_steps": 17941, "loss": 1.9771, "learning_rate": 6.883247333527567e-05, "epoch": 0.3875480742433532, "percentage": 38.75, "elapsed_time": "16:27:04", "remaining_time": "1 day, 1:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6954, "total_steps": 17941, "loss": 1.7549, "learning_rate": 6.882422454521058e-05, "epoch": 0.3876038124965164, "percentage": 38.76, "elapsed_time": "16:27:12", "remaining_time": "1 day, 1:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6955, "total_steps": 17941, "loss": 1.7045, "learning_rate": 6.881597515815084e-05, "epoch": 0.3876595507496795, "percentage": 38.77, "elapsed_time": "16:27:20", "remaining_time": "1 day, 1:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6956, "total_steps": 17941, "loss": 1.5901, "learning_rate": 6.880772517435807e-05, "epoch": 0.38771528900284263, "percentage": 38.77, "elapsed_time": "16:27:29", "remaining_time": "1 day, 1:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6957, "total_steps": 17941, "loss": 1.5849, "learning_rate": 6.879947459409393e-05, "epoch": 0.3877710272560058, "percentage": 38.78, "elapsed_time": "16:27:37", "remaining_time": "1 day, 1:59:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6958, "total_steps": 17941, "loss": 1.8152, "learning_rate": 6.879122341762003e-05, "epoch": 0.38782676550916895, "percentage": 38.78, "elapsed_time": "16:27:46", "remaining_time": "1 day, 1:59:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6959, "total_steps": 17941, "loss": 1.7573, "learning_rate": 6.878297164519812e-05, "epoch": 0.3878825037623321, "percentage": 38.79, "elapsed_time": "16:27:54", "remaining_time": "1 day, 1:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6960, "total_steps": 17941, "loss": 1.7487, "learning_rate": 6.877471927708985e-05, "epoch": 0.38793824201549526, "percentage": 38.79, "elapsed_time": "16:28:03", "remaining_time": "1 day, 1:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6961, "total_steps": 17941, "loss": 1.8512, "learning_rate": 6.876646631355693e-05, "epoch": 0.3879939802686584, "percentage": 38.8, "elapsed_time": "16:28:11", "remaining_time": "1 day, 1:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6962, "total_steps": 17941, "loss": 2.1185, "learning_rate": 6.875821275486113e-05, "epoch": 0.3880497185218215, "percentage": 38.8, "elapsed_time": "16:28:20", "remaining_time": "1 day, 1:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6963, "total_steps": 17941, "loss": 1.6607, "learning_rate": 6.874995860126419e-05, "epoch": 0.38810545677498465, "percentage": 38.81, "elapsed_time": "16:28:28", "remaining_time": "1 day, 1:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6964, "total_steps": 17941, "loss": 1.4841, "learning_rate": 6.874170385302789e-05, "epoch": 0.38816119502814783, "percentage": 38.82, "elapsed_time": "16:28:37", "remaining_time": "1 day, 1:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6965, "total_steps": 17941, "loss": 1.7557, "learning_rate": 6.8733448510414e-05, "epoch": 0.38821693328131096, "percentage": 38.82, "elapsed_time": "16:28:45", "remaining_time": "1 day, 1:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6966, "total_steps": 17941, "loss": 1.7722, "learning_rate": 6.872519257368437e-05, "epoch": 0.3882726715344741, "percentage": 38.83, "elapsed_time": "16:28:54", "remaining_time": "1 day, 1:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6967, "total_steps": 17941, "loss": 1.8058, "learning_rate": 6.871693604310077e-05, "epoch": 0.3883284097876373, "percentage": 38.83, "elapsed_time": "16:29:02", "remaining_time": "1 day, 1:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6968, "total_steps": 17941, "loss": 1.8542, "learning_rate": 6.87086789189251e-05, "epoch": 0.3883841480408004, "percentage": 38.84, "elapsed_time": "16:29:10", "remaining_time": "1 day, 1:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6969, "total_steps": 17941, "loss": 1.7221, "learning_rate": 6.870042120141923e-05, "epoch": 0.38843988629396353, "percentage": 38.84, "elapsed_time": "16:29:19", "remaining_time": "1 day, 1:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6970, "total_steps": 17941, "loss": 1.5492, "learning_rate": 6.869216289084503e-05, "epoch": 0.3884956245471267, "percentage": 38.85, "elapsed_time": "16:29:27", "remaining_time": "1 day, 1:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6971, "total_steps": 17941, "loss": 1.4507, "learning_rate": 6.86839039874644e-05, "epoch": 0.38855136280028985, "percentage": 38.86, "elapsed_time": "16:29:36", "remaining_time": "1 day, 1:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6972, "total_steps": 17941, "loss": 1.7683, "learning_rate": 6.867564449153925e-05, "epoch": 0.388607101053453, "percentage": 38.86, "elapsed_time": "16:29:44", "remaining_time": "1 day, 1:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6973, "total_steps": 17941, "loss": 1.7076, "learning_rate": 6.866738440333157e-05, "epoch": 0.3886628393066161, "percentage": 38.87, "elapsed_time": "16:29:53", "remaining_time": "1 day, 1:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6974, "total_steps": 17941, "loss": 1.542, "learning_rate": 6.865912372310328e-05, "epoch": 0.3887185775597793, "percentage": 38.87, "elapsed_time": "16:30:02", "remaining_time": "1 day, 1:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6975, "total_steps": 17941, "loss": 1.6909, "learning_rate": 6.865086245111638e-05, "epoch": 0.3887743158129424, "percentage": 38.88, "elapsed_time": "16:30:10", "remaining_time": "1 day, 1:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6976, "total_steps": 17941, "loss": 1.8409, "learning_rate": 6.864260058763286e-05, "epoch": 0.38883005406610555, "percentage": 38.88, "elapsed_time": "16:30:19", "remaining_time": "1 day, 1:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6977, "total_steps": 17941, "loss": 1.5931, "learning_rate": 6.863433813291477e-05, "epoch": 0.38888579231926873, "percentage": 38.89, "elapsed_time": "16:30:28", "remaining_time": "1 day, 1:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6978, "total_steps": 17941, "loss": 1.7741, "learning_rate": 6.86260750872241e-05, "epoch": 0.38894153057243186, "percentage": 38.89, "elapsed_time": "16:30:36", "remaining_time": "1 day, 1:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6979, "total_steps": 17941, "loss": 1.6731, "learning_rate": 6.861781145082293e-05, "epoch": 0.388997268825595, "percentage": 38.9, "elapsed_time": "16:30:45", "remaining_time": "1 day, 1:56:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6980, "total_steps": 17941, "loss": 1.6809, "learning_rate": 6.860954722397332e-05, "epoch": 0.3890530070787582, "percentage": 38.91, "elapsed_time": "16:30:54", "remaining_time": "1 day, 1:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6981, "total_steps": 17941, "loss": 1.7078, "learning_rate": 6.860128240693737e-05, "epoch": 0.3891087453319213, "percentage": 38.91, "elapsed_time": "16:31:03", "remaining_time": "1 day, 1:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6982, "total_steps": 17941, "loss": 1.7694, "learning_rate": 6.85930169999772e-05, "epoch": 0.38916448358508443, "percentage": 38.92, "elapsed_time": "16:31:11", "remaining_time": "1 day, 1:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6983, "total_steps": 17941, "loss": 1.7516, "learning_rate": 6.858475100335496e-05, "epoch": 0.3892202218382476, "percentage": 38.92, "elapsed_time": "16:31:20", "remaining_time": "1 day, 1:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6984, "total_steps": 17941, "loss": 1.7409, "learning_rate": 6.857648441733275e-05, "epoch": 0.38927596009141074, "percentage": 38.93, "elapsed_time": "16:31:28", "remaining_time": "1 day, 1:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6985, "total_steps": 17941, "loss": 1.7237, "learning_rate": 6.856821724217276e-05, "epoch": 0.3893316983445739, "percentage": 38.93, "elapsed_time": "16:31:37", "remaining_time": "1 day, 1:55:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6986, "total_steps": 17941, "loss": 1.8842, "learning_rate": 6.855994947813719e-05, "epoch": 0.389387436597737, "percentage": 38.94, "elapsed_time": "16:31:45", "remaining_time": "1 day, 1:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6987, "total_steps": 17941, "loss": 1.8356, "learning_rate": 6.855168112548823e-05, "epoch": 0.3894431748509002, "percentage": 38.94, "elapsed_time": "16:31:53", "remaining_time": "1 day, 1:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6988, "total_steps": 17941, "loss": 2.1173, "learning_rate": 6.85434121844881e-05, "epoch": 0.3894989131040633, "percentage": 38.95, "elapsed_time": "16:32:02", "remaining_time": "1 day, 1:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6989, "total_steps": 17941, "loss": 1.6531, "learning_rate": 6.853514265539907e-05, "epoch": 0.38955465135722644, "percentage": 38.96, "elapsed_time": "16:32:10", "remaining_time": "1 day, 1:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6990, "total_steps": 17941, "loss": 1.7125, "learning_rate": 6.852687253848337e-05, "epoch": 0.38961038961038963, "percentage": 38.96, "elapsed_time": "16:32:19", "remaining_time": "1 day, 1:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6991, "total_steps": 17941, "loss": 1.8723, "learning_rate": 6.85186018340033e-05, "epoch": 0.38966612786355276, "percentage": 38.97, "elapsed_time": "16:32:27", "remaining_time": "1 day, 1:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6992, "total_steps": 17941, "loss": 1.9066, "learning_rate": 6.851033054222115e-05, "epoch": 0.3897218661167159, "percentage": 38.97, "elapsed_time": "16:32:36", "remaining_time": "1 day, 1:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6993, "total_steps": 17941, "loss": 1.6027, "learning_rate": 6.850205866339923e-05, "epoch": 0.38977760436987907, "percentage": 38.98, "elapsed_time": "16:32:45", "remaining_time": "1 day, 1:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6994, "total_steps": 17941, "loss": 1.7806, "learning_rate": 6.849378619779989e-05, "epoch": 0.3898333426230422, "percentage": 38.98, "elapsed_time": "16:32:53", "remaining_time": "1 day, 1:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6995, "total_steps": 17941, "loss": 1.8153, "learning_rate": 6.848551314568548e-05, "epoch": 0.38988908087620533, "percentage": 38.99, "elapsed_time": "16:33:01", "remaining_time": "1 day, 1:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6996, "total_steps": 17941, "loss": 1.7705, "learning_rate": 6.847723950731837e-05, "epoch": 0.38994481912936846, "percentage": 38.99, "elapsed_time": "16:33:10", "remaining_time": "1 day, 1:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6997, "total_steps": 17941, "loss": 1.6717, "learning_rate": 6.846896528296094e-05, "epoch": 0.39000055738253164, "percentage": 39.0, "elapsed_time": "16:33:18", "remaining_time": "1 day, 1:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6998, "total_steps": 17941, "loss": 1.6567, "learning_rate": 6.846069047287562e-05, "epoch": 0.39005629563569477, "percentage": 39.01, "elapsed_time": "16:33:27", "remaining_time": "1 day, 1:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6999, "total_steps": 17941, "loss": 1.3903, "learning_rate": 6.845241507732483e-05, "epoch": 0.3901120338888579, "percentage": 39.01, "elapsed_time": "16:33:35", "remaining_time": "1 day, 1:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7000, "total_steps": 17941, "loss": 1.8607, "learning_rate": 6.844413909657104e-05, "epoch": 0.3901677721420211, "percentage": 39.02, "elapsed_time": "16:33:44", "remaining_time": "1 day, 1:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7001, "total_steps": 17941, "loss": 1.6199, "learning_rate": 6.843586253087666e-05, "epoch": 0.3902235103951842, "percentage": 39.02, "elapsed_time": "16:33:52", "remaining_time": "1 day, 1:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7002, "total_steps": 17941, "loss": 1.5923, "learning_rate": 6.842758538050422e-05, "epoch": 0.39027924864834734, "percentage": 39.03, "elapsed_time": "16:34:00", "remaining_time": "1 day, 1:52:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7003, "total_steps": 17941, "loss": 1.6086, "learning_rate": 6.841930764571623e-05, "epoch": 0.39033498690151053, "percentage": 39.03, "elapsed_time": "16:34:09", "remaining_time": "1 day, 1:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7004, "total_steps": 17941, "loss": 1.8973, "learning_rate": 6.841102932677517e-05, "epoch": 0.39039072515467366, "percentage": 39.04, "elapsed_time": "16:34:17", "remaining_time": "1 day, 1:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7005, "total_steps": 17941, "loss": 1.4897, "learning_rate": 6.840275042394363e-05, "epoch": 0.3904464634078368, "percentage": 39.04, "elapsed_time": "16:34:26", "remaining_time": "1 day, 1:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7006, "total_steps": 17941, "loss": 1.7267, "learning_rate": 6.839447093748413e-05, "epoch": 0.39050220166099997, "percentage": 39.05, "elapsed_time": "16:34:34", "remaining_time": "1 day, 1:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7007, "total_steps": 17941, "loss": 1.9025, "learning_rate": 6.838619086765925e-05, "epoch": 0.3905579399141631, "percentage": 39.06, "elapsed_time": "16:34:43", "remaining_time": "1 day, 1:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7008, "total_steps": 17941, "loss": 1.6509, "learning_rate": 6.83779102147316e-05, "epoch": 0.39061367816732623, "percentage": 39.06, "elapsed_time": "16:34:52", "remaining_time": "1 day, 1:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7009, "total_steps": 17941, "loss": 1.6244, "learning_rate": 6.83696289789638e-05, "epoch": 0.39066941642048936, "percentage": 39.07, "elapsed_time": "16:35:00", "remaining_time": "1 day, 1:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7010, "total_steps": 17941, "loss": 1.7403, "learning_rate": 6.836134716061845e-05, "epoch": 0.39072515467365254, "percentage": 39.07, "elapsed_time": "16:35:09", "remaining_time": "1 day, 1:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7011, "total_steps": 17941, "loss": 1.6201, "learning_rate": 6.835306475995823e-05, "epoch": 0.39078089292681567, "percentage": 39.08, "elapsed_time": "16:35:17", "remaining_time": "1 day, 1:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7012, "total_steps": 17941, "loss": 1.5593, "learning_rate": 6.834478177724581e-05, "epoch": 0.3908366311799788, "percentage": 39.08, "elapsed_time": "16:35:26", "remaining_time": "1 day, 1:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7013, "total_steps": 17941, "loss": 1.6275, "learning_rate": 6.833649821274386e-05, "epoch": 0.390892369433142, "percentage": 39.09, "elapsed_time": "16:35:34", "remaining_time": "1 day, 1:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7014, "total_steps": 17941, "loss": 1.9288, "learning_rate": 6.83282140667151e-05, "epoch": 0.3909481076863051, "percentage": 39.09, "elapsed_time": "16:35:43", "remaining_time": "1 day, 1:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7015, "total_steps": 17941, "loss": 1.6756, "learning_rate": 6.831992933942225e-05, "epoch": 0.39100384593946824, "percentage": 39.1, "elapsed_time": "16:35:51", "remaining_time": "1 day, 1:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7016, "total_steps": 17941, "loss": 1.8422, "learning_rate": 6.831164403112806e-05, "epoch": 0.3910595841926314, "percentage": 39.11, "elapsed_time": "16:35:59", "remaining_time": "1 day, 1:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7017, "total_steps": 17941, "loss": 1.407, "learning_rate": 6.830335814209527e-05, "epoch": 0.39111532244579456, "percentage": 39.11, "elapsed_time": "16:36:08", "remaining_time": "1 day, 1:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7018, "total_steps": 17941, "loss": 1.7507, "learning_rate": 6.829507167258671e-05, "epoch": 0.3911710606989577, "percentage": 39.12, "elapsed_time": "16:36:16", "remaining_time": "1 day, 1:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7019, "total_steps": 17941, "loss": 1.9612, "learning_rate": 6.828678462286511e-05, "epoch": 0.3912267989521208, "percentage": 39.12, "elapsed_time": "16:36:25", "remaining_time": "1 day, 1:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7020, "total_steps": 17941, "loss": 1.8656, "learning_rate": 6.827849699319333e-05, "epoch": 0.391282537205284, "percentage": 39.13, "elapsed_time": "16:36:33", "remaining_time": "1 day, 1:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7021, "total_steps": 17941, "loss": 1.6849, "learning_rate": 6.827020878383418e-05, "epoch": 0.3913382754584471, "percentage": 39.13, "elapsed_time": "16:36:42", "remaining_time": "1 day, 1:50:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7022, "total_steps": 17941, "loss": 1.9619, "learning_rate": 6.826191999505056e-05, "epoch": 0.39139401371161026, "percentage": 39.14, "elapsed_time": "16:36:50", "remaining_time": "1 day, 1:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7023, "total_steps": 17941, "loss": 1.6066, "learning_rate": 6.82536306271053e-05, "epoch": 0.39144975196477344, "percentage": 39.14, "elapsed_time": "16:36:59", "remaining_time": "1 day, 1:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7024, "total_steps": 17941, "loss": 1.8761, "learning_rate": 6.82453406802613e-05, "epoch": 0.39150549021793657, "percentage": 39.15, "elapsed_time": "16:37:07", "remaining_time": "1 day, 1:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7025, "total_steps": 17941, "loss": 1.494, "learning_rate": 6.823705015478148e-05, "epoch": 0.3915612284710997, "percentage": 39.16, "elapsed_time": "16:37:16", "remaining_time": "1 day, 1:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7026, "total_steps": 17941, "loss": 1.4918, "learning_rate": 6.822875905092876e-05, "epoch": 0.3916169667242629, "percentage": 39.16, "elapsed_time": "16:37:24", "remaining_time": "1 day, 1:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7027, "total_steps": 17941, "loss": 1.7521, "learning_rate": 6.822046736896607e-05, "epoch": 0.391672704977426, "percentage": 39.17, "elapsed_time": "16:37:32", "remaining_time": "1 day, 1:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7028, "total_steps": 17941, "loss": 1.5782, "learning_rate": 6.821217510915639e-05, "epoch": 0.39172844323058914, "percentage": 39.17, "elapsed_time": "16:37:41", "remaining_time": "1 day, 1:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7029, "total_steps": 17941, "loss": 1.4754, "learning_rate": 6.820388227176271e-05, "epoch": 0.3917841814837523, "percentage": 39.18, "elapsed_time": "16:37:49", "remaining_time": "1 day, 1:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7030, "total_steps": 17941, "loss": 1.6245, "learning_rate": 6.819558885704801e-05, "epoch": 0.39183991973691545, "percentage": 39.18, "elapsed_time": "16:37:58", "remaining_time": "1 day, 1:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7031, "total_steps": 17941, "loss": 1.7134, "learning_rate": 6.818729486527533e-05, "epoch": 0.3918956579900786, "percentage": 39.19, "elapsed_time": "16:38:06", "remaining_time": "1 day, 1:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7032, "total_steps": 17941, "loss": 1.6473, "learning_rate": 6.817900029670769e-05, "epoch": 0.3919513962432417, "percentage": 39.2, "elapsed_time": "16:38:15", "remaining_time": "1 day, 1:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7033, "total_steps": 17941, "loss": 1.4961, "learning_rate": 6.817070515160815e-05, "epoch": 0.3920071344964049, "percentage": 39.2, "elapsed_time": "16:38:23", "remaining_time": "1 day, 1:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7034, "total_steps": 17941, "loss": 1.8336, "learning_rate": 6.816240943023977e-05, "epoch": 0.392062872749568, "percentage": 39.21, "elapsed_time": "16:38:32", "remaining_time": "1 day, 1:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7035, "total_steps": 17941, "loss": 1.8517, "learning_rate": 6.815411313286568e-05, "epoch": 0.39211861100273115, "percentage": 39.21, "elapsed_time": "16:38:40", "remaining_time": "1 day, 1:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7036, "total_steps": 17941, "loss": 1.8405, "learning_rate": 6.814581625974897e-05, "epoch": 0.39217434925589434, "percentage": 39.22, "elapsed_time": "16:38:49", "remaining_time": "1 day, 1:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7037, "total_steps": 17941, "loss": 1.7636, "learning_rate": 6.813751881115275e-05, "epoch": 0.39223008750905747, "percentage": 39.22, "elapsed_time": "16:38:57", "remaining_time": "1 day, 1:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7038, "total_steps": 17941, "loss": 1.8142, "learning_rate": 6.812922078734019e-05, "epoch": 0.3922858257622206, "percentage": 39.23, "elapsed_time": "16:39:06", "remaining_time": "1 day, 1:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7039, "total_steps": 17941, "loss": 1.7048, "learning_rate": 6.812092218857444e-05, "epoch": 0.3923415640153838, "percentage": 39.23, "elapsed_time": "16:39:14", "remaining_time": "1 day, 1:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7040, "total_steps": 17941, "loss": 1.652, "learning_rate": 6.811262301511869e-05, "epoch": 0.3923973022685469, "percentage": 39.24, "elapsed_time": "16:39:22", "remaining_time": "1 day, 1:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7041, "total_steps": 17941, "loss": 1.325, "learning_rate": 6.810432326723615e-05, "epoch": 0.39245304052171004, "percentage": 39.25, "elapsed_time": "16:39:31", "remaining_time": "1 day, 1:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7042, "total_steps": 17941, "loss": 1.7832, "learning_rate": 6.809602294519004e-05, "epoch": 0.39250877877487317, "percentage": 39.25, "elapsed_time": "16:39:39", "remaining_time": "1 day, 1:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7043, "total_steps": 17941, "loss": 1.6449, "learning_rate": 6.808772204924357e-05, "epoch": 0.39256451702803635, "percentage": 39.26, "elapsed_time": "16:39:48", "remaining_time": "1 day, 1:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7044, "total_steps": 17941, "loss": 1.6308, "learning_rate": 6.807942057966003e-05, "epoch": 0.3926202552811995, "percentage": 39.26, "elapsed_time": "16:39:56", "remaining_time": "1 day, 1:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7045, "total_steps": 17941, "loss": 1.6675, "learning_rate": 6.807111853670268e-05, "epoch": 0.3926759935343626, "percentage": 39.27, "elapsed_time": "16:40:05", "remaining_time": "1 day, 1:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7046, "total_steps": 17941, "loss": 1.8951, "learning_rate": 6.806281592063481e-05, "epoch": 0.3927317317875258, "percentage": 39.27, "elapsed_time": "16:40:13", "remaining_time": "1 day, 1:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7047, "total_steps": 17941, "loss": 1.686, "learning_rate": 6.805451273171972e-05, "epoch": 0.3927874700406889, "percentage": 39.28, "elapsed_time": "16:40:21", "remaining_time": "1 day, 1:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7048, "total_steps": 17941, "loss": 1.407, "learning_rate": 6.804620897022076e-05, "epoch": 0.39284320829385205, "percentage": 39.28, "elapsed_time": "16:40:30", "remaining_time": "1 day, 1:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7049, "total_steps": 17941, "loss": 1.8137, "learning_rate": 6.803790463640127e-05, "epoch": 0.39289894654701524, "percentage": 39.29, "elapsed_time": "16:40:38", "remaining_time": "1 day, 1:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7050, "total_steps": 17941, "loss": 1.7861, "learning_rate": 6.802959973052461e-05, "epoch": 0.39295468480017837, "percentage": 39.3, "elapsed_time": "16:40:47", "remaining_time": "1 day, 1:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7051, "total_steps": 17941, "loss": 1.6572, "learning_rate": 6.802129425285417e-05, "epoch": 0.3930104230533415, "percentage": 39.3, "elapsed_time": "16:40:56", "remaining_time": "1 day, 1:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7052, "total_steps": 17941, "loss": 1.7467, "learning_rate": 6.801298820365333e-05, "epoch": 0.3930661613065047, "percentage": 39.31, "elapsed_time": "16:41:04", "remaining_time": "1 day, 1:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7053, "total_steps": 17941, "loss": 1.7429, "learning_rate": 6.800468158318554e-05, "epoch": 0.3931218995596678, "percentage": 39.31, "elapsed_time": "16:41:13", "remaining_time": "1 day, 1:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7054, "total_steps": 17941, "loss": 1.764, "learning_rate": 6.799637439171424e-05, "epoch": 0.39317763781283094, "percentage": 39.32, "elapsed_time": "16:41:21", "remaining_time": "1 day, 1:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7055, "total_steps": 17941, "loss": 1.4691, "learning_rate": 6.798806662950286e-05, "epoch": 0.39323337606599407, "percentage": 39.32, "elapsed_time": "16:41:30", "remaining_time": "1 day, 1:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7056, "total_steps": 17941, "loss": 1.5577, "learning_rate": 6.797975829681487e-05, "epoch": 0.39328911431915725, "percentage": 39.33, "elapsed_time": "16:41:38", "remaining_time": "1 day, 1:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7057, "total_steps": 17941, "loss": 1.7471, "learning_rate": 6.79714493939138e-05, "epoch": 0.3933448525723204, "percentage": 39.33, "elapsed_time": "16:41:47", "remaining_time": "1 day, 1:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7058, "total_steps": 17941, "loss": 1.765, "learning_rate": 6.796313992106313e-05, "epoch": 0.3934005908254835, "percentage": 39.34, "elapsed_time": "16:41:56", "remaining_time": "1 day, 1:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7059, "total_steps": 17941, "loss": 1.9101, "learning_rate": 6.795482987852638e-05, "epoch": 0.3934563290786467, "percentage": 39.35, "elapsed_time": "16:42:04", "remaining_time": "1 day, 1:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7060, "total_steps": 17941, "loss": 1.8193, "learning_rate": 6.794651926656711e-05, "epoch": 0.3935120673318098, "percentage": 39.35, "elapsed_time": "16:42:13", "remaining_time": "1 day, 1:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7061, "total_steps": 17941, "loss": 1.3794, "learning_rate": 6.793820808544891e-05, "epoch": 0.39356780558497295, "percentage": 39.36, "elapsed_time": "16:42:21", "remaining_time": "1 day, 1:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7062, "total_steps": 17941, "loss": 1.5634, "learning_rate": 6.792989633543531e-05, "epoch": 0.39362354383813614, "percentage": 39.36, "elapsed_time": "16:42:30", "remaining_time": "1 day, 1:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7063, "total_steps": 17941, "loss": 1.6858, "learning_rate": 6.792158401678994e-05, "epoch": 0.39367928209129927, "percentage": 39.37, "elapsed_time": "16:42:38", "remaining_time": "1 day, 1:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7064, "total_steps": 17941, "loss": 1.8272, "learning_rate": 6.791327112977644e-05, "epoch": 0.3937350203444624, "percentage": 39.37, "elapsed_time": "16:42:46", "remaining_time": "1 day, 1:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7065, "total_steps": 17941, "loss": 1.7226, "learning_rate": 6.790495767465839e-05, "epoch": 0.3937907585976255, "percentage": 39.38, "elapsed_time": "16:42:55", "remaining_time": "1 day, 1:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7066, "total_steps": 17941, "loss": 1.5082, "learning_rate": 6.789664365169947e-05, "epoch": 0.3938464968507887, "percentage": 39.38, "elapsed_time": "16:43:03", "remaining_time": "1 day, 1:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7067, "total_steps": 17941, "loss": 1.4914, "learning_rate": 6.788832906116338e-05, "epoch": 0.39390223510395184, "percentage": 39.39, "elapsed_time": "16:43:12", "remaining_time": "1 day, 1:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7068, "total_steps": 17941, "loss": 1.5864, "learning_rate": 6.78800139033138e-05, "epoch": 0.39395797335711497, "percentage": 39.4, "elapsed_time": "16:43:20", "remaining_time": "1 day, 1:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7069, "total_steps": 17941, "loss": 1.9452, "learning_rate": 6.787169817841442e-05, "epoch": 0.39401371161027815, "percentage": 39.4, "elapsed_time": "16:43:29", "remaining_time": "1 day, 1:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7070, "total_steps": 17941, "loss": 1.7637, "learning_rate": 6.786338188672896e-05, "epoch": 0.3940694498634413, "percentage": 39.41, "elapsed_time": "16:43:37", "remaining_time": "1 day, 1:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7071, "total_steps": 17941, "loss": 1.6875, "learning_rate": 6.785506502852118e-05, "epoch": 0.3941251881166044, "percentage": 39.41, "elapsed_time": "16:43:46", "remaining_time": "1 day, 1:43:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7072, "total_steps": 17941, "loss": 1.6496, "learning_rate": 6.784674760405482e-05, "epoch": 0.3941809263697676, "percentage": 39.42, "elapsed_time": "16:43:54", "remaining_time": "1 day, 1:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7073, "total_steps": 17941, "loss": 1.7234, "learning_rate": 6.78384296135937e-05, "epoch": 0.3942366646229307, "percentage": 39.42, "elapsed_time": "16:44:03", "remaining_time": "1 day, 1:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7074, "total_steps": 17941, "loss": 1.9166, "learning_rate": 6.783011105740162e-05, "epoch": 0.39429240287609385, "percentage": 39.43, "elapsed_time": "16:44:11", "remaining_time": "1 day, 1:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7075, "total_steps": 17941, "loss": 1.6746, "learning_rate": 6.782179193574234e-05, "epoch": 0.39434814112925703, "percentage": 39.43, "elapsed_time": "16:44:20", "remaining_time": "1 day, 1:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7076, "total_steps": 17941, "loss": 1.6615, "learning_rate": 6.781347224887974e-05, "epoch": 0.39440387938242016, "percentage": 39.44, "elapsed_time": "16:44:28", "remaining_time": "1 day, 1:42:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7077, "total_steps": 17941, "loss": 1.7271, "learning_rate": 6.780515199707766e-05, "epoch": 0.3944596176355833, "percentage": 39.45, "elapsed_time": "16:44:37", "remaining_time": "1 day, 1:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7078, "total_steps": 17941, "loss": 1.5172, "learning_rate": 6.779683118059997e-05, "epoch": 0.3945153558887464, "percentage": 39.45, "elapsed_time": "16:44:45", "remaining_time": "1 day, 1:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7079, "total_steps": 17941, "loss": 1.5777, "learning_rate": 6.778850979971057e-05, "epoch": 0.3945710941419096, "percentage": 39.46, "elapsed_time": "16:44:54", "remaining_time": "1 day, 1:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7080, "total_steps": 17941, "loss": 1.5685, "learning_rate": 6.778018785467332e-05, "epoch": 0.39462683239507274, "percentage": 39.46, "elapsed_time": "16:45:02", "remaining_time": "1 day, 1:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7081, "total_steps": 17941, "loss": 1.6626, "learning_rate": 6.777186534575222e-05, "epoch": 0.39468257064823586, "percentage": 39.47, "elapsed_time": "16:45:10", "remaining_time": "1 day, 1:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7082, "total_steps": 17941, "loss": 1.5554, "learning_rate": 6.776354227321114e-05, "epoch": 0.39473830890139905, "percentage": 39.47, "elapsed_time": "16:45:19", "remaining_time": "1 day, 1:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7083, "total_steps": 17941, "loss": 1.613, "learning_rate": 6.775521863731408e-05, "epoch": 0.3947940471545622, "percentage": 39.48, "elapsed_time": "16:45:27", "remaining_time": "1 day, 1:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7084, "total_steps": 17941, "loss": 1.6554, "learning_rate": 6.7746894438325e-05, "epoch": 0.3948497854077253, "percentage": 39.48, "elapsed_time": "16:45:36", "remaining_time": "1 day, 1:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7085, "total_steps": 17941, "loss": 1.7542, "learning_rate": 6.773856967650789e-05, "epoch": 0.3949055236608885, "percentage": 39.49, "elapsed_time": "16:45:45", "remaining_time": "1 day, 1:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7086, "total_steps": 17941, "loss": 1.8008, "learning_rate": 6.773024435212678e-05, "epoch": 0.3949612619140516, "percentage": 39.5, "elapsed_time": "16:45:54", "remaining_time": "1 day, 1:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7087, "total_steps": 17941, "loss": 1.6853, "learning_rate": 6.77219184654457e-05, "epoch": 0.39501700016721475, "percentage": 39.5, "elapsed_time": "16:46:03", "remaining_time": "1 day, 1:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7088, "total_steps": 17941, "loss": 1.877, "learning_rate": 6.771359201672868e-05, "epoch": 0.3950727384203779, "percentage": 39.51, "elapsed_time": "16:46:11", "remaining_time": "1 day, 1:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7089, "total_steps": 17941, "loss": 1.5347, "learning_rate": 6.770526500623982e-05, "epoch": 0.39512847667354106, "percentage": 39.51, "elapsed_time": "16:46:19", "remaining_time": "1 day, 1:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7090, "total_steps": 17941, "loss": 1.6611, "learning_rate": 6.769693743424317e-05, "epoch": 0.3951842149267042, "percentage": 39.52, "elapsed_time": "16:46:28", "remaining_time": "1 day, 1:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7091, "total_steps": 17941, "loss": 1.991, "learning_rate": 6.768860930100285e-05, "epoch": 0.3952399531798673, "percentage": 39.52, "elapsed_time": "16:46:36", "remaining_time": "1 day, 1:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7092, "total_steps": 17941, "loss": 1.8402, "learning_rate": 6.768028060678296e-05, "epoch": 0.3952956914330305, "percentage": 39.53, "elapsed_time": "16:46:45", "remaining_time": "1 day, 1:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7093, "total_steps": 17941, "loss": 1.6969, "learning_rate": 6.767195135184765e-05, "epoch": 0.39535142968619363, "percentage": 39.54, "elapsed_time": "16:46:53", "remaining_time": "1 day, 1:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7094, "total_steps": 17941, "loss": 1.6525, "learning_rate": 6.766362153646111e-05, "epoch": 0.39540716793935676, "percentage": 39.54, "elapsed_time": "16:47:02", "remaining_time": "1 day, 1:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7095, "total_steps": 17941, "loss": 1.7744, "learning_rate": 6.765529116088745e-05, "epoch": 0.39546290619251995, "percentage": 39.55, "elapsed_time": "16:47:10", "remaining_time": "1 day, 1:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7096, "total_steps": 17941, "loss": 1.6068, "learning_rate": 6.764696022539091e-05, "epoch": 0.3955186444456831, "percentage": 39.55, "elapsed_time": "16:47:19", "remaining_time": "1 day, 1:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7097, "total_steps": 17941, "loss": 1.6501, "learning_rate": 6.763862873023567e-05, "epoch": 0.3955743826988462, "percentage": 39.56, "elapsed_time": "16:47:27", "remaining_time": "1 day, 1:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7098, "total_steps": 17941, "loss": 1.5805, "learning_rate": 6.763029667568597e-05, "epoch": 0.3956301209520094, "percentage": 39.56, "elapsed_time": "16:47:36", "remaining_time": "1 day, 1:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7099, "total_steps": 17941, "loss": 1.7185, "learning_rate": 6.762196406200604e-05, "epoch": 0.3956858592051725, "percentage": 39.57, "elapsed_time": "16:47:44", "remaining_time": "1 day, 1:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7100, "total_steps": 17941, "loss": 1.7264, "learning_rate": 6.761363088946017e-05, "epoch": 0.39574159745833565, "percentage": 39.57, "elapsed_time": "16:47:53", "remaining_time": "1 day, 1:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7101, "total_steps": 17941, "loss": 1.6626, "learning_rate": 6.760529715831262e-05, "epoch": 0.3957973357114988, "percentage": 39.58, "elapsed_time": "16:48:02", "remaining_time": "1 day, 1:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7102, "total_steps": 17941, "loss": 1.827, "learning_rate": 6.759696286882769e-05, "epoch": 0.39585307396466196, "percentage": 39.59, "elapsed_time": "16:48:10", "remaining_time": "1 day, 1:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7103, "total_steps": 17941, "loss": 1.8003, "learning_rate": 6.758862802126969e-05, "epoch": 0.3959088122178251, "percentage": 39.59, "elapsed_time": "16:48:18", "remaining_time": "1 day, 1:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7104, "total_steps": 17941, "loss": 1.7641, "learning_rate": 6.758029261590296e-05, "epoch": 0.3959645504709882, "percentage": 39.6, "elapsed_time": "16:48:27", "remaining_time": "1 day, 1:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7105, "total_steps": 17941, "loss": 1.6907, "learning_rate": 6.757195665299186e-05, "epoch": 0.3960202887241514, "percentage": 39.6, "elapsed_time": "16:48:36", "remaining_time": "1 day, 1:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7106, "total_steps": 17941, "loss": 1.5457, "learning_rate": 6.756362013280072e-05, "epoch": 0.39607602697731453, "percentage": 39.61, "elapsed_time": "16:48:44", "remaining_time": "1 day, 1:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7107, "total_steps": 17941, "loss": 1.6021, "learning_rate": 6.755528305559398e-05, "epoch": 0.39613176523047766, "percentage": 39.61, "elapsed_time": "16:48:53", "remaining_time": "1 day, 1:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7108, "total_steps": 17941, "loss": 1.5837, "learning_rate": 6.7546945421636e-05, "epoch": 0.39618750348364085, "percentage": 39.62, "elapsed_time": "16:49:02", "remaining_time": "1 day, 1:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7109, "total_steps": 17941, "loss": 2.096, "learning_rate": 6.753860723119122e-05, "epoch": 0.396243241736804, "percentage": 39.62, "elapsed_time": "16:49:10", "remaining_time": "1 day, 1:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7110, "total_steps": 17941, "loss": 1.9298, "learning_rate": 6.753026848452407e-05, "epoch": 0.3962989799899671, "percentage": 39.63, "elapsed_time": "16:49:19", "remaining_time": "1 day, 1:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7111, "total_steps": 17941, "loss": 1.702, "learning_rate": 6.752192918189902e-05, "epoch": 0.39635471824313023, "percentage": 39.64, "elapsed_time": "16:49:27", "remaining_time": "1 day, 1:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7112, "total_steps": 17941, "loss": 1.6217, "learning_rate": 6.751358932358052e-05, "epoch": 0.3964104564962934, "percentage": 39.64, "elapsed_time": "16:49:36", "remaining_time": "1 day, 1:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7113, "total_steps": 17941, "loss": 1.9734, "learning_rate": 6.750524890983309e-05, "epoch": 0.39646619474945655, "percentage": 39.65, "elapsed_time": "16:49:44", "remaining_time": "1 day, 1:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7114, "total_steps": 17941, "loss": 1.9415, "learning_rate": 6.749690794092125e-05, "epoch": 0.3965219330026197, "percentage": 39.65, "elapsed_time": "16:49:53", "remaining_time": "1 day, 1:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7115, "total_steps": 17941, "loss": 2.0009, "learning_rate": 6.748856641710948e-05, "epoch": 0.39657767125578286, "percentage": 39.66, "elapsed_time": "16:50:01", "remaining_time": "1 day, 1:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7116, "total_steps": 17941, "loss": 1.7601, "learning_rate": 6.748022433866236e-05, "epoch": 0.396633409508946, "percentage": 39.66, "elapsed_time": "16:50:10", "remaining_time": "1 day, 1:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7117, "total_steps": 17941, "loss": 1.7173, "learning_rate": 6.747188170584444e-05, "epoch": 0.3966891477621091, "percentage": 39.67, "elapsed_time": "16:50:18", "remaining_time": "1 day, 1:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7118, "total_steps": 17941, "loss": 1.7054, "learning_rate": 6.746353851892028e-05, "epoch": 0.3967448860152723, "percentage": 39.67, "elapsed_time": "16:50:26", "remaining_time": "1 day, 1:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7119, "total_steps": 17941, "loss": 1.6456, "learning_rate": 6.745519477815451e-05, "epoch": 0.39680062426843543, "percentage": 39.68, "elapsed_time": "16:50:35", "remaining_time": "1 day, 1:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7120, "total_steps": 17941, "loss": 1.7264, "learning_rate": 6.744685048381174e-05, "epoch": 0.39685636252159856, "percentage": 39.69, "elapsed_time": "16:50:43", "remaining_time": "1 day, 1:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7121, "total_steps": 17941, "loss": 1.7025, "learning_rate": 6.743850563615659e-05, "epoch": 0.39691210077476174, "percentage": 39.69, "elapsed_time": "16:50:52", "remaining_time": "1 day, 1:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7122, "total_steps": 17941, "loss": 1.5742, "learning_rate": 6.743016023545373e-05, "epoch": 0.3969678390279249, "percentage": 39.7, "elapsed_time": "16:51:00", "remaining_time": "1 day, 1:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7123, "total_steps": 17941, "loss": 1.8845, "learning_rate": 6.742181428196777e-05, "epoch": 0.397023577281088, "percentage": 39.7, "elapsed_time": "16:51:09", "remaining_time": "1 day, 1:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7124, "total_steps": 17941, "loss": 1.6998, "learning_rate": 6.741346777596347e-05, "epoch": 0.39707931553425113, "percentage": 39.71, "elapsed_time": "16:51:17", "remaining_time": "1 day, 1:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7125, "total_steps": 17941, "loss": 1.4712, "learning_rate": 6.74051207177055e-05, "epoch": 0.3971350537874143, "percentage": 39.71, "elapsed_time": "16:51:26", "remaining_time": "1 day, 1:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7126, "total_steps": 17941, "loss": 1.4259, "learning_rate": 6.739677310745856e-05, "epoch": 0.39719079204057745, "percentage": 39.72, "elapsed_time": "16:51:34", "remaining_time": "1 day, 1:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7127, "total_steps": 17941, "loss": 1.6437, "learning_rate": 6.738842494548742e-05, "epoch": 0.3972465302937406, "percentage": 39.72, "elapsed_time": "16:51:43", "remaining_time": "1 day, 1:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7128, "total_steps": 17941, "loss": 1.537, "learning_rate": 6.738007623205682e-05, "epoch": 0.39730226854690376, "percentage": 39.73, "elapsed_time": "16:51:52", "remaining_time": "1 day, 1:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7129, "total_steps": 17941, "loss": 1.7359, "learning_rate": 6.737172696743155e-05, "epoch": 0.3973580068000669, "percentage": 39.74, "elapsed_time": "16:52:01", "remaining_time": "1 day, 1:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7130, "total_steps": 17941, "loss": 1.632, "learning_rate": 6.736337715187638e-05, "epoch": 0.39741374505323, "percentage": 39.74, "elapsed_time": "16:52:09", "remaining_time": "1 day, 1:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7131, "total_steps": 17941, "loss": 1.6633, "learning_rate": 6.735502678565611e-05, "epoch": 0.3974694833063932, "percentage": 39.75, "elapsed_time": "16:52:18", "remaining_time": "1 day, 1:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7132, "total_steps": 17941, "loss": 1.6349, "learning_rate": 6.734667586903557e-05, "epoch": 0.39752522155955633, "percentage": 39.75, "elapsed_time": "16:52:27", "remaining_time": "1 day, 1:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7133, "total_steps": 17941, "loss": 1.8522, "learning_rate": 6.733832440227963e-05, "epoch": 0.39758095981271946, "percentage": 39.76, "elapsed_time": "16:52:35", "remaining_time": "1 day, 1:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7134, "total_steps": 17941, "loss": 1.8608, "learning_rate": 6.732997238565311e-05, "epoch": 0.3976366980658826, "percentage": 39.76, "elapsed_time": "16:52:44", "remaining_time": "1 day, 1:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7135, "total_steps": 17941, "loss": 1.7628, "learning_rate": 6.732161981942093e-05, "epoch": 0.3976924363190458, "percentage": 39.77, "elapsed_time": "16:52:52", "remaining_time": "1 day, 1:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7136, "total_steps": 17941, "loss": 1.7216, "learning_rate": 6.731326670384794e-05, "epoch": 0.3977481745722089, "percentage": 39.77, "elapsed_time": "16:53:01", "remaining_time": "1 day, 1:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7137, "total_steps": 17941, "loss": 1.6816, "learning_rate": 6.730491303919907e-05, "epoch": 0.39780391282537203, "percentage": 39.78, "elapsed_time": "16:53:09", "remaining_time": "1 day, 1:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7138, "total_steps": 17941, "loss": 1.9808, "learning_rate": 6.729655882573928e-05, "epoch": 0.3978596510785352, "percentage": 39.79, "elapsed_time": "16:53:18", "remaining_time": "1 day, 1:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7139, "total_steps": 17941, "loss": 1.8237, "learning_rate": 6.728820406373346e-05, "epoch": 0.39791538933169834, "percentage": 39.79, "elapsed_time": "16:53:26", "remaining_time": "1 day, 1:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7140, "total_steps": 17941, "loss": 1.61, "learning_rate": 6.727984875344663e-05, "epoch": 0.3979711275848615, "percentage": 39.8, "elapsed_time": "16:53:35", "remaining_time": "1 day, 1:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7141, "total_steps": 17941, "loss": 2.1011, "learning_rate": 6.727149289514373e-05, "epoch": 0.39802686583802466, "percentage": 39.8, "elapsed_time": "16:53:43", "remaining_time": "1 day, 1:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7142, "total_steps": 17941, "loss": 1.6724, "learning_rate": 6.72631364890898e-05, "epoch": 0.3980826040911878, "percentage": 39.81, "elapsed_time": "16:53:52", "remaining_time": "1 day, 1:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7143, "total_steps": 17941, "loss": 1.5425, "learning_rate": 6.725477953554979e-05, "epoch": 0.3981383423443509, "percentage": 39.81, "elapsed_time": "16:54:00", "remaining_time": "1 day, 1:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7144, "total_steps": 17941, "loss": 1.6308, "learning_rate": 6.72464220347888e-05, "epoch": 0.3981940805975141, "percentage": 39.82, "elapsed_time": "16:54:09", "remaining_time": "1 day, 1:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7145, "total_steps": 17941, "loss": 1.8022, "learning_rate": 6.723806398707185e-05, "epoch": 0.39824981885067723, "percentage": 39.82, "elapsed_time": "16:54:17", "remaining_time": "1 day, 1:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7146, "total_steps": 17941, "loss": 1.4448, "learning_rate": 6.722970539266403e-05, "epoch": 0.39830555710384036, "percentage": 39.83, "elapsed_time": "16:54:27", "remaining_time": "1 day, 1:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7147, "total_steps": 17941, "loss": 1.7358, "learning_rate": 6.72213462518304e-05, "epoch": 0.3983612953570035, "percentage": 39.84, "elapsed_time": "16:54:35", "remaining_time": "1 day, 1:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7148, "total_steps": 17941, "loss": 1.4709, "learning_rate": 6.721298656483608e-05, "epoch": 0.39841703361016667, "percentage": 39.84, "elapsed_time": "16:54:44", "remaining_time": "1 day, 1:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7149, "total_steps": 17941, "loss": 1.6085, "learning_rate": 6.720462633194618e-05, "epoch": 0.3984727718633298, "percentage": 39.85, "elapsed_time": "16:54:52", "remaining_time": "1 day, 1:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7150, "total_steps": 17941, "loss": 1.8059, "learning_rate": 6.719626555342585e-05, "epoch": 0.39852851011649293, "percentage": 39.85, "elapsed_time": "16:55:01", "remaining_time": "1 day, 1:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7151, "total_steps": 17941, "loss": 1.7492, "learning_rate": 6.718790422954021e-05, "epoch": 0.3985842483696561, "percentage": 39.86, "elapsed_time": "16:55:09", "remaining_time": "1 day, 1:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7152, "total_steps": 17941, "loss": 1.6074, "learning_rate": 6.717954236055449e-05, "epoch": 0.39863998662281924, "percentage": 39.86, "elapsed_time": "16:55:18", "remaining_time": "1 day, 1:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7153, "total_steps": 17941, "loss": 1.3657, "learning_rate": 6.717117994673384e-05, "epoch": 0.39869572487598237, "percentage": 39.87, "elapsed_time": "16:55:27", "remaining_time": "1 day, 1:31:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7154, "total_steps": 17941, "loss": 1.6112, "learning_rate": 6.716281698834346e-05, "epoch": 0.39875146312914556, "percentage": 39.88, "elapsed_time": "16:55:35", "remaining_time": "1 day, 1:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7155, "total_steps": 17941, "loss": 1.9087, "learning_rate": 6.715445348564862e-05, "epoch": 0.3988072013823087, "percentage": 39.88, "elapsed_time": "16:55:44", "remaining_time": "1 day, 1:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7156, "total_steps": 17941, "loss": 2.0278, "learning_rate": 6.714608943891452e-05, "epoch": 0.3988629396354718, "percentage": 39.89, "elapsed_time": "16:55:53", "remaining_time": "1 day, 1:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7157, "total_steps": 17941, "loss": 1.63, "learning_rate": 6.713772484840645e-05, "epoch": 0.39891867788863494, "percentage": 39.89, "elapsed_time": "16:56:01", "remaining_time": "1 day, 1:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7158, "total_steps": 17941, "loss": 1.6313, "learning_rate": 6.712935971438962e-05, "epoch": 0.3989744161417981, "percentage": 39.9, "elapsed_time": "16:56:10", "remaining_time": "1 day, 1:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7159, "total_steps": 17941, "loss": 1.7367, "learning_rate": 6.712099403712942e-05, "epoch": 0.39903015439496126, "percentage": 39.9, "elapsed_time": "16:56:18", "remaining_time": "1 day, 1:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7160, "total_steps": 17941, "loss": 1.8337, "learning_rate": 6.711262781689109e-05, "epoch": 0.3990858926481244, "percentage": 39.91, "elapsed_time": "16:56:27", "remaining_time": "1 day, 1:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7161, "total_steps": 17941, "loss": 1.8474, "learning_rate": 6.710426105394e-05, "epoch": 0.39914163090128757, "percentage": 39.91, "elapsed_time": "16:56:35", "remaining_time": "1 day, 1:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7162, "total_steps": 17941, "loss": 1.4712, "learning_rate": 6.709589374854144e-05, "epoch": 0.3991973691544507, "percentage": 39.92, "elapsed_time": "16:56:44", "remaining_time": "1 day, 1:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7163, "total_steps": 17941, "loss": 1.6399, "learning_rate": 6.708752590096082e-05, "epoch": 0.3992531074076138, "percentage": 39.93, "elapsed_time": "16:56:53", "remaining_time": "1 day, 1:30:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7164, "total_steps": 17941, "loss": 1.6822, "learning_rate": 6.707915751146351e-05, "epoch": 0.399308845660777, "percentage": 39.93, "elapsed_time": "16:57:01", "remaining_time": "1 day, 1:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7165, "total_steps": 17941, "loss": 1.4796, "learning_rate": 6.70707885803149e-05, "epoch": 0.39936458391394014, "percentage": 39.94, "elapsed_time": "16:57:10", "remaining_time": "1 day, 1:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7166, "total_steps": 17941, "loss": 1.844, "learning_rate": 6.706241910778041e-05, "epoch": 0.39942032216710327, "percentage": 39.94, "elapsed_time": "16:57:18", "remaining_time": "1 day, 1:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7167, "total_steps": 17941, "loss": 1.787, "learning_rate": 6.705404909412547e-05, "epoch": 0.39947606042026645, "percentage": 39.95, "elapsed_time": "16:57:27", "remaining_time": "1 day, 1:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7168, "total_steps": 17941, "loss": 1.7695, "learning_rate": 6.704567853961552e-05, "epoch": 0.3995317986734296, "percentage": 39.95, "elapsed_time": "16:57:35", "remaining_time": "1 day, 1:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7169, "total_steps": 17941, "loss": 1.5939, "learning_rate": 6.703730744451601e-05, "epoch": 0.3995875369265927, "percentage": 39.96, "elapsed_time": "16:57:44", "remaining_time": "1 day, 1:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7170, "total_steps": 17941, "loss": 1.7385, "learning_rate": 6.702893580909247e-05, "epoch": 0.39964327517975584, "percentage": 39.96, "elapsed_time": "16:57:52", "remaining_time": "1 day, 1:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7171, "total_steps": 17941, "loss": 1.6495, "learning_rate": 6.702056363361036e-05, "epoch": 0.399699013432919, "percentage": 39.97, "elapsed_time": "16:58:01", "remaining_time": "1 day, 1:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7172, "total_steps": 17941, "loss": 1.8867, "learning_rate": 6.701219091833522e-05, "epoch": 0.39975475168608215, "percentage": 39.98, "elapsed_time": "16:58:09", "remaining_time": "1 day, 1:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7173, "total_steps": 17941, "loss": 1.7746, "learning_rate": 6.700381766353255e-05, "epoch": 0.3998104899392453, "percentage": 39.98, "elapsed_time": "16:58:18", "remaining_time": "1 day, 1:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7174, "total_steps": 17941, "loss": 1.8656, "learning_rate": 6.699544386946795e-05, "epoch": 0.39986622819240847, "percentage": 39.99, "elapsed_time": "16:58:27", "remaining_time": "1 day, 1:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7175, "total_steps": 17941, "loss": 1.6071, "learning_rate": 6.698706953640693e-05, "epoch": 0.3999219664455716, "percentage": 39.99, "elapsed_time": "16:58:36", "remaining_time": "1 day, 1:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7176, "total_steps": 17941, "loss": 1.8849, "learning_rate": 6.697869466461513e-05, "epoch": 0.3999777046987347, "percentage": 40.0, "elapsed_time": "16:58:44", "remaining_time": "1 day, 1:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7177, "total_steps": 17941, "loss": 1.7764, "learning_rate": 6.69703192543581e-05, "epoch": 0.4000334429518979, "percentage": 40.0, "elapsed_time": "16:58:53", "remaining_time": "1 day, 1:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7178, "total_steps": 17941, "loss": 1.6598, "learning_rate": 6.696194330590151e-05, "epoch": 0.40008918120506104, "percentage": 40.01, "elapsed_time": "16:59:01", "remaining_time": "1 day, 1:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7179, "total_steps": 17941, "loss": 1.6139, "learning_rate": 6.695356681951099e-05, "epoch": 0.40014491945822417, "percentage": 40.01, "elapsed_time": "16:59:10", "remaining_time": "1 day, 1:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7180, "total_steps": 17941, "loss": 1.6783, "learning_rate": 6.694518979545214e-05, "epoch": 0.4002006577113873, "percentage": 40.02, "elapsed_time": "16:59:18", "remaining_time": "1 day, 1:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7181, "total_steps": 17941, "loss": 1.6699, "learning_rate": 6.69368122339907e-05, "epoch": 0.4002563959645505, "percentage": 40.03, "elapsed_time": "16:59:27", "remaining_time": "1 day, 1:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7182, "total_steps": 17941, "loss": 1.532, "learning_rate": 6.692843413539229e-05, "epoch": 0.4003121342177136, "percentage": 40.03, "elapsed_time": "16:59:35", "remaining_time": "1 day, 1:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7183, "total_steps": 17941, "loss": 1.9554, "learning_rate": 6.692005549992268e-05, "epoch": 0.40036787247087674, "percentage": 40.04, "elapsed_time": "16:59:44", "remaining_time": "1 day, 1:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7184, "total_steps": 17941, "loss": 1.4465, "learning_rate": 6.691167632784754e-05, "epoch": 0.4004236107240399, "percentage": 40.04, "elapsed_time": "16:59:52", "remaining_time": "1 day, 1:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7185, "total_steps": 17941, "loss": 1.6263, "learning_rate": 6.690329661943265e-05, "epoch": 0.40047934897720305, "percentage": 40.05, "elapsed_time": "17:00:01", "remaining_time": "1 day, 1:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7186, "total_steps": 17941, "loss": 1.8053, "learning_rate": 6.689491637494371e-05, "epoch": 0.4005350872303662, "percentage": 40.05, "elapsed_time": "17:00:09", "remaining_time": "1 day, 1:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7187, "total_steps": 17941, "loss": 1.6647, "learning_rate": 6.688653559464655e-05, "epoch": 0.40059082548352937, "percentage": 40.06, "elapsed_time": "17:00:18", "remaining_time": "1 day, 1:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7188, "total_steps": 17941, "loss": 1.7904, "learning_rate": 6.687815427880694e-05, "epoch": 0.4006465637366925, "percentage": 40.06, "elapsed_time": "17:00:26", "remaining_time": "1 day, 1:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7189, "total_steps": 17941, "loss": 1.8628, "learning_rate": 6.686977242769067e-05, "epoch": 0.4007023019898556, "percentage": 40.07, "elapsed_time": "17:00:35", "remaining_time": "1 day, 1:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7190, "total_steps": 17941, "loss": 1.6146, "learning_rate": 6.686139004156358e-05, "epoch": 0.4007580402430188, "percentage": 40.08, "elapsed_time": "17:00:43", "remaining_time": "1 day, 1:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7191, "total_steps": 17941, "loss": 1.683, "learning_rate": 6.68530071206915e-05, "epoch": 0.40081377849618194, "percentage": 40.08, "elapsed_time": "17:00:52", "remaining_time": "1 day, 1:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7192, "total_steps": 17941, "loss": 1.6757, "learning_rate": 6.684462366534032e-05, "epoch": 0.40086951674934507, "percentage": 40.09, "elapsed_time": "17:01:00", "remaining_time": "1 day, 1:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7193, "total_steps": 17941, "loss": 1.7725, "learning_rate": 6.683623967577586e-05, "epoch": 0.4009252550025082, "percentage": 40.09, "elapsed_time": "17:01:09", "remaining_time": "1 day, 1:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7194, "total_steps": 17941, "loss": 1.4681, "learning_rate": 6.682785515226407e-05, "epoch": 0.4009809932556714, "percentage": 40.1, "elapsed_time": "17:01:18", "remaining_time": "1 day, 1:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7195, "total_steps": 17941, "loss": 1.4126, "learning_rate": 6.681947009507079e-05, "epoch": 0.4010367315088345, "percentage": 40.1, "elapsed_time": "17:01:27", "remaining_time": "1 day, 1:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7196, "total_steps": 17941, "loss": 1.6593, "learning_rate": 6.681108450446202e-05, "epoch": 0.40109246976199764, "percentage": 40.11, "elapsed_time": "17:01:35", "remaining_time": "1 day, 1:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7197, "total_steps": 17941, "loss": 1.9668, "learning_rate": 6.680269838070364e-05, "epoch": 0.4011482080151608, "percentage": 40.11, "elapsed_time": "17:01:44", "remaining_time": "1 day, 1:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7198, "total_steps": 17941, "loss": 1.4285, "learning_rate": 6.679431172406163e-05, "epoch": 0.40120394626832395, "percentage": 40.12, "elapsed_time": "17:01:52", "remaining_time": "1 day, 1:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7199, "total_steps": 17941, "loss": 1.8469, "learning_rate": 6.678592453480198e-05, "epoch": 0.4012596845214871, "percentage": 40.13, "elapsed_time": "17:02:01", "remaining_time": "1 day, 1:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7200, "total_steps": 17941, "loss": 2.1511, "learning_rate": 6.677753681319066e-05, "epoch": 0.40131542277465027, "percentage": 40.13, "elapsed_time": "17:02:09", "remaining_time": "1 day, 1:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7201, "total_steps": 17941, "loss": 1.8045, "learning_rate": 6.676914855949372e-05, "epoch": 0.4013711610278134, "percentage": 40.14, "elapsed_time": "17:02:18", "remaining_time": "1 day, 1:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7202, "total_steps": 17941, "loss": 1.7844, "learning_rate": 6.676075977397715e-05, "epoch": 0.4014268992809765, "percentage": 40.14, "elapsed_time": "17:02:26", "remaining_time": "1 day, 1:24:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7203, "total_steps": 17941, "loss": 1.7289, "learning_rate": 6.675237045690699e-05, "epoch": 0.40148263753413965, "percentage": 40.15, "elapsed_time": "17:02:35", "remaining_time": "1 day, 1:24:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7204, "total_steps": 17941, "loss": 1.4584, "learning_rate": 6.674398060854931e-05, "epoch": 0.40153837578730284, "percentage": 40.15, "elapsed_time": "17:02:44", "remaining_time": "1 day, 1:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7205, "total_steps": 17941, "loss": 1.8035, "learning_rate": 6.67355902291702e-05, "epoch": 0.40159411404046597, "percentage": 40.16, "elapsed_time": "17:02:52", "remaining_time": "1 day, 1:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7206, "total_steps": 17941, "loss": 1.781, "learning_rate": 6.672719931903574e-05, "epoch": 0.4016498522936291, "percentage": 40.16, "elapsed_time": "17:03:00", "remaining_time": "1 day, 1:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7207, "total_steps": 17941, "loss": 1.7033, "learning_rate": 6.671880787841204e-05, "epoch": 0.4017055905467923, "percentage": 40.17, "elapsed_time": "17:03:09", "remaining_time": "1 day, 1:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7208, "total_steps": 17941, "loss": 1.7048, "learning_rate": 6.671041590756524e-05, "epoch": 0.4017613287999554, "percentage": 40.18, "elapsed_time": "17:03:17", "remaining_time": "1 day, 1:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7209, "total_steps": 17941, "loss": 1.6601, "learning_rate": 6.670202340676149e-05, "epoch": 0.40181706705311854, "percentage": 40.18, "elapsed_time": "17:03:26", "remaining_time": "1 day, 1:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7210, "total_steps": 17941, "loss": 1.619, "learning_rate": 6.669363037626689e-05, "epoch": 0.4018728053062817, "percentage": 40.19, "elapsed_time": "17:03:35", "remaining_time": "1 day, 1:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7211, "total_steps": 17941, "loss": 1.6898, "learning_rate": 6.66852368163477e-05, "epoch": 0.40192854355944485, "percentage": 40.19, "elapsed_time": "17:03:43", "remaining_time": "1 day, 1:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7212, "total_steps": 17941, "loss": 1.4842, "learning_rate": 6.667684272727007e-05, "epoch": 0.401984281812608, "percentage": 40.2, "elapsed_time": "17:03:51", "remaining_time": "1 day, 1:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7213, "total_steps": 17941, "loss": 1.5747, "learning_rate": 6.666844810930021e-05, "epoch": 0.40204002006577116, "percentage": 40.2, "elapsed_time": "17:04:00", "remaining_time": "1 day, 1:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7214, "total_steps": 17941, "loss": 1.9183, "learning_rate": 6.666005296270439e-05, "epoch": 0.4020957583189343, "percentage": 40.21, "elapsed_time": "17:04:08", "remaining_time": "1 day, 1:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7215, "total_steps": 17941, "loss": 1.708, "learning_rate": 6.66516572877488e-05, "epoch": 0.4021514965720974, "percentage": 40.22, "elapsed_time": "17:04:17", "remaining_time": "1 day, 1:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7216, "total_steps": 17941, "loss": 1.5666, "learning_rate": 6.664326108469974e-05, "epoch": 0.40220723482526055, "percentage": 40.22, "elapsed_time": "17:04:25", "remaining_time": "1 day, 1:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7217, "total_steps": 17941, "loss": 1.8389, "learning_rate": 6.663486435382347e-05, "epoch": 0.40226297307842374, "percentage": 40.23, "elapsed_time": "17:04:34", "remaining_time": "1 day, 1:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7218, "total_steps": 17941, "loss": 1.91, "learning_rate": 6.66264670953863e-05, "epoch": 0.40231871133158686, "percentage": 40.23, "elapsed_time": "17:04:42", "remaining_time": "1 day, 1:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7219, "total_steps": 17941, "loss": 1.6892, "learning_rate": 6.661806930965452e-05, "epoch": 0.40237444958475, "percentage": 40.24, "elapsed_time": "17:04:51", "remaining_time": "1 day, 1:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7220, "total_steps": 17941, "loss": 1.6718, "learning_rate": 6.660967099689448e-05, "epoch": 0.4024301878379132, "percentage": 40.24, "elapsed_time": "17:04:59", "remaining_time": "1 day, 1:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7221, "total_steps": 17941, "loss": 1.7055, "learning_rate": 6.66012721573725e-05, "epoch": 0.4024859260910763, "percentage": 40.25, "elapsed_time": "17:05:08", "remaining_time": "1 day, 1:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7222, "total_steps": 17941, "loss": 1.6732, "learning_rate": 6.659287279135499e-05, "epoch": 0.40254166434423944, "percentage": 40.25, "elapsed_time": "17:05:16", "remaining_time": "1 day, 1:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7223, "total_steps": 17941, "loss": 1.4223, "learning_rate": 6.658447289910827e-05, "epoch": 0.4025974025974026, "percentage": 40.26, "elapsed_time": "17:05:25", "remaining_time": "1 day, 1:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7224, "total_steps": 17941, "loss": 1.8696, "learning_rate": 6.657607248089879e-05, "epoch": 0.40265314085056575, "percentage": 40.27, "elapsed_time": "17:05:33", "remaining_time": "1 day, 1:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7225, "total_steps": 17941, "loss": 1.5046, "learning_rate": 6.65676715369929e-05, "epoch": 0.4027088791037289, "percentage": 40.27, "elapsed_time": "17:05:42", "remaining_time": "1 day, 1:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7226, "total_steps": 17941, "loss": 1.6517, "learning_rate": 6.655927006765709e-05, "epoch": 0.402764617356892, "percentage": 40.28, "elapsed_time": "17:05:50", "remaining_time": "1 day, 1:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7227, "total_steps": 17941, "loss": 1.8544, "learning_rate": 6.655086807315778e-05, "epoch": 0.4028203556100552, "percentage": 40.28, "elapsed_time": "17:05:59", "remaining_time": "1 day, 1:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7228, "total_steps": 17941, "loss": 1.7556, "learning_rate": 6.654246555376144e-05, "epoch": 0.4028760938632183, "percentage": 40.29, "elapsed_time": "17:06:07", "remaining_time": "1 day, 1:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7229, "total_steps": 17941, "loss": 1.7469, "learning_rate": 6.653406250973451e-05, "epoch": 0.40293183211638145, "percentage": 40.29, "elapsed_time": "17:06:15", "remaining_time": "1 day, 1:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7230, "total_steps": 17941, "loss": 1.6428, "learning_rate": 6.652565894134355e-05, "epoch": 0.40298757036954463, "percentage": 40.3, "elapsed_time": "17:06:24", "remaining_time": "1 day, 1:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7231, "total_steps": 17941, "loss": 1.4699, "learning_rate": 6.651725484885503e-05, "epoch": 0.40304330862270776, "percentage": 40.3, "elapsed_time": "17:06:32", "remaining_time": "1 day, 1:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7232, "total_steps": 17941, "loss": 1.8881, "learning_rate": 6.650885023253548e-05, "epoch": 0.4030990468758709, "percentage": 40.31, "elapsed_time": "17:06:42", "remaining_time": "1 day, 1:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7233, "total_steps": 17941, "loss": 1.8263, "learning_rate": 6.650044509265147e-05, "epoch": 0.4031547851290341, "percentage": 40.32, "elapsed_time": "17:06:51", "remaining_time": "1 day, 1:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7234, "total_steps": 17941, "loss": 1.5232, "learning_rate": 6.649203942946954e-05, "epoch": 0.4032105233821972, "percentage": 40.32, "elapsed_time": "17:06:59", "remaining_time": "1 day, 1:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7235, "total_steps": 17941, "loss": 1.5617, "learning_rate": 6.648363324325627e-05, "epoch": 0.40326626163536033, "percentage": 40.33, "elapsed_time": "17:07:08", "remaining_time": "1 day, 1:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7236, "total_steps": 17941, "loss": 1.7428, "learning_rate": 6.647522653427825e-05, "epoch": 0.4033219998885235, "percentage": 40.33, "elapsed_time": "17:07:16", "remaining_time": "1 day, 1:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7237, "total_steps": 17941, "loss": 1.5538, "learning_rate": 6.646681930280211e-05, "epoch": 0.40337773814168665, "percentage": 40.34, "elapsed_time": "17:07:24", "remaining_time": "1 day, 1:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7238, "total_steps": 17941, "loss": 1.5501, "learning_rate": 6.645841154909448e-05, "epoch": 0.4034334763948498, "percentage": 40.34, "elapsed_time": "17:07:33", "remaining_time": "1 day, 1:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7239, "total_steps": 17941, "loss": 1.7322, "learning_rate": 6.6450003273422e-05, "epoch": 0.4034892146480129, "percentage": 40.35, "elapsed_time": "17:07:42", "remaining_time": "1 day, 1:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7240, "total_steps": 17941, "loss": 1.6913, "learning_rate": 6.644159447605131e-05, "epoch": 0.4035449529011761, "percentage": 40.35, "elapsed_time": "17:07:51", "remaining_time": "1 day, 1:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7241, "total_steps": 17941, "loss": 1.6574, "learning_rate": 6.64331851572491e-05, "epoch": 0.4036006911543392, "percentage": 40.36, "elapsed_time": "17:07:59", "remaining_time": "1 day, 1:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7242, "total_steps": 17941, "loss": 1.5934, "learning_rate": 6.642477531728207e-05, "epoch": 0.40365642940750235, "percentage": 40.37, "elapsed_time": "17:08:08", "remaining_time": "1 day, 1:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7243, "total_steps": 17941, "loss": 1.8274, "learning_rate": 6.641636495641694e-05, "epoch": 0.40371216766066553, "percentage": 40.37, "elapsed_time": "17:08:16", "remaining_time": "1 day, 1:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7244, "total_steps": 17941, "loss": 1.4047, "learning_rate": 6.640795407492043e-05, "epoch": 0.40376790591382866, "percentage": 40.38, "elapsed_time": "17:08:25", "remaining_time": "1 day, 1:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7245, "total_steps": 17941, "loss": 1.8228, "learning_rate": 6.639954267305928e-05, "epoch": 0.4038236441669918, "percentage": 40.38, "elapsed_time": "17:08:33", "remaining_time": "1 day, 1:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7246, "total_steps": 17941, "loss": 1.8899, "learning_rate": 6.639113075110025e-05, "epoch": 0.403879382420155, "percentage": 40.39, "elapsed_time": "17:08:42", "remaining_time": "1 day, 1:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7247, "total_steps": 17941, "loss": 1.6491, "learning_rate": 6.63827183093101e-05, "epoch": 0.4039351206733181, "percentage": 40.39, "elapsed_time": "17:08:50", "remaining_time": "1 day, 1:18:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7248, "total_steps": 17941, "loss": 1.7502, "learning_rate": 6.637430534795567e-05, "epoch": 0.40399085892648123, "percentage": 40.4, "elapsed_time": "17:08:59", "remaining_time": "1 day, 1:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7249, "total_steps": 17941, "loss": 1.6643, "learning_rate": 6.636589186730373e-05, "epoch": 0.40404659717964436, "percentage": 40.4, "elapsed_time": "17:09:07", "remaining_time": "1 day, 1:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7250, "total_steps": 17941, "loss": 1.5516, "learning_rate": 6.635747786762113e-05, "epoch": 0.40410233543280755, "percentage": 40.41, "elapsed_time": "17:09:16", "remaining_time": "1 day, 1:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7251, "total_steps": 17941, "loss": 1.5581, "learning_rate": 6.63490633491747e-05, "epoch": 0.4041580736859707, "percentage": 40.42, "elapsed_time": "17:09:24", "remaining_time": "1 day, 1:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7252, "total_steps": 17941, "loss": 1.7449, "learning_rate": 6.63406483122313e-05, "epoch": 0.4042138119391338, "percentage": 40.42, "elapsed_time": "17:09:33", "remaining_time": "1 day, 1:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7253, "total_steps": 17941, "loss": 1.6806, "learning_rate": 6.633223275705781e-05, "epoch": 0.404269550192297, "percentage": 40.43, "elapsed_time": "17:09:41", "remaining_time": "1 day, 1:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7254, "total_steps": 17941, "loss": 1.742, "learning_rate": 6.632381668392111e-05, "epoch": 0.4043252884454601, "percentage": 40.43, "elapsed_time": "17:09:50", "remaining_time": "1 day, 1:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7255, "total_steps": 17941, "loss": 1.7586, "learning_rate": 6.631540009308813e-05, "epoch": 0.40438102669862325, "percentage": 40.44, "elapsed_time": "17:09:59", "remaining_time": "1 day, 1:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7256, "total_steps": 17941, "loss": 1.8601, "learning_rate": 6.630698298482578e-05, "epoch": 0.40443676495178643, "percentage": 40.44, "elapsed_time": "17:10:07", "remaining_time": "1 day, 1:16:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7257, "total_steps": 17941, "loss": 1.5131, "learning_rate": 6.629856535940101e-05, "epoch": 0.40449250320494956, "percentage": 40.45, "elapsed_time": "17:10:15", "remaining_time": "1 day, 1:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7258, "total_steps": 17941, "loss": 1.6167, "learning_rate": 6.629014721708076e-05, "epoch": 0.4045482414581127, "percentage": 40.45, "elapsed_time": "17:10:24", "remaining_time": "1 day, 1:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7259, "total_steps": 17941, "loss": 1.6698, "learning_rate": 6.628172855813203e-05, "epoch": 0.4046039797112759, "percentage": 40.46, "elapsed_time": "17:10:33", "remaining_time": "1 day, 1:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7260, "total_steps": 17941, "loss": 1.7449, "learning_rate": 6.627330938282182e-05, "epoch": 0.404659717964439, "percentage": 40.47, "elapsed_time": "17:10:41", "remaining_time": "1 day, 1:16:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7261, "total_steps": 17941, "loss": 1.6906, "learning_rate": 6.62648896914171e-05, "epoch": 0.40471545621760213, "percentage": 40.47, "elapsed_time": "17:10:49", "remaining_time": "1 day, 1:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7262, "total_steps": 17941, "loss": 1.651, "learning_rate": 6.62564694841849e-05, "epoch": 0.40477119447076526, "percentage": 40.48, "elapsed_time": "17:10:58", "remaining_time": "1 day, 1:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7263, "total_steps": 17941, "loss": 1.6232, "learning_rate": 6.624804876139227e-05, "epoch": 0.40482693272392845, "percentage": 40.48, "elapsed_time": "17:11:06", "remaining_time": "1 day, 1:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7264, "total_steps": 17941, "loss": 1.5745, "learning_rate": 6.623962752330627e-05, "epoch": 0.4048826709770916, "percentage": 40.49, "elapsed_time": "17:11:15", "remaining_time": "1 day, 1:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7265, "total_steps": 17941, "loss": 1.621, "learning_rate": 6.623120577019396e-05, "epoch": 0.4049384092302547, "percentage": 40.49, "elapsed_time": "17:11:23", "remaining_time": "1 day, 1:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7266, "total_steps": 17941, "loss": 1.8571, "learning_rate": 6.622278350232246e-05, "epoch": 0.4049941474834179, "percentage": 40.5, "elapsed_time": "17:11:32", "remaining_time": "1 day, 1:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7267, "total_steps": 17941, "loss": 1.5815, "learning_rate": 6.621436071995884e-05, "epoch": 0.405049885736581, "percentage": 40.5, "elapsed_time": "17:11:40", "remaining_time": "1 day, 1:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7268, "total_steps": 17941, "loss": 1.7069, "learning_rate": 6.620593742337022e-05, "epoch": 0.40510562398974415, "percentage": 40.51, "elapsed_time": "17:11:49", "remaining_time": "1 day, 1:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7269, "total_steps": 17941, "loss": 1.5408, "learning_rate": 6.619751361282377e-05, "epoch": 0.40516136224290733, "percentage": 40.52, "elapsed_time": "17:11:58", "remaining_time": "1 day, 1:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7270, "total_steps": 17941, "loss": 1.7405, "learning_rate": 6.618908928858663e-05, "epoch": 0.40521710049607046, "percentage": 40.52, "elapsed_time": "17:12:07", "remaining_time": "1 day, 1:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7271, "total_steps": 17941, "loss": 1.5968, "learning_rate": 6.618066445092595e-05, "epoch": 0.4052728387492336, "percentage": 40.53, "elapsed_time": "17:12:15", "remaining_time": "1 day, 1:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7272, "total_steps": 17941, "loss": 1.8194, "learning_rate": 6.617223910010896e-05, "epoch": 0.4053285770023967, "percentage": 40.53, "elapsed_time": "17:12:24", "remaining_time": "1 day, 1:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7273, "total_steps": 17941, "loss": 1.4983, "learning_rate": 6.61638132364028e-05, "epoch": 0.4053843152555599, "percentage": 40.54, "elapsed_time": "17:12:32", "remaining_time": "1 day, 1:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7274, "total_steps": 17941, "loss": 1.6838, "learning_rate": 6.615538686007476e-05, "epoch": 0.40544005350872303, "percentage": 40.54, "elapsed_time": "17:12:41", "remaining_time": "1 day, 1:14:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7275, "total_steps": 17941, "loss": 1.87, "learning_rate": 6.614695997139202e-05, "epoch": 0.40549579176188616, "percentage": 40.55, "elapsed_time": "17:12:49", "remaining_time": "1 day, 1:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7276, "total_steps": 17941, "loss": 1.839, "learning_rate": 6.613853257062186e-05, "epoch": 0.40555153001504934, "percentage": 40.56, "elapsed_time": "17:12:58", "remaining_time": "1 day, 1:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7277, "total_steps": 17941, "loss": 1.7833, "learning_rate": 6.613010465803153e-05, "epoch": 0.4056072682682125, "percentage": 40.56, "elapsed_time": "17:13:06", "remaining_time": "1 day, 1:13:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7278, "total_steps": 17941, "loss": 1.8361, "learning_rate": 6.612167623388834e-05, "epoch": 0.4056630065213756, "percentage": 40.57, "elapsed_time": "17:13:15", "remaining_time": "1 day, 1:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7279, "total_steps": 17941, "loss": 1.8218, "learning_rate": 6.611324729845958e-05, "epoch": 0.4057187447745388, "percentage": 40.57, "elapsed_time": "17:13:24", "remaining_time": "1 day, 1:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7280, "total_steps": 17941, "loss": 1.6214, "learning_rate": 6.610481785201254e-05, "epoch": 0.4057744830277019, "percentage": 40.58, "elapsed_time": "17:13:32", "remaining_time": "1 day, 1:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7281, "total_steps": 17941, "loss": 1.5644, "learning_rate": 6.60963878948146e-05, "epoch": 0.40583022128086504, "percentage": 40.58, "elapsed_time": "17:13:40", "remaining_time": "1 day, 1:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7282, "total_steps": 17941, "loss": 1.6407, "learning_rate": 6.608795742713306e-05, "epoch": 0.40588595953402823, "percentage": 40.59, "elapsed_time": "17:13:49", "remaining_time": "1 day, 1:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7283, "total_steps": 17941, "loss": 1.6906, "learning_rate": 6.607952644923534e-05, "epoch": 0.40594169778719136, "percentage": 40.59, "elapsed_time": "17:13:57", "remaining_time": "1 day, 1:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7284, "total_steps": 17941, "loss": 1.5545, "learning_rate": 6.607109496138877e-05, "epoch": 0.4059974360403545, "percentage": 40.6, "elapsed_time": "17:14:06", "remaining_time": "1 day, 1:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7285, "total_steps": 17941, "loss": 1.3279, "learning_rate": 6.606266296386078e-05, "epoch": 0.4060531742935176, "percentage": 40.61, "elapsed_time": "17:14:15", "remaining_time": "1 day, 1:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7286, "total_steps": 17941, "loss": 1.6515, "learning_rate": 6.605423045691875e-05, "epoch": 0.4061089125466808, "percentage": 40.61, "elapsed_time": "17:14:24", "remaining_time": "1 day, 1:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7287, "total_steps": 17941, "loss": 1.7375, "learning_rate": 6.604579744083015e-05, "epoch": 0.40616465079984393, "percentage": 40.62, "elapsed_time": "17:14:32", "remaining_time": "1 day, 1:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7288, "total_steps": 17941, "loss": 1.3345, "learning_rate": 6.60373639158624e-05, "epoch": 0.40622038905300706, "percentage": 40.62, "elapsed_time": "17:14:41", "remaining_time": "1 day, 1:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7289, "total_steps": 17941, "loss": 1.5881, "learning_rate": 6.602892988228299e-05, "epoch": 0.40627612730617024, "percentage": 40.63, "elapsed_time": "17:14:49", "remaining_time": "1 day, 1:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7290, "total_steps": 17941, "loss": 1.6593, "learning_rate": 6.602049534035937e-05, "epoch": 0.40633186555933337, "percentage": 40.63, "elapsed_time": "17:14:58", "remaining_time": "1 day, 1:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7291, "total_steps": 17941, "loss": 1.7801, "learning_rate": 6.601206029035904e-05, "epoch": 0.4063876038124965, "percentage": 40.64, "elapsed_time": "17:15:06", "remaining_time": "1 day, 1:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7292, "total_steps": 17941, "loss": 1.8566, "learning_rate": 6.60036247325495e-05, "epoch": 0.4064433420656597, "percentage": 40.64, "elapsed_time": "17:15:15", "remaining_time": "1 day, 1:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7293, "total_steps": 17941, "loss": 1.6081, "learning_rate": 6.599518866719831e-05, "epoch": 0.4064990803188228, "percentage": 40.65, "elapsed_time": "17:15:24", "remaining_time": "1 day, 1:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7294, "total_steps": 17941, "loss": 1.5883, "learning_rate": 6.5986752094573e-05, "epoch": 0.40655481857198594, "percentage": 40.66, "elapsed_time": "17:15:32", "remaining_time": "1 day, 1:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7295, "total_steps": 17941, "loss": 1.7286, "learning_rate": 6.59783150149411e-05, "epoch": 0.4066105568251491, "percentage": 40.66, "elapsed_time": "17:15:41", "remaining_time": "1 day, 1:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7296, "total_steps": 17941, "loss": 1.782, "learning_rate": 6.596987742857024e-05, "epoch": 0.40666629507831226, "percentage": 40.67, "elapsed_time": "17:15:49", "remaining_time": "1 day, 1:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7297, "total_steps": 17941, "loss": 1.6989, "learning_rate": 6.596143933572795e-05, "epoch": 0.4067220333314754, "percentage": 40.67, "elapsed_time": "17:15:58", "remaining_time": "1 day, 1:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7298, "total_steps": 17941, "loss": 1.7724, "learning_rate": 6.595300073668188e-05, "epoch": 0.4067777715846385, "percentage": 40.68, "elapsed_time": "17:16:06", "remaining_time": "1 day, 1:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7299, "total_steps": 17941, "loss": 1.7927, "learning_rate": 6.594456163169963e-05, "epoch": 0.4068335098378017, "percentage": 40.68, "elapsed_time": "17:16:14", "remaining_time": "1 day, 1:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7300, "total_steps": 17941, "loss": 1.9269, "learning_rate": 6.593612202104885e-05, "epoch": 0.40688924809096483, "percentage": 40.69, "elapsed_time": "17:16:23", "remaining_time": "1 day, 1:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7301, "total_steps": 17941, "loss": 1.6254, "learning_rate": 6.59276819049972e-05, "epoch": 0.40694498634412796, "percentage": 40.69, "elapsed_time": "17:16:32", "remaining_time": "1 day, 1:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7302, "total_steps": 17941, "loss": 2.2446, "learning_rate": 6.591924128381234e-05, "epoch": 0.40700072459729114, "percentage": 40.7, "elapsed_time": "17:16:41", "remaining_time": "1 day, 1:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7303, "total_steps": 17941, "loss": 1.7268, "learning_rate": 6.591080015776196e-05, "epoch": 0.40705646285045427, "percentage": 40.71, "elapsed_time": "17:16:50", "remaining_time": "1 day, 1:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7304, "total_steps": 17941, "loss": 1.5403, "learning_rate": 6.590235852711377e-05, "epoch": 0.4071122011036174, "percentage": 40.71, "elapsed_time": "17:16:58", "remaining_time": "1 day, 1:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7305, "total_steps": 17941, "loss": 1.7487, "learning_rate": 6.589391639213549e-05, "epoch": 0.4071679393567806, "percentage": 40.72, "elapsed_time": "17:17:07", "remaining_time": "1 day, 1:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7306, "total_steps": 17941, "loss": 1.8118, "learning_rate": 6.588547375309484e-05, "epoch": 0.4072236776099437, "percentage": 40.72, "elapsed_time": "17:17:15", "remaining_time": "1 day, 1:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7307, "total_steps": 17941, "loss": 1.7792, "learning_rate": 6.587703061025959e-05, "epoch": 0.40727941586310684, "percentage": 40.73, "elapsed_time": "17:17:24", "remaining_time": "1 day, 1:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7308, "total_steps": 17941, "loss": 1.8367, "learning_rate": 6.586858696389748e-05, "epoch": 0.40733515411626997, "percentage": 40.73, "elapsed_time": "17:17:32", "remaining_time": "1 day, 1:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7309, "total_steps": 17941, "loss": 1.8874, "learning_rate": 6.586014281427632e-05, "epoch": 0.40739089236943316, "percentage": 40.74, "elapsed_time": "17:17:41", "remaining_time": "1 day, 1:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7310, "total_steps": 17941, "loss": 1.6405, "learning_rate": 6.585169816166392e-05, "epoch": 0.4074466306225963, "percentage": 40.74, "elapsed_time": "17:17:49", "remaining_time": "1 day, 1:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7311, "total_steps": 17941, "loss": 1.7544, "learning_rate": 6.584325300632806e-05, "epoch": 0.4075023688757594, "percentage": 40.75, "elapsed_time": "17:17:58", "remaining_time": "1 day, 1:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7312, "total_steps": 17941, "loss": 1.6416, "learning_rate": 6.583480734853658e-05, "epoch": 0.4075581071289226, "percentage": 40.76, "elapsed_time": "17:18:06", "remaining_time": "1 day, 1:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7313, "total_steps": 17941, "loss": 1.7322, "learning_rate": 6.582636118855735e-05, "epoch": 0.4076138453820857, "percentage": 40.76, "elapsed_time": "17:18:15", "remaining_time": "1 day, 1:08:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7314, "total_steps": 17941, "loss": 1.7432, "learning_rate": 6.58179145266582e-05, "epoch": 0.40766958363524886, "percentage": 40.77, "elapsed_time": "17:18:23", "remaining_time": "1 day, 1:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7315, "total_steps": 17941, "loss": 1.6643, "learning_rate": 6.580946736310704e-05, "epoch": 0.40772532188841204, "percentage": 40.77, "elapsed_time": "17:18:32", "remaining_time": "1 day, 1:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7316, "total_steps": 17941, "loss": 1.8664, "learning_rate": 6.580101969817175e-05, "epoch": 0.40778106014157517, "percentage": 40.78, "elapsed_time": "17:18:40", "remaining_time": "1 day, 1:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7317, "total_steps": 17941, "loss": 1.8217, "learning_rate": 6.579257153212024e-05, "epoch": 0.4078367983947383, "percentage": 40.78, "elapsed_time": "17:18:49", "remaining_time": "1 day, 1:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7318, "total_steps": 17941, "loss": 1.5422, "learning_rate": 6.578412286522044e-05, "epoch": 0.4078925366479015, "percentage": 40.79, "elapsed_time": "17:18:57", "remaining_time": "1 day, 1:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7319, "total_steps": 17941, "loss": 1.753, "learning_rate": 6.57756736977403e-05, "epoch": 0.4079482749010646, "percentage": 40.79, "elapsed_time": "17:19:06", "remaining_time": "1 day, 1:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7320, "total_steps": 17941, "loss": 1.5805, "learning_rate": 6.576722402994775e-05, "epoch": 0.40800401315422774, "percentage": 40.8, "elapsed_time": "17:19:14", "remaining_time": "1 day, 1:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7321, "total_steps": 17941, "loss": 1.742, "learning_rate": 6.575877386211077e-05, "epoch": 0.40805975140739087, "percentage": 40.81, "elapsed_time": "17:19:23", "remaining_time": "1 day, 1:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7322, "total_steps": 17941, "loss": 1.7166, "learning_rate": 6.57503231944974e-05, "epoch": 0.40811548966055405, "percentage": 40.81, "elapsed_time": "17:19:31", "remaining_time": "1 day, 1:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7323, "total_steps": 17941, "loss": 1.8698, "learning_rate": 6.574187202737558e-05, "epoch": 0.4081712279137172, "percentage": 40.82, "elapsed_time": "17:19:40", "remaining_time": "1 day, 1:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7324, "total_steps": 17941, "loss": 1.5871, "learning_rate": 6.573342036101339e-05, "epoch": 0.4082269661668803, "percentage": 40.82, "elapsed_time": "17:19:48", "remaining_time": "1 day, 1:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7325, "total_steps": 17941, "loss": 1.6091, "learning_rate": 6.572496819567882e-05, "epoch": 0.4082827044200435, "percentage": 40.83, "elapsed_time": "17:19:57", "remaining_time": "1 day, 1:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7326, "total_steps": 17941, "loss": 1.9233, "learning_rate": 6.571651553163994e-05, "epoch": 0.4083384426732066, "percentage": 40.83, "elapsed_time": "17:20:05", "remaining_time": "1 day, 1:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7327, "total_steps": 17941, "loss": 1.681, "learning_rate": 6.570806236916481e-05, "epoch": 0.40839418092636975, "percentage": 40.84, "elapsed_time": "17:20:14", "remaining_time": "1 day, 1:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7328, "total_steps": 17941, "loss": 1.8081, "learning_rate": 6.569960870852156e-05, "epoch": 0.40844991917953294, "percentage": 40.84, "elapsed_time": "17:20:22", "remaining_time": "1 day, 1:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7329, "total_steps": 17941, "loss": 1.7268, "learning_rate": 6.569115454997823e-05, "epoch": 0.40850565743269607, "percentage": 40.85, "elapsed_time": "17:20:31", "remaining_time": "1 day, 1:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7330, "total_steps": 17941, "loss": 1.9007, "learning_rate": 6.568269989380296e-05, "epoch": 0.4085613956858592, "percentage": 40.86, "elapsed_time": "17:20:39", "remaining_time": "1 day, 1:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7331, "total_steps": 17941, "loss": 1.8163, "learning_rate": 6.56742447402639e-05, "epoch": 0.4086171339390223, "percentage": 40.86, "elapsed_time": "17:20:48", "remaining_time": "1 day, 1:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7332, "total_steps": 17941, "loss": 1.6564, "learning_rate": 6.566578908962918e-05, "epoch": 0.4086728721921855, "percentage": 40.87, "elapsed_time": "17:20:56", "remaining_time": "1 day, 1:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7333, "total_steps": 17941, "loss": 1.3752, "learning_rate": 6.565733294216697e-05, "epoch": 0.40872861044534864, "percentage": 40.87, "elapsed_time": "17:21:05", "remaining_time": "1 day, 1:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7334, "total_steps": 17941, "loss": 1.629, "learning_rate": 6.564887629814543e-05, "epoch": 0.40878434869851177, "percentage": 40.88, "elapsed_time": "17:21:13", "remaining_time": "1 day, 1:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7335, "total_steps": 17941, "loss": 1.6818, "learning_rate": 6.56404191578328e-05, "epoch": 0.40884008695167495, "percentage": 40.88, "elapsed_time": "17:21:22", "remaining_time": "1 day, 1:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7336, "total_steps": 17941, "loss": 1.6562, "learning_rate": 6.563196152149725e-05, "epoch": 0.4088958252048381, "percentage": 40.89, "elapsed_time": "17:21:30", "remaining_time": "1 day, 1:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7337, "total_steps": 17941, "loss": 1.6497, "learning_rate": 6.562350338940704e-05, "epoch": 0.4089515634580012, "percentage": 40.9, "elapsed_time": "17:21:39", "remaining_time": "1 day, 1:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7338, "total_steps": 17941, "loss": 1.5777, "learning_rate": 6.561504476183037e-05, "epoch": 0.4090073017111644, "percentage": 40.9, "elapsed_time": "17:21:47", "remaining_time": "1 day, 1:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7339, "total_steps": 17941, "loss": 1.6048, "learning_rate": 6.560658563903553e-05, "epoch": 0.4090630399643275, "percentage": 40.91, "elapsed_time": "17:21:56", "remaining_time": "1 day, 1:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7340, "total_steps": 17941, "loss": 1.85, "learning_rate": 6.559812602129078e-05, "epoch": 0.40911877821749065, "percentage": 40.91, "elapsed_time": "17:22:04", "remaining_time": "1 day, 1:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7341, "total_steps": 17941, "loss": 1.7366, "learning_rate": 6.558966590886443e-05, "epoch": 0.40917451647065384, "percentage": 40.92, "elapsed_time": "17:22:14", "remaining_time": "1 day, 1:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7342, "total_steps": 17941, "loss": 1.5962, "learning_rate": 6.558120530202476e-05, "epoch": 0.40923025472381697, "percentage": 40.92, "elapsed_time": "17:22:22", "remaining_time": "1 day, 1:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7343, "total_steps": 17941, "loss": 1.6842, "learning_rate": 6.55727442010401e-05, "epoch": 0.4092859929769801, "percentage": 40.93, "elapsed_time": "17:22:30", "remaining_time": "1 day, 1:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7344, "total_steps": 17941, "loss": 1.8824, "learning_rate": 6.55642826061788e-05, "epoch": 0.4093417312301432, "percentage": 40.93, "elapsed_time": "17:22:39", "remaining_time": "1 day, 1:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7345, "total_steps": 17941, "loss": 1.7393, "learning_rate": 6.55558205177092e-05, "epoch": 0.4093974694833064, "percentage": 40.94, "elapsed_time": "17:22:48", "remaining_time": "1 day, 1:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7346, "total_steps": 17941, "loss": 1.6012, "learning_rate": 6.554735793589967e-05, "epoch": 0.40945320773646954, "percentage": 40.95, "elapsed_time": "17:22:56", "remaining_time": "1 day, 1:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7347, "total_steps": 17941, "loss": 1.6051, "learning_rate": 6.553889486101857e-05, "epoch": 0.40950894598963267, "percentage": 40.95, "elapsed_time": "17:23:05", "remaining_time": "1 day, 1:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7348, "total_steps": 17941, "loss": 1.6571, "learning_rate": 6.553043129333436e-05, "epoch": 0.40956468424279585, "percentage": 40.96, "elapsed_time": "17:23:13", "remaining_time": "1 day, 1:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7349, "total_steps": 17941, "loss": 1.6247, "learning_rate": 6.55219672331154e-05, "epoch": 0.409620422495959, "percentage": 40.96, "elapsed_time": "17:23:22", "remaining_time": "1 day, 1:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7350, "total_steps": 17941, "loss": 1.7125, "learning_rate": 6.551350268063015e-05, "epoch": 0.4096761607491221, "percentage": 40.97, "elapsed_time": "17:23:31", "remaining_time": "1 day, 1:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7351, "total_steps": 17941, "loss": 1.9143, "learning_rate": 6.550503763614702e-05, "epoch": 0.4097318990022853, "percentage": 40.97, "elapsed_time": "17:23:39", "remaining_time": "1 day, 1:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7352, "total_steps": 17941, "loss": 1.4884, "learning_rate": 6.549657209993452e-05, "epoch": 0.4097876372554484, "percentage": 40.98, "elapsed_time": "17:23:47", "remaining_time": "1 day, 1:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7353, "total_steps": 17941, "loss": 1.6739, "learning_rate": 6.548810607226109e-05, "epoch": 0.40984337550861155, "percentage": 40.98, "elapsed_time": "17:23:56", "remaining_time": "1 day, 1:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7354, "total_steps": 17941, "loss": 1.8902, "learning_rate": 6.547963955339526e-05, "epoch": 0.4098991137617747, "percentage": 40.99, "elapsed_time": "17:24:04", "remaining_time": "1 day, 1:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7355, "total_steps": 17941, "loss": 1.8688, "learning_rate": 6.547117254360549e-05, "epoch": 0.40995485201493786, "percentage": 41.0, "elapsed_time": "17:24:14", "remaining_time": "1 day, 1:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7356, "total_steps": 17941, "loss": 1.7046, "learning_rate": 6.546270504316033e-05, "epoch": 0.410010590268101, "percentage": 41.0, "elapsed_time": "17:24:22", "remaining_time": "1 day, 1:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7357, "total_steps": 17941, "loss": 1.6008, "learning_rate": 6.545423705232834e-05, "epoch": 0.4100663285212641, "percentage": 41.01, "elapsed_time": "17:24:30", "remaining_time": "1 day, 1:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7358, "total_steps": 17941, "loss": 1.806, "learning_rate": 6.544576857137804e-05, "epoch": 0.4101220667744273, "percentage": 41.01, "elapsed_time": "17:24:39", "remaining_time": "1 day, 1:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7359, "total_steps": 17941, "loss": 1.8252, "learning_rate": 6.543729960057803e-05, "epoch": 0.41017780502759044, "percentage": 41.02, "elapsed_time": "17:24:47", "remaining_time": "1 day, 1:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7360, "total_steps": 17941, "loss": 1.6653, "learning_rate": 6.542883014019686e-05, "epoch": 0.41023354328075357, "percentage": 41.02, "elapsed_time": "17:24:56", "remaining_time": "1 day, 1:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7361, "total_steps": 17941, "loss": 1.7503, "learning_rate": 6.542036019050318e-05, "epoch": 0.41028928153391675, "percentage": 41.03, "elapsed_time": "17:25:04", "remaining_time": "1 day, 1:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7362, "total_steps": 17941, "loss": 2.0138, "learning_rate": 6.541188975176557e-05, "epoch": 0.4103450197870799, "percentage": 41.03, "elapsed_time": "17:25:13", "remaining_time": "1 day, 1:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7363, "total_steps": 17941, "loss": 1.8193, "learning_rate": 6.540341882425267e-05, "epoch": 0.410400758040243, "percentage": 41.04, "elapsed_time": "17:25:21", "remaining_time": "1 day, 1:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7364, "total_steps": 17941, "loss": 1.6905, "learning_rate": 6.539494740823313e-05, "epoch": 0.4104564962934062, "percentage": 41.05, "elapsed_time": "17:25:30", "remaining_time": "1 day, 1:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7365, "total_steps": 17941, "loss": 1.5966, "learning_rate": 6.538647550397563e-05, "epoch": 0.4105122345465693, "percentage": 41.05, "elapsed_time": "17:25:38", "remaining_time": "1 day, 1:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7366, "total_steps": 17941, "loss": 1.9665, "learning_rate": 6.537800311174882e-05, "epoch": 0.41056797279973245, "percentage": 41.06, "elapsed_time": "17:25:47", "remaining_time": "1 day, 1:01:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7367, "total_steps": 17941, "loss": 1.7119, "learning_rate": 6.536953023182143e-05, "epoch": 0.4106237110528956, "percentage": 41.06, "elapsed_time": "17:25:55", "remaining_time": "1 day, 1:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7368, "total_steps": 17941, "loss": 1.8307, "learning_rate": 6.536105686446214e-05, "epoch": 0.41067944930605876, "percentage": 41.07, "elapsed_time": "17:26:04", "remaining_time": "1 day, 1:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7369, "total_steps": 17941, "loss": 1.6834, "learning_rate": 6.535258300993969e-05, "epoch": 0.4107351875592219, "percentage": 41.07, "elapsed_time": "17:26:12", "remaining_time": "1 day, 1:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7370, "total_steps": 17941, "loss": 1.7639, "learning_rate": 6.534410866852283e-05, "epoch": 0.410790925812385, "percentage": 41.08, "elapsed_time": "17:26:21", "remaining_time": "1 day, 1:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7371, "total_steps": 17941, "loss": 1.68, "learning_rate": 6.533563384048029e-05, "epoch": 0.4108466640655482, "percentage": 41.08, "elapsed_time": "17:26:29", "remaining_time": "1 day, 1:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7372, "total_steps": 17941, "loss": 1.6856, "learning_rate": 6.532715852608087e-05, "epoch": 0.41090240231871134, "percentage": 41.09, "elapsed_time": "17:26:38", "remaining_time": "1 day, 1:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7373, "total_steps": 17941, "loss": 1.6829, "learning_rate": 6.531868272559333e-05, "epoch": 0.41095814057187446, "percentage": 41.1, "elapsed_time": "17:26:46", "remaining_time": "1 day, 1:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7374, "total_steps": 17941, "loss": 1.666, "learning_rate": 6.531020643928649e-05, "epoch": 0.41101387882503765, "percentage": 41.1, "elapsed_time": "17:26:55", "remaining_time": "1 day, 1:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7375, "total_steps": 17941, "loss": 1.5504, "learning_rate": 6.530172966742918e-05, "epoch": 0.4110696170782008, "percentage": 41.11, "elapsed_time": "17:27:04", "remaining_time": "1 day, 1:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7376, "total_steps": 17941, "loss": 1.8604, "learning_rate": 6.529325241029022e-05, "epoch": 0.4111253553313639, "percentage": 41.11, "elapsed_time": "17:27:12", "remaining_time": "1 day, 0:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7377, "total_steps": 17941, "loss": 1.5969, "learning_rate": 6.528477466813845e-05, "epoch": 0.41118109358452704, "percentage": 41.12, "elapsed_time": "17:27:20", "remaining_time": "1 day, 0:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7378, "total_steps": 17941, "loss": 1.5824, "learning_rate": 6.527629644124273e-05, "epoch": 0.4112368318376902, "percentage": 41.12, "elapsed_time": "17:27:29", "remaining_time": "1 day, 0:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7379, "total_steps": 17941, "loss": 1.9316, "learning_rate": 6.526781772987197e-05, "epoch": 0.41129257009085335, "percentage": 41.13, "elapsed_time": "17:27:37", "remaining_time": "1 day, 0:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7380, "total_steps": 17941, "loss": 1.6927, "learning_rate": 6.525933853429505e-05, "epoch": 0.4113483083440165, "percentage": 41.13, "elapsed_time": "17:27:46", "remaining_time": "1 day, 0:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7381, "total_steps": 17941, "loss": 1.7149, "learning_rate": 6.525085885478089e-05, "epoch": 0.41140404659717966, "percentage": 41.14, "elapsed_time": "17:27:54", "remaining_time": "1 day, 0:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7382, "total_steps": 17941, "loss": 1.6511, "learning_rate": 6.524237869159838e-05, "epoch": 0.4114597848503428, "percentage": 41.15, "elapsed_time": "17:28:03", "remaining_time": "1 day, 0:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7383, "total_steps": 17941, "loss": 1.5401, "learning_rate": 6.523389804501651e-05, "epoch": 0.4115155231035059, "percentage": 41.15, "elapsed_time": "17:28:11", "remaining_time": "1 day, 0:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7384, "total_steps": 17941, "loss": 1.6796, "learning_rate": 6.52254169153042e-05, "epoch": 0.4115712613566691, "percentage": 41.16, "elapsed_time": "17:28:20", "remaining_time": "1 day, 0:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7385, "total_steps": 17941, "loss": 1.7729, "learning_rate": 6.521693530273045e-05, "epoch": 0.41162699960983223, "percentage": 41.16, "elapsed_time": "17:28:28", "remaining_time": "1 day, 0:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7386, "total_steps": 17941, "loss": 1.6136, "learning_rate": 6.520845320756421e-05, "epoch": 0.41168273786299536, "percentage": 41.17, "elapsed_time": "17:28:37", "remaining_time": "1 day, 0:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7387, "total_steps": 17941, "loss": 1.5817, "learning_rate": 6.519997063007452e-05, "epoch": 0.41173847611615855, "percentage": 41.17, "elapsed_time": "17:28:45", "remaining_time": "1 day, 0:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7388, "total_steps": 17941, "loss": 1.6962, "learning_rate": 6.51914875705304e-05, "epoch": 0.4117942143693217, "percentage": 41.18, "elapsed_time": "17:28:55", "remaining_time": "1 day, 0:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7389, "total_steps": 17941, "loss": 2.035, "learning_rate": 6.518300402920084e-05, "epoch": 0.4118499526224848, "percentage": 41.18, "elapsed_time": "17:29:03", "remaining_time": "1 day, 0:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7390, "total_steps": 17941, "loss": 1.1806, "learning_rate": 6.517452000635493e-05, "epoch": 0.41190569087564793, "percentage": 41.19, "elapsed_time": "17:29:12", "remaining_time": "1 day, 0:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7391, "total_steps": 17941, "loss": 1.7513, "learning_rate": 6.516603550226171e-05, "epoch": 0.4119614291288111, "percentage": 41.2, "elapsed_time": "17:29:20", "remaining_time": "1 day, 0:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7392, "total_steps": 17941, "loss": 1.8616, "learning_rate": 6.515755051719026e-05, "epoch": 0.41201716738197425, "percentage": 41.2, "elapsed_time": "17:29:29", "remaining_time": "1 day, 0:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7393, "total_steps": 17941, "loss": 1.7594, "learning_rate": 6.51490650514097e-05, "epoch": 0.4120729056351374, "percentage": 41.21, "elapsed_time": "17:29:37", "remaining_time": "1 day, 0:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7394, "total_steps": 17941, "loss": 1.5641, "learning_rate": 6.514057910518913e-05, "epoch": 0.41212864388830056, "percentage": 41.21, "elapsed_time": "17:29:46", "remaining_time": "1 day, 0:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7395, "total_steps": 17941, "loss": 1.6398, "learning_rate": 6.513209267879765e-05, "epoch": 0.4121843821414637, "percentage": 41.22, "elapsed_time": "17:29:54", "remaining_time": "1 day, 0:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7396, "total_steps": 17941, "loss": 1.4485, "learning_rate": 6.512360577250443e-05, "epoch": 0.4122401203946268, "percentage": 41.22, "elapsed_time": "17:30:02", "remaining_time": "1 day, 0:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7397, "total_steps": 17941, "loss": 1.6851, "learning_rate": 6.511511838657859e-05, "epoch": 0.41229585864779, "percentage": 41.23, "elapsed_time": "17:30:11", "remaining_time": "1 day, 0:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7398, "total_steps": 17941, "loss": 1.6724, "learning_rate": 6.510663052128934e-05, "epoch": 0.41235159690095313, "percentage": 41.24, "elapsed_time": "17:30:20", "remaining_time": "1 day, 0:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7399, "total_steps": 17941, "loss": 1.7999, "learning_rate": 6.509814217690582e-05, "epoch": 0.41240733515411626, "percentage": 41.24, "elapsed_time": "17:30:28", "remaining_time": "1 day, 0:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7400, "total_steps": 17941, "loss": 1.5216, "learning_rate": 6.508965335369729e-05, "epoch": 0.4124630734072794, "percentage": 41.25, "elapsed_time": "17:30:37", "remaining_time": "1 day, 0:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7401, "total_steps": 17941, "loss": 1.5396, "learning_rate": 6.508116405193292e-05, "epoch": 0.4125188116604426, "percentage": 41.25, "elapsed_time": "17:30:45", "remaining_time": "1 day, 0:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7402, "total_steps": 17941, "loss": 1.7238, "learning_rate": 6.507267427188197e-05, "epoch": 0.4125745499136057, "percentage": 41.26, "elapsed_time": "17:30:54", "remaining_time": "1 day, 0:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7403, "total_steps": 17941, "loss": 1.7004, "learning_rate": 6.506418401381365e-05, "epoch": 0.41263028816676883, "percentage": 41.26, "elapsed_time": "17:31:02", "remaining_time": "1 day, 0:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7404, "total_steps": 17941, "loss": 1.5875, "learning_rate": 6.505569327799726e-05, "epoch": 0.412686026419932, "percentage": 41.27, "elapsed_time": "17:31:11", "remaining_time": "1 day, 0:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7405, "total_steps": 17941, "loss": 1.806, "learning_rate": 6.504720206470205e-05, "epoch": 0.41274176467309515, "percentage": 41.27, "elapsed_time": "17:31:19", "remaining_time": "1 day, 0:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7406, "total_steps": 17941, "loss": 1.6241, "learning_rate": 6.503871037419731e-05, "epoch": 0.4127975029262583, "percentage": 41.28, "elapsed_time": "17:31:28", "remaining_time": "1 day, 0:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7407, "total_steps": 17941, "loss": 1.5105, "learning_rate": 6.50302182067524e-05, "epoch": 0.41285324117942146, "percentage": 41.29, "elapsed_time": "17:31:36", "remaining_time": "1 day, 0:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7408, "total_steps": 17941, "loss": 1.6661, "learning_rate": 6.502172556263656e-05, "epoch": 0.4129089794325846, "percentage": 41.29, "elapsed_time": "17:31:45", "remaining_time": "1 day, 0:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7409, "total_steps": 17941, "loss": 1.5414, "learning_rate": 6.501323244211919e-05, "epoch": 0.4129647176857477, "percentage": 41.3, "elapsed_time": "17:31:53", "remaining_time": "1 day, 0:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7410, "total_steps": 17941, "loss": 1.7312, "learning_rate": 6.500473884546962e-05, "epoch": 0.4130204559389109, "percentage": 41.3, "elapsed_time": "17:32:02", "remaining_time": "1 day, 0:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7411, "total_steps": 17941, "loss": 1.4628, "learning_rate": 6.499624477295722e-05, "epoch": 0.41307619419207403, "percentage": 41.31, "elapsed_time": "17:32:10", "remaining_time": "1 day, 0:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7412, "total_steps": 17941, "loss": 1.7568, "learning_rate": 6.498775022485134e-05, "epoch": 0.41313193244523716, "percentage": 41.31, "elapsed_time": "17:32:19", "remaining_time": "1 day, 0:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7413, "total_steps": 17941, "loss": 1.8805, "learning_rate": 6.497925520142143e-05, "epoch": 0.4131876706984003, "percentage": 41.32, "elapsed_time": "17:32:27", "remaining_time": "1 day, 0:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7414, "total_steps": 17941, "loss": 1.8406, "learning_rate": 6.497075970293688e-05, "epoch": 0.4132434089515635, "percentage": 41.32, "elapsed_time": "17:32:36", "remaining_time": "1 day, 0:54:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7415, "total_steps": 17941, "loss": 1.8577, "learning_rate": 6.496226372966711e-05, "epoch": 0.4132991472047266, "percentage": 41.33, "elapsed_time": "17:32:44", "remaining_time": "1 day, 0:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7416, "total_steps": 17941, "loss": 1.5441, "learning_rate": 6.495376728188159e-05, "epoch": 0.41335488545788973, "percentage": 41.34, "elapsed_time": "17:32:53", "remaining_time": "1 day, 0:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7417, "total_steps": 17941, "loss": 1.7383, "learning_rate": 6.494527035984974e-05, "epoch": 0.4134106237110529, "percentage": 41.34, "elapsed_time": "17:33:01", "remaining_time": "1 day, 0:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7418, "total_steps": 17941, "loss": 1.7542, "learning_rate": 6.493677296384106e-05, "epoch": 0.41346636196421604, "percentage": 41.35, "elapsed_time": "17:33:09", "remaining_time": "1 day, 0:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7419, "total_steps": 17941, "loss": 1.887, "learning_rate": 6.492827509412501e-05, "epoch": 0.4135221002173792, "percentage": 41.35, "elapsed_time": "17:33:18", "remaining_time": "1 day, 0:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7420, "total_steps": 17941, "loss": 1.6247, "learning_rate": 6.491977675097114e-05, "epoch": 0.41357783847054236, "percentage": 41.36, "elapsed_time": "17:33:27", "remaining_time": "1 day, 0:53:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7421, "total_steps": 17941, "loss": 1.7428, "learning_rate": 6.491127793464893e-05, "epoch": 0.4136335767237055, "percentage": 41.36, "elapsed_time": "17:33:36", "remaining_time": "1 day, 0:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7422, "total_steps": 17941, "loss": 1.6937, "learning_rate": 6.490277864542792e-05, "epoch": 0.4136893149768686, "percentage": 41.37, "elapsed_time": "17:33:44", "remaining_time": "1 day, 0:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7423, "total_steps": 17941, "loss": 1.7254, "learning_rate": 6.489427888357765e-05, "epoch": 0.41374505323003175, "percentage": 41.37, "elapsed_time": "17:33:53", "remaining_time": "1 day, 0:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7424, "total_steps": 17941, "loss": 1.6893, "learning_rate": 6.488577864936771e-05, "epoch": 0.41380079148319493, "percentage": 41.38, "elapsed_time": "17:34:01", "remaining_time": "1 day, 0:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7425, "total_steps": 17941, "loss": 1.5928, "learning_rate": 6.487727794306765e-05, "epoch": 0.41385652973635806, "percentage": 41.39, "elapsed_time": "17:34:09", "remaining_time": "1 day, 0:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7426, "total_steps": 17941, "loss": 1.5923, "learning_rate": 6.48687767649471e-05, "epoch": 0.4139122679895212, "percentage": 41.39, "elapsed_time": "17:34:18", "remaining_time": "1 day, 0:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7427, "total_steps": 17941, "loss": 1.5783, "learning_rate": 6.48602751152756e-05, "epoch": 0.41396800624268437, "percentage": 41.4, "elapsed_time": "17:34:26", "remaining_time": "1 day, 0:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7428, "total_steps": 17941, "loss": 1.7081, "learning_rate": 6.485177299432284e-05, "epoch": 0.4140237444958475, "percentage": 41.4, "elapsed_time": "17:34:35", "remaining_time": "1 day, 0:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7429, "total_steps": 17941, "loss": 1.8141, "learning_rate": 6.484327040235844e-05, "epoch": 0.41407948274901063, "percentage": 41.41, "elapsed_time": "17:34:43", "remaining_time": "1 day, 0:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7430, "total_steps": 17941, "loss": 1.8114, "learning_rate": 6.483476733965202e-05, "epoch": 0.4141352210021738, "percentage": 41.41, "elapsed_time": "17:34:52", "remaining_time": "1 day, 0:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7431, "total_steps": 17941, "loss": 1.8538, "learning_rate": 6.48262638064733e-05, "epoch": 0.41419095925533694, "percentage": 41.42, "elapsed_time": "17:35:01", "remaining_time": "1 day, 0:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7432, "total_steps": 17941, "loss": 1.8671, "learning_rate": 6.48177598030919e-05, "epoch": 0.4142466975085001, "percentage": 41.42, "elapsed_time": "17:35:09", "remaining_time": "1 day, 0:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7433, "total_steps": 17941, "loss": 1.6247, "learning_rate": 6.480925532977758e-05, "epoch": 0.41430243576166326, "percentage": 41.43, "elapsed_time": "17:35:18", "remaining_time": "1 day, 0:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7434, "total_steps": 17941, "loss": 1.6946, "learning_rate": 6.480075038680002e-05, "epoch": 0.4143581740148264, "percentage": 41.44, "elapsed_time": "17:35:26", "remaining_time": "1 day, 0:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7435, "total_steps": 17941, "loss": 1.9345, "learning_rate": 6.479224497442897e-05, "epoch": 0.4144139122679895, "percentage": 41.44, "elapsed_time": "17:35:35", "remaining_time": "1 day, 0:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7436, "total_steps": 17941, "loss": 1.8108, "learning_rate": 6.478373909293412e-05, "epoch": 0.41446965052115264, "percentage": 41.45, "elapsed_time": "17:35:44", "remaining_time": "1 day, 0:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7437, "total_steps": 17941, "loss": 1.6404, "learning_rate": 6.477523274258528e-05, "epoch": 0.41452538877431583, "percentage": 41.45, "elapsed_time": "17:35:52", "remaining_time": "1 day, 0:51:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7438, "total_steps": 17941, "loss": 1.8287, "learning_rate": 6.47667259236522e-05, "epoch": 0.41458112702747896, "percentage": 41.46, "elapsed_time": "17:36:01", "remaining_time": "1 day, 0:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7439, "total_steps": 17941, "loss": 1.8535, "learning_rate": 6.475821863640467e-05, "epoch": 0.4146368652806421, "percentage": 41.46, "elapsed_time": "17:36:10", "remaining_time": "1 day, 0:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7440, "total_steps": 17941, "loss": 1.3973, "learning_rate": 6.474971088111248e-05, "epoch": 0.41469260353380527, "percentage": 41.47, "elapsed_time": "17:36:18", "remaining_time": "1 day, 0:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7441, "total_steps": 17941, "loss": 1.5271, "learning_rate": 6.474120265804549e-05, "epoch": 0.4147483417869684, "percentage": 41.47, "elapsed_time": "17:36:27", "remaining_time": "1 day, 0:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7442, "total_steps": 17941, "loss": 1.6953, "learning_rate": 6.473269396747346e-05, "epoch": 0.41480408004013153, "percentage": 41.48, "elapsed_time": "17:36:35", "remaining_time": "1 day, 0:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7443, "total_steps": 17941, "loss": 1.7807, "learning_rate": 6.47241848096663e-05, "epoch": 0.4148598182932947, "percentage": 41.49, "elapsed_time": "17:36:44", "remaining_time": "1 day, 0:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7444, "total_steps": 17941, "loss": 2.0551, "learning_rate": 6.471567518489383e-05, "epoch": 0.41491555654645784, "percentage": 41.49, "elapsed_time": "17:36:53", "remaining_time": "1 day, 0:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7445, "total_steps": 17941, "loss": 1.6525, "learning_rate": 6.470716509342594e-05, "epoch": 0.41497129479962097, "percentage": 41.5, "elapsed_time": "17:37:02", "remaining_time": "1 day, 0:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7446, "total_steps": 17941, "loss": 1.7753, "learning_rate": 6.469865453553254e-05, "epoch": 0.4150270330527841, "percentage": 41.5, "elapsed_time": "17:37:10", "remaining_time": "1 day, 0:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7447, "total_steps": 17941, "loss": 1.6718, "learning_rate": 6.46901435114835e-05, "epoch": 0.4150827713059473, "percentage": 41.51, "elapsed_time": "17:37:19", "remaining_time": "1 day, 0:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7448, "total_steps": 17941, "loss": 1.7607, "learning_rate": 6.468163202154877e-05, "epoch": 0.4151385095591104, "percentage": 41.51, "elapsed_time": "17:37:27", "remaining_time": "1 day, 0:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7449, "total_steps": 17941, "loss": 1.8854, "learning_rate": 6.467312006599828e-05, "epoch": 0.41519424781227354, "percentage": 41.52, "elapsed_time": "17:37:36", "remaining_time": "1 day, 0:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7450, "total_steps": 17941, "loss": 1.6298, "learning_rate": 6.466460764510196e-05, "epoch": 0.4152499860654367, "percentage": 41.52, "elapsed_time": "17:37:44", "remaining_time": "1 day, 0:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7451, "total_steps": 17941, "loss": 1.5961, "learning_rate": 6.465609475912977e-05, "epoch": 0.41530572431859986, "percentage": 41.53, "elapsed_time": "17:37:53", "remaining_time": "1 day, 0:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7452, "total_steps": 17941, "loss": 1.6091, "learning_rate": 6.464758140835173e-05, "epoch": 0.415361462571763, "percentage": 41.54, "elapsed_time": "17:38:02", "remaining_time": "1 day, 0:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7453, "total_steps": 17941, "loss": 1.6807, "learning_rate": 6.463906759303779e-05, "epoch": 0.41541720082492617, "percentage": 41.54, "elapsed_time": "17:38:11", "remaining_time": "1 day, 0:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7454, "total_steps": 17941, "loss": 1.8693, "learning_rate": 6.463055331345798e-05, "epoch": 0.4154729390780893, "percentage": 41.55, "elapsed_time": "17:38:19", "remaining_time": "1 day, 0:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7455, "total_steps": 17941, "loss": 1.5473, "learning_rate": 6.462203856988233e-05, "epoch": 0.4155286773312524, "percentage": 41.55, "elapsed_time": "17:38:28", "remaining_time": "1 day, 0:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7456, "total_steps": 17941, "loss": 1.5523, "learning_rate": 6.461352336258088e-05, "epoch": 0.4155844155844156, "percentage": 41.56, "elapsed_time": "17:38:37", "remaining_time": "1 day, 0:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7457, "total_steps": 17941, "loss": 1.6515, "learning_rate": 6.460500769182365e-05, "epoch": 0.41564015383757874, "percentage": 41.56, "elapsed_time": "17:38:46", "remaining_time": "1 day, 0:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7458, "total_steps": 17941, "loss": 1.6962, "learning_rate": 6.459649155788075e-05, "epoch": 0.41569589209074187, "percentage": 41.57, "elapsed_time": "17:38:54", "remaining_time": "1 day, 0:48:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7459, "total_steps": 17941, "loss": 1.5808, "learning_rate": 6.458797496102222e-05, "epoch": 0.415751630343905, "percentage": 41.58, "elapsed_time": "17:39:03", "remaining_time": "1 day, 0:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7460, "total_steps": 17941, "loss": 1.6652, "learning_rate": 6.45794579015182e-05, "epoch": 0.4158073685970682, "percentage": 41.58, "elapsed_time": "17:39:11", "remaining_time": "1 day, 0:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7461, "total_steps": 17941, "loss": 1.5447, "learning_rate": 6.457094037963877e-05, "epoch": 0.4158631068502313, "percentage": 41.59, "elapsed_time": "17:39:20", "remaining_time": "1 day, 0:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7462, "total_steps": 17941, "loss": 1.8373, "learning_rate": 6.456242239565405e-05, "epoch": 0.41591884510339444, "percentage": 41.59, "elapsed_time": "17:39:28", "remaining_time": "1 day, 0:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7463, "total_steps": 17941, "loss": 1.7338, "learning_rate": 6.455390394983422e-05, "epoch": 0.4159745833565576, "percentage": 41.6, "elapsed_time": "17:39:37", "remaining_time": "1 day, 0:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7464, "total_steps": 17941, "loss": 1.5552, "learning_rate": 6.454538504244938e-05, "epoch": 0.41603032160972075, "percentage": 41.6, "elapsed_time": "17:39:45", "remaining_time": "1 day, 0:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7465, "total_steps": 17941, "loss": 1.692, "learning_rate": 6.453686567376976e-05, "epoch": 0.4160860598628839, "percentage": 41.61, "elapsed_time": "17:39:54", "remaining_time": "1 day, 0:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7466, "total_steps": 17941, "loss": 1.6676, "learning_rate": 6.45283458440655e-05, "epoch": 0.41614179811604707, "percentage": 41.61, "elapsed_time": "17:40:03", "remaining_time": "1 day, 0:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7467, "total_steps": 17941, "loss": 1.6982, "learning_rate": 6.451982555360682e-05, "epoch": 0.4161975363692102, "percentage": 41.62, "elapsed_time": "17:40:12", "remaining_time": "1 day, 0:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7468, "total_steps": 17941, "loss": 1.762, "learning_rate": 6.451130480266395e-05, "epoch": 0.4162532746223733, "percentage": 41.63, "elapsed_time": "17:40:20", "remaining_time": "1 day, 0:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7469, "total_steps": 17941, "loss": 1.5914, "learning_rate": 6.450278359150708e-05, "epoch": 0.41630901287553645, "percentage": 41.63, "elapsed_time": "17:40:29", "remaining_time": "1 day, 0:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7470, "total_steps": 17941, "loss": 1.909, "learning_rate": 6.449426192040649e-05, "epoch": 0.41636475112869964, "percentage": 41.64, "elapsed_time": "17:40:38", "remaining_time": "1 day, 0:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7471, "total_steps": 17941, "loss": 1.8037, "learning_rate": 6.448573978963239e-05, "epoch": 0.41642048938186277, "percentage": 41.64, "elapsed_time": "17:40:47", "remaining_time": "1 day, 0:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7472, "total_steps": 17941, "loss": 1.5707, "learning_rate": 6.44772171994551e-05, "epoch": 0.4164762276350259, "percentage": 41.65, "elapsed_time": "17:40:55", "remaining_time": "1 day, 0:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7473, "total_steps": 17941, "loss": 1.6062, "learning_rate": 6.446869415014488e-05, "epoch": 0.4165319658881891, "percentage": 41.65, "elapsed_time": "17:41:04", "remaining_time": "1 day, 0:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7474, "total_steps": 17941, "loss": 1.7973, "learning_rate": 6.446017064197205e-05, "epoch": 0.4165877041413522, "percentage": 41.66, "elapsed_time": "17:41:13", "remaining_time": "1 day, 0:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7475, "total_steps": 17941, "loss": 1.751, "learning_rate": 6.445164667520691e-05, "epoch": 0.41664344239451534, "percentage": 41.66, "elapsed_time": "17:41:21", "remaining_time": "1 day, 0:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7476, "total_steps": 17941, "loss": 1.5348, "learning_rate": 6.44431222501198e-05, "epoch": 0.4166991806476785, "percentage": 41.67, "elapsed_time": "17:41:30", "remaining_time": "1 day, 0:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7477, "total_steps": 17941, "loss": 1.7648, "learning_rate": 6.443459736698105e-05, "epoch": 0.41675491890084165, "percentage": 41.68, "elapsed_time": "17:41:38", "remaining_time": "1 day, 0:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7478, "total_steps": 17941, "loss": 1.5702, "learning_rate": 6.442607202606104e-05, "epoch": 0.4168106571540048, "percentage": 41.68, "elapsed_time": "17:41:47", "remaining_time": "1 day, 0:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7479, "total_steps": 17941, "loss": 1.5624, "learning_rate": 6.441754622763015e-05, "epoch": 0.41686639540716797, "percentage": 41.69, "elapsed_time": "17:41:55", "remaining_time": "1 day, 0:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7480, "total_steps": 17941, "loss": 1.8265, "learning_rate": 6.440901997195871e-05, "epoch": 0.4169221336603311, "percentage": 41.69, "elapsed_time": "17:42:04", "remaining_time": "1 day, 0:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7481, "total_steps": 17941, "loss": 1.6908, "learning_rate": 6.440049325931721e-05, "epoch": 0.4169778719134942, "percentage": 41.7, "elapsed_time": "17:42:12", "remaining_time": "1 day, 0:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7482, "total_steps": 17941, "loss": 1.8279, "learning_rate": 6.4391966089976e-05, "epoch": 0.41703361016665735, "percentage": 41.7, "elapsed_time": "17:42:21", "remaining_time": "1 day, 0:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7483, "total_steps": 17941, "loss": 1.4909, "learning_rate": 6.438343846420556e-05, "epoch": 0.41708934841982054, "percentage": 41.71, "elapsed_time": "17:42:30", "remaining_time": "1 day, 0:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7484, "total_steps": 17941, "loss": 1.6886, "learning_rate": 6.437491038227628e-05, "epoch": 0.41714508667298367, "percentage": 41.71, "elapsed_time": "17:42:38", "remaining_time": "1 day, 0:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7485, "total_steps": 17941, "loss": 1.5501, "learning_rate": 6.43663818444587e-05, "epoch": 0.4172008249261468, "percentage": 41.72, "elapsed_time": "17:42:47", "remaining_time": "1 day, 0:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7486, "total_steps": 17941, "loss": 1.5227, "learning_rate": 6.435785285102321e-05, "epoch": 0.41725656317931, "percentage": 41.73, "elapsed_time": "17:42:55", "remaining_time": "1 day, 0:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7487, "total_steps": 17941, "loss": 1.8644, "learning_rate": 6.434932340224036e-05, "epoch": 0.4173123014324731, "percentage": 41.73, "elapsed_time": "17:43:04", "remaining_time": "1 day, 0:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7488, "total_steps": 17941, "loss": 1.823, "learning_rate": 6.434079349838062e-05, "epoch": 0.41736803968563624, "percentage": 41.74, "elapsed_time": "17:43:12", "remaining_time": "1 day, 0:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7489, "total_steps": 17941, "loss": 1.6917, "learning_rate": 6.433226313971455e-05, "epoch": 0.4174237779387994, "percentage": 41.74, "elapsed_time": "17:43:21", "remaining_time": "1 day, 0:44:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7490, "total_steps": 17941, "loss": 1.8103, "learning_rate": 6.432373232651261e-05, "epoch": 0.41747951619196255, "percentage": 41.75, "elapsed_time": "17:43:29", "remaining_time": "1 day, 0:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7491, "total_steps": 17941, "loss": 1.6457, "learning_rate": 6.431520105904543e-05, "epoch": 0.4175352544451257, "percentage": 41.75, "elapsed_time": "17:43:38", "remaining_time": "1 day, 0:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7492, "total_steps": 17941, "loss": 1.7308, "learning_rate": 6.430666933758353e-05, "epoch": 0.4175909926982888, "percentage": 41.76, "elapsed_time": "17:43:47", "remaining_time": "1 day, 0:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7493, "total_steps": 17941, "loss": 1.5346, "learning_rate": 6.429813716239747e-05, "epoch": 0.417646730951452, "percentage": 41.76, "elapsed_time": "17:43:55", "remaining_time": "1 day, 0:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7494, "total_steps": 17941, "loss": 1.541, "learning_rate": 6.42896045337579e-05, "epoch": 0.4177024692046151, "percentage": 41.77, "elapsed_time": "17:44:04", "remaining_time": "1 day, 0:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7495, "total_steps": 17941, "loss": 1.6209, "learning_rate": 6.428107145193535e-05, "epoch": 0.41775820745777825, "percentage": 41.78, "elapsed_time": "17:44:13", "remaining_time": "1 day, 0:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7496, "total_steps": 17941, "loss": 1.6333, "learning_rate": 6.427253791720051e-05, "epoch": 0.41781394571094144, "percentage": 41.78, "elapsed_time": "17:44:21", "remaining_time": "1 day, 0:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7497, "total_steps": 17941, "loss": 1.4312, "learning_rate": 6.426400392982396e-05, "epoch": 0.41786968396410457, "percentage": 41.79, "elapsed_time": "17:44:30", "remaining_time": "1 day, 0:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7498, "total_steps": 17941, "loss": 1.4918, "learning_rate": 6.425546949007639e-05, "epoch": 0.4179254222172677, "percentage": 41.79, "elapsed_time": "17:44:38", "remaining_time": "1 day, 0:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7499, "total_steps": 17941, "loss": 1.6224, "learning_rate": 6.424693459822842e-05, "epoch": 0.4179811604704309, "percentage": 41.8, "elapsed_time": "17:44:46", "remaining_time": "1 day, 0:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7500, "total_steps": 17941, "loss": 1.815, "learning_rate": 6.423839925455077e-05, "epoch": 0.418036898723594, "percentage": 41.8, "elapsed_time": "17:44:55", "remaining_time": "1 day, 0:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7501, "total_steps": 17941, "loss": 1.6608, "learning_rate": 6.422986345931411e-05, "epoch": 0.41809263697675714, "percentage": 41.81, "elapsed_time": "17:45:03", "remaining_time": "1 day, 0:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7502, "total_steps": 17941, "loss": 1.5651, "learning_rate": 6.422132721278915e-05, "epoch": 0.4181483752299203, "percentage": 41.81, "elapsed_time": "17:45:12", "remaining_time": "1 day, 0:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7503, "total_steps": 17941, "loss": 1.6941, "learning_rate": 6.421279051524658e-05, "epoch": 0.41820411348308345, "percentage": 41.82, "elapsed_time": "17:45:20", "remaining_time": "1 day, 0:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7504, "total_steps": 17941, "loss": 1.8122, "learning_rate": 6.420425336695719e-05, "epoch": 0.4182598517362466, "percentage": 41.83, "elapsed_time": "17:45:28", "remaining_time": "1 day, 0:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7505, "total_steps": 17941, "loss": 1.59, "learning_rate": 6.419571576819168e-05, "epoch": 0.4183155899894097, "percentage": 41.83, "elapsed_time": "17:45:37", "remaining_time": "1 day, 0:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7506, "total_steps": 17941, "loss": 1.6675, "learning_rate": 6.418717771922084e-05, "epoch": 0.4183713282425729, "percentage": 41.84, "elapsed_time": "17:45:46", "remaining_time": "1 day, 0:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7507, "total_steps": 17941, "loss": 1.9184, "learning_rate": 6.417863922031544e-05, "epoch": 0.418427066495736, "percentage": 41.84, "elapsed_time": "17:45:54", "remaining_time": "1 day, 0:41:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7508, "total_steps": 17941, "loss": 1.7789, "learning_rate": 6.417010027174627e-05, "epoch": 0.41848280474889915, "percentage": 41.85, "elapsed_time": "17:46:02", "remaining_time": "1 day, 0:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7509, "total_steps": 17941, "loss": 1.6246, "learning_rate": 6.416156087378415e-05, "epoch": 0.41853854300206234, "percentage": 41.85, "elapsed_time": "17:46:11", "remaining_time": "1 day, 0:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7510, "total_steps": 17941, "loss": 1.5967, "learning_rate": 6.415302102669987e-05, "epoch": 0.41859428125522546, "percentage": 41.86, "elapsed_time": "17:46:19", "remaining_time": "1 day, 0:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7511, "total_steps": 17941, "loss": 1.6613, "learning_rate": 6.414448073076429e-05, "epoch": 0.4186500195083886, "percentage": 41.87, "elapsed_time": "17:46:28", "remaining_time": "1 day, 0:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7512, "total_steps": 17941, "loss": 1.709, "learning_rate": 6.413593998624824e-05, "epoch": 0.4187057577615518, "percentage": 41.87, "elapsed_time": "17:46:36", "remaining_time": "1 day, 0:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7513, "total_steps": 17941, "loss": 1.6281, "learning_rate": 6.41273987934226e-05, "epoch": 0.4187614960147149, "percentage": 41.88, "elapsed_time": "17:46:46", "remaining_time": "1 day, 0:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7514, "total_steps": 17941, "loss": 1.7274, "learning_rate": 6.411885715255823e-05, "epoch": 0.41881723426787804, "percentage": 41.88, "elapsed_time": "17:46:54", "remaining_time": "1 day, 0:40:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7515, "total_steps": 17941, "loss": 1.6704, "learning_rate": 6.411031506392605e-05, "epoch": 0.41887297252104116, "percentage": 41.89, "elapsed_time": "17:47:03", "remaining_time": "1 day, 0:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7516, "total_steps": 17941, "loss": 1.7526, "learning_rate": 6.410177252779692e-05, "epoch": 0.41892871077420435, "percentage": 41.89, "elapsed_time": "17:47:11", "remaining_time": "1 day, 0:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7517, "total_steps": 17941, "loss": 1.5793, "learning_rate": 6.409322954444179e-05, "epoch": 0.4189844490273675, "percentage": 41.9, "elapsed_time": "17:47:19", "remaining_time": "1 day, 0:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7518, "total_steps": 17941, "loss": 1.8319, "learning_rate": 6.408468611413159e-05, "epoch": 0.4190401872805306, "percentage": 41.9, "elapsed_time": "17:47:28", "remaining_time": "1 day, 0:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7519, "total_steps": 17941, "loss": 1.6506, "learning_rate": 6.407614223713727e-05, "epoch": 0.4190959255336938, "percentage": 41.91, "elapsed_time": "17:47:37", "remaining_time": "1 day, 0:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7520, "total_steps": 17941, "loss": 1.5807, "learning_rate": 6.40675979137298e-05, "epoch": 0.4191516637868569, "percentage": 41.92, "elapsed_time": "17:47:45", "remaining_time": "1 day, 0:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7521, "total_steps": 17941, "loss": 1.6839, "learning_rate": 6.405905314418013e-05, "epoch": 0.41920740204002005, "percentage": 41.92, "elapsed_time": "17:47:53", "remaining_time": "1 day, 0:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7522, "total_steps": 17941, "loss": 1.5602, "learning_rate": 6.405050792875926e-05, "epoch": 0.41926314029318323, "percentage": 41.93, "elapsed_time": "17:48:02", "remaining_time": "1 day, 0:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7523, "total_steps": 17941, "loss": 1.5204, "learning_rate": 6.40419622677382e-05, "epoch": 0.41931887854634636, "percentage": 41.93, "elapsed_time": "17:48:11", "remaining_time": "1 day, 0:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7524, "total_steps": 17941, "loss": 1.7654, "learning_rate": 6.403341616138797e-05, "epoch": 0.4193746167995095, "percentage": 41.94, "elapsed_time": "17:48:19", "remaining_time": "1 day, 0:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7525, "total_steps": 17941, "loss": 1.7341, "learning_rate": 6.40248696099796e-05, "epoch": 0.4194303550526727, "percentage": 41.94, "elapsed_time": "17:48:28", "remaining_time": "1 day, 0:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7526, "total_steps": 17941, "loss": 1.3932, "learning_rate": 6.401632261378414e-05, "epoch": 0.4194860933058358, "percentage": 41.95, "elapsed_time": "17:48:36", "remaining_time": "1 day, 0:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7527, "total_steps": 17941, "loss": 1.9211, "learning_rate": 6.400777517307265e-05, "epoch": 0.41954183155899893, "percentage": 41.95, "elapsed_time": "17:48:44", "remaining_time": "1 day, 0:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7528, "total_steps": 17941, "loss": 1.848, "learning_rate": 6.39992272881162e-05, "epoch": 0.41959756981216206, "percentage": 41.96, "elapsed_time": "17:48:53", "remaining_time": "1 day, 0:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7529, "total_steps": 17941, "loss": 1.6233, "learning_rate": 6.399067895918587e-05, "epoch": 0.41965330806532525, "percentage": 41.97, "elapsed_time": "17:49:02", "remaining_time": "1 day, 0:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7530, "total_steps": 17941, "loss": 1.578, "learning_rate": 6.39821301865528e-05, "epoch": 0.4197090463184884, "percentage": 41.97, "elapsed_time": "17:49:10", "remaining_time": "1 day, 0:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7531, "total_steps": 17941, "loss": 1.6923, "learning_rate": 6.397358097048806e-05, "epoch": 0.4197647845716515, "percentage": 41.98, "elapsed_time": "17:49:19", "remaining_time": "1 day, 0:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7532, "total_steps": 17941, "loss": 1.7314, "learning_rate": 6.39650313112628e-05, "epoch": 0.4198205228248147, "percentage": 41.98, "elapsed_time": "17:49:27", "remaining_time": "1 day, 0:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7533, "total_steps": 17941, "loss": 1.6396, "learning_rate": 6.39564812091482e-05, "epoch": 0.4198762610779778, "percentage": 41.99, "elapsed_time": "17:49:36", "remaining_time": "1 day, 0:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7534, "total_steps": 17941, "loss": 1.8865, "learning_rate": 6.394793066441534e-05, "epoch": 0.41993199933114095, "percentage": 41.99, "elapsed_time": "17:49:44", "remaining_time": "1 day, 0:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7535, "total_steps": 17941, "loss": 1.8735, "learning_rate": 6.393937967733548e-05, "epoch": 0.41998773758430413, "percentage": 42.0, "elapsed_time": "17:49:52", "remaining_time": "1 day, 0:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7536, "total_steps": 17941, "loss": 1.635, "learning_rate": 6.393082824817974e-05, "epoch": 0.42004347583746726, "percentage": 42.0, "elapsed_time": "17:50:01", "remaining_time": "1 day, 0:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7537, "total_steps": 17941, "loss": 1.797, "learning_rate": 6.392227637721937e-05, "epoch": 0.4200992140906304, "percentage": 42.01, "elapsed_time": "17:50:10", "remaining_time": "1 day, 0:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7538, "total_steps": 17941, "loss": 1.6705, "learning_rate": 6.391372406472557e-05, "epoch": 0.4201549523437935, "percentage": 42.02, "elapsed_time": "17:50:18", "remaining_time": "1 day, 0:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7539, "total_steps": 17941, "loss": 1.7877, "learning_rate": 6.390517131096955e-05, "epoch": 0.4202106905969567, "percentage": 42.02, "elapsed_time": "17:50:27", "remaining_time": "1 day, 0:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7540, "total_steps": 17941, "loss": 1.5672, "learning_rate": 6.389661811622258e-05, "epoch": 0.42026642885011983, "percentage": 42.03, "elapsed_time": "17:50:35", "remaining_time": "1 day, 0:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7541, "total_steps": 17941, "loss": 1.8186, "learning_rate": 6.388806448075591e-05, "epoch": 0.42032216710328296, "percentage": 42.03, "elapsed_time": "17:50:44", "remaining_time": "1 day, 0:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7542, "total_steps": 17941, "loss": 1.5539, "learning_rate": 6.38795104048408e-05, "epoch": 0.42037790535644615, "percentage": 42.04, "elapsed_time": "17:50:52", "remaining_time": "1 day, 0:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7543, "total_steps": 17941, "loss": 1.6383, "learning_rate": 6.387095588874854e-05, "epoch": 0.4204336436096093, "percentage": 42.04, "elapsed_time": "17:51:01", "remaining_time": "1 day, 0:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7544, "total_steps": 17941, "loss": 1.9338, "learning_rate": 6.386240093275044e-05, "epoch": 0.4204893818627724, "percentage": 42.05, "elapsed_time": "17:51:09", "remaining_time": "1 day, 0:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7545, "total_steps": 17941, "loss": 1.5479, "learning_rate": 6.385384553711779e-05, "epoch": 0.4205451201159356, "percentage": 42.05, "elapsed_time": "17:51:18", "remaining_time": "1 day, 0:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7546, "total_steps": 17941, "loss": 1.6119, "learning_rate": 6.384528970212196e-05, "epoch": 0.4206008583690987, "percentage": 42.06, "elapsed_time": "17:51:26", "remaining_time": "1 day, 0:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7547, "total_steps": 17941, "loss": 1.7555, "learning_rate": 6.383673342803424e-05, "epoch": 0.42065659662226185, "percentage": 42.07, "elapsed_time": "17:51:35", "remaining_time": "1 day, 0:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7548, "total_steps": 17941, "loss": 1.629, "learning_rate": 6.382817671512603e-05, "epoch": 0.42071233487542503, "percentage": 42.07, "elapsed_time": "17:51:43", "remaining_time": "1 day, 0:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7549, "total_steps": 17941, "loss": 2.0066, "learning_rate": 6.381961956366865e-05, "epoch": 0.42076807312858816, "percentage": 42.08, "elapsed_time": "17:51:52", "remaining_time": "1 day, 0:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7550, "total_steps": 17941, "loss": 1.7497, "learning_rate": 6.381106197393353e-05, "epoch": 0.4208238113817513, "percentage": 42.08, "elapsed_time": "17:52:00", "remaining_time": "1 day, 0:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7551, "total_steps": 17941, "loss": 1.4505, "learning_rate": 6.380250394619205e-05, "epoch": 0.4208795496349144, "percentage": 42.09, "elapsed_time": "17:52:09", "remaining_time": "1 day, 0:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7552, "total_steps": 17941, "loss": 1.7164, "learning_rate": 6.379394548071563e-05, "epoch": 0.4209352878880776, "percentage": 42.09, "elapsed_time": "17:52:17", "remaining_time": "1 day, 0:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7553, "total_steps": 17941, "loss": 1.4521, "learning_rate": 6.378538657777565e-05, "epoch": 0.42099102614124073, "percentage": 42.1, "elapsed_time": "17:52:26", "remaining_time": "1 day, 0:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7554, "total_steps": 17941, "loss": 1.6832, "learning_rate": 6.37768272376436e-05, "epoch": 0.42104676439440386, "percentage": 42.1, "elapsed_time": "17:52:34", "remaining_time": "1 day, 0:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7555, "total_steps": 17941, "loss": 1.5916, "learning_rate": 6.376826746059092e-05, "epoch": 0.42110250264756705, "percentage": 42.11, "elapsed_time": "17:52:42", "remaining_time": "1 day, 0:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7556, "total_steps": 17941, "loss": 1.5985, "learning_rate": 6.375970724688906e-05, "epoch": 0.4211582409007302, "percentage": 42.12, "elapsed_time": "17:52:51", "remaining_time": "1 day, 0:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7557, "total_steps": 17941, "loss": 1.5822, "learning_rate": 6.375114659680951e-05, "epoch": 0.4212139791538933, "percentage": 42.12, "elapsed_time": "17:53:00", "remaining_time": "1 day, 0:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7558, "total_steps": 17941, "loss": 1.7155, "learning_rate": 6.374258551062378e-05, "epoch": 0.4212697174070565, "percentage": 42.13, "elapsed_time": "17:53:08", "remaining_time": "1 day, 0:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7559, "total_steps": 17941, "loss": 1.7239, "learning_rate": 6.373402398860336e-05, "epoch": 0.4213254556602196, "percentage": 42.13, "elapsed_time": "17:53:17", "remaining_time": "1 day, 0:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7560, "total_steps": 17941, "loss": 1.8782, "learning_rate": 6.372546203101977e-05, "epoch": 0.42138119391338275, "percentage": 42.14, "elapsed_time": "17:53:26", "remaining_time": "1 day, 0:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7561, "total_steps": 17941, "loss": 1.798, "learning_rate": 6.371689963814455e-05, "epoch": 0.4214369321665459, "percentage": 42.14, "elapsed_time": "17:53:34", "remaining_time": "1 day, 0:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7562, "total_steps": 17941, "loss": 1.679, "learning_rate": 6.370833681024924e-05, "epoch": 0.42149267041970906, "percentage": 42.15, "elapsed_time": "17:53:42", "remaining_time": "1 day, 0:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7563, "total_steps": 17941, "loss": 1.6172, "learning_rate": 6.369977354760541e-05, "epoch": 0.4215484086728722, "percentage": 42.15, "elapsed_time": "17:53:51", "remaining_time": "1 day, 0:33:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7564, "total_steps": 17941, "loss": 1.8897, "learning_rate": 6.369120985048464e-05, "epoch": 0.4216041469260353, "percentage": 42.16, "elapsed_time": "17:53:59", "remaining_time": "1 day, 0:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7565, "total_steps": 17941, "loss": 1.9296, "learning_rate": 6.368264571915854e-05, "epoch": 0.4216598851791985, "percentage": 42.17, "elapsed_time": "17:54:08", "remaining_time": "1 day, 0:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7566, "total_steps": 17941, "loss": 1.8127, "learning_rate": 6.367408115389868e-05, "epoch": 0.42171562343236163, "percentage": 42.17, "elapsed_time": "17:54:16", "remaining_time": "1 day, 0:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7567, "total_steps": 17941, "loss": 1.4419, "learning_rate": 6.366551615497669e-05, "epoch": 0.42177136168552476, "percentage": 42.18, "elapsed_time": "17:54:25", "remaining_time": "1 day, 0:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7568, "total_steps": 17941, "loss": 1.5106, "learning_rate": 6.36569507226642e-05, "epoch": 0.42182709993868794, "percentage": 42.18, "elapsed_time": "17:54:33", "remaining_time": "1 day, 0:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7569, "total_steps": 17941, "loss": 1.6104, "learning_rate": 6.364838485723286e-05, "epoch": 0.4218828381918511, "percentage": 42.19, "elapsed_time": "17:54:43", "remaining_time": "1 day, 0:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7570, "total_steps": 17941, "loss": 1.8112, "learning_rate": 6.363981855895433e-05, "epoch": 0.4219385764450142, "percentage": 42.19, "elapsed_time": "17:54:52", "remaining_time": "1 day, 0:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7571, "total_steps": 17941, "loss": 1.668, "learning_rate": 6.363125182810028e-05, "epoch": 0.4219943146981774, "percentage": 42.2, "elapsed_time": "17:55:00", "remaining_time": "1 day, 0:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7572, "total_steps": 17941, "loss": 1.477, "learning_rate": 6.36226846649424e-05, "epoch": 0.4220500529513405, "percentage": 42.21, "elapsed_time": "17:55:09", "remaining_time": "1 day, 0:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7573, "total_steps": 17941, "loss": 1.6127, "learning_rate": 6.361411706975237e-05, "epoch": 0.42210579120450364, "percentage": 42.21, "elapsed_time": "17:55:17", "remaining_time": "1 day, 0:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7574, "total_steps": 17941, "loss": 1.7687, "learning_rate": 6.360554904280196e-05, "epoch": 0.4221615294576668, "percentage": 42.22, "elapsed_time": "17:55:26", "remaining_time": "1 day, 0:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7575, "total_steps": 17941, "loss": 1.7282, "learning_rate": 6.359698058436282e-05, "epoch": 0.42221726771082996, "percentage": 42.22, "elapsed_time": "17:55:34", "remaining_time": "1 day, 0:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7576, "total_steps": 17941, "loss": 1.6214, "learning_rate": 6.358841169470676e-05, "epoch": 0.4222730059639931, "percentage": 42.23, "elapsed_time": "17:55:42", "remaining_time": "1 day, 0:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7577, "total_steps": 17941, "loss": 1.6966, "learning_rate": 6.35798423741055e-05, "epoch": 0.4223287442171562, "percentage": 42.23, "elapsed_time": "17:55:51", "remaining_time": "1 day, 0:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7578, "total_steps": 17941, "loss": 1.6683, "learning_rate": 6.357127262283081e-05, "epoch": 0.4223844824703194, "percentage": 42.24, "elapsed_time": "17:56:00", "remaining_time": "1 day, 0:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7579, "total_steps": 17941, "loss": 1.3579, "learning_rate": 6.356270244115448e-05, "epoch": 0.42244022072348253, "percentage": 42.24, "elapsed_time": "17:56:09", "remaining_time": "1 day, 0:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7580, "total_steps": 17941, "loss": 1.7506, "learning_rate": 6.355413182934831e-05, "epoch": 0.42249595897664566, "percentage": 42.25, "elapsed_time": "17:56:17", "remaining_time": "1 day, 0:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7581, "total_steps": 17941, "loss": 1.5443, "learning_rate": 6.35455607876841e-05, "epoch": 0.42255169722980884, "percentage": 42.26, "elapsed_time": "17:56:26", "remaining_time": "1 day, 0:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7582, "total_steps": 17941, "loss": 1.7318, "learning_rate": 6.353698931643368e-05, "epoch": 0.42260743548297197, "percentage": 42.26, "elapsed_time": "17:56:35", "remaining_time": "1 day, 0:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7583, "total_steps": 17941, "loss": 1.9499, "learning_rate": 6.352841741586888e-05, "epoch": 0.4226631737361351, "percentage": 42.27, "elapsed_time": "17:56:43", "remaining_time": "1 day, 0:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7584, "total_steps": 17941, "loss": 1.6598, "learning_rate": 6.351984508626155e-05, "epoch": 0.42271891198929823, "percentage": 42.27, "elapsed_time": "17:56:52", "remaining_time": "1 day, 0:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7585, "total_steps": 17941, "loss": 1.9022, "learning_rate": 6.351127232788357e-05, "epoch": 0.4227746502424614, "percentage": 42.28, "elapsed_time": "17:57:00", "remaining_time": "1 day, 0:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7586, "total_steps": 17941, "loss": 1.8523, "learning_rate": 6.350269914100681e-05, "epoch": 0.42283038849562454, "percentage": 42.28, "elapsed_time": "17:57:09", "remaining_time": "1 day, 0:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7587, "total_steps": 17941, "loss": 1.7423, "learning_rate": 6.349412552590317e-05, "epoch": 0.42288612674878767, "percentage": 42.29, "elapsed_time": "17:57:17", "remaining_time": "1 day, 0:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7588, "total_steps": 17941, "loss": 1.6669, "learning_rate": 6.348555148284452e-05, "epoch": 0.42294186500195086, "percentage": 42.29, "elapsed_time": "17:57:26", "remaining_time": "1 day, 0:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7589, "total_steps": 17941, "loss": 1.8138, "learning_rate": 6.347697701210281e-05, "epoch": 0.422997603255114, "percentage": 42.3, "elapsed_time": "17:57:34", "remaining_time": "1 day, 0:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7590, "total_steps": 17941, "loss": 1.5228, "learning_rate": 6.346840211394998e-05, "epoch": 0.4230533415082771, "percentage": 42.31, "elapsed_time": "17:57:42", "remaining_time": "1 day, 0:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7591, "total_steps": 17941, "loss": 1.8378, "learning_rate": 6.345982678865795e-05, "epoch": 0.4231090797614403, "percentage": 42.31, "elapsed_time": "17:57:51", "remaining_time": "1 day, 0:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7592, "total_steps": 17941, "loss": 1.9561, "learning_rate": 6.345125103649869e-05, "epoch": 0.4231648180146034, "percentage": 42.32, "elapsed_time": "17:58:00", "remaining_time": "1 day, 0:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7593, "total_steps": 17941, "loss": 1.6172, "learning_rate": 6.344267485774417e-05, "epoch": 0.42322055626776656, "percentage": 42.32, "elapsed_time": "17:58:08", "remaining_time": "1 day, 0:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7594, "total_steps": 17941, "loss": 1.7064, "learning_rate": 6.34340982526664e-05, "epoch": 0.42327629452092974, "percentage": 42.33, "elapsed_time": "17:58:17", "remaining_time": "1 day, 0:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7595, "total_steps": 17941, "loss": 1.5869, "learning_rate": 6.342552122153734e-05, "epoch": 0.42333203277409287, "percentage": 42.33, "elapsed_time": "17:58:26", "remaining_time": "1 day, 0:29:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7596, "total_steps": 17941, "loss": 1.4539, "learning_rate": 6.3416943764629e-05, "epoch": 0.423387771027256, "percentage": 42.34, "elapsed_time": "17:58:34", "remaining_time": "1 day, 0:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7597, "total_steps": 17941, "loss": 1.2324, "learning_rate": 6.340836588221347e-05, "epoch": 0.42344350928041913, "percentage": 42.34, "elapsed_time": "17:58:43", "remaining_time": "1 day, 0:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7598, "total_steps": 17941, "loss": 1.7336, "learning_rate": 6.339978757456274e-05, "epoch": 0.4234992475335823, "percentage": 42.35, "elapsed_time": "17:58:51", "remaining_time": "1 day, 0:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7599, "total_steps": 17941, "loss": 1.8399, "learning_rate": 6.339120884194886e-05, "epoch": 0.42355498578674544, "percentage": 42.36, "elapsed_time": "17:59:00", "remaining_time": "1 day, 0:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7600, "total_steps": 17941, "loss": 1.7355, "learning_rate": 6.338262968464394e-05, "epoch": 0.42361072403990857, "percentage": 42.36, "elapsed_time": "17:59:08", "remaining_time": "1 day, 0:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7601, "total_steps": 17941, "loss": 1.5466, "learning_rate": 6.337405010292e-05, "epoch": 0.42366646229307175, "percentage": 42.37, "elapsed_time": "17:59:17", "remaining_time": "1 day, 0:28:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7602, "total_steps": 17941, "loss": 1.894, "learning_rate": 6.336547009704919e-05, "epoch": 0.4237222005462349, "percentage": 42.37, "elapsed_time": "17:59:25", "remaining_time": "1 day, 0:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7603, "total_steps": 17941, "loss": 1.7874, "learning_rate": 6.335688966730358e-05, "epoch": 0.423777938799398, "percentage": 42.38, "elapsed_time": "17:59:34", "remaining_time": "1 day, 0:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7604, "total_steps": 17941, "loss": 1.4537, "learning_rate": 6.334830881395533e-05, "epoch": 0.4238336770525612, "percentage": 42.38, "elapsed_time": "17:59:42", "remaining_time": "1 day, 0:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7605, "total_steps": 17941, "loss": 1.6731, "learning_rate": 6.333972753727653e-05, "epoch": 0.4238894153057243, "percentage": 42.39, "elapsed_time": "17:59:51", "remaining_time": "1 day, 0:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7606, "total_steps": 17941, "loss": 2.0005, "learning_rate": 6.333114583753936e-05, "epoch": 0.42394515355888746, "percentage": 42.39, "elapsed_time": "17:59:59", "remaining_time": "1 day, 0:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7607, "total_steps": 17941, "loss": 1.7024, "learning_rate": 6.332256371501597e-05, "epoch": 0.4240008918120506, "percentage": 42.4, "elapsed_time": "18:00:08", "remaining_time": "1 day, 0:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7608, "total_steps": 17941, "loss": 1.4046, "learning_rate": 6.331398116997851e-05, "epoch": 0.42405663006521377, "percentage": 42.41, "elapsed_time": "18:00:16", "remaining_time": "1 day, 0:27:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7609, "total_steps": 17941, "loss": 1.7066, "learning_rate": 6.330539820269921e-05, "epoch": 0.4241123683183769, "percentage": 42.41, "elapsed_time": "18:00:25", "remaining_time": "1 day, 0:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7610, "total_steps": 17941, "loss": 1.7871, "learning_rate": 6.329681481345026e-05, "epoch": 0.42416810657154, "percentage": 42.42, "elapsed_time": "18:00:33", "remaining_time": "1 day, 0:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7611, "total_steps": 17941, "loss": 1.6782, "learning_rate": 6.328823100250386e-05, "epoch": 0.4242238448247032, "percentage": 42.42, "elapsed_time": "18:00:43", "remaining_time": "1 day, 0:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7612, "total_steps": 17941, "loss": 1.6405, "learning_rate": 6.327964677013224e-05, "epoch": 0.42427958307786634, "percentage": 42.43, "elapsed_time": "18:00:51", "remaining_time": "1 day, 0:26:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7613, "total_steps": 17941, "loss": 1.798, "learning_rate": 6.327106211660769e-05, "epoch": 0.42433532133102947, "percentage": 42.43, "elapsed_time": "18:01:00", "remaining_time": "1 day, 0:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7614, "total_steps": 17941, "loss": 1.6055, "learning_rate": 6.326247704220239e-05, "epoch": 0.42439105958419265, "percentage": 42.44, "elapsed_time": "18:01:09", "remaining_time": "1 day, 0:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7615, "total_steps": 17941, "loss": 1.7596, "learning_rate": 6.325389154718865e-05, "epoch": 0.4244467978373558, "percentage": 42.44, "elapsed_time": "18:01:17", "remaining_time": "1 day, 0:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7616, "total_steps": 17941, "loss": 1.6401, "learning_rate": 6.324530563183875e-05, "epoch": 0.4245025360905189, "percentage": 42.45, "elapsed_time": "18:01:26", "remaining_time": "1 day, 0:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7617, "total_steps": 17941, "loss": 1.868, "learning_rate": 6.323671929642498e-05, "epoch": 0.4245582743436821, "percentage": 42.46, "elapsed_time": "18:01:34", "remaining_time": "1 day, 0:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7618, "total_steps": 17941, "loss": 1.715, "learning_rate": 6.322813254121964e-05, "epoch": 0.4246140125968452, "percentage": 42.46, "elapsed_time": "18:01:43", "remaining_time": "1 day, 0:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7619, "total_steps": 17941, "loss": 1.5837, "learning_rate": 6.321954536649508e-05, "epoch": 0.42466975085000835, "percentage": 42.47, "elapsed_time": "18:01:51", "remaining_time": "1 day, 0:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7620, "total_steps": 17941, "loss": 1.7406, "learning_rate": 6.32109577725236e-05, "epoch": 0.4247254891031715, "percentage": 42.47, "elapsed_time": "18:02:00", "remaining_time": "1 day, 0:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7621, "total_steps": 17941, "loss": 1.6099, "learning_rate": 6.320236975957757e-05, "epoch": 0.42478122735633467, "percentage": 42.48, "elapsed_time": "18:02:08", "remaining_time": "1 day, 0:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7622, "total_steps": 17941, "loss": 1.5277, "learning_rate": 6.319378132792935e-05, "epoch": 0.4248369656094978, "percentage": 42.48, "elapsed_time": "18:02:17", "remaining_time": "1 day, 0:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7623, "total_steps": 17941, "loss": 1.7702, "learning_rate": 6.318519247785131e-05, "epoch": 0.4248927038626609, "percentage": 42.49, "elapsed_time": "18:02:25", "remaining_time": "1 day, 0:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7624, "total_steps": 17941, "loss": 1.6098, "learning_rate": 6.317660320961585e-05, "epoch": 0.4249484421158241, "percentage": 42.49, "elapsed_time": "18:02:34", "remaining_time": "1 day, 0:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7625, "total_steps": 17941, "loss": 1.6451, "learning_rate": 6.316801352349534e-05, "epoch": 0.42500418036898724, "percentage": 42.5, "elapsed_time": "18:02:42", "remaining_time": "1 day, 0:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7626, "total_steps": 17941, "loss": 1.9987, "learning_rate": 6.315942341976223e-05, "epoch": 0.42505991862215037, "percentage": 42.51, "elapsed_time": "18:02:51", "remaining_time": "1 day, 0:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7627, "total_steps": 17941, "loss": 1.6352, "learning_rate": 6.315083289868892e-05, "epoch": 0.42511565687531355, "percentage": 42.51, "elapsed_time": "18:02:59", "remaining_time": "1 day, 0:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7628, "total_steps": 17941, "loss": 1.8757, "learning_rate": 6.314224196054787e-05, "epoch": 0.4251713951284767, "percentage": 42.52, "elapsed_time": "18:03:07", "remaining_time": "1 day, 0:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7629, "total_steps": 17941, "loss": 2.0665, "learning_rate": 6.313365060561153e-05, "epoch": 0.4252271333816398, "percentage": 42.52, "elapsed_time": "18:03:16", "remaining_time": "1 day, 0:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7630, "total_steps": 17941, "loss": 1.6602, "learning_rate": 6.312505883415238e-05, "epoch": 0.42528287163480294, "percentage": 42.53, "elapsed_time": "18:03:25", "remaining_time": "1 day, 0:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7631, "total_steps": 17941, "loss": 1.7241, "learning_rate": 6.311646664644288e-05, "epoch": 0.4253386098879661, "percentage": 42.53, "elapsed_time": "18:03:33", "remaining_time": "1 day, 0:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7632, "total_steps": 17941, "loss": 1.7581, "learning_rate": 6.310787404275553e-05, "epoch": 0.42539434814112925, "percentage": 42.54, "elapsed_time": "18:03:42", "remaining_time": "1 day, 0:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7633, "total_steps": 17941, "loss": 1.7147, "learning_rate": 6.309928102336284e-05, "epoch": 0.4254500863942924, "percentage": 42.55, "elapsed_time": "18:03:50", "remaining_time": "1 day, 0:23:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7634, "total_steps": 17941, "loss": 1.6103, "learning_rate": 6.309068758853732e-05, "epoch": 0.42550582464745557, "percentage": 42.55, "elapsed_time": "18:03:58", "remaining_time": "1 day, 0:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7635, "total_steps": 17941, "loss": 1.6947, "learning_rate": 6.308209373855154e-05, "epoch": 0.4255615629006187, "percentage": 42.56, "elapsed_time": "18:04:07", "remaining_time": "1 day, 0:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7636, "total_steps": 17941, "loss": 1.6384, "learning_rate": 6.3073499473678e-05, "epoch": 0.4256173011537818, "percentage": 42.56, "elapsed_time": "18:04:16", "remaining_time": "1 day, 0:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7637, "total_steps": 17941, "loss": 1.5643, "learning_rate": 6.30649047941893e-05, "epoch": 0.425673039406945, "percentage": 42.57, "elapsed_time": "18:04:24", "remaining_time": "1 day, 0:23:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7638, "total_steps": 17941, "loss": 1.5257, "learning_rate": 6.305630970035796e-05, "epoch": 0.42572877766010814, "percentage": 42.57, "elapsed_time": "18:04:33", "remaining_time": "1 day, 0:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7639, "total_steps": 17941, "loss": 1.8738, "learning_rate": 6.304771419245663e-05, "epoch": 0.42578451591327127, "percentage": 42.58, "elapsed_time": "18:04:41", "remaining_time": "1 day, 0:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7640, "total_steps": 17941, "loss": 1.8562, "learning_rate": 6.303911827075786e-05, "epoch": 0.42584025416643445, "percentage": 42.58, "elapsed_time": "18:04:50", "remaining_time": "1 day, 0:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7641, "total_steps": 17941, "loss": 1.7146, "learning_rate": 6.303052193553429e-05, "epoch": 0.4258959924195976, "percentage": 42.59, "elapsed_time": "18:04:58", "remaining_time": "1 day, 0:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7642, "total_steps": 17941, "loss": 1.7639, "learning_rate": 6.302192518705853e-05, "epoch": 0.4259517306727607, "percentage": 42.6, "elapsed_time": "18:05:07", "remaining_time": "1 day, 0:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7643, "total_steps": 17941, "loss": 1.5804, "learning_rate": 6.301332802560325e-05, "epoch": 0.42600746892592384, "percentage": 42.6, "elapsed_time": "18:05:16", "remaining_time": "1 day, 0:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7644, "total_steps": 17941, "loss": 1.4344, "learning_rate": 6.300473045144107e-05, "epoch": 0.426063207179087, "percentage": 42.61, "elapsed_time": "18:05:25", "remaining_time": "1 day, 0:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7645, "total_steps": 17941, "loss": 1.6573, "learning_rate": 6.299613246484464e-05, "epoch": 0.42611894543225015, "percentage": 42.61, "elapsed_time": "18:05:33", "remaining_time": "1 day, 0:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7646, "total_steps": 17941, "loss": 1.5995, "learning_rate": 6.298753406608668e-05, "epoch": 0.4261746836854133, "percentage": 42.62, "elapsed_time": "18:05:42", "remaining_time": "1 day, 0:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7647, "total_steps": 17941, "loss": 1.7107, "learning_rate": 6.297893525543986e-05, "epoch": 0.42623042193857646, "percentage": 42.62, "elapsed_time": "18:05:50", "remaining_time": "1 day, 0:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7648, "total_steps": 17941, "loss": 1.6734, "learning_rate": 6.297033603317689e-05, "epoch": 0.4262861601917396, "percentage": 42.63, "elapsed_time": "18:06:00", "remaining_time": "1 day, 0:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7649, "total_steps": 17941, "loss": 1.64, "learning_rate": 6.296173639957045e-05, "epoch": 0.4263418984449027, "percentage": 42.63, "elapsed_time": "18:06:08", "remaining_time": "1 day, 0:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7650, "total_steps": 17941, "loss": 1.3837, "learning_rate": 6.295313635489335e-05, "epoch": 0.4263976366980659, "percentage": 42.64, "elapsed_time": "18:06:16", "remaining_time": "1 day, 0:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7651, "total_steps": 17941, "loss": 1.6142, "learning_rate": 6.294453589941826e-05, "epoch": 0.42645337495122904, "percentage": 42.65, "elapsed_time": "18:06:25", "remaining_time": "1 day, 0:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7652, "total_steps": 17941, "loss": 1.7297, "learning_rate": 6.2935935033418e-05, "epoch": 0.42650911320439217, "percentage": 42.65, "elapsed_time": "18:06:33", "remaining_time": "1 day, 0:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7653, "total_steps": 17941, "loss": 1.7119, "learning_rate": 6.292733375716526e-05, "epoch": 0.4265648514575553, "percentage": 42.66, "elapsed_time": "18:06:42", "remaining_time": "1 day, 0:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7654, "total_steps": 17941, "loss": 1.6478, "learning_rate": 6.291873207093287e-05, "epoch": 0.4266205897107185, "percentage": 42.66, "elapsed_time": "18:06:50", "remaining_time": "1 day, 0:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7655, "total_steps": 17941, "loss": 1.8439, "learning_rate": 6.291012997499362e-05, "epoch": 0.4266763279638816, "percentage": 42.67, "elapsed_time": "18:06:59", "remaining_time": "1 day, 0:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7656, "total_steps": 17941, "loss": 1.6251, "learning_rate": 6.290152746962034e-05, "epoch": 0.42673206621704474, "percentage": 42.67, "elapsed_time": "18:07:07", "remaining_time": "1 day, 0:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7657, "total_steps": 17941, "loss": 1.6364, "learning_rate": 6.289292455508582e-05, "epoch": 0.4267878044702079, "percentage": 42.68, "elapsed_time": "18:07:16", "remaining_time": "1 day, 0:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7658, "total_steps": 17941, "loss": 1.4855, "learning_rate": 6.28843212316629e-05, "epoch": 0.42684354272337105, "percentage": 42.68, "elapsed_time": "18:07:24", "remaining_time": "1 day, 0:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7659, "total_steps": 17941, "loss": 1.6034, "learning_rate": 6.287571749962444e-05, "epoch": 0.4268992809765342, "percentage": 42.69, "elapsed_time": "18:07:33", "remaining_time": "1 day, 0:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7660, "total_steps": 17941, "loss": 2.0333, "learning_rate": 6.286711335924326e-05, "epoch": 0.42695501922969736, "percentage": 42.7, "elapsed_time": "18:07:41", "remaining_time": "1 day, 0:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7661, "total_steps": 17941, "loss": 1.7037, "learning_rate": 6.28585088107923e-05, "epoch": 0.4270107574828605, "percentage": 42.7, "elapsed_time": "18:07:50", "remaining_time": "1 day, 0:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7662, "total_steps": 17941, "loss": 1.5226, "learning_rate": 6.284990385454439e-05, "epoch": 0.4270664957360236, "percentage": 42.71, "elapsed_time": "18:07:58", "remaining_time": "1 day, 0:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7663, "total_steps": 17941, "loss": 1.6186, "learning_rate": 6.284129849077247e-05, "epoch": 0.4271222339891868, "percentage": 42.71, "elapsed_time": "18:08:07", "remaining_time": "1 day, 0:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7664, "total_steps": 17941, "loss": 1.7211, "learning_rate": 6.283269271974941e-05, "epoch": 0.42717797224234993, "percentage": 42.72, "elapsed_time": "18:08:15", "remaining_time": "1 day, 0:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7665, "total_steps": 17941, "loss": 1.6978, "learning_rate": 6.282408654174818e-05, "epoch": 0.42723371049551306, "percentage": 42.72, "elapsed_time": "18:08:24", "remaining_time": "1 day, 0:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7666, "total_steps": 17941, "loss": 1.5544, "learning_rate": 6.281547995704168e-05, "epoch": 0.4272894487486762, "percentage": 42.73, "elapsed_time": "18:08:32", "remaining_time": "1 day, 0:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7667, "total_steps": 17941, "loss": 1.697, "learning_rate": 6.280687296590287e-05, "epoch": 0.4273451870018394, "percentage": 42.73, "elapsed_time": "18:08:41", "remaining_time": "1 day, 0:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7668, "total_steps": 17941, "loss": 1.6596, "learning_rate": 6.279826556860472e-05, "epoch": 0.4274009252550025, "percentage": 42.74, "elapsed_time": "18:08:49", "remaining_time": "1 day, 0:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7669, "total_steps": 17941, "loss": 1.7029, "learning_rate": 6.278965776542021e-05, "epoch": 0.42745666350816564, "percentage": 42.75, "elapsed_time": "18:08:57", "remaining_time": "1 day, 0:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7670, "total_steps": 17941, "loss": 1.7344, "learning_rate": 6.278104955662234e-05, "epoch": 0.4275124017613288, "percentage": 42.75, "elapsed_time": "18:09:06", "remaining_time": "1 day, 0:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7671, "total_steps": 17941, "loss": 1.7182, "learning_rate": 6.277244094248407e-05, "epoch": 0.42756814001449195, "percentage": 42.76, "elapsed_time": "18:09:14", "remaining_time": "1 day, 0:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7672, "total_steps": 17941, "loss": 1.7045, "learning_rate": 6.276383192327846e-05, "epoch": 0.4276238782676551, "percentage": 42.76, "elapsed_time": "18:09:23", "remaining_time": "1 day, 0:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7673, "total_steps": 17941, "loss": 1.5657, "learning_rate": 6.27552224992785e-05, "epoch": 0.42767961652081826, "percentage": 42.77, "elapsed_time": "18:09:31", "remaining_time": "1 day, 0:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7674, "total_steps": 17941, "loss": 1.701, "learning_rate": 6.274661267075728e-05, "epoch": 0.4277353547739814, "percentage": 42.77, "elapsed_time": "18:09:40", "remaining_time": "1 day, 0:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7675, "total_steps": 17941, "loss": 1.804, "learning_rate": 6.27380024379878e-05, "epoch": 0.4277910930271445, "percentage": 42.78, "elapsed_time": "18:09:48", "remaining_time": "1 day, 0:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7676, "total_steps": 17941, "loss": 1.7744, "learning_rate": 6.272939180124317e-05, "epoch": 0.42784683128030765, "percentage": 42.78, "elapsed_time": "18:09:57", "remaining_time": "1 day, 0:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7677, "total_steps": 17941, "loss": 1.9837, "learning_rate": 6.272078076079644e-05, "epoch": 0.42790256953347083, "percentage": 42.79, "elapsed_time": "18:10:05", "remaining_time": "1 day, 0:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7678, "total_steps": 17941, "loss": 1.8042, "learning_rate": 6.27121693169207e-05, "epoch": 0.42795830778663396, "percentage": 42.8, "elapsed_time": "18:10:14", "remaining_time": "1 day, 0:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7679, "total_steps": 17941, "loss": 1.6222, "learning_rate": 6.270355746988908e-05, "epoch": 0.4280140460397971, "percentage": 42.8, "elapsed_time": "18:10:22", "remaining_time": "1 day, 0:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7680, "total_steps": 17941, "loss": 1.6313, "learning_rate": 6.269494521997467e-05, "epoch": 0.4280697842929603, "percentage": 42.81, "elapsed_time": "18:10:31", "remaining_time": "1 day, 0:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7681, "total_steps": 17941, "loss": 1.7364, "learning_rate": 6.268633256745063e-05, "epoch": 0.4281255225461234, "percentage": 42.81, "elapsed_time": "18:10:39", "remaining_time": "1 day, 0:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7682, "total_steps": 17941, "loss": 1.8938, "learning_rate": 6.267771951259009e-05, "epoch": 0.42818126079928653, "percentage": 42.82, "elapsed_time": "18:10:48", "remaining_time": "1 day, 0:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7683, "total_steps": 17941, "loss": 1.706, "learning_rate": 6.26691060556662e-05, "epoch": 0.4282369990524497, "percentage": 42.82, "elapsed_time": "18:10:56", "remaining_time": "1 day, 0:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7684, "total_steps": 17941, "loss": 1.6015, "learning_rate": 6.266049219695211e-05, "epoch": 0.42829273730561285, "percentage": 42.83, "elapsed_time": "18:11:05", "remaining_time": "1 day, 0:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7685, "total_steps": 17941, "loss": 1.9252, "learning_rate": 6.265187793672105e-05, "epoch": 0.428348475558776, "percentage": 42.83, "elapsed_time": "18:11:13", "remaining_time": "1 day, 0:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7686, "total_steps": 17941, "loss": 1.7076, "learning_rate": 6.264326327524617e-05, "epoch": 0.42840421381193916, "percentage": 42.84, "elapsed_time": "18:11:23", "remaining_time": "1 day, 0:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7687, "total_steps": 17941, "loss": 1.8343, "learning_rate": 6.263464821280071e-05, "epoch": 0.4284599520651023, "percentage": 42.85, "elapsed_time": "18:11:31", "remaining_time": "1 day, 0:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7688, "total_steps": 17941, "loss": 1.5771, "learning_rate": 6.262603274965786e-05, "epoch": 0.4285156903182654, "percentage": 42.85, "elapsed_time": "18:11:39", "remaining_time": "1 day, 0:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7689, "total_steps": 17941, "loss": 1.6646, "learning_rate": 6.261741688609087e-05, "epoch": 0.42857142857142855, "percentage": 42.86, "elapsed_time": "18:11:48", "remaining_time": "1 day, 0:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7690, "total_steps": 17941, "loss": 1.8235, "learning_rate": 6.260880062237299e-05, "epoch": 0.42862716682459173, "percentage": 42.86, "elapsed_time": "18:11:57", "remaining_time": "1 day, 0:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7691, "total_steps": 17941, "loss": 1.7776, "learning_rate": 6.260018395877747e-05, "epoch": 0.42868290507775486, "percentage": 42.87, "elapsed_time": "18:12:06", "remaining_time": "1 day, 0:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7692, "total_steps": 17941, "loss": 1.5817, "learning_rate": 6.259156689557757e-05, "epoch": 0.428738643330918, "percentage": 42.87, "elapsed_time": "18:12:14", "remaining_time": "1 day, 0:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7693, "total_steps": 17941, "loss": 1.6236, "learning_rate": 6.258294943304656e-05, "epoch": 0.4287943815840812, "percentage": 42.88, "elapsed_time": "18:12:23", "remaining_time": "1 day, 0:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7694, "total_steps": 17941, "loss": 1.8114, "learning_rate": 6.257433157145779e-05, "epoch": 0.4288501198372443, "percentage": 42.89, "elapsed_time": "18:12:31", "remaining_time": "1 day, 0:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7695, "total_steps": 17941, "loss": 1.7796, "learning_rate": 6.256571331108454e-05, "epoch": 0.42890585809040743, "percentage": 42.89, "elapsed_time": "18:12:40", "remaining_time": "1 day, 0:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7696, "total_steps": 17941, "loss": 1.4089, "learning_rate": 6.25570946522001e-05, "epoch": 0.4289615963435706, "percentage": 42.9, "elapsed_time": "18:12:48", "remaining_time": "1 day, 0:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7697, "total_steps": 17941, "loss": 1.8332, "learning_rate": 6.254847559507783e-05, "epoch": 0.42901733459673375, "percentage": 42.9, "elapsed_time": "18:12:57", "remaining_time": "1 day, 0:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7698, "total_steps": 17941, "loss": 1.7905, "learning_rate": 6.253985613999111e-05, "epoch": 0.4290730728498969, "percentage": 42.91, "elapsed_time": "18:13:05", "remaining_time": "1 day, 0:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7699, "total_steps": 17941, "loss": 1.7185, "learning_rate": 6.253123628721324e-05, "epoch": 0.42912881110306, "percentage": 42.91, "elapsed_time": "18:13:14", "remaining_time": "1 day, 0:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7700, "total_steps": 17941, "loss": 1.6092, "learning_rate": 6.252261603701762e-05, "epoch": 0.4291845493562232, "percentage": 42.92, "elapsed_time": "18:13:23", "remaining_time": "1 day, 0:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7701, "total_steps": 17941, "loss": 1.6353, "learning_rate": 6.251399538967764e-05, "epoch": 0.4292402876093863, "percentage": 42.92, "elapsed_time": "18:13:31", "remaining_time": "1 day, 0:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7702, "total_steps": 17941, "loss": 1.5933, "learning_rate": 6.250537434546668e-05, "epoch": 0.42929602586254945, "percentage": 42.93, "elapsed_time": "18:13:40", "remaining_time": "1 day, 0:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7703, "total_steps": 17941, "loss": 1.5875, "learning_rate": 6.249675290465817e-05, "epoch": 0.42935176411571263, "percentage": 42.94, "elapsed_time": "18:13:48", "remaining_time": "1 day, 0:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7704, "total_steps": 17941, "loss": 1.4277, "learning_rate": 6.248813106752551e-05, "epoch": 0.42940750236887576, "percentage": 42.94, "elapsed_time": "18:13:57", "remaining_time": "1 day, 0:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7705, "total_steps": 17941, "loss": 1.667, "learning_rate": 6.247950883434214e-05, "epoch": 0.4294632406220389, "percentage": 42.95, "elapsed_time": "18:14:05", "remaining_time": "1 day, 0:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7706, "total_steps": 17941, "loss": 1.6387, "learning_rate": 6.24708862053815e-05, "epoch": 0.4295189788752021, "percentage": 42.95, "elapsed_time": "18:14:14", "remaining_time": "1 day, 0:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7707, "total_steps": 17941, "loss": 1.5703, "learning_rate": 6.246226318091708e-05, "epoch": 0.4295747171283652, "percentage": 42.96, "elapsed_time": "18:14:22", "remaining_time": "1 day, 0:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7708, "total_steps": 17941, "loss": 1.4084, "learning_rate": 6.245363976122232e-05, "epoch": 0.42963045538152833, "percentage": 42.96, "elapsed_time": "18:14:31", "remaining_time": "1 day, 0:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7709, "total_steps": 17941, "loss": 1.6056, "learning_rate": 6.244501594657073e-05, "epoch": 0.4296861936346915, "percentage": 42.97, "elapsed_time": "18:14:39", "remaining_time": "1 day, 0:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7710, "total_steps": 17941, "loss": 1.3122, "learning_rate": 6.243639173723577e-05, "epoch": 0.42974193188785464, "percentage": 42.97, "elapsed_time": "18:14:48", "remaining_time": "1 day, 0:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7711, "total_steps": 17941, "loss": 1.5922, "learning_rate": 6.2427767133491e-05, "epoch": 0.4297976701410178, "percentage": 42.98, "elapsed_time": "18:14:56", "remaining_time": "1 day, 0:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7712, "total_steps": 17941, "loss": 1.7423, "learning_rate": 6.241914213560988e-05, "epoch": 0.4298534083941809, "percentage": 42.99, "elapsed_time": "18:15:05", "remaining_time": "1 day, 0:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7713, "total_steps": 17941, "loss": 1.4298, "learning_rate": 6.241051674386602e-05, "epoch": 0.4299091466473441, "percentage": 42.99, "elapsed_time": "18:15:14", "remaining_time": "1 day, 0:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7714, "total_steps": 17941, "loss": 1.6772, "learning_rate": 6.24018909585329e-05, "epoch": 0.4299648849005072, "percentage": 43.0, "elapsed_time": "18:15:23", "remaining_time": "1 day, 0:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7715, "total_steps": 17941, "loss": 1.7007, "learning_rate": 6.239326477988413e-05, "epoch": 0.43002062315367034, "percentage": 43.0, "elapsed_time": "18:15:31", "remaining_time": "1 day, 0:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7716, "total_steps": 17941, "loss": 1.5829, "learning_rate": 6.238463820819325e-05, "epoch": 0.43007636140683353, "percentage": 43.01, "elapsed_time": "18:15:40", "remaining_time": "1 day, 0:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7717, "total_steps": 17941, "loss": 1.7885, "learning_rate": 6.237601124373385e-05, "epoch": 0.43013209965999666, "percentage": 43.01, "elapsed_time": "18:15:48", "remaining_time": "1 day, 0:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7718, "total_steps": 17941, "loss": 1.7993, "learning_rate": 6.236738388677952e-05, "epoch": 0.4301878379131598, "percentage": 43.02, "elapsed_time": "18:15:57", "remaining_time": "1 day, 0:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7719, "total_steps": 17941, "loss": 1.8437, "learning_rate": 6.23587561376039e-05, "epoch": 0.43024357616632297, "percentage": 43.02, "elapsed_time": "18:16:05", "remaining_time": "1 day, 0:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7720, "total_steps": 17941, "loss": 1.7246, "learning_rate": 6.235012799648057e-05, "epoch": 0.4302993144194861, "percentage": 43.03, "elapsed_time": "18:16:13", "remaining_time": "1 day, 0:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7721, "total_steps": 17941, "loss": 1.7322, "learning_rate": 6.23414994636832e-05, "epoch": 0.43035505267264923, "percentage": 43.04, "elapsed_time": "18:16:22", "remaining_time": "1 day, 0:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7722, "total_steps": 17941, "loss": 1.6743, "learning_rate": 6.233287053948543e-05, "epoch": 0.43041079092581236, "percentage": 43.04, "elapsed_time": "18:16:30", "remaining_time": "1 day, 0:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7723, "total_steps": 17941, "loss": 1.5439, "learning_rate": 6.23242412241609e-05, "epoch": 0.43046652917897554, "percentage": 43.05, "elapsed_time": "18:16:39", "remaining_time": "1 day, 0:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7724, "total_steps": 17941, "loss": 2.0254, "learning_rate": 6.23156115179833e-05, "epoch": 0.43052226743213867, "percentage": 43.05, "elapsed_time": "18:16:47", "remaining_time": "1 day, 0:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7725, "total_steps": 17941, "loss": 1.6787, "learning_rate": 6.230698142122629e-05, "epoch": 0.4305780056853018, "percentage": 43.06, "elapsed_time": "18:16:56", "remaining_time": "1 day, 0:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7726, "total_steps": 17941, "loss": 1.711, "learning_rate": 6.229835093416361e-05, "epoch": 0.430633743938465, "percentage": 43.06, "elapsed_time": "18:17:04", "remaining_time": "1 day, 0:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7727, "total_steps": 17941, "loss": 1.5921, "learning_rate": 6.228972005706893e-05, "epoch": 0.4306894821916281, "percentage": 43.07, "elapsed_time": "18:17:13", "remaining_time": "1 day, 0:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7728, "total_steps": 17941, "loss": 1.5798, "learning_rate": 6.228108879021599e-05, "epoch": 0.43074522044479124, "percentage": 43.07, "elapsed_time": "18:17:21", "remaining_time": "1 day, 0:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7729, "total_steps": 17941, "loss": 2.0899, "learning_rate": 6.22724571338785e-05, "epoch": 0.43080095869795443, "percentage": 43.08, "elapsed_time": "18:17:30", "remaining_time": "1 day, 0:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7730, "total_steps": 17941, "loss": 1.6937, "learning_rate": 6.226382508833026e-05, "epoch": 0.43085669695111756, "percentage": 43.09, "elapsed_time": "18:17:38", "remaining_time": "1 day, 0:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7731, "total_steps": 17941, "loss": 1.7363, "learning_rate": 6.225519265384495e-05, "epoch": 0.4309124352042807, "percentage": 43.09, "elapsed_time": "18:17:47", "remaining_time": "1 day, 0:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7732, "total_steps": 17941, "loss": 1.6438, "learning_rate": 6.22465598306964e-05, "epoch": 0.43096817345744387, "percentage": 43.1, "elapsed_time": "18:17:55", "remaining_time": "1 day, 0:09:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7733, "total_steps": 17941, "loss": 1.6701, "learning_rate": 6.223792661915838e-05, "epoch": 0.431023911710607, "percentage": 43.1, "elapsed_time": "18:18:04", "remaining_time": "1 day, 0:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7734, "total_steps": 17941, "loss": 1.6195, "learning_rate": 6.222929301950466e-05, "epoch": 0.43107964996377013, "percentage": 43.11, "elapsed_time": "18:18:12", "remaining_time": "1 day, 0:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7735, "total_steps": 17941, "loss": 1.852, "learning_rate": 6.222065903200908e-05, "epoch": 0.43113538821693326, "percentage": 43.11, "elapsed_time": "18:18:21", "remaining_time": "1 day, 0:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7736, "total_steps": 17941, "loss": 1.9739, "learning_rate": 6.221202465694545e-05, "epoch": 0.43119112647009644, "percentage": 43.12, "elapsed_time": "18:18:29", "remaining_time": "1 day, 0:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7737, "total_steps": 17941, "loss": 1.5755, "learning_rate": 6.22033898945876e-05, "epoch": 0.43124686472325957, "percentage": 43.12, "elapsed_time": "18:18:38", "remaining_time": "1 day, 0:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7738, "total_steps": 17941, "loss": 1.7666, "learning_rate": 6.219475474520936e-05, "epoch": 0.4313026029764227, "percentage": 43.13, "elapsed_time": "18:18:46", "remaining_time": "1 day, 0:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7739, "total_steps": 17941, "loss": 1.6721, "learning_rate": 6.218611920908461e-05, "epoch": 0.4313583412295859, "percentage": 43.14, "elapsed_time": "18:18:55", "remaining_time": "1 day, 0:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7740, "total_steps": 17941, "loss": 1.635, "learning_rate": 6.21774832864872e-05, "epoch": 0.431414079482749, "percentage": 43.14, "elapsed_time": "18:19:04", "remaining_time": "1 day, 0:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7741, "total_steps": 17941, "loss": 1.7878, "learning_rate": 6.216884697769104e-05, "epoch": 0.43146981773591214, "percentage": 43.15, "elapsed_time": "18:19:12", "remaining_time": "1 day, 0:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7742, "total_steps": 17941, "loss": 1.817, "learning_rate": 6.216021028296999e-05, "epoch": 0.4315255559890753, "percentage": 43.15, "elapsed_time": "18:19:21", "remaining_time": "1 day, 0:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7743, "total_steps": 17941, "loss": 1.6086, "learning_rate": 6.215157320259798e-05, "epoch": 0.43158129424223846, "percentage": 43.16, "elapsed_time": "18:19:29", "remaining_time": "1 day, 0:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7744, "total_steps": 17941, "loss": 1.7647, "learning_rate": 6.214293573684889e-05, "epoch": 0.4316370324954016, "percentage": 43.16, "elapsed_time": "18:19:38", "remaining_time": "1 day, 0:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7745, "total_steps": 17941, "loss": 2.0043, "learning_rate": 6.21342978859967e-05, "epoch": 0.4316927707485647, "percentage": 43.17, "elapsed_time": "18:19:47", "remaining_time": "1 day, 0:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7746, "total_steps": 17941, "loss": 1.7955, "learning_rate": 6.212565965031532e-05, "epoch": 0.4317485090017279, "percentage": 43.17, "elapsed_time": "18:19:56", "remaining_time": "1 day, 0:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7747, "total_steps": 17941, "loss": 1.6242, "learning_rate": 6.211702103007871e-05, "epoch": 0.431804247254891, "percentage": 43.18, "elapsed_time": "18:20:04", "remaining_time": "1 day, 0:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7748, "total_steps": 17941, "loss": 1.5951, "learning_rate": 6.210838202556085e-05, "epoch": 0.43185998550805416, "percentage": 43.19, "elapsed_time": "18:20:13", "remaining_time": "1 day, 0:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7749, "total_steps": 17941, "loss": 1.849, "learning_rate": 6.209974263703569e-05, "epoch": 0.43191572376121734, "percentage": 43.19, "elapsed_time": "18:20:21", "remaining_time": "1 day, 0:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7750, "total_steps": 17941, "loss": 1.7899, "learning_rate": 6.209110286477727e-05, "epoch": 0.43197146201438047, "percentage": 43.2, "elapsed_time": "18:20:30", "remaining_time": "1 day, 0:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7751, "total_steps": 17941, "loss": 1.8588, "learning_rate": 6.208246270905952e-05, "epoch": 0.4320272002675436, "percentage": 43.2, "elapsed_time": "18:20:38", "remaining_time": "1 day, 0:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7752, "total_steps": 17941, "loss": 1.7115, "learning_rate": 6.207382217015655e-05, "epoch": 0.4320829385207068, "percentage": 43.21, "elapsed_time": "18:20:46", "remaining_time": "1 day, 0:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7753, "total_steps": 17941, "loss": 1.7556, "learning_rate": 6.206518124834231e-05, "epoch": 0.4321386767738699, "percentage": 43.21, "elapsed_time": "18:20:55", "remaining_time": "1 day, 0:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7754, "total_steps": 17941, "loss": 1.4447, "learning_rate": 6.205653994389087e-05, "epoch": 0.43219441502703304, "percentage": 43.22, "elapsed_time": "18:21:03", "remaining_time": "1 day, 0:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7755, "total_steps": 17941, "loss": 1.7097, "learning_rate": 6.204789825707626e-05, "epoch": 0.4322501532801962, "percentage": 43.23, "elapsed_time": "18:21:12", "remaining_time": "1 day, 0:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7756, "total_steps": 17941, "loss": 1.6242, "learning_rate": 6.203925618817258e-05, "epoch": 0.43230589153335935, "percentage": 43.23, "elapsed_time": "18:21:20", "remaining_time": "1 day, 0:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7757, "total_steps": 17941, "loss": 1.6055, "learning_rate": 6.203061373745388e-05, "epoch": 0.4323616297865225, "percentage": 43.24, "elapsed_time": "18:21:29", "remaining_time": "1 day, 0:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7758, "total_steps": 17941, "loss": 1.6537, "learning_rate": 6.202197090519428e-05, "epoch": 0.4324173680396856, "percentage": 43.24, "elapsed_time": "18:21:37", "remaining_time": "1 day, 0:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7759, "total_steps": 17941, "loss": 1.5895, "learning_rate": 6.201332769166782e-05, "epoch": 0.4324731062928488, "percentage": 43.25, "elapsed_time": "18:21:46", "remaining_time": "1 day, 0:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7760, "total_steps": 17941, "loss": 1.6663, "learning_rate": 6.200468409714866e-05, "epoch": 0.4325288445460119, "percentage": 43.25, "elapsed_time": "18:21:54", "remaining_time": "1 day, 0:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7761, "total_steps": 17941, "loss": 1.6446, "learning_rate": 6.199604012191093e-05, "epoch": 0.43258458279917505, "percentage": 43.26, "elapsed_time": "18:22:03", "remaining_time": "1 day, 0:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7762, "total_steps": 17941, "loss": 1.8155, "learning_rate": 6.198739576622872e-05, "epoch": 0.43264032105233824, "percentage": 43.26, "elapsed_time": "18:22:11", "remaining_time": "1 day, 0:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7763, "total_steps": 17941, "loss": 1.6124, "learning_rate": 6.197875103037623e-05, "epoch": 0.43269605930550137, "percentage": 43.27, "elapsed_time": "18:22:20", "remaining_time": "1 day, 0:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7764, "total_steps": 17941, "loss": 1.72, "learning_rate": 6.197010591462758e-05, "epoch": 0.4327517975586645, "percentage": 43.28, "elapsed_time": "18:22:29", "remaining_time": "1 day, 0:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7765, "total_steps": 17941, "loss": 1.6948, "learning_rate": 6.196146041925697e-05, "epoch": 0.4328075358118277, "percentage": 43.28, "elapsed_time": "18:22:37", "remaining_time": "1 day, 0:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7766, "total_steps": 17941, "loss": 1.5966, "learning_rate": 6.195281454453858e-05, "epoch": 0.4328632740649908, "percentage": 43.29, "elapsed_time": "18:22:45", "remaining_time": "1 day, 0:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7767, "total_steps": 17941, "loss": 1.8594, "learning_rate": 6.19441682907466e-05, "epoch": 0.43291901231815394, "percentage": 43.29, "elapsed_time": "18:22:54", "remaining_time": "1 day, 0:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7768, "total_steps": 17941, "loss": 1.707, "learning_rate": 6.193552165815525e-05, "epoch": 0.43297475057131707, "percentage": 43.3, "elapsed_time": "18:23:02", "remaining_time": "1 day, 0:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7769, "total_steps": 17941, "loss": 1.3713, "learning_rate": 6.192687464703873e-05, "epoch": 0.43303048882448025, "percentage": 43.3, "elapsed_time": "18:23:11", "remaining_time": "1 day, 0:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7770, "total_steps": 17941, "loss": 1.7667, "learning_rate": 6.191822725767129e-05, "epoch": 0.4330862270776434, "percentage": 43.31, "elapsed_time": "18:23:19", "remaining_time": "1 day, 0:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7771, "total_steps": 17941, "loss": 1.688, "learning_rate": 6.190957949032716e-05, "epoch": 0.4331419653308065, "percentage": 43.31, "elapsed_time": "18:23:28", "remaining_time": "1 day, 0:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7772, "total_steps": 17941, "loss": 1.6081, "learning_rate": 6.190093134528061e-05, "epoch": 0.4331977035839697, "percentage": 43.32, "elapsed_time": "18:23:37", "remaining_time": "1 day, 0:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7773, "total_steps": 17941, "loss": 1.7503, "learning_rate": 6.189228282280592e-05, "epoch": 0.4332534418371328, "percentage": 43.33, "elapsed_time": "18:23:45", "remaining_time": "1 day, 0:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7774, "total_steps": 17941, "loss": 1.7848, "learning_rate": 6.188363392317734e-05, "epoch": 0.43330918009029595, "percentage": 43.33, "elapsed_time": "18:23:54", "remaining_time": "1 day, 0:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7775, "total_steps": 17941, "loss": 1.8112, "learning_rate": 6.187498464666917e-05, "epoch": 0.43336491834345914, "percentage": 43.34, "elapsed_time": "18:24:02", "remaining_time": "1 day, 0:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7776, "total_steps": 17941, "loss": 1.5268, "learning_rate": 6.186633499355576e-05, "epoch": 0.43342065659662227, "percentage": 43.34, "elapsed_time": "18:24:11", "remaining_time": "1 day, 0:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7777, "total_steps": 17941, "loss": 1.6839, "learning_rate": 6.185768496411135e-05, "epoch": 0.4334763948497854, "percentage": 43.35, "elapsed_time": "18:24:19", "remaining_time": "1 day, 0:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7778, "total_steps": 17941, "loss": 1.592, "learning_rate": 6.184903455861032e-05, "epoch": 0.4335321331029486, "percentage": 43.35, "elapsed_time": "18:24:28", "remaining_time": "1 day, 0:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7779, "total_steps": 17941, "loss": 1.7992, "learning_rate": 6.1840383777327e-05, "epoch": 0.4335878713561117, "percentage": 43.36, "elapsed_time": "18:24:37", "remaining_time": "1 day, 0:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7780, "total_steps": 17941, "loss": 1.76, "learning_rate": 6.183173262053575e-05, "epoch": 0.43364360960927484, "percentage": 43.36, "elapsed_time": "18:24:45", "remaining_time": "1 day, 0:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7781, "total_steps": 17941, "loss": 1.5548, "learning_rate": 6.182308108851091e-05, "epoch": 0.43369934786243797, "percentage": 43.37, "elapsed_time": "18:24:54", "remaining_time": "1 day, 0:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7782, "total_steps": 17941, "loss": 1.4981, "learning_rate": 6.18144291815269e-05, "epoch": 0.43375508611560115, "percentage": 43.38, "elapsed_time": "18:25:02", "remaining_time": "1 day, 0:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7783, "total_steps": 17941, "loss": 1.6661, "learning_rate": 6.180577689985805e-05, "epoch": 0.4338108243687643, "percentage": 43.38, "elapsed_time": "18:25:11", "remaining_time": "1 day, 0:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7784, "total_steps": 17941, "loss": 1.6262, "learning_rate": 6.179712424377879e-05, "epoch": 0.4338665626219274, "percentage": 43.39, "elapsed_time": "18:25:19", "remaining_time": "1 day, 0:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7785, "total_steps": 17941, "loss": 1.9091, "learning_rate": 6.178847121356353e-05, "epoch": 0.4339223008750906, "percentage": 43.39, "elapsed_time": "18:25:28", "remaining_time": "1 day, 0:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7786, "total_steps": 17941, "loss": 1.7357, "learning_rate": 6.17798178094867e-05, "epoch": 0.4339780391282537, "percentage": 43.4, "elapsed_time": "18:25:37", "remaining_time": "1 day, 0:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7787, "total_steps": 17941, "loss": 1.6313, "learning_rate": 6.177116403182274e-05, "epoch": 0.43403377738141685, "percentage": 43.4, "elapsed_time": "18:25:45", "remaining_time": "1 day, 0:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7788, "total_steps": 17941, "loss": 1.605, "learning_rate": 6.176250988084608e-05, "epoch": 0.43408951563458004, "percentage": 43.41, "elapsed_time": "18:25:54", "remaining_time": "1 day, 0:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7789, "total_steps": 17941, "loss": 1.5072, "learning_rate": 6.17538553568312e-05, "epoch": 0.43414525388774317, "percentage": 43.41, "elapsed_time": "18:26:02", "remaining_time": "1 day, 0:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7790, "total_steps": 17941, "loss": 1.769, "learning_rate": 6.174520046005253e-05, "epoch": 0.4342009921409063, "percentage": 43.42, "elapsed_time": "18:26:11", "remaining_time": "1 day, 0:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7791, "total_steps": 17941, "loss": 1.6427, "learning_rate": 6.17365451907846e-05, "epoch": 0.4342567303940694, "percentage": 43.43, "elapsed_time": "18:26:19", "remaining_time": "1 day, 0:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7792, "total_steps": 17941, "loss": 1.7614, "learning_rate": 6.172788954930188e-05, "epoch": 0.4343124686472326, "percentage": 43.43, "elapsed_time": "18:26:28", "remaining_time": "1 day, 0:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7793, "total_steps": 17941, "loss": 1.7932, "learning_rate": 6.171923353587888e-05, "epoch": 0.43436820690039574, "percentage": 43.44, "elapsed_time": "18:26:37", "remaining_time": "1 day, 0:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7794, "total_steps": 17941, "loss": 1.5032, "learning_rate": 6.171057715079012e-05, "epoch": 0.43442394515355887, "percentage": 43.44, "elapsed_time": "18:26:46", "remaining_time": "1 day, 0:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7795, "total_steps": 17941, "loss": 1.7822, "learning_rate": 6.170192039431013e-05, "epoch": 0.43447968340672205, "percentage": 43.45, "elapsed_time": "18:26:54", "remaining_time": "1 day, 0:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7796, "total_steps": 17941, "loss": 1.4389, "learning_rate": 6.169326326671346e-05, "epoch": 0.4345354216598852, "percentage": 43.45, "elapsed_time": "18:27:03", "remaining_time": "1 day, 0:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7797, "total_steps": 17941, "loss": 1.6287, "learning_rate": 6.168460576827465e-05, "epoch": 0.4345911599130483, "percentage": 43.46, "elapsed_time": "18:27:11", "remaining_time": "1 day, 0:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7798, "total_steps": 17941, "loss": 1.9769, "learning_rate": 6.167594789926827e-05, "epoch": 0.4346468981662115, "percentage": 43.46, "elapsed_time": "18:27:20", "remaining_time": "1 day, 0:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7799, "total_steps": 17941, "loss": 1.8077, "learning_rate": 6.16672896599689e-05, "epoch": 0.4347026364193746, "percentage": 43.47, "elapsed_time": "18:27:28", "remaining_time": "1 day, 0:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7800, "total_steps": 17941, "loss": 1.7451, "learning_rate": 6.165863105065113e-05, "epoch": 0.43475837467253775, "percentage": 43.48, "elapsed_time": "18:27:37", "remaining_time": "1 day, 0:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7801, "total_steps": 17941, "loss": 1.809, "learning_rate": 6.164997207158954e-05, "epoch": 0.43481411292570094, "percentage": 43.48, "elapsed_time": "18:27:45", "remaining_time": "23:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7802, "total_steps": 17941, "loss": 1.7839, "learning_rate": 6.164131272305878e-05, "epoch": 0.43486985117886406, "percentage": 43.49, "elapsed_time": "18:27:54", "remaining_time": "23:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7803, "total_steps": 17941, "loss": 1.6121, "learning_rate": 6.163265300533345e-05, "epoch": 0.4349255894320272, "percentage": 43.49, "elapsed_time": "18:28:02", "remaining_time": "23:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7804, "total_steps": 17941, "loss": 1.7024, "learning_rate": 6.162399291868819e-05, "epoch": 0.4349813276851903, "percentage": 43.5, "elapsed_time": "18:28:10", "remaining_time": "23:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7805, "total_steps": 17941, "loss": 1.702, "learning_rate": 6.161533246339764e-05, "epoch": 0.4350370659383535, "percentage": 43.5, "elapsed_time": "18:28:19", "remaining_time": "23:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7806, "total_steps": 17941, "loss": 1.7928, "learning_rate": 6.160667163973648e-05, "epoch": 0.43509280419151664, "percentage": 43.51, "elapsed_time": "18:28:28", "remaining_time": "23:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7807, "total_steps": 17941, "loss": 1.7094, "learning_rate": 6.159801044797936e-05, "epoch": 0.43514854244467976, "percentage": 43.51, "elapsed_time": "18:28:36", "remaining_time": "23:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7808, "total_steps": 17941, "loss": 1.4788, "learning_rate": 6.158934888840095e-05, "epoch": 0.43520428069784295, "percentage": 43.52, "elapsed_time": "18:28:44", "remaining_time": "23:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7809, "total_steps": 17941, "loss": 1.789, "learning_rate": 6.158068696127601e-05, "epoch": 0.4352600189510061, "percentage": 43.53, "elapsed_time": "18:28:53", "remaining_time": "23:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7810, "total_steps": 17941, "loss": 1.7309, "learning_rate": 6.157202466687916e-05, "epoch": 0.4353157572041692, "percentage": 43.53, "elapsed_time": "18:29:01", "remaining_time": "23:58:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7811, "total_steps": 17941, "loss": 1.7018, "learning_rate": 6.156336200548517e-05, "epoch": 0.4353714954573324, "percentage": 43.54, "elapsed_time": "18:29:10", "remaining_time": "23:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7812, "total_steps": 17941, "loss": 1.6621, "learning_rate": 6.155469897736874e-05, "epoch": 0.4354272337104955, "percentage": 43.54, "elapsed_time": "18:29:18", "remaining_time": "23:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7813, "total_steps": 17941, "loss": 1.7123, "learning_rate": 6.154603558280466e-05, "epoch": 0.43548297196365865, "percentage": 43.55, "elapsed_time": "18:29:27", "remaining_time": "23:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7814, "total_steps": 17941, "loss": 1.7392, "learning_rate": 6.153737182206762e-05, "epoch": 0.4355387102168218, "percentage": 43.55, "elapsed_time": "18:29:35", "remaining_time": "23:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7815, "total_steps": 17941, "loss": 1.5766, "learning_rate": 6.152870769543245e-05, "epoch": 0.43559444846998496, "percentage": 43.56, "elapsed_time": "18:29:44", "remaining_time": "23:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7816, "total_steps": 17941, "loss": 1.6999, "learning_rate": 6.152004320317385e-05, "epoch": 0.4356501867231481, "percentage": 43.57, "elapsed_time": "18:29:53", "remaining_time": "23:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7817, "total_steps": 17941, "loss": 1.569, "learning_rate": 6.151137834556666e-05, "epoch": 0.4357059249763112, "percentage": 43.57, "elapsed_time": "18:30:02", "remaining_time": "23:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7818, "total_steps": 17941, "loss": 1.9939, "learning_rate": 6.150271312288566e-05, "epoch": 0.4357616632294744, "percentage": 43.58, "elapsed_time": "18:30:11", "remaining_time": "23:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7819, "total_steps": 17941, "loss": 1.7254, "learning_rate": 6.149404753540567e-05, "epoch": 0.43581740148263753, "percentage": 43.58, "elapsed_time": "18:30:20", "remaining_time": "23:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7820, "total_steps": 17941, "loss": 2.0098, "learning_rate": 6.14853815834015e-05, "epoch": 0.43587313973580066, "percentage": 43.59, "elapsed_time": "18:30:28", "remaining_time": "23:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7821, "total_steps": 17941, "loss": 2.1957, "learning_rate": 6.1476715267148e-05, "epoch": 0.43592887798896385, "percentage": 43.59, "elapsed_time": "18:30:36", "remaining_time": "23:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7822, "total_steps": 17941, "loss": 1.614, "learning_rate": 6.146804858692001e-05, "epoch": 0.435984616242127, "percentage": 43.6, "elapsed_time": "18:30:45", "remaining_time": "23:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7823, "total_steps": 17941, "loss": 1.5681, "learning_rate": 6.145938154299237e-05, "epoch": 0.4360403544952901, "percentage": 43.6, "elapsed_time": "18:30:53", "remaining_time": "23:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7824, "total_steps": 17941, "loss": 1.8961, "learning_rate": 6.145071413563996e-05, "epoch": 0.4360960927484533, "percentage": 43.61, "elapsed_time": "18:31:02", "remaining_time": "23:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7825, "total_steps": 17941, "loss": 1.7469, "learning_rate": 6.144204636513767e-05, "epoch": 0.4361518310016164, "percentage": 43.62, "elapsed_time": "18:31:10", "remaining_time": "23:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7826, "total_steps": 17941, "loss": 1.8796, "learning_rate": 6.143337823176038e-05, "epoch": 0.43620756925477955, "percentage": 43.62, "elapsed_time": "18:31:19", "remaining_time": "23:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7827, "total_steps": 17941, "loss": 1.8995, "learning_rate": 6.142470973578299e-05, "epoch": 0.4362633075079427, "percentage": 43.63, "elapsed_time": "18:31:27", "remaining_time": "23:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7828, "total_steps": 17941, "loss": 1.544, "learning_rate": 6.141604087748043e-05, "epoch": 0.43631904576110586, "percentage": 43.63, "elapsed_time": "18:31:36", "remaining_time": "23:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7829, "total_steps": 17941, "loss": 1.7948, "learning_rate": 6.14073716571276e-05, "epoch": 0.436374784014269, "percentage": 43.64, "elapsed_time": "18:31:45", "remaining_time": "23:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7830, "total_steps": 17941, "loss": 1.6391, "learning_rate": 6.139870207499945e-05, "epoch": 0.4364305222674321, "percentage": 43.64, "elapsed_time": "18:31:54", "remaining_time": "23:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7831, "total_steps": 17941, "loss": 1.7099, "learning_rate": 6.139003213137092e-05, "epoch": 0.4364862605205953, "percentage": 43.65, "elapsed_time": "18:32:02", "remaining_time": "23:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7832, "total_steps": 17941, "loss": 1.5748, "learning_rate": 6.1381361826517e-05, "epoch": 0.43654199877375843, "percentage": 43.65, "elapsed_time": "18:32:10", "remaining_time": "23:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7833, "total_steps": 17941, "loss": 1.6389, "learning_rate": 6.137269116071263e-05, "epoch": 0.43659773702692156, "percentage": 43.66, "elapsed_time": "18:32:19", "remaining_time": "23:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7834, "total_steps": 17941, "loss": 1.7916, "learning_rate": 6.13640201342328e-05, "epoch": 0.43665347528008475, "percentage": 43.67, "elapsed_time": "18:32:27", "remaining_time": "23:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7835, "total_steps": 17941, "loss": 1.6772, "learning_rate": 6.135534874735253e-05, "epoch": 0.4367092135332479, "percentage": 43.67, "elapsed_time": "18:32:36", "remaining_time": "23:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7836, "total_steps": 17941, "loss": 1.6905, "learning_rate": 6.134667700034678e-05, "epoch": 0.436764951786411, "percentage": 43.68, "elapsed_time": "18:32:45", "remaining_time": "23:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7837, "total_steps": 17941, "loss": 1.4808, "learning_rate": 6.13380048934906e-05, "epoch": 0.43682069003957413, "percentage": 43.68, "elapsed_time": "18:32:53", "remaining_time": "23:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7838, "total_steps": 17941, "loss": 1.4744, "learning_rate": 6.132933242705899e-05, "epoch": 0.4368764282927373, "percentage": 43.69, "elapsed_time": "18:33:01", "remaining_time": "23:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7839, "total_steps": 17941, "loss": 1.5957, "learning_rate": 6.132065960132705e-05, "epoch": 0.43693216654590045, "percentage": 43.69, "elapsed_time": "18:33:10", "remaining_time": "23:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7840, "total_steps": 17941, "loss": 1.7756, "learning_rate": 6.131198641656976e-05, "epoch": 0.4369879047990636, "percentage": 43.7, "elapsed_time": "18:33:18", "remaining_time": "23:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7841, "total_steps": 17941, "loss": 1.8239, "learning_rate": 6.130331287306224e-05, "epoch": 0.43704364305222676, "percentage": 43.7, "elapsed_time": "18:33:27", "remaining_time": "23:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7842, "total_steps": 17941, "loss": 1.5446, "learning_rate": 6.129463897107951e-05, "epoch": 0.4370993813053899, "percentage": 43.71, "elapsed_time": "18:33:35", "remaining_time": "23:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7843, "total_steps": 17941, "loss": 1.7479, "learning_rate": 6.128596471089669e-05, "epoch": 0.437155119558553, "percentage": 43.72, "elapsed_time": "18:33:44", "remaining_time": "23:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7844, "total_steps": 17941, "loss": 1.5951, "learning_rate": 6.127729009278889e-05, "epoch": 0.4372108578117162, "percentage": 43.72, "elapsed_time": "18:33:52", "remaining_time": "23:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7845, "total_steps": 17941, "loss": 1.7609, "learning_rate": 6.126861511703119e-05, "epoch": 0.43726659606487933, "percentage": 43.73, "elapsed_time": "18:34:01", "remaining_time": "23:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7846, "total_steps": 17941, "loss": 1.559, "learning_rate": 6.125993978389871e-05, "epoch": 0.43732233431804246, "percentage": 43.73, "elapsed_time": "18:34:09", "remaining_time": "23:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7847, "total_steps": 17941, "loss": 1.8498, "learning_rate": 6.12512640936666e-05, "epoch": 0.43737807257120564, "percentage": 43.74, "elapsed_time": "18:34:18", "remaining_time": "23:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7848, "total_steps": 17941, "loss": 1.6316, "learning_rate": 6.124258804660999e-05, "epoch": 0.4374338108243688, "percentage": 43.74, "elapsed_time": "18:34:26", "remaining_time": "23:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7849, "total_steps": 17941, "loss": 1.5648, "learning_rate": 6.123391164300404e-05, "epoch": 0.4374895490775319, "percentage": 43.75, "elapsed_time": "18:34:34", "remaining_time": "23:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7850, "total_steps": 17941, "loss": 1.6624, "learning_rate": 6.12252348831239e-05, "epoch": 0.43754528733069503, "percentage": 43.75, "elapsed_time": "18:34:43", "remaining_time": "23:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7851, "total_steps": 17941, "loss": 1.617, "learning_rate": 6.121655776724475e-05, "epoch": 0.4376010255838582, "percentage": 43.76, "elapsed_time": "18:34:51", "remaining_time": "23:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7852, "total_steps": 17941, "loss": 1.6805, "learning_rate": 6.120788029564181e-05, "epoch": 0.43765676383702135, "percentage": 43.77, "elapsed_time": "18:35:00", "remaining_time": "23:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7853, "total_steps": 17941, "loss": 1.51, "learning_rate": 6.119920246859024e-05, "epoch": 0.4377125020901845, "percentage": 43.77, "elapsed_time": "18:35:08", "remaining_time": "23:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7854, "total_steps": 17941, "loss": 1.9405, "learning_rate": 6.119052428636529e-05, "epoch": 0.43776824034334766, "percentage": 43.78, "elapsed_time": "18:35:17", "remaining_time": "23:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7855, "total_steps": 17941, "loss": 1.6922, "learning_rate": 6.118184574924212e-05, "epoch": 0.4378239785965108, "percentage": 43.78, "elapsed_time": "18:35:25", "remaining_time": "23:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7856, "total_steps": 17941, "loss": 1.7829, "learning_rate": 6.1173166857496e-05, "epoch": 0.4378797168496739, "percentage": 43.79, "elapsed_time": "18:35:34", "remaining_time": "23:52:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7857, "total_steps": 17941, "loss": 1.9078, "learning_rate": 6.116448761140218e-05, "epoch": 0.4379354551028371, "percentage": 43.79, "elapsed_time": "18:35:42", "remaining_time": "23:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7858, "total_steps": 17941, "loss": 1.4085, "learning_rate": 6.11558080112359e-05, "epoch": 0.43799119335600023, "percentage": 43.8, "elapsed_time": "18:35:50", "remaining_time": "23:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7859, "total_steps": 17941, "loss": 1.8526, "learning_rate": 6.114712805727244e-05, "epoch": 0.43804693160916336, "percentage": 43.8, "elapsed_time": "18:35:59", "remaining_time": "23:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7860, "total_steps": 17941, "loss": 1.6052, "learning_rate": 6.113844774978706e-05, "epoch": 0.4381026698623265, "percentage": 43.81, "elapsed_time": "18:36:07", "remaining_time": "23:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7861, "total_steps": 17941, "loss": 1.7706, "learning_rate": 6.112976708905508e-05, "epoch": 0.4381584081154897, "percentage": 43.82, "elapsed_time": "18:36:16", "remaining_time": "23:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7862, "total_steps": 17941, "loss": 1.6883, "learning_rate": 6.112108607535176e-05, "epoch": 0.4382141463686528, "percentage": 43.82, "elapsed_time": "18:36:24", "remaining_time": "23:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7863, "total_steps": 17941, "loss": 1.4164, "learning_rate": 6.111240470895245e-05, "epoch": 0.43826988462181593, "percentage": 43.83, "elapsed_time": "18:36:33", "remaining_time": "23:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7864, "total_steps": 17941, "loss": 1.7575, "learning_rate": 6.110372299013243e-05, "epoch": 0.4383256228749791, "percentage": 43.83, "elapsed_time": "18:36:41", "remaining_time": "23:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7865, "total_steps": 17941, "loss": 1.825, "learning_rate": 6.109504091916707e-05, "epoch": 0.43838136112814224, "percentage": 43.84, "elapsed_time": "18:36:50", "remaining_time": "23:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7866, "total_steps": 17941, "loss": 1.5657, "learning_rate": 6.108635849633169e-05, "epoch": 0.4384370993813054, "percentage": 43.84, "elapsed_time": "18:36:58", "remaining_time": "23:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7867, "total_steps": 17941, "loss": 2.019, "learning_rate": 6.107767572190168e-05, "epoch": 0.43849283763446856, "percentage": 43.85, "elapsed_time": "18:37:07", "remaining_time": "23:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7868, "total_steps": 17941, "loss": 1.5383, "learning_rate": 6.106899259615236e-05, "epoch": 0.4385485758876317, "percentage": 43.85, "elapsed_time": "18:37:15", "remaining_time": "23:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7869, "total_steps": 17941, "loss": 1.8226, "learning_rate": 6.106030911935913e-05, "epoch": 0.4386043141407948, "percentage": 43.86, "elapsed_time": "18:37:24", "remaining_time": "23:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7870, "total_steps": 17941, "loss": 1.8757, "learning_rate": 6.105162529179738e-05, "epoch": 0.438660052393958, "percentage": 43.87, "elapsed_time": "18:37:32", "remaining_time": "23:50:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7871, "total_steps": 17941, "loss": 1.6836, "learning_rate": 6.104294111374252e-05, "epoch": 0.43871579064712113, "percentage": 43.87, "elapsed_time": "18:37:40", "remaining_time": "23:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7872, "total_steps": 17941, "loss": 1.7928, "learning_rate": 6.103425658546995e-05, "epoch": 0.43877152890028426, "percentage": 43.88, "elapsed_time": "18:37:49", "remaining_time": "23:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7873, "total_steps": 17941, "loss": 1.7313, "learning_rate": 6.1025571707255104e-05, "epoch": 0.4388272671534474, "percentage": 43.88, "elapsed_time": "18:37:57", "remaining_time": "23:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7874, "total_steps": 17941, "loss": 1.7947, "learning_rate": 6.10168864793734e-05, "epoch": 0.43888300540661057, "percentage": 43.89, "elapsed_time": "18:38:06", "remaining_time": "23:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7875, "total_steps": 17941, "loss": 1.5192, "learning_rate": 6.100820090210028e-05, "epoch": 0.4389387436597737, "percentage": 43.89, "elapsed_time": "18:38:14", "remaining_time": "23:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7876, "total_steps": 17941, "loss": 1.5993, "learning_rate": 6.099951497571123e-05, "epoch": 0.43899448191293683, "percentage": 43.9, "elapsed_time": "18:38:23", "remaining_time": "23:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7877, "total_steps": 17941, "loss": 1.8421, "learning_rate": 6.099082870048168e-05, "epoch": 0.4390502201661, "percentage": 43.91, "elapsed_time": "18:38:31", "remaining_time": "23:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7878, "total_steps": 17941, "loss": 1.5466, "learning_rate": 6.098214207668713e-05, "epoch": 0.43910595841926314, "percentage": 43.91, "elapsed_time": "18:38:40", "remaining_time": "23:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7879, "total_steps": 17941, "loss": 1.8151, "learning_rate": 6.097345510460307e-05, "epoch": 0.43916169667242627, "percentage": 43.92, "elapsed_time": "18:38:49", "remaining_time": "23:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7880, "total_steps": 17941, "loss": 1.6425, "learning_rate": 6.0964767784504995e-05, "epoch": 0.43921743492558946, "percentage": 43.92, "elapsed_time": "18:38:57", "remaining_time": "23:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7881, "total_steps": 17941, "loss": 1.7276, "learning_rate": 6.09560801166684e-05, "epoch": 0.4392731731787526, "percentage": 43.93, "elapsed_time": "18:39:06", "remaining_time": "23:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7882, "total_steps": 17941, "loss": 1.7726, "learning_rate": 6.094739210136883e-05, "epoch": 0.4393289114319157, "percentage": 43.93, "elapsed_time": "18:39:14", "remaining_time": "23:48:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7883, "total_steps": 17941, "loss": 1.6228, "learning_rate": 6.093870373888181e-05, "epoch": 0.43938464968507884, "percentage": 43.94, "elapsed_time": "18:39:23", "remaining_time": "23:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7884, "total_steps": 17941, "loss": 1.7197, "learning_rate": 6.093001502948289e-05, "epoch": 0.439440387938242, "percentage": 43.94, "elapsed_time": "18:39:31", "remaining_time": "23:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7885, "total_steps": 17941, "loss": 1.5778, "learning_rate": 6.0921325973447604e-05, "epoch": 0.43949612619140516, "percentage": 43.95, "elapsed_time": "18:39:40", "remaining_time": "23:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7886, "total_steps": 17941, "loss": 1.7891, "learning_rate": 6.091263657105155e-05, "epoch": 0.4395518644445683, "percentage": 43.96, "elapsed_time": "18:39:49", "remaining_time": "23:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7887, "total_steps": 17941, "loss": 1.5781, "learning_rate": 6.090394682257029e-05, "epoch": 0.43960760269773147, "percentage": 43.96, "elapsed_time": "18:39:57", "remaining_time": "23:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7888, "total_steps": 17941, "loss": 1.683, "learning_rate": 6.08952567282794e-05, "epoch": 0.4396633409508946, "percentage": 43.97, "elapsed_time": "18:40:05", "remaining_time": "23:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7889, "total_steps": 17941, "loss": 1.5673, "learning_rate": 6.0886566288454496e-05, "epoch": 0.43971907920405773, "percentage": 43.97, "elapsed_time": "18:40:14", "remaining_time": "23:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7890, "total_steps": 17941, "loss": 1.7352, "learning_rate": 6.0877875503371176e-05, "epoch": 0.4397748174572209, "percentage": 43.98, "elapsed_time": "18:40:23", "remaining_time": "23:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7891, "total_steps": 17941, "loss": 1.7736, "learning_rate": 6.086918437330508e-05, "epoch": 0.43983055571038404, "percentage": 43.98, "elapsed_time": "18:40:31", "remaining_time": "23:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7892, "total_steps": 17941, "loss": 1.7542, "learning_rate": 6.086049289853182e-05, "epoch": 0.43988629396354717, "percentage": 43.99, "elapsed_time": "18:40:40", "remaining_time": "23:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7893, "total_steps": 17941, "loss": 1.7245, "learning_rate": 6.0851801079327056e-05, "epoch": 0.43994203221671035, "percentage": 43.99, "elapsed_time": "18:40:48", "remaining_time": "23:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7894, "total_steps": 17941, "loss": 1.4047, "learning_rate": 6.0843108915966415e-05, "epoch": 0.4399977704698735, "percentage": 44.0, "elapsed_time": "18:40:56", "remaining_time": "23:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7895, "total_steps": 17941, "loss": 2.0188, "learning_rate": 6.083441640872558e-05, "epoch": 0.4400535087230366, "percentage": 44.01, "elapsed_time": "18:41:05", "remaining_time": "23:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7896, "total_steps": 17941, "loss": 1.5408, "learning_rate": 6.082572355788023e-05, "epoch": 0.44010924697619974, "percentage": 44.01, "elapsed_time": "18:41:13", "remaining_time": "23:46:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7897, "total_steps": 17941, "loss": 2.0136, "learning_rate": 6.081703036370606e-05, "epoch": 0.4401649852293629, "percentage": 44.02, "elapsed_time": "18:41:22", "remaining_time": "23:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7898, "total_steps": 17941, "loss": 1.6615, "learning_rate": 6.080833682647874e-05, "epoch": 0.44022072348252606, "percentage": 44.02, "elapsed_time": "18:41:30", "remaining_time": "23:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7899, "total_steps": 17941, "loss": 1.5859, "learning_rate": 6.0799642946473986e-05, "epoch": 0.4402764617356892, "percentage": 44.03, "elapsed_time": "18:41:39", "remaining_time": "23:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7900, "total_steps": 17941, "loss": 1.7462, "learning_rate": 6.079094872396754e-05, "epoch": 0.44033219998885237, "percentage": 44.03, "elapsed_time": "18:41:47", "remaining_time": "23:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7901, "total_steps": 17941, "loss": 1.736, "learning_rate": 6.0782254159235116e-05, "epoch": 0.4403879382420155, "percentage": 44.04, "elapsed_time": "18:41:56", "remaining_time": "23:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7902, "total_steps": 17941, "loss": 1.372, "learning_rate": 6.0773559252552446e-05, "epoch": 0.4404436764951786, "percentage": 44.04, "elapsed_time": "18:42:04", "remaining_time": "23:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7903, "total_steps": 17941, "loss": 1.7732, "learning_rate": 6.0764864004195286e-05, "epoch": 0.4404994147483418, "percentage": 44.05, "elapsed_time": "18:42:12", "remaining_time": "23:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7904, "total_steps": 17941, "loss": 1.8002, "learning_rate": 6.075616841443943e-05, "epoch": 0.44055515300150494, "percentage": 44.06, "elapsed_time": "18:42:21", "remaining_time": "23:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7905, "total_steps": 17941, "loss": 1.7832, "learning_rate": 6.07474724835606e-05, "epoch": 0.44061089125466807, "percentage": 44.06, "elapsed_time": "18:42:29", "remaining_time": "23:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7906, "total_steps": 17941, "loss": 1.9006, "learning_rate": 6.0738776211834615e-05, "epoch": 0.4406666295078312, "percentage": 44.07, "elapsed_time": "18:42:38", "remaining_time": "23:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7907, "total_steps": 17941, "loss": 1.8046, "learning_rate": 6.073007959953726e-05, "epoch": 0.4407223677609944, "percentage": 44.07, "elapsed_time": "18:42:46", "remaining_time": "23:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7908, "total_steps": 17941, "loss": 1.8318, "learning_rate": 6.0721382646944326e-05, "epoch": 0.4407781060141575, "percentage": 44.08, "elapsed_time": "18:42:55", "remaining_time": "23:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7909, "total_steps": 17941, "loss": 1.4663, "learning_rate": 6.0712685354331654e-05, "epoch": 0.44083384426732064, "percentage": 44.08, "elapsed_time": "18:43:03", "remaining_time": "23:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7910, "total_steps": 17941, "loss": 1.6231, "learning_rate": 6.0703987721975076e-05, "epoch": 0.4408895825204838, "percentage": 44.09, "elapsed_time": "18:43:12", "remaining_time": "23:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7911, "total_steps": 17941, "loss": 1.6668, "learning_rate": 6.0695289750150394e-05, "epoch": 0.44094532077364695, "percentage": 44.09, "elapsed_time": "18:43:20", "remaining_time": "23:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7912, "total_steps": 17941, "loss": 1.7711, "learning_rate": 6.068659143913349e-05, "epoch": 0.4410010590268101, "percentage": 44.1, "elapsed_time": "18:43:29", "remaining_time": "23:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7913, "total_steps": 17941, "loss": 1.7025, "learning_rate": 6.0677892789200216e-05, "epoch": 0.44105679727997327, "percentage": 44.11, "elapsed_time": "18:43:37", "remaining_time": "23:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7914, "total_steps": 17941, "loss": 1.7495, "learning_rate": 6.066919380062643e-05, "epoch": 0.4411125355331364, "percentage": 44.11, "elapsed_time": "18:43:46", "remaining_time": "23:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7915, "total_steps": 17941, "loss": 1.5988, "learning_rate": 6.066049447368802e-05, "epoch": 0.4411682737862995, "percentage": 44.12, "elapsed_time": "18:43:54", "remaining_time": "23:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7916, "total_steps": 17941, "loss": 1.7006, "learning_rate": 6.065179480866089e-05, "epoch": 0.4412240120394627, "percentage": 44.12, "elapsed_time": "18:44:02", "remaining_time": "23:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7917, "total_steps": 17941, "loss": 1.6275, "learning_rate": 6.064309480582093e-05, "epoch": 0.44127975029262584, "percentage": 44.13, "elapsed_time": "18:44:11", "remaining_time": "23:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7918, "total_steps": 17941, "loss": 1.8278, "learning_rate": 6.0634394465444056e-05, "epoch": 0.44133548854578897, "percentage": 44.13, "elapsed_time": "18:44:19", "remaining_time": "23:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7919, "total_steps": 17941, "loss": 1.724, "learning_rate": 6.062569378780621e-05, "epoch": 0.4413912267989521, "percentage": 44.14, "elapsed_time": "18:44:28", "remaining_time": "23:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7920, "total_steps": 17941, "loss": 1.706, "learning_rate": 6.061699277318328e-05, "epoch": 0.4414469650521153, "percentage": 44.14, "elapsed_time": "18:44:36", "remaining_time": "23:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7921, "total_steps": 17941, "loss": 1.7118, "learning_rate": 6.060829142185125e-05, "epoch": 0.4415027033052784, "percentage": 44.15, "elapsed_time": "18:44:45", "remaining_time": "23:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7922, "total_steps": 17941, "loss": 1.908, "learning_rate": 6.059958973408607e-05, "epoch": 0.44155844155844154, "percentage": 44.16, "elapsed_time": "18:44:53", "remaining_time": "23:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7923, "total_steps": 17941, "loss": 1.7077, "learning_rate": 6.05908877101637e-05, "epoch": 0.4416141798116047, "percentage": 44.16, "elapsed_time": "18:45:02", "remaining_time": "23:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7924, "total_steps": 17941, "loss": 1.6519, "learning_rate": 6.058218535036013e-05, "epoch": 0.44166991806476785, "percentage": 44.17, "elapsed_time": "18:45:10", "remaining_time": "23:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7925, "total_steps": 17941, "loss": 1.4665, "learning_rate": 6.057348265495133e-05, "epoch": 0.441725656317931, "percentage": 44.17, "elapsed_time": "18:45:18", "remaining_time": "23:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7926, "total_steps": 17941, "loss": 1.6157, "learning_rate": 6.0564779624213316e-05, "epoch": 0.44178139457109417, "percentage": 44.18, "elapsed_time": "18:45:27", "remaining_time": "23:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7927, "total_steps": 17941, "loss": 1.5828, "learning_rate": 6.055607625842208e-05, "epoch": 0.4418371328242573, "percentage": 44.18, "elapsed_time": "18:45:35", "remaining_time": "23:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7928, "total_steps": 17941, "loss": 1.6772, "learning_rate": 6.0547372557853655e-05, "epoch": 0.4418928710774204, "percentage": 44.19, "elapsed_time": "18:45:44", "remaining_time": "23:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7929, "total_steps": 17941, "loss": 1.7394, "learning_rate": 6.053866852278406e-05, "epoch": 0.44194860933058355, "percentage": 44.19, "elapsed_time": "18:45:52", "remaining_time": "23:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7930, "total_steps": 17941, "loss": 1.8231, "learning_rate": 6.052996415348936e-05, "epoch": 0.44200434758374674, "percentage": 44.2, "elapsed_time": "18:46:01", "remaining_time": "23:41:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7931, "total_steps": 17941, "loss": 1.6415, "learning_rate": 6.052125945024558e-05, "epoch": 0.44206008583690987, "percentage": 44.21, "elapsed_time": "18:46:09", "remaining_time": "23:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7932, "total_steps": 17941, "loss": 1.5515, "learning_rate": 6.05125544133288e-05, "epoch": 0.442115824090073, "percentage": 44.21, "elapsed_time": "18:46:18", "remaining_time": "23:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7933, "total_steps": 17941, "loss": 1.7348, "learning_rate": 6.050384904301508e-05, "epoch": 0.4421715623432362, "percentage": 44.22, "elapsed_time": "18:46:26", "remaining_time": "23:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7934, "total_steps": 17941, "loss": 1.6601, "learning_rate": 6.049514333958052e-05, "epoch": 0.4422273005963993, "percentage": 44.22, "elapsed_time": "18:46:35", "remaining_time": "23:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7935, "total_steps": 17941, "loss": 1.5493, "learning_rate": 6.048643730330119e-05, "epoch": 0.44228303884956244, "percentage": 44.23, "elapsed_time": "18:46:43", "remaining_time": "23:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7936, "total_steps": 17941, "loss": 1.5092, "learning_rate": 6.0477730934453226e-05, "epoch": 0.4423387771027256, "percentage": 44.23, "elapsed_time": "18:46:52", "remaining_time": "23:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7937, "total_steps": 17941, "loss": 1.4483, "learning_rate": 6.046902423331271e-05, "epoch": 0.44239451535588875, "percentage": 44.24, "elapsed_time": "18:47:00", "remaining_time": "23:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7938, "total_steps": 17941, "loss": 1.6987, "learning_rate": 6.046031720015579e-05, "epoch": 0.4424502536090519, "percentage": 44.25, "elapsed_time": "18:47:09", "remaining_time": "23:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7939, "total_steps": 17941, "loss": 1.8988, "learning_rate": 6.045160983525859e-05, "epoch": 0.44250599186221506, "percentage": 44.25, "elapsed_time": "18:47:17", "remaining_time": "23:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7940, "total_steps": 17941, "loss": 1.696, "learning_rate": 6.044290213889727e-05, "epoch": 0.4425617301153782, "percentage": 44.26, "elapsed_time": "18:47:26", "remaining_time": "23:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7941, "total_steps": 17941, "loss": 1.5279, "learning_rate": 6.0434194111347985e-05, "epoch": 0.4426174683685413, "percentage": 44.26, "elapsed_time": "18:47:34", "remaining_time": "23:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7942, "total_steps": 17941, "loss": 1.7109, "learning_rate": 6.042548575288689e-05, "epoch": 0.44267320662170445, "percentage": 44.27, "elapsed_time": "18:47:43", "remaining_time": "23:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7943, "total_steps": 17941, "loss": 1.4709, "learning_rate": 6.0416777063790184e-05, "epoch": 0.44272894487486764, "percentage": 44.27, "elapsed_time": "18:47:51", "remaining_time": "23:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7944, "total_steps": 17941, "loss": 1.6943, "learning_rate": 6.040806804433403e-05, "epoch": 0.44278468312803076, "percentage": 44.28, "elapsed_time": "18:48:00", "remaining_time": "23:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7945, "total_steps": 17941, "loss": 1.3918, "learning_rate": 6.0399358694794647e-05, "epoch": 0.4428404213811939, "percentage": 44.28, "elapsed_time": "18:48:08", "remaining_time": "23:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7946, "total_steps": 17941, "loss": 1.8103, "learning_rate": 6.039064901544824e-05, "epoch": 0.4428961596343571, "percentage": 44.29, "elapsed_time": "18:48:17", "remaining_time": "23:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7947, "total_steps": 17941, "loss": 1.7597, "learning_rate": 6.038193900657102e-05, "epoch": 0.4429518978875202, "percentage": 44.3, "elapsed_time": "18:48:26", "remaining_time": "23:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7948, "total_steps": 17941, "loss": 1.7671, "learning_rate": 6.037322866843923e-05, "epoch": 0.44300763614068334, "percentage": 44.3, "elapsed_time": "18:48:34", "remaining_time": "23:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7949, "total_steps": 17941, "loss": 1.7487, "learning_rate": 6.036451800132912e-05, "epoch": 0.4430633743938465, "percentage": 44.31, "elapsed_time": "18:48:43", "remaining_time": "23:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7950, "total_steps": 17941, "loss": 1.7112, "learning_rate": 6.03558070055169e-05, "epoch": 0.44311911264700965, "percentage": 44.31, "elapsed_time": "18:48:52", "remaining_time": "23:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7951, "total_steps": 17941, "loss": 1.7736, "learning_rate": 6.0347095681278876e-05, "epoch": 0.4431748509001728, "percentage": 44.32, "elapsed_time": "18:49:00", "remaining_time": "23:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7952, "total_steps": 17941, "loss": 1.7693, "learning_rate": 6.033838402889131e-05, "epoch": 0.4432305891533359, "percentage": 44.32, "elapsed_time": "18:49:09", "remaining_time": "23:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7953, "total_steps": 17941, "loss": 1.6216, "learning_rate": 6.032967204863048e-05, "epoch": 0.4432863274064991, "percentage": 44.33, "elapsed_time": "18:49:17", "remaining_time": "23:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7954, "total_steps": 17941, "loss": 1.7631, "learning_rate": 6.0320959740772666e-05, "epoch": 0.4433420656596622, "percentage": 44.33, "elapsed_time": "18:49:26", "remaining_time": "23:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7955, "total_steps": 17941, "loss": 1.6809, "learning_rate": 6.031224710559419e-05, "epoch": 0.44339780391282535, "percentage": 44.34, "elapsed_time": "18:49:34", "remaining_time": "23:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7956, "total_steps": 17941, "loss": 1.5357, "learning_rate": 6.0303534143371374e-05, "epoch": 0.44345354216598853, "percentage": 44.35, "elapsed_time": "18:49:43", "remaining_time": "23:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7957, "total_steps": 17941, "loss": 1.6955, "learning_rate": 6.029482085438051e-05, "epoch": 0.44350928041915166, "percentage": 44.35, "elapsed_time": "18:49:51", "remaining_time": "23:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7958, "total_steps": 17941, "loss": 1.762, "learning_rate": 6.028610723889797e-05, "epoch": 0.4435650186723148, "percentage": 44.36, "elapsed_time": "18:49:59", "remaining_time": "23:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7959, "total_steps": 17941, "loss": 1.4594, "learning_rate": 6.027739329720006e-05, "epoch": 0.443620756925478, "percentage": 44.36, "elapsed_time": "18:50:08", "remaining_time": "23:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7960, "total_steps": 17941, "loss": 1.7942, "learning_rate": 6.026867902956317e-05, "epoch": 0.4436764951786411, "percentage": 44.37, "elapsed_time": "18:50:16", "remaining_time": "23:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7961, "total_steps": 17941, "loss": 1.6659, "learning_rate": 6.025996443626364e-05, "epoch": 0.44373223343180423, "percentage": 44.37, "elapsed_time": "18:50:25", "remaining_time": "23:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7962, "total_steps": 17941, "loss": 1.9042, "learning_rate": 6.0251249517577854e-05, "epoch": 0.4437879716849674, "percentage": 44.38, "elapsed_time": "18:50:34", "remaining_time": "23:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7963, "total_steps": 17941, "loss": 1.6772, "learning_rate": 6.024253427378222e-05, "epoch": 0.44384370993813055, "percentage": 44.38, "elapsed_time": "18:50:42", "remaining_time": "23:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7964, "total_steps": 17941, "loss": 1.5868, "learning_rate": 6.0233818705153114e-05, "epoch": 0.4438994481912937, "percentage": 44.39, "elapsed_time": "18:50:50", "remaining_time": "23:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7965, "total_steps": 17941, "loss": 1.6118, "learning_rate": 6.022510281196695e-05, "epoch": 0.4439551864444568, "percentage": 44.4, "elapsed_time": "18:50:59", "remaining_time": "23:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7966, "total_steps": 17941, "loss": 1.4902, "learning_rate": 6.021638659450013e-05, "epoch": 0.44401092469762, "percentage": 44.4, "elapsed_time": "18:51:07", "remaining_time": "23:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7967, "total_steps": 17941, "loss": 1.5573, "learning_rate": 6.020767005302909e-05, "epoch": 0.4440666629507831, "percentage": 44.41, "elapsed_time": "18:51:16", "remaining_time": "23:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7968, "total_steps": 17941, "loss": 1.9599, "learning_rate": 6.0198953187830277e-05, "epoch": 0.44412240120394625, "percentage": 44.41, "elapsed_time": "18:51:24", "remaining_time": "23:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7969, "total_steps": 17941, "loss": 1.7111, "learning_rate": 6.019023599918014e-05, "epoch": 0.44417813945710943, "percentage": 44.42, "elapsed_time": "18:51:33", "remaining_time": "23:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7970, "total_steps": 17941, "loss": 1.6214, "learning_rate": 6.018151848735511e-05, "epoch": 0.44423387771027256, "percentage": 44.42, "elapsed_time": "18:51:42", "remaining_time": "23:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7971, "total_steps": 17941, "loss": 1.8074, "learning_rate": 6.01728006526317e-05, "epoch": 0.4442896159634357, "percentage": 44.43, "elapsed_time": "18:51:50", "remaining_time": "23:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7972, "total_steps": 17941, "loss": 1.6405, "learning_rate": 6.0164082495286354e-05, "epoch": 0.4443453542165989, "percentage": 44.43, "elapsed_time": "18:51:59", "remaining_time": "23:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7973, "total_steps": 17941, "loss": 1.4973, "learning_rate": 6.015536401559556e-05, "epoch": 0.444401092469762, "percentage": 44.44, "elapsed_time": "18:52:08", "remaining_time": "23:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7974, "total_steps": 17941, "loss": 1.8733, "learning_rate": 6.014664521383584e-05, "epoch": 0.44445683072292513, "percentage": 44.45, "elapsed_time": "18:52:16", "remaining_time": "23:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7975, "total_steps": 17941, "loss": 1.6334, "learning_rate": 6.0137926090283694e-05, "epoch": 0.44451256897608826, "percentage": 44.45, "elapsed_time": "18:52:25", "remaining_time": "23:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7976, "total_steps": 17941, "loss": 1.7995, "learning_rate": 6.0129206645215655e-05, "epoch": 0.44456830722925145, "percentage": 44.46, "elapsed_time": "18:52:33", "remaining_time": "23:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7977, "total_steps": 17941, "loss": 1.8132, "learning_rate": 6.012048687890821e-05, "epoch": 0.4446240454824146, "percentage": 44.46, "elapsed_time": "18:52:43", "remaining_time": "23:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7978, "total_steps": 17941, "loss": 1.9482, "learning_rate": 6.011176679163796e-05, "epoch": 0.4446797837355777, "percentage": 44.47, "elapsed_time": "18:52:51", "remaining_time": "23:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7979, "total_steps": 17941, "loss": 1.8485, "learning_rate": 6.010304638368139e-05, "epoch": 0.4447355219887409, "percentage": 44.47, "elapsed_time": "18:53:00", "remaining_time": "23:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7980, "total_steps": 17941, "loss": 1.6343, "learning_rate": 6.009432565531511e-05, "epoch": 0.444791260241904, "percentage": 44.48, "elapsed_time": "18:53:08", "remaining_time": "23:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7981, "total_steps": 17941, "loss": 1.721, "learning_rate": 6.008560460681567e-05, "epoch": 0.44484699849506715, "percentage": 44.48, "elapsed_time": "18:53:17", "remaining_time": "23:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7982, "total_steps": 17941, "loss": 1.5152, "learning_rate": 6.007688323845966e-05, "epoch": 0.44490273674823033, "percentage": 44.49, "elapsed_time": "18:53:25", "remaining_time": "23:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7983, "total_steps": 17941, "loss": 1.7975, "learning_rate": 6.006816155052366e-05, "epoch": 0.44495847500139346, "percentage": 44.5, "elapsed_time": "18:53:34", "remaining_time": "23:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7984, "total_steps": 17941, "loss": 1.7401, "learning_rate": 6.005943954328429e-05, "epoch": 0.4450142132545566, "percentage": 44.5, "elapsed_time": "18:53:42", "remaining_time": "23:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7985, "total_steps": 17941, "loss": 1.5525, "learning_rate": 6.005071721701814e-05, "epoch": 0.4450699515077198, "percentage": 44.51, "elapsed_time": "18:53:50", "remaining_time": "23:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7986, "total_steps": 17941, "loss": 1.8248, "learning_rate": 6.004199457200184e-05, "epoch": 0.4451256897608829, "percentage": 44.51, "elapsed_time": "18:53:59", "remaining_time": "23:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7987, "total_steps": 17941, "loss": 1.5985, "learning_rate": 6.003327160851201e-05, "epoch": 0.44518142801404603, "percentage": 44.52, "elapsed_time": "18:54:07", "remaining_time": "23:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7988, "total_steps": 17941, "loss": 1.4312, "learning_rate": 6.002454832682532e-05, "epoch": 0.44523716626720916, "percentage": 44.52, "elapsed_time": "18:54:16", "remaining_time": "23:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7989, "total_steps": 17941, "loss": 1.6288, "learning_rate": 6.00158247272184e-05, "epoch": 0.44529290452037235, "percentage": 44.53, "elapsed_time": "18:54:24", "remaining_time": "23:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7990, "total_steps": 17941, "loss": 1.2663, "learning_rate": 6.00071008099679e-05, "epoch": 0.4453486427735355, "percentage": 44.53, "elapsed_time": "18:54:33", "remaining_time": "23:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7991, "total_steps": 17941, "loss": 1.8037, "learning_rate": 5.999837657535052e-05, "epoch": 0.4454043810266986, "percentage": 44.54, "elapsed_time": "18:54:41", "remaining_time": "23:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7992, "total_steps": 17941, "loss": 1.6298, "learning_rate": 5.998965202364294e-05, "epoch": 0.4454601192798618, "percentage": 44.55, "elapsed_time": "18:54:50", "remaining_time": "23:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7993, "total_steps": 17941, "loss": 1.6349, "learning_rate": 5.998092715512183e-05, "epoch": 0.4455158575330249, "percentage": 44.55, "elapsed_time": "18:54:58", "remaining_time": "23:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7994, "total_steps": 17941, "loss": 1.5642, "learning_rate": 5.9972201970063904e-05, "epoch": 0.44557159578618805, "percentage": 44.56, "elapsed_time": "18:55:06", "remaining_time": "23:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7995, "total_steps": 17941, "loss": 1.6421, "learning_rate": 5.996347646874587e-05, "epoch": 0.44562733403935123, "percentage": 44.56, "elapsed_time": "18:55:15", "remaining_time": "23:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7996, "total_steps": 17941, "loss": 1.6171, "learning_rate": 5.9954750651444455e-05, "epoch": 0.44568307229251436, "percentage": 44.57, "elapsed_time": "18:55:23", "remaining_time": "23:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7997, "total_steps": 17941, "loss": 1.6702, "learning_rate": 5.9946024518436406e-05, "epoch": 0.4457388105456775, "percentage": 44.57, "elapsed_time": "18:55:32", "remaining_time": "23:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7998, "total_steps": 17941, "loss": 1.4339, "learning_rate": 5.9937298069998424e-05, "epoch": 0.4457945487988406, "percentage": 44.58, "elapsed_time": "18:55:40", "remaining_time": "23:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7999, "total_steps": 17941, "loss": 1.738, "learning_rate": 5.99285713064073e-05, "epoch": 0.4458502870520038, "percentage": 44.59, "elapsed_time": "18:55:49", "remaining_time": "23:31:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8000, "total_steps": 17941, "loss": 1.4481, "learning_rate": 5.991984422793977e-05, "epoch": 0.44590602530516693, "percentage": 44.59, "elapsed_time": "18:55:57", "remaining_time": "23:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8001, "total_steps": 17941, "loss": 1.7051, "learning_rate": 5.9911116834872624e-05, "epoch": 0.44596176355833006, "percentage": 44.6, "elapsed_time": "18:56:06", "remaining_time": "23:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8002, "total_steps": 17941, "loss": 1.7542, "learning_rate": 5.990238912748265e-05, "epoch": 0.44601750181149324, "percentage": 44.6, "elapsed_time": "18:56:14", "remaining_time": "23:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8003, "total_steps": 17941, "loss": 1.8245, "learning_rate": 5.989366110604662e-05, "epoch": 0.4460732400646564, "percentage": 44.61, "elapsed_time": "18:56:23", "remaining_time": "23:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8004, "total_steps": 17941, "loss": 1.7637, "learning_rate": 5.988493277084134e-05, "epoch": 0.4461289783178195, "percentage": 44.61, "elapsed_time": "18:56:31", "remaining_time": "23:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8005, "total_steps": 17941, "loss": 1.6303, "learning_rate": 5.9876204122143634e-05, "epoch": 0.4461847165709827, "percentage": 44.62, "elapsed_time": "18:56:39", "remaining_time": "23:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8006, "total_steps": 17941, "loss": 1.8505, "learning_rate": 5.98674751602303e-05, "epoch": 0.4462404548241458, "percentage": 44.62, "elapsed_time": "18:56:48", "remaining_time": "23:30:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8007, "total_steps": 17941, "loss": 1.6483, "learning_rate": 5.985874588537819e-05, "epoch": 0.44629619307730894, "percentage": 44.63, "elapsed_time": "18:56:56", "remaining_time": "23:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8008, "total_steps": 17941, "loss": 1.5566, "learning_rate": 5.985001629786415e-05, "epoch": 0.44635193133047213, "percentage": 44.64, "elapsed_time": "18:57:05", "remaining_time": "23:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8009, "total_steps": 17941, "loss": 1.7409, "learning_rate": 5.9841286397965014e-05, "epoch": 0.44640766958363526, "percentage": 44.64, "elapsed_time": "18:57:13", "remaining_time": "23:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8010, "total_steps": 17941, "loss": 1.712, "learning_rate": 5.983255618595767e-05, "epoch": 0.4464634078367984, "percentage": 44.65, "elapsed_time": "18:57:22", "remaining_time": "23:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8011, "total_steps": 17941, "loss": 1.7699, "learning_rate": 5.982382566211895e-05, "epoch": 0.4465191460899615, "percentage": 44.65, "elapsed_time": "18:57:31", "remaining_time": "23:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8012, "total_steps": 17941, "loss": 1.862, "learning_rate": 5.981509482672576e-05, "epoch": 0.4465748843431247, "percentage": 44.66, "elapsed_time": "18:57:39", "remaining_time": "23:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8013, "total_steps": 17941, "loss": 1.5174, "learning_rate": 5.980636368005499e-05, "epoch": 0.44663062259628783, "percentage": 44.66, "elapsed_time": "18:57:48", "remaining_time": "23:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8014, "total_steps": 17941, "loss": 1.8425, "learning_rate": 5.979763222238354e-05, "epoch": 0.44668636084945096, "percentage": 44.67, "elapsed_time": "18:57:56", "remaining_time": "23:29:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8015, "total_steps": 17941, "loss": 1.7243, "learning_rate": 5.978890045398833e-05, "epoch": 0.44674209910261414, "percentage": 44.67, "elapsed_time": "18:58:05", "remaining_time": "23:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8016, "total_steps": 17941, "loss": 1.8003, "learning_rate": 5.978016837514625e-05, "epoch": 0.44679783735577727, "percentage": 44.68, "elapsed_time": "18:58:13", "remaining_time": "23:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8017, "total_steps": 17941, "loss": 1.648, "learning_rate": 5.9771435986134274e-05, "epoch": 0.4468535756089404, "percentage": 44.69, "elapsed_time": "18:58:22", "remaining_time": "23:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8018, "total_steps": 17941, "loss": 1.5867, "learning_rate": 5.9762703287229304e-05, "epoch": 0.4469093138621036, "percentage": 44.69, "elapsed_time": "18:58:30", "remaining_time": "23:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8019, "total_steps": 17941, "loss": 1.656, "learning_rate": 5.975397027870831e-05, "epoch": 0.4469650521152667, "percentage": 44.7, "elapsed_time": "18:58:39", "remaining_time": "23:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8020, "total_steps": 17941, "loss": 1.6628, "learning_rate": 5.974523696084825e-05, "epoch": 0.44702079036842984, "percentage": 44.7, "elapsed_time": "18:58:48", "remaining_time": "23:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8021, "total_steps": 17941, "loss": 1.4316, "learning_rate": 5.97365033339261e-05, "epoch": 0.447076528621593, "percentage": 44.71, "elapsed_time": "18:58:56", "remaining_time": "23:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8022, "total_steps": 17941, "loss": 1.4696, "learning_rate": 5.972776939821883e-05, "epoch": 0.44713226687475616, "percentage": 44.71, "elapsed_time": "18:59:06", "remaining_time": "23:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8023, "total_steps": 17941, "loss": 1.7885, "learning_rate": 5.971903515400342e-05, "epoch": 0.4471880051279193, "percentage": 44.72, "elapsed_time": "18:59:15", "remaining_time": "23:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8024, "total_steps": 17941, "loss": 1.6956, "learning_rate": 5.971030060155689e-05, "epoch": 0.4472437433810824, "percentage": 44.72, "elapsed_time": "18:59:23", "remaining_time": "23:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8025, "total_steps": 17941, "loss": 1.5434, "learning_rate": 5.970156574115623e-05, "epoch": 0.4472994816342456, "percentage": 44.73, "elapsed_time": "18:59:31", "remaining_time": "23:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8026, "total_steps": 17941, "loss": 1.5207, "learning_rate": 5.969283057307847e-05, "epoch": 0.44735521988740873, "percentage": 44.74, "elapsed_time": "18:59:40", "remaining_time": "23:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8027, "total_steps": 17941, "loss": 1.6211, "learning_rate": 5.9684095097600645e-05, "epoch": 0.44741095814057186, "percentage": 44.74, "elapsed_time": "18:59:48", "remaining_time": "23:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8028, "total_steps": 17941, "loss": 1.7282, "learning_rate": 5.967535931499979e-05, "epoch": 0.44746669639373504, "percentage": 44.75, "elapsed_time": "18:59:57", "remaining_time": "23:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8029, "total_steps": 17941, "loss": 1.822, "learning_rate": 5.966662322555294e-05, "epoch": 0.44752243464689817, "percentage": 44.75, "elapsed_time": "19:00:05", "remaining_time": "23:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8030, "total_steps": 17941, "loss": 1.6235, "learning_rate": 5.965788682953717e-05, "epoch": 0.4475781729000613, "percentage": 44.76, "elapsed_time": "19:00:14", "remaining_time": "23:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8031, "total_steps": 17941, "loss": 1.8248, "learning_rate": 5.9649150127229534e-05, "epoch": 0.4476339111532245, "percentage": 44.76, "elapsed_time": "19:00:22", "remaining_time": "23:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8032, "total_steps": 17941, "loss": 1.5738, "learning_rate": 5.964041311890711e-05, "epoch": 0.4476896494063876, "percentage": 44.77, "elapsed_time": "19:00:31", "remaining_time": "23:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8033, "total_steps": 17941, "loss": 1.5644, "learning_rate": 5.9631675804846985e-05, "epoch": 0.44774538765955074, "percentage": 44.77, "elapsed_time": "19:00:39", "remaining_time": "23:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8034, "total_steps": 17941, "loss": 1.6785, "learning_rate": 5.962293818532628e-05, "epoch": 0.44780112591271387, "percentage": 44.78, "elapsed_time": "19:00:47", "remaining_time": "23:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8035, "total_steps": 17941, "loss": 1.7991, "learning_rate": 5.9614200260622066e-05, "epoch": 0.44785686416587706, "percentage": 44.79, "elapsed_time": "19:00:56", "remaining_time": "23:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8036, "total_steps": 17941, "loss": 1.6311, "learning_rate": 5.960546203101148e-05, "epoch": 0.4479126024190402, "percentage": 44.79, "elapsed_time": "19:01:04", "remaining_time": "23:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8037, "total_steps": 17941, "loss": 1.4416, "learning_rate": 5.959672349677163e-05, "epoch": 0.4479683406722033, "percentage": 44.8, "elapsed_time": "19:01:13", "remaining_time": "23:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8038, "total_steps": 17941, "loss": 1.8168, "learning_rate": 5.9587984658179676e-05, "epoch": 0.4480240789253665, "percentage": 44.8, "elapsed_time": "19:01:21", "remaining_time": "23:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8039, "total_steps": 17941, "loss": 1.6999, "learning_rate": 5.957924551551275e-05, "epoch": 0.4480798171785296, "percentage": 44.81, "elapsed_time": "19:01:30", "remaining_time": "23:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8040, "total_steps": 17941, "loss": 1.7066, "learning_rate": 5.9570506069048e-05, "epoch": 0.44813555543169276, "percentage": 44.81, "elapsed_time": "19:01:39", "remaining_time": "23:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8041, "total_steps": 17941, "loss": 1.6468, "learning_rate": 5.95617663190626e-05, "epoch": 0.44819129368485594, "percentage": 44.82, "elapsed_time": "19:01:48", "remaining_time": "23:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8042, "total_steps": 17941, "loss": 1.8804, "learning_rate": 5.955302626583374e-05, "epoch": 0.44824703193801907, "percentage": 44.82, "elapsed_time": "19:01:56", "remaining_time": "23:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8043, "total_steps": 17941, "loss": 1.4389, "learning_rate": 5.9544285909638566e-05, "epoch": 0.4483027701911822, "percentage": 44.83, "elapsed_time": "19:02:05", "remaining_time": "23:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8044, "total_steps": 17941, "loss": 1.9128, "learning_rate": 5.953554525075429e-05, "epoch": 0.4483585084443453, "percentage": 44.84, "elapsed_time": "19:02:13", "remaining_time": "23:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8045, "total_steps": 17941, "loss": 1.5926, "learning_rate": 5.952680428945812e-05, "epoch": 0.4484142466975085, "percentage": 44.84, "elapsed_time": "19:02:22", "remaining_time": "23:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8046, "total_steps": 17941, "loss": 1.6805, "learning_rate": 5.951806302602725e-05, "epoch": 0.44846998495067164, "percentage": 44.85, "elapsed_time": "19:02:30", "remaining_time": "23:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8047, "total_steps": 17941, "loss": 1.6863, "learning_rate": 5.950932146073893e-05, "epoch": 0.44852572320383477, "percentage": 44.85, "elapsed_time": "19:02:39", "remaining_time": "23:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8048, "total_steps": 17941, "loss": 1.695, "learning_rate": 5.950057959387038e-05, "epoch": 0.44858146145699795, "percentage": 44.86, "elapsed_time": "19:02:48", "remaining_time": "23:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8049, "total_steps": 17941, "loss": 1.3978, "learning_rate": 5.9491837425698816e-05, "epoch": 0.4486371997101611, "percentage": 44.86, "elapsed_time": "19:02:56", "remaining_time": "23:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8050, "total_steps": 17941, "loss": 1.3862, "learning_rate": 5.948309495650153e-05, "epoch": 0.4486929379633242, "percentage": 44.87, "elapsed_time": "19:03:05", "remaining_time": "23:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8051, "total_steps": 17941, "loss": 1.744, "learning_rate": 5.947435218655576e-05, "epoch": 0.4487486762164874, "percentage": 44.87, "elapsed_time": "19:03:13", "remaining_time": "23:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8052, "total_steps": 17941, "loss": 1.9782, "learning_rate": 5.946560911613877e-05, "epoch": 0.4488044144696505, "percentage": 44.88, "elapsed_time": "19:03:22", "remaining_time": "23:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8053, "total_steps": 17941, "loss": 1.6861, "learning_rate": 5.945686574552785e-05, "epoch": 0.44886015272281365, "percentage": 44.89, "elapsed_time": "19:03:30", "remaining_time": "23:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8054, "total_steps": 17941, "loss": 1.8577, "learning_rate": 5.944812207500029e-05, "epoch": 0.44891589097597684, "percentage": 44.89, "elapsed_time": "19:03:39", "remaining_time": "23:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8055, "total_steps": 17941, "loss": 1.8143, "learning_rate": 5.943937810483338e-05, "epoch": 0.44897162922913997, "percentage": 44.9, "elapsed_time": "19:03:47", "remaining_time": "23:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8056, "total_steps": 17941, "loss": 1.7183, "learning_rate": 5.943063383530444e-05, "epoch": 0.4490273674823031, "percentage": 44.9, "elapsed_time": "19:03:56", "remaining_time": "23:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8057, "total_steps": 17941, "loss": 1.5619, "learning_rate": 5.942188926669077e-05, "epoch": 0.4490831057354662, "percentage": 44.91, "elapsed_time": "19:04:04", "remaining_time": "23:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8058, "total_steps": 17941, "loss": 1.8049, "learning_rate": 5.941314439926969e-05, "epoch": 0.4491388439886294, "percentage": 44.91, "elapsed_time": "19:04:12", "remaining_time": "23:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8059, "total_steps": 17941, "loss": 1.9301, "learning_rate": 5.940439923331857e-05, "epoch": 0.44919458224179254, "percentage": 44.92, "elapsed_time": "19:04:21", "remaining_time": "23:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8060, "total_steps": 17941, "loss": 1.6145, "learning_rate": 5.939565376911475e-05, "epoch": 0.44925032049495567, "percentage": 44.93, "elapsed_time": "19:04:29", "remaining_time": "23:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8061, "total_steps": 17941, "loss": 1.7435, "learning_rate": 5.938690800693556e-05, "epoch": 0.44930605874811885, "percentage": 44.93, "elapsed_time": "19:04:38", "remaining_time": "23:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8062, "total_steps": 17941, "loss": 1.7497, "learning_rate": 5.937816194705838e-05, "epoch": 0.449361797001282, "percentage": 44.94, "elapsed_time": "19:04:46", "remaining_time": "23:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8063, "total_steps": 17941, "loss": 1.6565, "learning_rate": 5.936941558976058e-05, "epoch": 0.4494175352544451, "percentage": 44.94, "elapsed_time": "19:04:55", "remaining_time": "23:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8064, "total_steps": 17941, "loss": 1.6147, "learning_rate": 5.936066893531954e-05, "epoch": 0.4494732735076083, "percentage": 44.95, "elapsed_time": "19:05:03", "remaining_time": "23:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8065, "total_steps": 17941, "loss": 1.652, "learning_rate": 5.9351921984012657e-05, "epoch": 0.4495290117607714, "percentage": 44.95, "elapsed_time": "19:05:12", "remaining_time": "23:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8066, "total_steps": 17941, "loss": 1.7302, "learning_rate": 5.934317473611734e-05, "epoch": 0.44958475001393455, "percentage": 44.96, "elapsed_time": "19:05:20", "remaining_time": "23:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8067, "total_steps": 17941, "loss": 1.6976, "learning_rate": 5.9334427191911e-05, "epoch": 0.4496404882670977, "percentage": 44.96, "elapsed_time": "19:05:28", "remaining_time": "23:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8068, "total_steps": 17941, "loss": 1.5901, "learning_rate": 5.932567935167104e-05, "epoch": 0.44969622652026087, "percentage": 44.97, "elapsed_time": "19:05:37", "remaining_time": "23:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8069, "total_steps": 17941, "loss": 1.7005, "learning_rate": 5.931693121567492e-05, "epoch": 0.449751964773424, "percentage": 44.98, "elapsed_time": "19:05:45", "remaining_time": "23:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8070, "total_steps": 17941, "loss": 1.8827, "learning_rate": 5.930818278420005e-05, "epoch": 0.4498077030265871, "percentage": 44.98, "elapsed_time": "19:05:54", "remaining_time": "23:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8071, "total_steps": 17941, "loss": 1.6689, "learning_rate": 5.9299434057523894e-05, "epoch": 0.4498634412797503, "percentage": 44.99, "elapsed_time": "19:06:02", "remaining_time": "23:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8072, "total_steps": 17941, "loss": 1.1558, "learning_rate": 5.929068503592391e-05, "epoch": 0.44991917953291344, "percentage": 44.99, "elapsed_time": "19:06:11", "remaining_time": "23:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8073, "total_steps": 17941, "loss": 1.7916, "learning_rate": 5.9281935719677574e-05, "epoch": 0.44997491778607657, "percentage": 45.0, "elapsed_time": "19:06:19", "remaining_time": "23:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8074, "total_steps": 17941, "loss": 1.6458, "learning_rate": 5.927318610906234e-05, "epoch": 0.45003065603923975, "percentage": 45.0, "elapsed_time": "19:06:28", "remaining_time": "23:21:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8075, "total_steps": 17941, "loss": 1.754, "learning_rate": 5.9264436204355724e-05, "epoch": 0.4500863942924029, "percentage": 45.01, "elapsed_time": "19:06:36", "remaining_time": "23:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8076, "total_steps": 17941, "loss": 1.7992, "learning_rate": 5.92556860058352e-05, "epoch": 0.450142132545566, "percentage": 45.01, "elapsed_time": "19:06:44", "remaining_time": "23:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8077, "total_steps": 17941, "loss": 1.6756, "learning_rate": 5.9246935513778276e-05, "epoch": 0.4501978707987292, "percentage": 45.02, "elapsed_time": "19:06:53", "remaining_time": "23:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8078, "total_steps": 17941, "loss": 1.6423, "learning_rate": 5.923818472846248e-05, "epoch": 0.4502536090518923, "percentage": 45.03, "elapsed_time": "19:07:01", "remaining_time": "23:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8079, "total_steps": 17941, "loss": 1.7708, "learning_rate": 5.922943365016531e-05, "epoch": 0.45030934730505545, "percentage": 45.03, "elapsed_time": "19:07:10", "remaining_time": "23:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8080, "total_steps": 17941, "loss": 1.7107, "learning_rate": 5.922068227916433e-05, "epoch": 0.4503650855582186, "percentage": 45.04, "elapsed_time": "19:07:18", "remaining_time": "23:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8081, "total_steps": 17941, "loss": 1.801, "learning_rate": 5.9211930615737066e-05, "epoch": 0.45042082381138177, "percentage": 45.04, "elapsed_time": "19:07:27", "remaining_time": "23:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8082, "total_steps": 17941, "loss": 1.6317, "learning_rate": 5.920317866016108e-05, "epoch": 0.4504765620645449, "percentage": 45.05, "elapsed_time": "19:07:35", "remaining_time": "23:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8083, "total_steps": 17941, "loss": 1.6841, "learning_rate": 5.919442641271391e-05, "epoch": 0.450532300317708, "percentage": 45.05, "elapsed_time": "19:07:44", "remaining_time": "23:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8084, "total_steps": 17941, "loss": 1.3761, "learning_rate": 5.9185673873673154e-05, "epoch": 0.4505880385708712, "percentage": 45.06, "elapsed_time": "19:07:52", "remaining_time": "23:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8085, "total_steps": 17941, "loss": 1.9012, "learning_rate": 5.917692104331637e-05, "epoch": 0.45064377682403434, "percentage": 45.06, "elapsed_time": "19:08:01", "remaining_time": "23:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8086, "total_steps": 17941, "loss": 1.8825, "learning_rate": 5.916816792192116e-05, "epoch": 0.45069951507719747, "percentage": 45.07, "elapsed_time": "19:08:09", "remaining_time": "23:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8087, "total_steps": 17941, "loss": 1.6097, "learning_rate": 5.915941450976512e-05, "epoch": 0.45075525333036065, "percentage": 45.08, "elapsed_time": "19:08:18", "remaining_time": "23:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8088, "total_steps": 17941, "loss": 1.7299, "learning_rate": 5.9150660807125844e-05, "epoch": 0.4508109915835238, "percentage": 45.08, "elapsed_time": "19:08:26", "remaining_time": "23:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8089, "total_steps": 17941, "loss": 1.818, "learning_rate": 5.9141906814280975e-05, "epoch": 0.4508667298366869, "percentage": 45.09, "elapsed_time": "19:08:34", "remaining_time": "23:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8090, "total_steps": 17941, "loss": 1.8804, "learning_rate": 5.9133152531508106e-05, "epoch": 0.45092246808985004, "percentage": 45.09, "elapsed_time": "19:08:43", "remaining_time": "23:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8091, "total_steps": 17941, "loss": 1.6162, "learning_rate": 5.91243979590849e-05, "epoch": 0.4509782063430132, "percentage": 45.1, "elapsed_time": "19:08:52", "remaining_time": "23:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8092, "total_steps": 17941, "loss": 1.7833, "learning_rate": 5.911564309728899e-05, "epoch": 0.45103394459617635, "percentage": 45.1, "elapsed_time": "19:09:00", "remaining_time": "23:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8093, "total_steps": 17941, "loss": 1.5982, "learning_rate": 5.910688794639803e-05, "epoch": 0.4510896828493395, "percentage": 45.11, "elapsed_time": "19:09:09", "remaining_time": "23:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8094, "total_steps": 17941, "loss": 1.8386, "learning_rate": 5.909813250668967e-05, "epoch": 0.45114542110250266, "percentage": 45.11, "elapsed_time": "19:09:17", "remaining_time": "23:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8095, "total_steps": 17941, "loss": 1.748, "learning_rate": 5.9089376778441606e-05, "epoch": 0.4512011593556658, "percentage": 45.12, "elapsed_time": "19:09:26", "remaining_time": "23:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8096, "total_steps": 17941, "loss": 1.4871, "learning_rate": 5.908062076193149e-05, "epoch": 0.4512568976088289, "percentage": 45.13, "elapsed_time": "19:09:34", "remaining_time": "23:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8097, "total_steps": 17941, "loss": 1.4985, "learning_rate": 5.907186445743704e-05, "epoch": 0.4513126358619921, "percentage": 45.13, "elapsed_time": "19:09:42", "remaining_time": "23:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8098, "total_steps": 17941, "loss": 1.7953, "learning_rate": 5.9063107865235936e-05, "epoch": 0.45136837411515524, "percentage": 45.14, "elapsed_time": "19:09:51", "remaining_time": "23:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8099, "total_steps": 17941, "loss": 1.4848, "learning_rate": 5.90543509856059e-05, "epoch": 0.45142411236831836, "percentage": 45.14, "elapsed_time": "19:10:00", "remaining_time": "23:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8100, "total_steps": 17941, "loss": 1.8602, "learning_rate": 5.904559381882463e-05, "epoch": 0.45147985062148155, "percentage": 45.15, "elapsed_time": "19:10:09", "remaining_time": "23:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8101, "total_steps": 17941, "loss": 1.7242, "learning_rate": 5.9036836365169865e-05, "epoch": 0.4515355888746447, "percentage": 45.15, "elapsed_time": "19:10:18", "remaining_time": "23:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8102, "total_steps": 17941, "loss": 1.4976, "learning_rate": 5.9028078624919344e-05, "epoch": 0.4515913271278078, "percentage": 45.16, "elapsed_time": "19:10:26", "remaining_time": "23:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8103, "total_steps": 17941, "loss": 1.667, "learning_rate": 5.901932059835081e-05, "epoch": 0.45164706538097094, "percentage": 45.16, "elapsed_time": "19:10:34", "remaining_time": "23:16:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8104, "total_steps": 17941, "loss": 1.5909, "learning_rate": 5.9010562285742e-05, "epoch": 0.4517028036341341, "percentage": 45.17, "elapsed_time": "19:10:43", "remaining_time": "23:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8105, "total_steps": 17941, "loss": 1.6947, "learning_rate": 5.9001803687370696e-05, "epoch": 0.45175854188729725, "percentage": 45.18, "elapsed_time": "19:10:51", "remaining_time": "23:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8106, "total_steps": 17941, "loss": 1.4796, "learning_rate": 5.8993044803514674e-05, "epoch": 0.4518142801404604, "percentage": 45.18, "elapsed_time": "19:11:00", "remaining_time": "23:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8107, "total_steps": 17941, "loss": 1.8176, "learning_rate": 5.8984285634451695e-05, "epoch": 0.45187001839362356, "percentage": 45.19, "elapsed_time": "19:11:08", "remaining_time": "23:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8108, "total_steps": 17941, "loss": 1.6067, "learning_rate": 5.897552618045956e-05, "epoch": 0.4519257566467867, "percentage": 45.19, "elapsed_time": "19:11:17", "remaining_time": "23:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8109, "total_steps": 17941, "loss": 1.6761, "learning_rate": 5.896676644181607e-05, "epoch": 0.4519814948999498, "percentage": 45.2, "elapsed_time": "19:11:25", "remaining_time": "23:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8110, "total_steps": 17941, "loss": 1.8323, "learning_rate": 5.8958006418799005e-05, "epoch": 0.452037233153113, "percentage": 45.2, "elapsed_time": "19:11:34", "remaining_time": "23:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8111, "total_steps": 17941, "loss": 1.865, "learning_rate": 5.894924611168622e-05, "epoch": 0.45209297140627613, "percentage": 45.21, "elapsed_time": "19:11:42", "remaining_time": "23:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8112, "total_steps": 17941, "loss": 1.8, "learning_rate": 5.894048552075554e-05, "epoch": 0.45214870965943926, "percentage": 45.21, "elapsed_time": "19:11:50", "remaining_time": "23:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8113, "total_steps": 17941, "loss": 1.4806, "learning_rate": 5.893172464628477e-05, "epoch": 0.4522044479126024, "percentage": 45.22, "elapsed_time": "19:11:59", "remaining_time": "23:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8114, "total_steps": 17941, "loss": 1.7427, "learning_rate": 5.8922963488551775e-05, "epoch": 0.4522601861657656, "percentage": 45.23, "elapsed_time": "19:12:07", "remaining_time": "23:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8115, "total_steps": 17941, "loss": 1.8576, "learning_rate": 5.89142020478344e-05, "epoch": 0.4523159244189287, "percentage": 45.23, "elapsed_time": "19:12:16", "remaining_time": "23:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8116, "total_steps": 17941, "loss": 1.6966, "learning_rate": 5.890544032441051e-05, "epoch": 0.45237166267209183, "percentage": 45.24, "elapsed_time": "19:12:25", "remaining_time": "23:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8117, "total_steps": 17941, "loss": 1.639, "learning_rate": 5.889667831855797e-05, "epoch": 0.452427400925255, "percentage": 45.24, "elapsed_time": "19:12:33", "remaining_time": "23:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8118, "total_steps": 17941, "loss": 1.7707, "learning_rate": 5.888791603055467e-05, "epoch": 0.45248313917841815, "percentage": 45.25, "elapsed_time": "19:12:42", "remaining_time": "23:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8119, "total_steps": 17941, "loss": 1.8751, "learning_rate": 5.887915346067851e-05, "epoch": 0.4525388774315813, "percentage": 45.25, "elapsed_time": "19:12:50", "remaining_time": "23:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8120, "total_steps": 17941, "loss": 1.5854, "learning_rate": 5.8870390609207337e-05, "epoch": 0.45259461568474446, "percentage": 45.26, "elapsed_time": "19:12:59", "remaining_time": "23:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8121, "total_steps": 17941, "loss": 1.6138, "learning_rate": 5.886162747641912e-05, "epoch": 0.4526503539379076, "percentage": 45.27, "elapsed_time": "19:13:07", "remaining_time": "23:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8122, "total_steps": 17941, "loss": 1.4997, "learning_rate": 5.885286406259174e-05, "epoch": 0.4527060921910707, "percentage": 45.27, "elapsed_time": "19:13:15", "remaining_time": "23:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8123, "total_steps": 17941, "loss": 1.372, "learning_rate": 5.884410036800312e-05, "epoch": 0.4527618304442339, "percentage": 45.28, "elapsed_time": "19:13:24", "remaining_time": "23:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8124, "total_steps": 17941, "loss": 1.7398, "learning_rate": 5.883533639293119e-05, "epoch": 0.45281756869739703, "percentage": 45.28, "elapsed_time": "19:13:32", "remaining_time": "23:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8125, "total_steps": 17941, "loss": 1.8826, "learning_rate": 5.882657213765393e-05, "epoch": 0.45287330695056016, "percentage": 45.29, "elapsed_time": "19:13:41", "remaining_time": "23:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8126, "total_steps": 17941, "loss": 1.8187, "learning_rate": 5.881780760244926e-05, "epoch": 0.4529290452037233, "percentage": 45.29, "elapsed_time": "19:13:50", "remaining_time": "23:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8127, "total_steps": 17941, "loss": 1.5317, "learning_rate": 5.8809042787595135e-05, "epoch": 0.4529847834568865, "percentage": 45.3, "elapsed_time": "19:13:58", "remaining_time": "23:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8128, "total_steps": 17941, "loss": 1.9912, "learning_rate": 5.880027769336953e-05, "epoch": 0.4530405217100496, "percentage": 45.3, "elapsed_time": "19:14:06", "remaining_time": "23:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8129, "total_steps": 17941, "loss": 1.7771, "learning_rate": 5.879151232005044e-05, "epoch": 0.45309625996321273, "percentage": 45.31, "elapsed_time": "19:14:15", "remaining_time": "23:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8130, "total_steps": 17941, "loss": 1.9728, "learning_rate": 5.8782746667915824e-05, "epoch": 0.4531519982163759, "percentage": 45.32, "elapsed_time": "19:14:24", "remaining_time": "23:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8131, "total_steps": 17941, "loss": 1.7932, "learning_rate": 5.877398073724368e-05, "epoch": 0.45320773646953905, "percentage": 45.32, "elapsed_time": "19:14:32", "remaining_time": "23:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8132, "total_steps": 17941, "loss": 1.6562, "learning_rate": 5.876521452831205e-05, "epoch": 0.4532634747227022, "percentage": 45.33, "elapsed_time": "19:14:41", "remaining_time": "23:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8133, "total_steps": 17941, "loss": 1.6491, "learning_rate": 5.87564480413989e-05, "epoch": 0.45331921297586536, "percentage": 45.33, "elapsed_time": "19:14:49", "remaining_time": "23:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8134, "total_steps": 17941, "loss": 1.6799, "learning_rate": 5.8747681276782294e-05, "epoch": 0.4533749512290285, "percentage": 45.34, "elapsed_time": "19:14:58", "remaining_time": "23:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8135, "total_steps": 17941, "loss": 1.7299, "learning_rate": 5.8738914234740225e-05, "epoch": 0.4534306894821916, "percentage": 45.34, "elapsed_time": "19:15:07", "remaining_time": "23:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8136, "total_steps": 17941, "loss": 1.529, "learning_rate": 5.8730146915550745e-05, "epoch": 0.45348642773535475, "percentage": 45.35, "elapsed_time": "19:15:15", "remaining_time": "23:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8137, "total_steps": 17941, "loss": 1.7301, "learning_rate": 5.872137931949191e-05, "epoch": 0.45354216598851793, "percentage": 45.35, "elapsed_time": "19:15:24", "remaining_time": "23:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8138, "total_steps": 17941, "loss": 1.7159, "learning_rate": 5.871261144684177e-05, "epoch": 0.45359790424168106, "percentage": 45.36, "elapsed_time": "19:15:33", "remaining_time": "23:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8139, "total_steps": 17941, "loss": 1.6208, "learning_rate": 5.870384329787839e-05, "epoch": 0.4536536424948442, "percentage": 45.37, "elapsed_time": "19:15:41", "remaining_time": "23:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8140, "total_steps": 17941, "loss": 1.7554, "learning_rate": 5.8695074872879855e-05, "epoch": 0.4537093807480074, "percentage": 45.37, "elapsed_time": "19:15:50", "remaining_time": "23:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8141, "total_steps": 17941, "loss": 1.6493, "learning_rate": 5.868630617212424e-05, "epoch": 0.4537651190011705, "percentage": 45.38, "elapsed_time": "19:15:58", "remaining_time": "23:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8142, "total_steps": 17941, "loss": 1.8717, "learning_rate": 5.867753719588963e-05, "epoch": 0.45382085725433363, "percentage": 45.38, "elapsed_time": "19:16:07", "remaining_time": "23:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8143, "total_steps": 17941, "loss": 1.7959, "learning_rate": 5.8668767944454136e-05, "epoch": 0.4538765955074968, "percentage": 45.39, "elapsed_time": "19:16:15", "remaining_time": "23:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8144, "total_steps": 17941, "loss": 1.7492, "learning_rate": 5.865999841809586e-05, "epoch": 0.45393233376065995, "percentage": 45.39, "elapsed_time": "19:16:24", "remaining_time": "23:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8145, "total_steps": 17941, "loss": 1.7432, "learning_rate": 5.865122861709295e-05, "epoch": 0.4539880720138231, "percentage": 45.4, "elapsed_time": "19:16:33", "remaining_time": "23:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8146, "total_steps": 17941, "loss": 1.5536, "learning_rate": 5.864245854172349e-05, "epoch": 0.45404381026698626, "percentage": 45.4, "elapsed_time": "19:16:42", "remaining_time": "23:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8147, "total_steps": 17941, "loss": 1.5528, "learning_rate": 5.8633688192265645e-05, "epoch": 0.4540995485201494, "percentage": 45.41, "elapsed_time": "19:16:50", "remaining_time": "23:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8148, "total_steps": 17941, "loss": 1.5251, "learning_rate": 5.862491756899753e-05, "epoch": 0.4541552867733125, "percentage": 45.42, "elapsed_time": "19:16:59", "remaining_time": "23:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8149, "total_steps": 17941, "loss": 1.5709, "learning_rate": 5.8616146672197326e-05, "epoch": 0.45421102502647565, "percentage": 45.42, "elapsed_time": "19:17:07", "remaining_time": "23:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8150, "total_steps": 17941, "loss": 1.6585, "learning_rate": 5.8607375502143183e-05, "epoch": 0.45426676327963883, "percentage": 45.43, "elapsed_time": "19:17:16", "remaining_time": "23:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8151, "total_steps": 17941, "loss": 2.0239, "learning_rate": 5.859860405911328e-05, "epoch": 0.45432250153280196, "percentage": 45.43, "elapsed_time": "19:17:24", "remaining_time": "23:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8152, "total_steps": 17941, "loss": 1.5565, "learning_rate": 5.858983234338579e-05, "epoch": 0.4543782397859651, "percentage": 45.44, "elapsed_time": "19:17:33", "remaining_time": "23:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8153, "total_steps": 17941, "loss": 1.8482, "learning_rate": 5.858106035523888e-05, "epoch": 0.4544339780391283, "percentage": 45.44, "elapsed_time": "19:17:42", "remaining_time": "23:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8154, "total_steps": 17941, "loss": 1.6401, "learning_rate": 5.85722880949508e-05, "epoch": 0.4544897162922914, "percentage": 45.45, "elapsed_time": "19:17:50", "remaining_time": "23:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8155, "total_steps": 17941, "loss": 1.8876, "learning_rate": 5.8563515562799695e-05, "epoch": 0.45454545454545453, "percentage": 45.45, "elapsed_time": "19:17:59", "remaining_time": "23:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8156, "total_steps": 17941, "loss": 1.4215, "learning_rate": 5.855474275906381e-05, "epoch": 0.4546011927986177, "percentage": 45.46, "elapsed_time": "19:18:07", "remaining_time": "23:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8157, "total_steps": 17941, "loss": 1.8225, "learning_rate": 5.854596968402136e-05, "epoch": 0.45465693105178084, "percentage": 45.47, "elapsed_time": "19:18:16", "remaining_time": "23:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8158, "total_steps": 17941, "loss": 1.6582, "learning_rate": 5.8537196337950596e-05, "epoch": 0.454712669304944, "percentage": 45.47, "elapsed_time": "19:18:24", "remaining_time": "23:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8159, "total_steps": 17941, "loss": 1.6121, "learning_rate": 5.8528422721129726e-05, "epoch": 0.4547684075581071, "percentage": 45.48, "elapsed_time": "19:18:33", "remaining_time": "23:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8160, "total_steps": 17941, "loss": 1.5704, "learning_rate": 5.8519648833837013e-05, "epoch": 0.4548241458112703, "percentage": 45.48, "elapsed_time": "19:18:42", "remaining_time": "23:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8161, "total_steps": 17941, "loss": 1.918, "learning_rate": 5.851087467635071e-05, "epoch": 0.4548798840644334, "percentage": 45.49, "elapsed_time": "19:18:50", "remaining_time": "23:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8162, "total_steps": 17941, "loss": 1.7381, "learning_rate": 5.8502100248949085e-05, "epoch": 0.45493562231759654, "percentage": 45.49, "elapsed_time": "19:18:59", "remaining_time": "23:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8163, "total_steps": 17941, "loss": 1.6602, "learning_rate": 5.8493325551910405e-05, "epoch": 0.45499136057075973, "percentage": 45.5, "elapsed_time": "19:19:07", "remaining_time": "23:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8164, "total_steps": 17941, "loss": 1.7762, "learning_rate": 5.848455058551298e-05, "epoch": 0.45504709882392286, "percentage": 45.5, "elapsed_time": "19:19:16", "remaining_time": "23:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8165, "total_steps": 17941, "loss": 1.8456, "learning_rate": 5.8475775350035056e-05, "epoch": 0.455102837077086, "percentage": 45.51, "elapsed_time": "19:19:24", "remaining_time": "23:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8166, "total_steps": 17941, "loss": 1.6512, "learning_rate": 5.846699984575497e-05, "epoch": 0.45515857533024917, "percentage": 45.52, "elapsed_time": "19:19:33", "remaining_time": "23:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8167, "total_steps": 17941, "loss": 1.675, "learning_rate": 5.8458224072951005e-05, "epoch": 0.4552143135834123, "percentage": 45.52, "elapsed_time": "19:19:41", "remaining_time": "23:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8168, "total_steps": 17941, "loss": 1.4973, "learning_rate": 5.844944803190149e-05, "epoch": 0.45527005183657543, "percentage": 45.53, "elapsed_time": "19:19:50", "remaining_time": "23:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8169, "total_steps": 17941, "loss": 1.6223, "learning_rate": 5.844067172288474e-05, "epoch": 0.4553257900897386, "percentage": 45.53, "elapsed_time": "19:19:59", "remaining_time": "23:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8170, "total_steps": 17941, "loss": 1.7822, "learning_rate": 5.843189514617911e-05, "epoch": 0.45538152834290174, "percentage": 45.54, "elapsed_time": "19:20:07", "remaining_time": "23:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8171, "total_steps": 17941, "loss": 1.7511, "learning_rate": 5.8423118302062915e-05, "epoch": 0.45543726659606487, "percentage": 45.54, "elapsed_time": "19:20:16", "remaining_time": "23:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8172, "total_steps": 17941, "loss": 1.6494, "learning_rate": 5.841434119081453e-05, "epoch": 0.455493004849228, "percentage": 45.55, "elapsed_time": "19:20:24", "remaining_time": "23:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8173, "total_steps": 17941, "loss": 1.6952, "learning_rate": 5.840556381271229e-05, "epoch": 0.4555487431023912, "percentage": 45.55, "elapsed_time": "19:20:33", "remaining_time": "23:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8174, "total_steps": 17941, "loss": 1.5907, "learning_rate": 5.839678616803458e-05, "epoch": 0.4556044813555543, "percentage": 45.56, "elapsed_time": "19:20:41", "remaining_time": "23:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8175, "total_steps": 17941, "loss": 1.6862, "learning_rate": 5.838800825705977e-05, "epoch": 0.45566021960871744, "percentage": 45.57, "elapsed_time": "19:20:50", "remaining_time": "23:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8176, "total_steps": 17941, "loss": 1.7354, "learning_rate": 5.837923008006623e-05, "epoch": 0.4557159578618806, "percentage": 45.57, "elapsed_time": "19:20:58", "remaining_time": "23:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8177, "total_steps": 17941, "loss": 1.7971, "learning_rate": 5.837045163733239e-05, "epoch": 0.45577169611504376, "percentage": 45.58, "elapsed_time": "19:21:07", "remaining_time": "23:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8178, "total_steps": 17941, "loss": 1.4939, "learning_rate": 5.8361672929136614e-05, "epoch": 0.4558274343682069, "percentage": 45.58, "elapsed_time": "19:21:15", "remaining_time": "23:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8179, "total_steps": 17941, "loss": 1.8816, "learning_rate": 5.835289395575731e-05, "epoch": 0.45588317262137007, "percentage": 45.59, "elapsed_time": "19:21:23", "remaining_time": "23:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8180, "total_steps": 17941, "loss": 1.6907, "learning_rate": 5.8344114717472943e-05, "epoch": 0.4559389108745332, "percentage": 45.59, "elapsed_time": "19:21:32", "remaining_time": "23:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8181, "total_steps": 17941, "loss": 1.6905, "learning_rate": 5.833533521456188e-05, "epoch": 0.4559946491276963, "percentage": 45.6, "elapsed_time": "19:21:40", "remaining_time": "23:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8182, "total_steps": 17941, "loss": 1.5996, "learning_rate": 5.832655544730259e-05, "epoch": 0.45605038738085946, "percentage": 45.61, "elapsed_time": "19:21:49", "remaining_time": "23:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8183, "total_steps": 17941, "loss": 1.6316, "learning_rate": 5.831777541597351e-05, "epoch": 0.45610612563402264, "percentage": 45.61, "elapsed_time": "19:21:57", "remaining_time": "23:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8184, "total_steps": 17941, "loss": 1.7246, "learning_rate": 5.8308995120853096e-05, "epoch": 0.45616186388718577, "percentage": 45.62, "elapsed_time": "19:22:06", "remaining_time": "23:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8185, "total_steps": 17941, "loss": 1.8438, "learning_rate": 5.830021456221979e-05, "epoch": 0.4562176021403489, "percentage": 45.62, "elapsed_time": "19:22:14", "remaining_time": "23:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8186, "total_steps": 17941, "loss": 1.2569, "learning_rate": 5.829143374035209e-05, "epoch": 0.4562733403935121, "percentage": 45.63, "elapsed_time": "19:22:22", "remaining_time": "23:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8187, "total_steps": 17941, "loss": 1.6355, "learning_rate": 5.8282652655528426e-05, "epoch": 0.4563290786466752, "percentage": 45.63, "elapsed_time": "19:22:31", "remaining_time": "23:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8188, "total_steps": 17941, "loss": 1.7473, "learning_rate": 5.827387130802733e-05, "epoch": 0.45638481689983834, "percentage": 45.64, "elapsed_time": "19:22:39", "remaining_time": "23:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8189, "total_steps": 17941, "loss": 1.817, "learning_rate": 5.826508969812726e-05, "epoch": 0.4564405551530015, "percentage": 45.64, "elapsed_time": "19:22:48", "remaining_time": "23:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8190, "total_steps": 17941, "loss": 1.8728, "learning_rate": 5.825630782610676e-05, "epoch": 0.45649629340616465, "percentage": 45.65, "elapsed_time": "19:22:56", "remaining_time": "23:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8191, "total_steps": 17941, "loss": 1.8616, "learning_rate": 5.82475256922443e-05, "epoch": 0.4565520316593278, "percentage": 45.66, "elapsed_time": "19:23:05", "remaining_time": "23:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8192, "total_steps": 17941, "loss": 1.7224, "learning_rate": 5.8238743296818396e-05, "epoch": 0.45660776991249097, "percentage": 45.66, "elapsed_time": "19:23:13", "remaining_time": "23:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8193, "total_steps": 17941, "loss": 1.556, "learning_rate": 5.8229960640107617e-05, "epoch": 0.4566635081656541, "percentage": 45.67, "elapsed_time": "19:23:22", "remaining_time": "23:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8194, "total_steps": 17941, "loss": 1.6086, "learning_rate": 5.822117772239045e-05, "epoch": 0.4567192464188172, "percentage": 45.67, "elapsed_time": "19:23:30", "remaining_time": "23:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8195, "total_steps": 17941, "loss": 1.5987, "learning_rate": 5.821239454394547e-05, "epoch": 0.45677498467198036, "percentage": 45.68, "elapsed_time": "19:23:38", "remaining_time": "23:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8196, "total_steps": 17941, "loss": 1.7936, "learning_rate": 5.8203611105051204e-05, "epoch": 0.45683072292514354, "percentage": 45.68, "elapsed_time": "19:23:47", "remaining_time": "23:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8197, "total_steps": 17941, "loss": 1.5304, "learning_rate": 5.819482740598624e-05, "epoch": 0.45688646117830667, "percentage": 45.69, "elapsed_time": "19:23:56", "remaining_time": "23:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8198, "total_steps": 17941, "loss": 1.6869, "learning_rate": 5.8186043447029125e-05, "epoch": 0.4569421994314698, "percentage": 45.69, "elapsed_time": "19:24:04", "remaining_time": "23:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8199, "total_steps": 17941, "loss": 1.7673, "learning_rate": 5.8177259228458444e-05, "epoch": 0.456997937684633, "percentage": 45.7, "elapsed_time": "19:24:13", "remaining_time": "23:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8200, "total_steps": 17941, "loss": 1.9119, "learning_rate": 5.816847475055277e-05, "epoch": 0.4570536759377961, "percentage": 45.71, "elapsed_time": "19:24:22", "remaining_time": "23:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8201, "total_steps": 17941, "loss": 1.5385, "learning_rate": 5.8159690013590695e-05, "epoch": 0.45710941419095924, "percentage": 45.71, "elapsed_time": "19:24:30", "remaining_time": "23:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8202, "total_steps": 17941, "loss": 1.5954, "learning_rate": 5.815090501785083e-05, "epoch": 0.4571651524441224, "percentage": 45.72, "elapsed_time": "19:24:39", "remaining_time": "23:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8203, "total_steps": 17941, "loss": 1.9886, "learning_rate": 5.814211976361179e-05, "epoch": 0.45722089069728555, "percentage": 45.72, "elapsed_time": "19:24:48", "remaining_time": "23:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8204, "total_steps": 17941, "loss": 1.6259, "learning_rate": 5.813333425115218e-05, "epoch": 0.4572766289504487, "percentage": 45.73, "elapsed_time": "19:24:56", "remaining_time": "23:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8205, "total_steps": 17941, "loss": 1.7129, "learning_rate": 5.812454848075063e-05, "epoch": 0.4573323672036118, "percentage": 45.73, "elapsed_time": "19:25:04", "remaining_time": "23:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8206, "total_steps": 17941, "loss": 1.7543, "learning_rate": 5.8115762452685774e-05, "epoch": 0.457388105456775, "percentage": 45.74, "elapsed_time": "19:25:13", "remaining_time": "23:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8207, "total_steps": 17941, "loss": 1.5619, "learning_rate": 5.810697616723624e-05, "epoch": 0.4574438437099381, "percentage": 45.74, "elapsed_time": "19:25:21", "remaining_time": "23:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8208, "total_steps": 17941, "loss": 1.5594, "learning_rate": 5.809818962468069e-05, "epoch": 0.45749958196310125, "percentage": 45.75, "elapsed_time": "19:25:30", "remaining_time": "23:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8209, "total_steps": 17941, "loss": 1.5727, "learning_rate": 5.8089402825297776e-05, "epoch": 0.45755532021626444, "percentage": 45.76, "elapsed_time": "19:25:38", "remaining_time": "23:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8210, "total_steps": 17941, "loss": 1.6845, "learning_rate": 5.80806157693662e-05, "epoch": 0.45761105846942757, "percentage": 45.76, "elapsed_time": "19:25:47", "remaining_time": "23:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8211, "total_steps": 17941, "loss": 1.8239, "learning_rate": 5.807182845716458e-05, "epoch": 0.4576667967225907, "percentage": 45.77, "elapsed_time": "19:25:55", "remaining_time": "23:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8212, "total_steps": 17941, "loss": 1.9671, "learning_rate": 5.8063040888971635e-05, "epoch": 0.4577225349757539, "percentage": 45.77, "elapsed_time": "19:26:04", "remaining_time": "23:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8213, "total_steps": 17941, "loss": 1.5801, "learning_rate": 5.8054253065066024e-05, "epoch": 0.457778273228917, "percentage": 45.78, "elapsed_time": "19:26:12", "remaining_time": "23:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8214, "total_steps": 17941, "loss": 1.5843, "learning_rate": 5.8045464985726474e-05, "epoch": 0.45783401148208014, "percentage": 45.78, "elapsed_time": "19:26:21", "remaining_time": "23:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8215, "total_steps": 17941, "loss": 1.9532, "learning_rate": 5.803667665123168e-05, "epoch": 0.4578897497352433, "percentage": 45.79, "elapsed_time": "19:26:29", "remaining_time": "23:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8216, "total_steps": 17941, "loss": 1.9501, "learning_rate": 5.802788806186038e-05, "epoch": 0.45794548798840645, "percentage": 45.79, "elapsed_time": "19:26:38", "remaining_time": "23:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8217, "total_steps": 17941, "loss": 1.7435, "learning_rate": 5.801909921789126e-05, "epoch": 0.4580012262415696, "percentage": 45.8, "elapsed_time": "19:26:46", "remaining_time": "23:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8218, "total_steps": 17941, "loss": 1.928, "learning_rate": 5.801031011960306e-05, "epoch": 0.4580569644947327, "percentage": 45.81, "elapsed_time": "19:26:55", "remaining_time": "23:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8219, "total_steps": 17941, "loss": 1.8, "learning_rate": 5.800152076727454e-05, "epoch": 0.4581127027478959, "percentage": 45.81, "elapsed_time": "19:27:03", "remaining_time": "23:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8220, "total_steps": 17941, "loss": 1.6805, "learning_rate": 5.799273116118443e-05, "epoch": 0.458168441001059, "percentage": 45.82, "elapsed_time": "19:27:12", "remaining_time": "23:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8221, "total_steps": 17941, "loss": 1.4218, "learning_rate": 5.798394130161149e-05, "epoch": 0.45822417925422215, "percentage": 45.82, "elapsed_time": "19:27:21", "remaining_time": "23:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8222, "total_steps": 17941, "loss": 1.7633, "learning_rate": 5.7975151188834475e-05, "epoch": 0.45827991750738534, "percentage": 45.83, "elapsed_time": "19:27:29", "remaining_time": "23:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8223, "total_steps": 17941, "loss": 2.0147, "learning_rate": 5.796636082313217e-05, "epoch": 0.45833565576054847, "percentage": 45.83, "elapsed_time": "19:27:38", "remaining_time": "22:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8224, "total_steps": 17941, "loss": 1.5335, "learning_rate": 5.795757020478334e-05, "epoch": 0.4583913940137116, "percentage": 45.84, "elapsed_time": "19:27:46", "remaining_time": "22:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8225, "total_steps": 17941, "loss": 1.778, "learning_rate": 5.794877933406679e-05, "epoch": 0.4584471322668748, "percentage": 45.84, "elapsed_time": "19:27:55", "remaining_time": "22:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8226, "total_steps": 17941, "loss": 1.678, "learning_rate": 5.79399882112613e-05, "epoch": 0.4585028705200379, "percentage": 45.85, "elapsed_time": "19:28:03", "remaining_time": "22:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8227, "total_steps": 17941, "loss": 1.5224, "learning_rate": 5.7931196836645675e-05, "epoch": 0.45855860877320104, "percentage": 45.86, "elapsed_time": "19:28:11", "remaining_time": "22:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8228, "total_steps": 17941, "loss": 1.9743, "learning_rate": 5.792240521049872e-05, "epoch": 0.45861434702636417, "percentage": 45.86, "elapsed_time": "19:28:20", "remaining_time": "22:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8229, "total_steps": 17941, "loss": 1.6526, "learning_rate": 5.791361333309926e-05, "epoch": 0.45867008527952735, "percentage": 45.87, "elapsed_time": "19:28:29", "remaining_time": "22:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8230, "total_steps": 17941, "loss": 1.7427, "learning_rate": 5.790482120472615e-05, "epoch": 0.4587258235326905, "percentage": 45.87, "elapsed_time": "19:28:38", "remaining_time": "22:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8231, "total_steps": 17941, "loss": 1.5028, "learning_rate": 5.789602882565818e-05, "epoch": 0.4587815617858536, "percentage": 45.88, "elapsed_time": "19:28:47", "remaining_time": "22:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8232, "total_steps": 17941, "loss": 1.6115, "learning_rate": 5.788723619617422e-05, "epoch": 0.4588373000390168, "percentage": 45.88, "elapsed_time": "19:28:55", "remaining_time": "22:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8233, "total_steps": 17941, "loss": 1.5789, "learning_rate": 5.787844331655311e-05, "epoch": 0.4588930382921799, "percentage": 45.89, "elapsed_time": "19:29:04", "remaining_time": "22:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8234, "total_steps": 17941, "loss": 1.66, "learning_rate": 5.786965018707371e-05, "epoch": 0.45894877654534305, "percentage": 45.89, "elapsed_time": "19:29:12", "remaining_time": "22:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8235, "total_steps": 17941, "loss": 1.9192, "learning_rate": 5.786085680801488e-05, "epoch": 0.45900451479850624, "percentage": 45.9, "elapsed_time": "19:29:20", "remaining_time": "22:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8236, "total_steps": 17941, "loss": 1.5435, "learning_rate": 5.785206317965553e-05, "epoch": 0.45906025305166936, "percentage": 45.91, "elapsed_time": "19:29:29", "remaining_time": "22:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8237, "total_steps": 17941, "loss": 1.2152, "learning_rate": 5.7843269302274506e-05, "epoch": 0.4591159913048325, "percentage": 45.91, "elapsed_time": "19:29:37", "remaining_time": "22:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8238, "total_steps": 17941, "loss": 1.6407, "learning_rate": 5.7834475176150715e-05, "epoch": 0.4591717295579957, "percentage": 45.92, "elapsed_time": "19:29:46", "remaining_time": "22:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8239, "total_steps": 17941, "loss": 1.8297, "learning_rate": 5.782568080156303e-05, "epoch": 0.4592274678111588, "percentage": 45.92, "elapsed_time": "19:29:54", "remaining_time": "22:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8240, "total_steps": 17941, "loss": 1.7981, "learning_rate": 5.781688617879039e-05, "epoch": 0.45928320606432194, "percentage": 45.93, "elapsed_time": "19:30:03", "remaining_time": "22:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8241, "total_steps": 17941, "loss": 1.6244, "learning_rate": 5.780809130811169e-05, "epoch": 0.45933894431748507, "percentage": 45.93, "elapsed_time": "19:30:11", "remaining_time": "22:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8242, "total_steps": 17941, "loss": 1.6348, "learning_rate": 5.779929618980586e-05, "epoch": 0.45939468257064825, "percentage": 45.94, "elapsed_time": "19:30:19", "remaining_time": "22:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8243, "total_steps": 17941, "loss": 1.7342, "learning_rate": 5.779050082415184e-05, "epoch": 0.4594504208238114, "percentage": 45.95, "elapsed_time": "19:30:28", "remaining_time": "22:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8244, "total_steps": 17941, "loss": 1.6838, "learning_rate": 5.778170521142854e-05, "epoch": 0.4595061590769745, "percentage": 45.95, "elapsed_time": "19:30:36", "remaining_time": "22:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8245, "total_steps": 17941, "loss": 1.72, "learning_rate": 5.777290935191493e-05, "epoch": 0.4595618973301377, "percentage": 45.96, "elapsed_time": "19:30:45", "remaining_time": "22:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8246, "total_steps": 17941, "loss": 1.6783, "learning_rate": 5.776411324588995e-05, "epoch": 0.4596176355833008, "percentage": 45.96, "elapsed_time": "19:30:54", "remaining_time": "22:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8247, "total_steps": 17941, "loss": 1.5248, "learning_rate": 5.775531689363256e-05, "epoch": 0.45967337383646395, "percentage": 45.97, "elapsed_time": "19:31:02", "remaining_time": "22:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8248, "total_steps": 17941, "loss": 1.5673, "learning_rate": 5.7746520295421736e-05, "epoch": 0.45972911208962713, "percentage": 45.97, "elapsed_time": "19:31:11", "remaining_time": "22:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8249, "total_steps": 17941, "loss": 1.9275, "learning_rate": 5.773772345153648e-05, "epoch": 0.45978485034279026, "percentage": 45.98, "elapsed_time": "19:31:19", "remaining_time": "22:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8250, "total_steps": 17941, "loss": 1.583, "learning_rate": 5.772892636225572e-05, "epoch": 0.4598405885959534, "percentage": 45.98, "elapsed_time": "19:31:28", "remaining_time": "22:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8251, "total_steps": 17941, "loss": 1.6752, "learning_rate": 5.7720129027858496e-05, "epoch": 0.4598963268491165, "percentage": 45.99, "elapsed_time": "19:31:36", "remaining_time": "22:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8252, "total_steps": 17941, "loss": 1.5191, "learning_rate": 5.771133144862377e-05, "epoch": 0.4599520651022797, "percentage": 46.0, "elapsed_time": "19:31:45", "remaining_time": "22:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8253, "total_steps": 17941, "loss": 1.7338, "learning_rate": 5.770253362483059e-05, "epoch": 0.46000780335544283, "percentage": 46.0, "elapsed_time": "19:31:53", "remaining_time": "22:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8254, "total_steps": 17941, "loss": 1.9825, "learning_rate": 5.769373555675794e-05, "epoch": 0.46006354160860596, "percentage": 46.01, "elapsed_time": "19:32:02", "remaining_time": "22:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8255, "total_steps": 17941, "loss": 1.8879, "learning_rate": 5.7684937244684856e-05, "epoch": 0.46011927986176915, "percentage": 46.01, "elapsed_time": "19:32:10", "remaining_time": "22:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8256, "total_steps": 17941, "loss": 1.5408, "learning_rate": 5.767613868889038e-05, "epoch": 0.4601750181149323, "percentage": 46.02, "elapsed_time": "19:32:18", "remaining_time": "22:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8257, "total_steps": 17941, "loss": 1.7434, "learning_rate": 5.766733988965354e-05, "epoch": 0.4602307563680954, "percentage": 46.02, "elapsed_time": "19:32:27", "remaining_time": "22:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8258, "total_steps": 17941, "loss": 1.7586, "learning_rate": 5.765854084725337e-05, "epoch": 0.4602864946212586, "percentage": 46.03, "elapsed_time": "19:32:35", "remaining_time": "22:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8259, "total_steps": 17941, "loss": 1.8, "learning_rate": 5.764974156196895e-05, "epoch": 0.4603422328744217, "percentage": 46.03, "elapsed_time": "19:32:44", "remaining_time": "22:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8260, "total_steps": 17941, "loss": 1.5867, "learning_rate": 5.764094203407933e-05, "epoch": 0.46039797112758485, "percentage": 46.04, "elapsed_time": "19:32:52", "remaining_time": "22:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8261, "total_steps": 17941, "loss": 1.8117, "learning_rate": 5.763214226386355e-05, "epoch": 0.46045370938074803, "percentage": 46.05, "elapsed_time": "19:33:01", "remaining_time": "22:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8262, "total_steps": 17941, "loss": 1.6466, "learning_rate": 5.7623342251600745e-05, "epoch": 0.46050944763391116, "percentage": 46.05, "elapsed_time": "19:33:09", "remaining_time": "22:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8263, "total_steps": 17941, "loss": 1.6135, "learning_rate": 5.761454199756996e-05, "epoch": 0.4605651858870743, "percentage": 46.06, "elapsed_time": "19:33:18", "remaining_time": "22:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8264, "total_steps": 17941, "loss": 1.6211, "learning_rate": 5.7605741502050314e-05, "epoch": 0.4606209241402374, "percentage": 46.06, "elapsed_time": "19:33:26", "remaining_time": "22:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8265, "total_steps": 17941, "loss": 1.795, "learning_rate": 5.759694076532087e-05, "epoch": 0.4606766623934006, "percentage": 46.07, "elapsed_time": "19:33:35", "remaining_time": "22:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8266, "total_steps": 17941, "loss": 1.4925, "learning_rate": 5.758813978766077e-05, "epoch": 0.46073240064656373, "percentage": 46.07, "elapsed_time": "19:33:43", "remaining_time": "22:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8267, "total_steps": 17941, "loss": 1.8677, "learning_rate": 5.75793385693491e-05, "epoch": 0.46078813889972686, "percentage": 46.08, "elapsed_time": "19:33:52", "remaining_time": "22:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8268, "total_steps": 17941, "loss": 1.7692, "learning_rate": 5.7570537110665026e-05, "epoch": 0.46084387715289005, "percentage": 46.08, "elapsed_time": "19:34:01", "remaining_time": "22:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8269, "total_steps": 17941, "loss": 1.8521, "learning_rate": 5.7561735411887644e-05, "epoch": 0.4608996154060532, "percentage": 46.09, "elapsed_time": "19:34:09", "remaining_time": "22:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8270, "total_steps": 17941, "loss": 1.8511, "learning_rate": 5.75529334732961e-05, "epoch": 0.4609553536592163, "percentage": 46.1, "elapsed_time": "19:34:17", "remaining_time": "22:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8271, "total_steps": 17941, "loss": 1.6472, "learning_rate": 5.754413129516956e-05, "epoch": 0.4610110919123795, "percentage": 46.1, "elapsed_time": "19:34:27", "remaining_time": "22:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8272, "total_steps": 17941, "loss": 1.5722, "learning_rate": 5.753532887778714e-05, "epoch": 0.4610668301655426, "percentage": 46.11, "elapsed_time": "19:34:35", "remaining_time": "22:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8273, "total_steps": 17941, "loss": 1.6829, "learning_rate": 5.7526526221428036e-05, "epoch": 0.46112256841870575, "percentage": 46.11, "elapsed_time": "19:34:44", "remaining_time": "22:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8274, "total_steps": 17941, "loss": 1.6583, "learning_rate": 5.751772332637137e-05, "epoch": 0.4611783066718689, "percentage": 46.12, "elapsed_time": "19:34:53", "remaining_time": "22:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8275, "total_steps": 17941, "loss": 1.7805, "learning_rate": 5.75089201928964e-05, "epoch": 0.46123404492503206, "percentage": 46.12, "elapsed_time": "19:35:01", "remaining_time": "22:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8276, "total_steps": 17941, "loss": 1.8315, "learning_rate": 5.750011682128222e-05, "epoch": 0.4612897831781952, "percentage": 46.13, "elapsed_time": "19:35:10", "remaining_time": "22:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8277, "total_steps": 17941, "loss": 1.6431, "learning_rate": 5.7491313211808095e-05, "epoch": 0.4613455214313583, "percentage": 46.13, "elapsed_time": "19:35:18", "remaining_time": "22:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8278, "total_steps": 17941, "loss": 1.9023, "learning_rate": 5.748250936475318e-05, "epoch": 0.4614012596845215, "percentage": 46.14, "elapsed_time": "19:35:27", "remaining_time": "22:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8279, "total_steps": 17941, "loss": 1.7468, "learning_rate": 5.747370528039668e-05, "epoch": 0.46145699793768463, "percentage": 46.15, "elapsed_time": "19:35:35", "remaining_time": "22:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8280, "total_steps": 17941, "loss": 1.7059, "learning_rate": 5.7464900959017844e-05, "epoch": 0.46151273619084776, "percentage": 46.15, "elapsed_time": "19:35:44", "remaining_time": "22:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8281, "total_steps": 17941, "loss": 1.8385, "learning_rate": 5.745609640089585e-05, "epoch": 0.46156847444401095, "percentage": 46.16, "elapsed_time": "19:35:52", "remaining_time": "22:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8282, "total_steps": 17941, "loss": 1.5585, "learning_rate": 5.744729160630998e-05, "epoch": 0.4616242126971741, "percentage": 46.16, "elapsed_time": "19:36:02", "remaining_time": "22:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8283, "total_steps": 17941, "loss": 1.6787, "learning_rate": 5.743848657553943e-05, "epoch": 0.4616799509503372, "percentage": 46.17, "elapsed_time": "19:36:10", "remaining_time": "22:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8284, "total_steps": 17941, "loss": 1.9457, "learning_rate": 5.742968130886346e-05, "epoch": 0.4617356892035004, "percentage": 46.17, "elapsed_time": "19:36:19", "remaining_time": "22:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8285, "total_steps": 17941, "loss": 1.7643, "learning_rate": 5.74208758065613e-05, "epoch": 0.4617914274566635, "percentage": 46.18, "elapsed_time": "19:36:27", "remaining_time": "22:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8286, "total_steps": 17941, "loss": 1.414, "learning_rate": 5.741207006891224e-05, "epoch": 0.46184716570982665, "percentage": 46.18, "elapsed_time": "19:36:36", "remaining_time": "22:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8287, "total_steps": 17941, "loss": 1.7004, "learning_rate": 5.740326409619552e-05, "epoch": 0.4619029039629898, "percentage": 46.19, "elapsed_time": "19:36:44", "remaining_time": "22:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8288, "total_steps": 17941, "loss": 1.7653, "learning_rate": 5.739445788869043e-05, "epoch": 0.46195864221615296, "percentage": 46.2, "elapsed_time": "19:36:52", "remaining_time": "22:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8289, "total_steps": 17941, "loss": 1.7572, "learning_rate": 5.738565144667626e-05, "epoch": 0.4620143804693161, "percentage": 46.2, "elapsed_time": "19:37:01", "remaining_time": "22:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8290, "total_steps": 17941, "loss": 1.8134, "learning_rate": 5.737684477043228e-05, "epoch": 0.4620701187224792, "percentage": 46.21, "elapsed_time": "19:37:10", "remaining_time": "22:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8291, "total_steps": 17941, "loss": 1.4841, "learning_rate": 5.736803786023779e-05, "epoch": 0.4621258569756424, "percentage": 46.21, "elapsed_time": "19:37:18", "remaining_time": "22:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8292, "total_steps": 17941, "loss": 1.9146, "learning_rate": 5.7359230716372105e-05, "epoch": 0.46218159522880553, "percentage": 46.22, "elapsed_time": "19:37:26", "remaining_time": "22:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8293, "total_steps": 17941, "loss": 1.6559, "learning_rate": 5.735042333911452e-05, "epoch": 0.46223733348196866, "percentage": 46.22, "elapsed_time": "19:37:35", "remaining_time": "22:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8294, "total_steps": 17941, "loss": 1.6659, "learning_rate": 5.734161572874437e-05, "epoch": 0.46229307173513184, "percentage": 46.23, "elapsed_time": "19:37:44", "remaining_time": "22:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8295, "total_steps": 17941, "loss": 1.7702, "learning_rate": 5.7332807885540976e-05, "epoch": 0.462348809988295, "percentage": 46.23, "elapsed_time": "19:37:52", "remaining_time": "22:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8296, "total_steps": 17941, "loss": 1.6766, "learning_rate": 5.7323999809783656e-05, "epoch": 0.4624045482414581, "percentage": 46.24, "elapsed_time": "19:38:00", "remaining_time": "22:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8297, "total_steps": 17941, "loss": 1.6475, "learning_rate": 5.731519150175179e-05, "epoch": 0.46246028649462123, "percentage": 46.25, "elapsed_time": "19:38:10", "remaining_time": "22:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8298, "total_steps": 17941, "loss": 1.643, "learning_rate": 5.730638296172467e-05, "epoch": 0.4625160247477844, "percentage": 46.25, "elapsed_time": "19:38:18", "remaining_time": "22:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8299, "total_steps": 17941, "loss": 1.5904, "learning_rate": 5.7297574189981705e-05, "epoch": 0.46257176300094754, "percentage": 46.26, "elapsed_time": "19:38:27", "remaining_time": "22:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8300, "total_steps": 17941, "loss": 1.6782, "learning_rate": 5.7288765186802204e-05, "epoch": 0.4626275012541107, "percentage": 46.26, "elapsed_time": "19:38:35", "remaining_time": "22:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8301, "total_steps": 17941, "loss": 1.7858, "learning_rate": 5.72799559524656e-05, "epoch": 0.46268323950727386, "percentage": 46.27, "elapsed_time": "19:38:44", "remaining_time": "22:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8302, "total_steps": 17941, "loss": 1.757, "learning_rate": 5.7271146487251224e-05, "epoch": 0.462738977760437, "percentage": 46.27, "elapsed_time": "19:38:53", "remaining_time": "22:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8303, "total_steps": 17941, "loss": 1.7816, "learning_rate": 5.726233679143849e-05, "epoch": 0.4627947160136001, "percentage": 46.28, "elapsed_time": "19:39:02", "remaining_time": "22:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8304, "total_steps": 17941, "loss": 1.742, "learning_rate": 5.725352686530676e-05, "epoch": 0.4628504542667633, "percentage": 46.29, "elapsed_time": "19:39:10", "remaining_time": "22:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8305, "total_steps": 17941, "loss": 1.7751, "learning_rate": 5.724471670913545e-05, "epoch": 0.46290619251992643, "percentage": 46.29, "elapsed_time": "19:39:19", "remaining_time": "22:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8306, "total_steps": 17941, "loss": 1.6988, "learning_rate": 5.7235906323203956e-05, "epoch": 0.46296193077308956, "percentage": 46.3, "elapsed_time": "19:39:27", "remaining_time": "22:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8307, "total_steps": 17941, "loss": 1.6722, "learning_rate": 5.7227095707791714e-05, "epoch": 0.46301766902625274, "percentage": 46.3, "elapsed_time": "19:39:36", "remaining_time": "22:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8308, "total_steps": 17941, "loss": 1.8056, "learning_rate": 5.721828486317814e-05, "epoch": 0.46307340727941587, "percentage": 46.31, "elapsed_time": "19:39:44", "remaining_time": "22:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8309, "total_steps": 17941, "loss": 1.4819, "learning_rate": 5.7209473789642644e-05, "epoch": 0.463129145532579, "percentage": 46.31, "elapsed_time": "19:39:53", "remaining_time": "22:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8310, "total_steps": 17941, "loss": 1.7022, "learning_rate": 5.720066248746468e-05, "epoch": 0.46318488378574213, "percentage": 46.32, "elapsed_time": "19:40:01", "remaining_time": "22:47:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8311, "total_steps": 17941, "loss": 1.5258, "learning_rate": 5.7191850956923675e-05, "epoch": 0.4632406220389053, "percentage": 46.32, "elapsed_time": "19:40:09", "remaining_time": "22:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8312, "total_steps": 17941, "loss": 1.7439, "learning_rate": 5.7183039198299105e-05, "epoch": 0.46329636029206844, "percentage": 46.33, "elapsed_time": "19:40:18", "remaining_time": "22:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8313, "total_steps": 17941, "loss": 1.8911, "learning_rate": 5.717422721187039e-05, "epoch": 0.46335209854523157, "percentage": 46.34, "elapsed_time": "19:40:26", "remaining_time": "22:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8314, "total_steps": 17941, "loss": 1.6547, "learning_rate": 5.7165414997917045e-05, "epoch": 0.46340783679839476, "percentage": 46.34, "elapsed_time": "19:40:35", "remaining_time": "22:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8315, "total_steps": 17941, "loss": 1.8988, "learning_rate": 5.715660255671848e-05, "epoch": 0.4634635750515579, "percentage": 46.35, "elapsed_time": "19:40:44", "remaining_time": "22:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8316, "total_steps": 17941, "loss": 1.8075, "learning_rate": 5.714778988855422e-05, "epoch": 0.463519313304721, "percentage": 46.35, "elapsed_time": "19:40:52", "remaining_time": "22:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8317, "total_steps": 17941, "loss": 1.6288, "learning_rate": 5.713897699370376e-05, "epoch": 0.4635750515578842, "percentage": 46.36, "elapsed_time": "19:41:00", "remaining_time": "22:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8318, "total_steps": 17941, "loss": 1.6575, "learning_rate": 5.713016387244656e-05, "epoch": 0.46363078981104733, "percentage": 46.36, "elapsed_time": "19:41:09", "remaining_time": "22:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8319, "total_steps": 17941, "loss": 1.7129, "learning_rate": 5.7121350525062126e-05, "epoch": 0.46368652806421046, "percentage": 46.37, "elapsed_time": "19:41:17", "remaining_time": "22:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8320, "total_steps": 17941, "loss": 1.7888, "learning_rate": 5.7112536951829975e-05, "epoch": 0.4637422663173736, "percentage": 46.37, "elapsed_time": "19:41:26", "remaining_time": "22:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8321, "total_steps": 17941, "loss": 1.6324, "learning_rate": 5.710372315302963e-05, "epoch": 0.46379800457053677, "percentage": 46.38, "elapsed_time": "19:41:35", "remaining_time": "22:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8322, "total_steps": 17941, "loss": 1.5484, "learning_rate": 5.70949091289406e-05, "epoch": 0.4638537428236999, "percentage": 46.39, "elapsed_time": "19:41:43", "remaining_time": "22:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8323, "total_steps": 17941, "loss": 1.5863, "learning_rate": 5.708609487984242e-05, "epoch": 0.46390948107686303, "percentage": 46.39, "elapsed_time": "19:41:52", "remaining_time": "22:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8324, "total_steps": 17941, "loss": 1.7411, "learning_rate": 5.707728040601462e-05, "epoch": 0.4639652193300262, "percentage": 46.4, "elapsed_time": "19:42:00", "remaining_time": "22:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8325, "total_steps": 17941, "loss": 1.6488, "learning_rate": 5.706846570773676e-05, "epoch": 0.46402095758318934, "percentage": 46.4, "elapsed_time": "19:42:09", "remaining_time": "22:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8326, "total_steps": 17941, "loss": 1.7995, "learning_rate": 5.7059650785288354e-05, "epoch": 0.46407669583635247, "percentage": 46.41, "elapsed_time": "19:42:17", "remaining_time": "22:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8327, "total_steps": 17941, "loss": 1.8457, "learning_rate": 5.705083563894902e-05, "epoch": 0.46413243408951566, "percentage": 46.41, "elapsed_time": "19:42:26", "remaining_time": "22:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8328, "total_steps": 17941, "loss": 1.665, "learning_rate": 5.7042020268998265e-05, "epoch": 0.4641881723426788, "percentage": 46.42, "elapsed_time": "19:42:34", "remaining_time": "22:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8329, "total_steps": 17941, "loss": 1.5915, "learning_rate": 5.703320467571569e-05, "epoch": 0.4642439105958419, "percentage": 46.42, "elapsed_time": "19:42:43", "remaining_time": "22:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8330, "total_steps": 17941, "loss": 1.6417, "learning_rate": 5.7024388859380875e-05, "epoch": 0.4642996488490051, "percentage": 46.43, "elapsed_time": "19:42:51", "remaining_time": "22:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8331, "total_steps": 17941, "loss": 1.8457, "learning_rate": 5.701557282027339e-05, "epoch": 0.4643553871021682, "percentage": 46.44, "elapsed_time": "19:43:00", "remaining_time": "22:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8332, "total_steps": 17941, "loss": 1.6806, "learning_rate": 5.700675655867285e-05, "epoch": 0.46441112535533136, "percentage": 46.44, "elapsed_time": "19:43:08", "remaining_time": "22:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8333, "total_steps": 17941, "loss": 1.5137, "learning_rate": 5.6997940074858835e-05, "epoch": 0.4644668636084945, "percentage": 46.45, "elapsed_time": "19:43:16", "remaining_time": "22:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8334, "total_steps": 17941, "loss": 1.737, "learning_rate": 5.698912336911097e-05, "epoch": 0.46452260186165767, "percentage": 46.45, "elapsed_time": "19:43:25", "remaining_time": "22:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8335, "total_steps": 17941, "loss": 1.5039, "learning_rate": 5.6980306441708854e-05, "epoch": 0.4645783401148208, "percentage": 46.46, "elapsed_time": "19:43:33", "remaining_time": "22:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8336, "total_steps": 17941, "loss": 1.7687, "learning_rate": 5.6971489292932126e-05, "epoch": 0.4646340783679839, "percentage": 46.46, "elapsed_time": "19:43:42", "remaining_time": "22:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8337, "total_steps": 17941, "loss": 1.8375, "learning_rate": 5.69626719230604e-05, "epoch": 0.4646898166211471, "percentage": 46.47, "elapsed_time": "19:43:50", "remaining_time": "22:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8338, "total_steps": 17941, "loss": 1.6076, "learning_rate": 5.6953854332373314e-05, "epoch": 0.46474555487431024, "percentage": 46.47, "elapsed_time": "19:43:59", "remaining_time": "22:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8339, "total_steps": 17941, "loss": 1.75, "learning_rate": 5.6945036521150495e-05, "epoch": 0.46480129312747337, "percentage": 46.48, "elapsed_time": "19:44:07", "remaining_time": "22:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8340, "total_steps": 17941, "loss": 1.753, "learning_rate": 5.693621848967163e-05, "epoch": 0.46485703138063655, "percentage": 46.49, "elapsed_time": "19:44:16", "remaining_time": "22:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8341, "total_steps": 17941, "loss": 1.845, "learning_rate": 5.6927400238216354e-05, "epoch": 0.4649127696337997, "percentage": 46.49, "elapsed_time": "19:44:24", "remaining_time": "22:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8342, "total_steps": 17941, "loss": 1.5699, "learning_rate": 5.6918581767064325e-05, "epoch": 0.4649685078869628, "percentage": 46.5, "elapsed_time": "19:44:33", "remaining_time": "22:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8343, "total_steps": 17941, "loss": 1.5899, "learning_rate": 5.690976307649523e-05, "epoch": 0.46502424614012594, "percentage": 46.5, "elapsed_time": "19:44:41", "remaining_time": "22:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8344, "total_steps": 17941, "loss": 1.7661, "learning_rate": 5.6900944166788725e-05, "epoch": 0.4650799843932891, "percentage": 46.51, "elapsed_time": "19:44:49", "remaining_time": "22:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8345, "total_steps": 17941, "loss": 1.5225, "learning_rate": 5.689212503822452e-05, "epoch": 0.46513572264645225, "percentage": 46.51, "elapsed_time": "19:44:58", "remaining_time": "22:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8346, "total_steps": 17941, "loss": 1.5896, "learning_rate": 5.688330569108228e-05, "epoch": 0.4651914608996154, "percentage": 46.52, "elapsed_time": "19:45:07", "remaining_time": "22:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8347, "total_steps": 17941, "loss": 1.5632, "learning_rate": 5.6874486125641726e-05, "epoch": 0.46524719915277857, "percentage": 46.52, "elapsed_time": "19:45:15", "remaining_time": "22:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8348, "total_steps": 17941, "loss": 1.679, "learning_rate": 5.686566634218254e-05, "epoch": 0.4653029374059417, "percentage": 46.53, "elapsed_time": "19:45:24", "remaining_time": "22:42:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8349, "total_steps": 17941, "loss": 2.0888, "learning_rate": 5.685684634098447e-05, "epoch": 0.4653586756591048, "percentage": 46.54, "elapsed_time": "19:45:32", "remaining_time": "22:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8350, "total_steps": 17941, "loss": 1.7972, "learning_rate": 5.684802612232719e-05, "epoch": 0.465414413912268, "percentage": 46.54, "elapsed_time": "19:45:41", "remaining_time": "22:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8351, "total_steps": 17941, "loss": 1.8225, "learning_rate": 5.683920568649047e-05, "epoch": 0.46547015216543114, "percentage": 46.55, "elapsed_time": "19:45:50", "remaining_time": "22:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8352, "total_steps": 17941, "loss": 1.6771, "learning_rate": 5.6830385033753995e-05, "epoch": 0.46552589041859427, "percentage": 46.55, "elapsed_time": "19:45:58", "remaining_time": "22:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8353, "total_steps": 17941, "loss": 1.3349, "learning_rate": 5.682156416439755e-05, "epoch": 0.46558162867175745, "percentage": 46.56, "elapsed_time": "19:46:07", "remaining_time": "22:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8354, "total_steps": 17941, "loss": 1.606, "learning_rate": 5.681274307870085e-05, "epoch": 0.4656373669249206, "percentage": 46.56, "elapsed_time": "19:46:15", "remaining_time": "22:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8355, "total_steps": 17941, "loss": 1.7091, "learning_rate": 5.680392177694366e-05, "epoch": 0.4656931051780837, "percentage": 46.57, "elapsed_time": "19:46:24", "remaining_time": "22:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8356, "total_steps": 17941, "loss": 1.7989, "learning_rate": 5.679510025940575e-05, "epoch": 0.46574884343124684, "percentage": 46.57, "elapsed_time": "19:46:32", "remaining_time": "22:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8357, "total_steps": 17941, "loss": 1.5115, "learning_rate": 5.6786278526366875e-05, "epoch": 0.46580458168441, "percentage": 46.58, "elapsed_time": "19:46:40", "remaining_time": "22:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8358, "total_steps": 17941, "loss": 1.5391, "learning_rate": 5.677745657810681e-05, "epoch": 0.46586031993757315, "percentage": 46.59, "elapsed_time": "19:46:49", "remaining_time": "22:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8359, "total_steps": 17941, "loss": 1.4878, "learning_rate": 5.6768634414905344e-05, "epoch": 0.4659160581907363, "percentage": 46.59, "elapsed_time": "19:46:58", "remaining_time": "22:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8360, "total_steps": 17941, "loss": 1.7812, "learning_rate": 5.675981203704226e-05, "epoch": 0.46597179644389947, "percentage": 46.6, "elapsed_time": "19:47:06", "remaining_time": "22:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8361, "total_steps": 17941, "loss": 1.6782, "learning_rate": 5.675098944479733e-05, "epoch": 0.4660275346970626, "percentage": 46.6, "elapsed_time": "19:47:15", "remaining_time": "22:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8362, "total_steps": 17941, "loss": 1.4408, "learning_rate": 5.67421666384504e-05, "epoch": 0.4660832729502257, "percentage": 46.61, "elapsed_time": "19:47:23", "remaining_time": "22:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8363, "total_steps": 17941, "loss": 1.6993, "learning_rate": 5.673334361828124e-05, "epoch": 0.4661390112033889, "percentage": 46.61, "elapsed_time": "19:47:32", "remaining_time": "22:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8364, "total_steps": 17941, "loss": 1.5929, "learning_rate": 5.672452038456969e-05, "epoch": 0.46619474945655204, "percentage": 46.62, "elapsed_time": "19:47:40", "remaining_time": "22:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8365, "total_steps": 17941, "loss": 1.5579, "learning_rate": 5.671569693759554e-05, "epoch": 0.46625048770971517, "percentage": 46.63, "elapsed_time": "19:47:49", "remaining_time": "22:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8366, "total_steps": 17941, "loss": 1.5625, "learning_rate": 5.670687327763866e-05, "epoch": 0.4663062259628783, "percentage": 46.63, "elapsed_time": "19:47:58", "remaining_time": "22:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8367, "total_steps": 17941, "loss": 1.6695, "learning_rate": 5.6698049404978845e-05, "epoch": 0.4663619642160415, "percentage": 46.64, "elapsed_time": "19:48:06", "remaining_time": "22:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8368, "total_steps": 17941, "loss": 1.884, "learning_rate": 5.6689225319895966e-05, "epoch": 0.4664177024692046, "percentage": 46.64, "elapsed_time": "19:48:15", "remaining_time": "22:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8369, "total_steps": 17941, "loss": 1.9091, "learning_rate": 5.668040102266987e-05, "epoch": 0.46647344072236774, "percentage": 46.65, "elapsed_time": "19:48:24", "remaining_time": "22:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8370, "total_steps": 17941, "loss": 1.7085, "learning_rate": 5.6671576513580385e-05, "epoch": 0.4665291789755309, "percentage": 46.65, "elapsed_time": "19:48:32", "remaining_time": "22:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8371, "total_steps": 17941, "loss": 1.5626, "learning_rate": 5.66627517929074e-05, "epoch": 0.46658491722869405, "percentage": 46.66, "elapsed_time": "19:48:41", "remaining_time": "22:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8372, "total_steps": 17941, "loss": 1.7621, "learning_rate": 5.665392686093076e-05, "epoch": 0.4666406554818572, "percentage": 46.66, "elapsed_time": "19:48:49", "remaining_time": "22:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8373, "total_steps": 17941, "loss": 1.9983, "learning_rate": 5.664510171793038e-05, "epoch": 0.46669639373502037, "percentage": 46.67, "elapsed_time": "19:48:57", "remaining_time": "22:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8374, "total_steps": 17941, "loss": 1.5046, "learning_rate": 5.6636276364186105e-05, "epoch": 0.4667521319881835, "percentage": 46.68, "elapsed_time": "19:49:06", "remaining_time": "22:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8375, "total_steps": 17941, "loss": 1.6931, "learning_rate": 5.6627450799977844e-05, "epoch": 0.4668078702413466, "percentage": 46.68, "elapsed_time": "19:49:14", "remaining_time": "22:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8376, "total_steps": 17941, "loss": 1.5232, "learning_rate": 5.661862502558547e-05, "epoch": 0.4668636084945098, "percentage": 46.69, "elapsed_time": "19:49:23", "remaining_time": "22:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8377, "total_steps": 17941, "loss": 1.8327, "learning_rate": 5.660979904128891e-05, "epoch": 0.46691934674767294, "percentage": 46.69, "elapsed_time": "19:49:31", "remaining_time": "22:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8378, "total_steps": 17941, "loss": 1.5354, "learning_rate": 5.660097284736805e-05, "epoch": 0.46697508500083607, "percentage": 46.7, "elapsed_time": "19:49:40", "remaining_time": "22:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8379, "total_steps": 17941, "loss": 1.4303, "learning_rate": 5.6592146444102826e-05, "epoch": 0.4670308232539992, "percentage": 46.7, "elapsed_time": "19:49:48", "remaining_time": "22:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8380, "total_steps": 17941, "loss": 1.9321, "learning_rate": 5.658331983177315e-05, "epoch": 0.4670865615071624, "percentage": 46.71, "elapsed_time": "19:49:57", "remaining_time": "22:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8381, "total_steps": 17941, "loss": 1.9125, "learning_rate": 5.657449301065895e-05, "epoch": 0.4671422997603255, "percentage": 46.71, "elapsed_time": "19:50:06", "remaining_time": "22:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8382, "total_steps": 17941, "loss": 1.6072, "learning_rate": 5.656566598104017e-05, "epoch": 0.46719803801348864, "percentage": 46.72, "elapsed_time": "19:50:14", "remaining_time": "22:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8383, "total_steps": 17941, "loss": 1.719, "learning_rate": 5.655683874319675e-05, "epoch": 0.4672537762666518, "percentage": 46.73, "elapsed_time": "19:50:22", "remaining_time": "22:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8384, "total_steps": 17941, "loss": 1.6492, "learning_rate": 5.6548011297408634e-05, "epoch": 0.46730951451981495, "percentage": 46.73, "elapsed_time": "19:50:32", "remaining_time": "22:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8385, "total_steps": 17941, "loss": 1.7208, "learning_rate": 5.653918364395575e-05, "epoch": 0.4673652527729781, "percentage": 46.74, "elapsed_time": "19:50:40", "remaining_time": "22:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8386, "total_steps": 17941, "loss": 1.6186, "learning_rate": 5.653035578311812e-05, "epoch": 0.46742099102614126, "percentage": 46.74, "elapsed_time": "19:50:49", "remaining_time": "22:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8387, "total_steps": 17941, "loss": 1.2929, "learning_rate": 5.652152771517566e-05, "epoch": 0.4674767292793044, "percentage": 46.75, "elapsed_time": "19:50:57", "remaining_time": "22:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8388, "total_steps": 17941, "loss": 1.7447, "learning_rate": 5.651269944040838e-05, "epoch": 0.4675324675324675, "percentage": 46.75, "elapsed_time": "19:51:06", "remaining_time": "22:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8389, "total_steps": 17941, "loss": 1.7896, "learning_rate": 5.650387095909623e-05, "epoch": 0.46758820578563065, "percentage": 46.76, "elapsed_time": "19:51:14", "remaining_time": "22:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8390, "total_steps": 17941, "loss": 1.5537, "learning_rate": 5.649504227151922e-05, "epoch": 0.46764394403879384, "percentage": 46.76, "elapsed_time": "19:51:23", "remaining_time": "22:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8391, "total_steps": 17941, "loss": 1.5894, "learning_rate": 5.648621337795733e-05, "epoch": 0.46769968229195696, "percentage": 46.77, "elapsed_time": "19:51:32", "remaining_time": "22:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8392, "total_steps": 17941, "loss": 1.8336, "learning_rate": 5.647738427869058e-05, "epoch": 0.4677554205451201, "percentage": 46.78, "elapsed_time": "19:51:40", "remaining_time": "22:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8393, "total_steps": 17941, "loss": 1.799, "learning_rate": 5.6468554973998955e-05, "epoch": 0.4678111587982833, "percentage": 46.78, "elapsed_time": "19:51:49", "remaining_time": "22:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8394, "total_steps": 17941, "loss": 1.7678, "learning_rate": 5.645972546416248e-05, "epoch": 0.4678668970514464, "percentage": 46.79, "elapsed_time": "19:51:57", "remaining_time": "22:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8395, "total_steps": 17941, "loss": 1.6982, "learning_rate": 5.6450895749461194e-05, "epoch": 0.46792263530460954, "percentage": 46.79, "elapsed_time": "19:52:06", "remaining_time": "22:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8396, "total_steps": 17941, "loss": 1.5794, "learning_rate": 5.64420658301751e-05, "epoch": 0.4679783735577727, "percentage": 46.8, "elapsed_time": "19:52:14", "remaining_time": "22:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8397, "total_steps": 17941, "loss": 1.4545, "learning_rate": 5.643323570658424e-05, "epoch": 0.46803411181093585, "percentage": 46.8, "elapsed_time": "19:52:23", "remaining_time": "22:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8398, "total_steps": 17941, "loss": 1.6886, "learning_rate": 5.642440537896863e-05, "epoch": 0.468089850064099, "percentage": 46.81, "elapsed_time": "19:52:32", "remaining_time": "22:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8399, "total_steps": 17941, "loss": 1.6932, "learning_rate": 5.6415574847608365e-05, "epoch": 0.46814558831726216, "percentage": 46.81, "elapsed_time": "19:52:41", "remaining_time": "22:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8400, "total_steps": 17941, "loss": 1.6357, "learning_rate": 5.640674411278345e-05, "epoch": 0.4682013265704253, "percentage": 46.82, "elapsed_time": "19:52:49", "remaining_time": "22:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8401, "total_steps": 17941, "loss": 1.4748, "learning_rate": 5.6397913174773986e-05, "epoch": 0.4682570648235884, "percentage": 46.83, "elapsed_time": "19:52:58", "remaining_time": "22:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8402, "total_steps": 17941, "loss": 1.6619, "learning_rate": 5.638908203386001e-05, "epoch": 0.46831280307675155, "percentage": 46.83, "elapsed_time": "19:53:07", "remaining_time": "22:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8403, "total_steps": 17941, "loss": 1.7486, "learning_rate": 5.638025069032159e-05, "epoch": 0.46836854132991473, "percentage": 46.84, "elapsed_time": "19:53:15", "remaining_time": "22:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8404, "total_steps": 17941, "loss": 1.6243, "learning_rate": 5.637141914443883e-05, "epoch": 0.46842427958307786, "percentage": 46.84, "elapsed_time": "19:53:23", "remaining_time": "22:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8405, "total_steps": 17941, "loss": 1.6984, "learning_rate": 5.6362587396491805e-05, "epoch": 0.468480017836241, "percentage": 46.85, "elapsed_time": "19:53:32", "remaining_time": "22:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8406, "total_steps": 17941, "loss": 1.6001, "learning_rate": 5.63537554467606e-05, "epoch": 0.4685357560894042, "percentage": 46.85, "elapsed_time": "19:53:41", "remaining_time": "22:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8407, "total_steps": 17941, "loss": 1.4702, "learning_rate": 5.634492329552531e-05, "epoch": 0.4685914943425673, "percentage": 46.86, "elapsed_time": "19:53:49", "remaining_time": "22:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8408, "total_steps": 17941, "loss": 1.8799, "learning_rate": 5.6336090943066063e-05, "epoch": 0.46864723259573043, "percentage": 46.86, "elapsed_time": "19:53:58", "remaining_time": "22:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8409, "total_steps": 17941, "loss": 1.7107, "learning_rate": 5.632725838966294e-05, "epoch": 0.4687029708488936, "percentage": 46.87, "elapsed_time": "19:54:06", "remaining_time": "22:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8410, "total_steps": 17941, "loss": 1.6502, "learning_rate": 5.631842563559608e-05, "epoch": 0.46875870910205675, "percentage": 46.88, "elapsed_time": "19:54:15", "remaining_time": "22:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8411, "total_steps": 17941, "loss": 1.6374, "learning_rate": 5.630959268114558e-05, "epoch": 0.4688144473552199, "percentage": 46.88, "elapsed_time": "19:54:23", "remaining_time": "22:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8412, "total_steps": 17941, "loss": 1.7209, "learning_rate": 5.630075952659162e-05, "epoch": 0.46887018560838306, "percentage": 46.89, "elapsed_time": "19:54:31", "remaining_time": "22:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8413, "total_steps": 17941, "loss": 1.7923, "learning_rate": 5.629192617221427e-05, "epoch": 0.4689259238615462, "percentage": 46.89, "elapsed_time": "19:54:41", "remaining_time": "22:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8414, "total_steps": 17941, "loss": 1.6201, "learning_rate": 5.6283092618293734e-05, "epoch": 0.4689816621147093, "percentage": 46.9, "elapsed_time": "19:54:49", "remaining_time": "22:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8415, "total_steps": 17941, "loss": 1.5646, "learning_rate": 5.627425886511012e-05, "epoch": 0.46903740036787245, "percentage": 46.9, "elapsed_time": "19:54:58", "remaining_time": "22:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8416, "total_steps": 17941, "loss": 1.7076, "learning_rate": 5.626542491294359e-05, "epoch": 0.46909313862103563, "percentage": 46.91, "elapsed_time": "19:55:06", "remaining_time": "22:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8417, "total_steps": 17941, "loss": 1.5801, "learning_rate": 5.6256590762074315e-05, "epoch": 0.46914887687419876, "percentage": 46.91, "elapsed_time": "19:55:15", "remaining_time": "22:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8418, "total_steps": 17941, "loss": 1.8075, "learning_rate": 5.624775641278247e-05, "epoch": 0.4692046151273619, "percentage": 46.92, "elapsed_time": "19:55:23", "remaining_time": "22:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8419, "total_steps": 17941, "loss": 1.8437, "learning_rate": 5.6238921865348204e-05, "epoch": 0.4692603533805251, "percentage": 46.93, "elapsed_time": "19:55:31", "remaining_time": "22:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8420, "total_steps": 17941, "loss": 1.7371, "learning_rate": 5.623008712005172e-05, "epoch": 0.4693160916336882, "percentage": 46.93, "elapsed_time": "19:55:40", "remaining_time": "22:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8421, "total_steps": 17941, "loss": 1.646, "learning_rate": 5.62212521771732e-05, "epoch": 0.46937182988685133, "percentage": 46.94, "elapsed_time": "19:55:48", "remaining_time": "22:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8422, "total_steps": 17941, "loss": 1.447, "learning_rate": 5.6212417036992826e-05, "epoch": 0.4694275681400145, "percentage": 46.94, "elapsed_time": "19:55:57", "remaining_time": "22:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8423, "total_steps": 17941, "loss": 1.729, "learning_rate": 5.620358169979082e-05, "epoch": 0.46948330639317765, "percentage": 46.95, "elapsed_time": "19:56:05", "remaining_time": "22:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8424, "total_steps": 17941, "loss": 1.5096, "learning_rate": 5.619474616584734e-05, "epoch": 0.4695390446463408, "percentage": 46.95, "elapsed_time": "19:56:14", "remaining_time": "22:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8425, "total_steps": 17941, "loss": 1.5803, "learning_rate": 5.618591043544266e-05, "epoch": 0.4695947828995039, "percentage": 46.96, "elapsed_time": "19:56:22", "remaining_time": "22:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8426, "total_steps": 17941, "loss": 1.6776, "learning_rate": 5.617707450885695e-05, "epoch": 0.4696505211526671, "percentage": 46.97, "elapsed_time": "19:56:30", "remaining_time": "22:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8427, "total_steps": 17941, "loss": 1.6402, "learning_rate": 5.6168238386370466e-05, "epoch": 0.4697062594058302, "percentage": 46.97, "elapsed_time": "19:56:39", "remaining_time": "22:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8428, "total_steps": 17941, "loss": 1.7642, "learning_rate": 5.615940206826341e-05, "epoch": 0.46976199765899335, "percentage": 46.98, "elapsed_time": "19:56:47", "remaining_time": "22:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8429, "total_steps": 17941, "loss": 1.7081, "learning_rate": 5.6150565554816035e-05, "epoch": 0.46981773591215653, "percentage": 46.98, "elapsed_time": "19:56:56", "remaining_time": "22:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8430, "total_steps": 17941, "loss": 1.7756, "learning_rate": 5.6141728846308586e-05, "epoch": 0.46987347416531966, "percentage": 46.99, "elapsed_time": "19:57:04", "remaining_time": "22:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8431, "total_steps": 17941, "loss": 1.5193, "learning_rate": 5.6132891943021304e-05, "epoch": 0.4699292124184828, "percentage": 46.99, "elapsed_time": "19:57:13", "remaining_time": "22:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8432, "total_steps": 17941, "loss": 1.5169, "learning_rate": 5.612405484523444e-05, "epoch": 0.469984950671646, "percentage": 47.0, "elapsed_time": "19:57:21", "remaining_time": "22:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8433, "total_steps": 17941, "loss": 1.6159, "learning_rate": 5.6115217553228274e-05, "epoch": 0.4700406889248091, "percentage": 47.0, "elapsed_time": "19:57:30", "remaining_time": "22:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8434, "total_steps": 17941, "loss": 1.6027, "learning_rate": 5.610638006728306e-05, "epoch": 0.47009642717797223, "percentage": 47.01, "elapsed_time": "19:57:38", "remaining_time": "22:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8435, "total_steps": 17941, "loss": 1.3854, "learning_rate": 5.609754238767907e-05, "epoch": 0.4701521654311354, "percentage": 47.02, "elapsed_time": "19:57:46", "remaining_time": "22:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8436, "total_steps": 17941, "loss": 1.6888, "learning_rate": 5.608870451469659e-05, "epoch": 0.47020790368429854, "percentage": 47.02, "elapsed_time": "19:57:55", "remaining_time": "22:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8437, "total_steps": 17941, "loss": 1.5963, "learning_rate": 5.607986644861588e-05, "epoch": 0.4702636419374617, "percentage": 47.03, "elapsed_time": "19:58:03", "remaining_time": "22:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8438, "total_steps": 17941, "loss": 1.7791, "learning_rate": 5.607102818971729e-05, "epoch": 0.4703193801906248, "percentage": 47.03, "elapsed_time": "19:58:12", "remaining_time": "22:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8439, "total_steps": 17941, "loss": 1.744, "learning_rate": 5.6062189738281056e-05, "epoch": 0.470375118443788, "percentage": 47.04, "elapsed_time": "19:58:20", "remaining_time": "22:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8440, "total_steps": 17941, "loss": 1.4963, "learning_rate": 5.6053351094587526e-05, "epoch": 0.4704308566969511, "percentage": 47.04, "elapsed_time": "19:58:30", "remaining_time": "22:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8441, "total_steps": 17941, "loss": 1.491, "learning_rate": 5.604451225891698e-05, "epoch": 0.47048659495011425, "percentage": 47.05, "elapsed_time": "19:58:39", "remaining_time": "22:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8442, "total_steps": 17941, "loss": 1.6241, "learning_rate": 5.603567323154975e-05, "epoch": 0.47054233320327743, "percentage": 47.05, "elapsed_time": "19:58:47", "remaining_time": "22:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8443, "total_steps": 17941, "loss": 1.6522, "learning_rate": 5.602683401276615e-05, "epoch": 0.47059807145644056, "percentage": 47.06, "elapsed_time": "19:58:56", "remaining_time": "22:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8444, "total_steps": 17941, "loss": 1.7361, "learning_rate": 5.601799460284654e-05, "epoch": 0.4706538097096037, "percentage": 47.07, "elapsed_time": "19:59:04", "remaining_time": "22:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8445, "total_steps": 17941, "loss": 1.6558, "learning_rate": 5.60091550020712e-05, "epoch": 0.47070954796276687, "percentage": 47.07, "elapsed_time": "19:59:12", "remaining_time": "22:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8446, "total_steps": 17941, "loss": 1.7492, "learning_rate": 5.60003152107205e-05, "epoch": 0.47076528621593, "percentage": 47.08, "elapsed_time": "19:59:21", "remaining_time": "22:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8447, "total_steps": 17941, "loss": 1.6956, "learning_rate": 5.599147522907481e-05, "epoch": 0.47082102446909313, "percentage": 47.08, "elapsed_time": "19:59:29", "remaining_time": "22:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8448, "total_steps": 17941, "loss": 1.5153, "learning_rate": 5.598263505741443e-05, "epoch": 0.47087676272225626, "percentage": 47.09, "elapsed_time": "19:59:38", "remaining_time": "22:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8449, "total_steps": 17941, "loss": 1.5719, "learning_rate": 5.597379469601978e-05, "epoch": 0.47093250097541944, "percentage": 47.09, "elapsed_time": "19:59:46", "remaining_time": "22:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8450, "total_steps": 17941, "loss": 1.7169, "learning_rate": 5.5964954145171145e-05, "epoch": 0.4709882392285826, "percentage": 47.1, "elapsed_time": "19:59:55", "remaining_time": "22:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8451, "total_steps": 17941, "loss": 1.6197, "learning_rate": 5.595611340514898e-05, "epoch": 0.4710439774817457, "percentage": 47.1, "elapsed_time": "20:00:03", "remaining_time": "22:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8452, "total_steps": 17941, "loss": 1.611, "learning_rate": 5.594727247623361e-05, "epoch": 0.4710997157349089, "percentage": 47.11, "elapsed_time": "20:00:12", "remaining_time": "22:27:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8453, "total_steps": 17941, "loss": 1.6694, "learning_rate": 5.593843135870545e-05, "epoch": 0.471155453988072, "percentage": 47.12, "elapsed_time": "20:00:20", "remaining_time": "22:27:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8454, "total_steps": 17941, "loss": 1.5342, "learning_rate": 5.592959005284485e-05, "epoch": 0.47121119224123514, "percentage": 47.12, "elapsed_time": "20:00:30", "remaining_time": "22:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8455, "total_steps": 17941, "loss": 1.7698, "learning_rate": 5.592074855893223e-05, "epoch": 0.47126693049439833, "percentage": 47.13, "elapsed_time": "20:00:38", "remaining_time": "22:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8456, "total_steps": 17941, "loss": 1.885, "learning_rate": 5.591190687724799e-05, "epoch": 0.47132266874756146, "percentage": 47.13, "elapsed_time": "20:00:46", "remaining_time": "22:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8457, "total_steps": 17941, "loss": 1.4436, "learning_rate": 5.590306500807253e-05, "epoch": 0.4713784070007246, "percentage": 47.14, "elapsed_time": "20:00:55", "remaining_time": "22:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8458, "total_steps": 17941, "loss": 1.6708, "learning_rate": 5.589422295168626e-05, "epoch": 0.47143414525388777, "percentage": 47.14, "elapsed_time": "20:01:03", "remaining_time": "22:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8459, "total_steps": 17941, "loss": 1.6496, "learning_rate": 5.5885380708369606e-05, "epoch": 0.4714898835070509, "percentage": 47.15, "elapsed_time": "20:01:12", "remaining_time": "22:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8460, "total_steps": 17941, "loss": 1.7612, "learning_rate": 5.5876538278403e-05, "epoch": 0.47154562176021403, "percentage": 47.15, "elapsed_time": "20:01:20", "remaining_time": "22:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8461, "total_steps": 17941, "loss": 1.9365, "learning_rate": 5.586769566206686e-05, "epoch": 0.47160136001337716, "percentage": 47.16, "elapsed_time": "20:01:29", "remaining_time": "22:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8462, "total_steps": 17941, "loss": 1.623, "learning_rate": 5.585885285964163e-05, "epoch": 0.47165709826654034, "percentage": 47.17, "elapsed_time": "20:01:37", "remaining_time": "22:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8463, "total_steps": 17941, "loss": 1.8284, "learning_rate": 5.5850009871407716e-05, "epoch": 0.47171283651970347, "percentage": 47.17, "elapsed_time": "20:01:46", "remaining_time": "22:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8464, "total_steps": 17941, "loss": 1.462, "learning_rate": 5.584116669764563e-05, "epoch": 0.4717685747728666, "percentage": 47.18, "elapsed_time": "20:01:54", "remaining_time": "22:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8465, "total_steps": 17941, "loss": 1.5878, "learning_rate": 5.583232333863577e-05, "epoch": 0.4718243130260298, "percentage": 47.18, "elapsed_time": "20:02:03", "remaining_time": "22:25:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8466, "total_steps": 17941, "loss": 1.6045, "learning_rate": 5.582347979465864e-05, "epoch": 0.4718800512791929, "percentage": 47.19, "elapsed_time": "20:02:11", "remaining_time": "22:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8467, "total_steps": 17941, "loss": 1.6802, "learning_rate": 5.581463606599467e-05, "epoch": 0.47193578953235604, "percentage": 47.19, "elapsed_time": "20:02:19", "remaining_time": "22:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8468, "total_steps": 17941, "loss": 1.6555, "learning_rate": 5.580579215292435e-05, "epoch": 0.4719915277855192, "percentage": 47.2, "elapsed_time": "20:02:28", "remaining_time": "22:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8469, "total_steps": 17941, "loss": 1.8245, "learning_rate": 5.5796948055728147e-05, "epoch": 0.47204726603868236, "percentage": 47.2, "elapsed_time": "20:02:36", "remaining_time": "22:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8470, "total_steps": 17941, "loss": 1.8156, "learning_rate": 5.578810377468656e-05, "epoch": 0.4721030042918455, "percentage": 47.21, "elapsed_time": "20:02:45", "remaining_time": "22:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8471, "total_steps": 17941, "loss": 1.6757, "learning_rate": 5.577925931008007e-05, "epoch": 0.4721587425450086, "percentage": 47.22, "elapsed_time": "20:02:53", "remaining_time": "22:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8472, "total_steps": 17941, "loss": 1.939, "learning_rate": 5.577041466218915e-05, "epoch": 0.4722144807981718, "percentage": 47.22, "elapsed_time": "20:03:02", "remaining_time": "22:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8473, "total_steps": 17941, "loss": 1.5016, "learning_rate": 5.576156983129435e-05, "epoch": 0.4722702190513349, "percentage": 47.23, "elapsed_time": "20:03:10", "remaining_time": "22:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8474, "total_steps": 17941, "loss": 1.5794, "learning_rate": 5.5752724817676125e-05, "epoch": 0.47232595730449806, "percentage": 47.23, "elapsed_time": "20:03:19", "remaining_time": "22:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8475, "total_steps": 17941, "loss": 1.5467, "learning_rate": 5.5743879621615026e-05, "epoch": 0.47238169555766124, "percentage": 47.24, "elapsed_time": "20:03:27", "remaining_time": "22:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8476, "total_steps": 17941, "loss": 1.6893, "learning_rate": 5.5735034243391537e-05, "epoch": 0.47243743381082437, "percentage": 47.24, "elapsed_time": "20:03:35", "remaining_time": "22:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8477, "total_steps": 17941, "loss": 1.6293, "learning_rate": 5.572618868328621e-05, "epoch": 0.4724931720639875, "percentage": 47.25, "elapsed_time": "20:03:44", "remaining_time": "22:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8478, "total_steps": 17941, "loss": 1.6616, "learning_rate": 5.5717342941579555e-05, "epoch": 0.4725489103171507, "percentage": 47.25, "elapsed_time": "20:03:52", "remaining_time": "22:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8479, "total_steps": 17941, "loss": 1.7797, "learning_rate": 5.570849701855213e-05, "epoch": 0.4726046485703138, "percentage": 47.26, "elapsed_time": "20:04:01", "remaining_time": "22:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8480, "total_steps": 17941, "loss": 1.6934, "learning_rate": 5.569965091448446e-05, "epoch": 0.47266038682347694, "percentage": 47.27, "elapsed_time": "20:04:09", "remaining_time": "22:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8481, "total_steps": 17941, "loss": 1.8593, "learning_rate": 5.5690804629657076e-05, "epoch": 0.4727161250766401, "percentage": 47.27, "elapsed_time": "20:04:18", "remaining_time": "22:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8482, "total_steps": 17941, "loss": 1.8292, "learning_rate": 5.568195816435057e-05, "epoch": 0.47277186332980325, "percentage": 47.28, "elapsed_time": "20:04:26", "remaining_time": "22:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8483, "total_steps": 17941, "loss": 1.6183, "learning_rate": 5.567311151884547e-05, "epoch": 0.4728276015829664, "percentage": 47.28, "elapsed_time": "20:04:35", "remaining_time": "22:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8484, "total_steps": 17941, "loss": 1.7618, "learning_rate": 5.566426469342235e-05, "epoch": 0.4728833398361295, "percentage": 47.29, "elapsed_time": "20:04:43", "remaining_time": "22:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8485, "total_steps": 17941, "loss": 1.6473, "learning_rate": 5.565541768836178e-05, "epoch": 0.4729390780892927, "percentage": 47.29, "elapsed_time": "20:04:52", "remaining_time": "22:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8486, "total_steps": 17941, "loss": 1.9419, "learning_rate": 5.564657050394434e-05, "epoch": 0.4729948163424558, "percentage": 47.3, "elapsed_time": "20:05:00", "remaining_time": "22:22:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8487, "total_steps": 17941, "loss": 1.6413, "learning_rate": 5.563772314045059e-05, "epoch": 0.47305055459561896, "percentage": 47.31, "elapsed_time": "20:05:08", "remaining_time": "22:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8488, "total_steps": 17941, "loss": 1.5344, "learning_rate": 5.562887559816116e-05, "epoch": 0.47310629284878214, "percentage": 47.31, "elapsed_time": "20:05:17", "remaining_time": "22:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8489, "total_steps": 17941, "loss": 1.6937, "learning_rate": 5.562002787735657e-05, "epoch": 0.47316203110194527, "percentage": 47.32, "elapsed_time": "20:05:25", "remaining_time": "22:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8490, "total_steps": 17941, "loss": 1.6869, "learning_rate": 5.561117997831751e-05, "epoch": 0.4732177693551084, "percentage": 47.32, "elapsed_time": "20:05:34", "remaining_time": "22:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8491, "total_steps": 17941, "loss": 1.3939, "learning_rate": 5.56023319013245e-05, "epoch": 0.4732735076082716, "percentage": 47.33, "elapsed_time": "20:05:42", "remaining_time": "22:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8492, "total_steps": 17941, "loss": 1.5309, "learning_rate": 5.559348364665822e-05, "epoch": 0.4733292458614347, "percentage": 47.33, "elapsed_time": "20:05:51", "remaining_time": "22:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8493, "total_steps": 17941, "loss": 1.5592, "learning_rate": 5.5584635214599225e-05, "epoch": 0.47338498411459784, "percentage": 47.34, "elapsed_time": "20:05:59", "remaining_time": "22:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8494, "total_steps": 17941, "loss": 1.5603, "learning_rate": 5.557578660542816e-05, "epoch": 0.47344072236776097, "percentage": 47.34, "elapsed_time": "20:06:08", "remaining_time": "22:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8495, "total_steps": 17941, "loss": 1.5251, "learning_rate": 5.5566937819425656e-05, "epoch": 0.47349646062092415, "percentage": 47.35, "elapsed_time": "20:06:16", "remaining_time": "22:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8496, "total_steps": 17941, "loss": 1.572, "learning_rate": 5.5558088856872346e-05, "epoch": 0.4735521988740873, "percentage": 47.36, "elapsed_time": "20:06:24", "remaining_time": "22:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8497, "total_steps": 17941, "loss": 1.5153, "learning_rate": 5.554923971804887e-05, "epoch": 0.4736079371272504, "percentage": 47.36, "elapsed_time": "20:06:33", "remaining_time": "22:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8498, "total_steps": 17941, "loss": 1.7534, "learning_rate": 5.554039040323586e-05, "epoch": 0.4736636753804136, "percentage": 47.37, "elapsed_time": "20:06:41", "remaining_time": "22:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8499, "total_steps": 17941, "loss": 1.6791, "learning_rate": 5.5531540912713974e-05, "epoch": 0.4737194136335767, "percentage": 47.37, "elapsed_time": "20:06:50", "remaining_time": "22:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8500, "total_steps": 17941, "loss": 1.7779, "learning_rate": 5.552269124676386e-05, "epoch": 0.47377515188673985, "percentage": 47.38, "elapsed_time": "20:06:58", "remaining_time": "22:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8501, "total_steps": 17941, "loss": 1.4377, "learning_rate": 5.551384140566618e-05, "epoch": 0.47383089013990304, "percentage": 47.38, "elapsed_time": "20:07:07", "remaining_time": "22:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8502, "total_steps": 17941, "loss": 1.8262, "learning_rate": 5.550499138970158e-05, "epoch": 0.47388662839306617, "percentage": 47.39, "elapsed_time": "20:07:15", "remaining_time": "22:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8503, "total_steps": 17941, "loss": 1.3705, "learning_rate": 5.5496141199150766e-05, "epoch": 0.4739423666462293, "percentage": 47.39, "elapsed_time": "20:07:24", "remaining_time": "22:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8504, "total_steps": 17941, "loss": 1.7927, "learning_rate": 5.548729083429439e-05, "epoch": 0.4739981048993925, "percentage": 47.4, "elapsed_time": "20:07:32", "remaining_time": "22:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8505, "total_steps": 17941, "loss": 1.7237, "learning_rate": 5.547844029541316e-05, "epoch": 0.4740538431525556, "percentage": 47.41, "elapsed_time": "20:07:41", "remaining_time": "22:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8506, "total_steps": 17941, "loss": 1.6761, "learning_rate": 5.546958958278773e-05, "epoch": 0.47410958140571874, "percentage": 47.41, "elapsed_time": "20:07:49", "remaining_time": "22:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8507, "total_steps": 17941, "loss": 1.7347, "learning_rate": 5.546073869669881e-05, "epoch": 0.47416531965888187, "percentage": 47.42, "elapsed_time": "20:07:58", "remaining_time": "22:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8508, "total_steps": 17941, "loss": 1.5048, "learning_rate": 5.5451887637427104e-05, "epoch": 0.47422105791204505, "percentage": 47.42, "elapsed_time": "20:08:06", "remaining_time": "22:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8509, "total_steps": 17941, "loss": 1.811, "learning_rate": 5.544303640525328e-05, "epoch": 0.4742767961652082, "percentage": 47.43, "elapsed_time": "20:08:15", "remaining_time": "22:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8510, "total_steps": 17941, "loss": 1.7104, "learning_rate": 5.5434185000458114e-05, "epoch": 0.4743325344183713, "percentage": 47.43, "elapsed_time": "20:08:23", "remaining_time": "22:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8511, "total_steps": 17941, "loss": 1.7893, "learning_rate": 5.5425333423322255e-05, "epoch": 0.4743882726715345, "percentage": 47.44, "elapsed_time": "20:08:32", "remaining_time": "22:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8512, "total_steps": 17941, "loss": 1.7735, "learning_rate": 5.5416481674126474e-05, "epoch": 0.4744440109246976, "percentage": 47.44, "elapsed_time": "20:08:41", "remaining_time": "22:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8513, "total_steps": 17941, "loss": 1.7249, "learning_rate": 5.540762975315147e-05, "epoch": 0.47449974917786075, "percentage": 47.45, "elapsed_time": "20:08:49", "remaining_time": "22:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8514, "total_steps": 17941, "loss": 1.7148, "learning_rate": 5.539877766067798e-05, "epoch": 0.47455548743102394, "percentage": 47.46, "elapsed_time": "20:08:57", "remaining_time": "22:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8515, "total_steps": 17941, "loss": 1.6184, "learning_rate": 5.538992539698672e-05, "epoch": 0.47461122568418707, "percentage": 47.46, "elapsed_time": "20:09:06", "remaining_time": "22:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8516, "total_steps": 17941, "loss": 1.6898, "learning_rate": 5.538107296235847e-05, "epoch": 0.4746669639373502, "percentage": 47.47, "elapsed_time": "20:09:14", "remaining_time": "22:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8517, "total_steps": 17941, "loss": 1.7039, "learning_rate": 5.5372220357073955e-05, "epoch": 0.4747227021905133, "percentage": 47.47, "elapsed_time": "20:09:23", "remaining_time": "22:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8518, "total_steps": 17941, "loss": 1.5221, "learning_rate": 5.536336758141394e-05, "epoch": 0.4747784404436765, "percentage": 47.48, "elapsed_time": "20:09:32", "remaining_time": "22:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8519, "total_steps": 17941, "loss": 1.7282, "learning_rate": 5.535451463565916e-05, "epoch": 0.47483417869683964, "percentage": 47.48, "elapsed_time": "20:09:40", "remaining_time": "22:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8520, "total_steps": 17941, "loss": 1.6662, "learning_rate": 5.5345661520090394e-05, "epoch": 0.47488991695000277, "percentage": 47.49, "elapsed_time": "20:09:48", "remaining_time": "22:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8521, "total_steps": 17941, "loss": 1.6679, "learning_rate": 5.533680823498844e-05, "epoch": 0.47494565520316595, "percentage": 47.49, "elapsed_time": "20:09:57", "remaining_time": "22:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8522, "total_steps": 17941, "loss": 1.769, "learning_rate": 5.5327954780634004e-05, "epoch": 0.4750013934563291, "percentage": 47.5, "elapsed_time": "20:10:06", "remaining_time": "22:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8523, "total_steps": 17941, "loss": 1.9089, "learning_rate": 5.531910115730794e-05, "epoch": 0.4750571317094922, "percentage": 47.51, "elapsed_time": "20:10:14", "remaining_time": "22:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8524, "total_steps": 17941, "loss": 1.7743, "learning_rate": 5.531024736529099e-05, "epoch": 0.4751128699626554, "percentage": 47.51, "elapsed_time": "20:10:23", "remaining_time": "22:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8525, "total_steps": 17941, "loss": 1.9673, "learning_rate": 5.5301393404863954e-05, "epoch": 0.4751686082158185, "percentage": 47.52, "elapsed_time": "20:10:31", "remaining_time": "22:17:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8526, "total_steps": 17941, "loss": 1.6666, "learning_rate": 5.529253927630762e-05, "epoch": 0.47522434646898165, "percentage": 47.52, "elapsed_time": "20:10:39", "remaining_time": "22:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8527, "total_steps": 17941, "loss": 1.678, "learning_rate": 5.5283684979902815e-05, "epoch": 0.47528008472214484, "percentage": 47.53, "elapsed_time": "20:10:48", "remaining_time": "22:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8528, "total_steps": 17941, "loss": 1.6429, "learning_rate": 5.5274830515930306e-05, "epoch": 0.47533582297530796, "percentage": 47.53, "elapsed_time": "20:10:56", "remaining_time": "22:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8529, "total_steps": 17941, "loss": 1.65, "learning_rate": 5.526597588467095e-05, "epoch": 0.4753915612284711, "percentage": 47.54, "elapsed_time": "20:11:05", "remaining_time": "22:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8530, "total_steps": 17941, "loss": 1.6486, "learning_rate": 5.525712108640553e-05, "epoch": 0.4754472994816342, "percentage": 47.54, "elapsed_time": "20:11:13", "remaining_time": "22:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8531, "total_steps": 17941, "loss": 1.5981, "learning_rate": 5.524826612141488e-05, "epoch": 0.4755030377347974, "percentage": 47.55, "elapsed_time": "20:11:22", "remaining_time": "22:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8532, "total_steps": 17941, "loss": 1.6958, "learning_rate": 5.523941098997983e-05, "epoch": 0.47555877598796054, "percentage": 47.56, "elapsed_time": "20:11:30", "remaining_time": "22:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8533, "total_steps": 17941, "loss": 1.7152, "learning_rate": 5.5230555692381214e-05, "epoch": 0.47561451424112366, "percentage": 47.56, "elapsed_time": "20:11:38", "remaining_time": "22:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8534, "total_steps": 17941, "loss": 1.5163, "learning_rate": 5.5221700228899866e-05, "epoch": 0.47567025249428685, "percentage": 47.57, "elapsed_time": "20:11:47", "remaining_time": "22:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8535, "total_steps": 17941, "loss": 1.6854, "learning_rate": 5.521284459981662e-05, "epoch": 0.47572599074745, "percentage": 47.57, "elapsed_time": "20:11:55", "remaining_time": "22:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8536, "total_steps": 17941, "loss": 1.6205, "learning_rate": 5.520398880541235e-05, "epoch": 0.4757817290006131, "percentage": 47.58, "elapsed_time": "20:12:04", "remaining_time": "22:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8537, "total_steps": 17941, "loss": 1.8303, "learning_rate": 5.519513284596789e-05, "epoch": 0.4758374672537763, "percentage": 47.58, "elapsed_time": "20:12:12", "remaining_time": "22:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8538, "total_steps": 17941, "loss": 1.5506, "learning_rate": 5.518627672176412e-05, "epoch": 0.4758932055069394, "percentage": 47.59, "elapsed_time": "20:12:21", "remaining_time": "22:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8539, "total_steps": 17941, "loss": 1.2786, "learning_rate": 5.5177420433081874e-05, "epoch": 0.47594894376010255, "percentage": 47.59, "elapsed_time": "20:12:29", "remaining_time": "22:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8540, "total_steps": 17941, "loss": 1.5573, "learning_rate": 5.516856398020205e-05, "epoch": 0.4760046820132657, "percentage": 47.6, "elapsed_time": "20:12:38", "remaining_time": "22:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8541, "total_steps": 17941, "loss": 1.7721, "learning_rate": 5.5159707363405485e-05, "epoch": 0.47606042026642886, "percentage": 47.61, "elapsed_time": "20:12:46", "remaining_time": "22:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8542, "total_steps": 17941, "loss": 1.4076, "learning_rate": 5.515085058297313e-05, "epoch": 0.476116158519592, "percentage": 47.61, "elapsed_time": "20:12:55", "remaining_time": "22:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8543, "total_steps": 17941, "loss": 1.7104, "learning_rate": 5.514199363918578e-05, "epoch": 0.4761718967727551, "percentage": 47.62, "elapsed_time": "20:13:03", "remaining_time": "22:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8544, "total_steps": 17941, "loss": 1.8326, "learning_rate": 5.51331365323244e-05, "epoch": 0.4762276350259183, "percentage": 47.62, "elapsed_time": "20:13:12", "remaining_time": "22:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8545, "total_steps": 17941, "loss": 1.6206, "learning_rate": 5.5124279262669856e-05, "epoch": 0.47628337327908143, "percentage": 47.63, "elapsed_time": "20:13:20", "remaining_time": "22:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8546, "total_steps": 17941, "loss": 1.7466, "learning_rate": 5.511542183050305e-05, "epoch": 0.47633911153224456, "percentage": 47.63, "elapsed_time": "20:13:29", "remaining_time": "22:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8547, "total_steps": 17941, "loss": 1.5614, "learning_rate": 5.5106564236104884e-05, "epoch": 0.47639484978540775, "percentage": 47.64, "elapsed_time": "20:13:37", "remaining_time": "22:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8548, "total_steps": 17941, "loss": 1.825, "learning_rate": 5.509770647975626e-05, "epoch": 0.4764505880385709, "percentage": 47.65, "elapsed_time": "20:13:45", "remaining_time": "22:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8549, "total_steps": 17941, "loss": 1.8289, "learning_rate": 5.508884856173813e-05, "epoch": 0.476506326291734, "percentage": 47.65, "elapsed_time": "20:13:54", "remaining_time": "22:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8550, "total_steps": 17941, "loss": 1.591, "learning_rate": 5.507999048233138e-05, "epoch": 0.4765620645448972, "percentage": 47.66, "elapsed_time": "20:14:02", "remaining_time": "22:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8551, "total_steps": 17941, "loss": 1.6152, "learning_rate": 5.507113224181696e-05, "epoch": 0.4766178027980603, "percentage": 47.66, "elapsed_time": "20:14:11", "remaining_time": "22:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8552, "total_steps": 17941, "loss": 1.7522, "learning_rate": 5.506227384047579e-05, "epoch": 0.47667354105122345, "percentage": 47.67, "elapsed_time": "20:14:19", "remaining_time": "22:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8553, "total_steps": 17941, "loss": 1.8002, "learning_rate": 5.50534152785888e-05, "epoch": 0.4767292793043866, "percentage": 47.67, "elapsed_time": "20:14:28", "remaining_time": "22:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8554, "total_steps": 17941, "loss": 1.7472, "learning_rate": 5.504455655643694e-05, "epoch": 0.47678501755754976, "percentage": 47.68, "elapsed_time": "20:14:36", "remaining_time": "22:12:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8555, "total_steps": 17941, "loss": 1.7638, "learning_rate": 5.503569767430118e-05, "epoch": 0.4768407558107129, "percentage": 47.68, "elapsed_time": "20:14:45", "remaining_time": "22:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8556, "total_steps": 17941, "loss": 1.7726, "learning_rate": 5.502683863246243e-05, "epoch": 0.476896494063876, "percentage": 47.69, "elapsed_time": "20:14:53", "remaining_time": "22:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8557, "total_steps": 17941, "loss": 1.5519, "learning_rate": 5.5017979431201675e-05, "epoch": 0.4769522323170392, "percentage": 47.7, "elapsed_time": "20:15:02", "remaining_time": "22:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8558, "total_steps": 17941, "loss": 1.6896, "learning_rate": 5.500912007079987e-05, "epoch": 0.47700797057020233, "percentage": 47.7, "elapsed_time": "20:15:10", "remaining_time": "22:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8559, "total_steps": 17941, "loss": 1.7455, "learning_rate": 5.5000260551537975e-05, "epoch": 0.47706370882336546, "percentage": 47.71, "elapsed_time": "20:15:19", "remaining_time": "22:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8560, "total_steps": 17941, "loss": 1.5399, "learning_rate": 5.499140087369697e-05, "epoch": 0.47711944707652865, "percentage": 47.71, "elapsed_time": "20:15:27", "remaining_time": "22:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8561, "total_steps": 17941, "loss": 1.5373, "learning_rate": 5.4982541037557823e-05, "epoch": 0.4771751853296918, "percentage": 47.72, "elapsed_time": "20:15:36", "remaining_time": "22:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8562, "total_steps": 17941, "loss": 1.2027, "learning_rate": 5.4973681043401534e-05, "epoch": 0.4772309235828549, "percentage": 47.72, "elapsed_time": "20:15:45", "remaining_time": "22:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8563, "total_steps": 17941, "loss": 1.9377, "learning_rate": 5.496482089150908e-05, "epoch": 0.47728666183601803, "percentage": 47.73, "elapsed_time": "20:15:53", "remaining_time": "22:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8564, "total_steps": 17941, "loss": 1.4814, "learning_rate": 5.495596058216147e-05, "epoch": 0.4773424000891812, "percentage": 47.73, "elapsed_time": "20:16:02", "remaining_time": "22:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8565, "total_steps": 17941, "loss": 1.6303, "learning_rate": 5.494710011563966e-05, "epoch": 0.47739813834234435, "percentage": 47.74, "elapsed_time": "20:16:10", "remaining_time": "22:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8566, "total_steps": 17941, "loss": 1.6204, "learning_rate": 5.49382394922247e-05, "epoch": 0.4774538765955075, "percentage": 47.75, "elapsed_time": "20:16:19", "remaining_time": "22:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8567, "total_steps": 17941, "loss": 1.5949, "learning_rate": 5.4929378712197556e-05, "epoch": 0.47750961484867066, "percentage": 47.75, "elapsed_time": "20:16:27", "remaining_time": "22:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8568, "total_steps": 17941, "loss": 1.7625, "learning_rate": 5.4920517775839276e-05, "epoch": 0.4775653531018338, "percentage": 47.76, "elapsed_time": "20:16:36", "remaining_time": "22:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8569, "total_steps": 17941, "loss": 1.7809, "learning_rate": 5.491165668343085e-05, "epoch": 0.4776210913549969, "percentage": 47.76, "elapsed_time": "20:16:44", "remaining_time": "22:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8570, "total_steps": 17941, "loss": 2.0053, "learning_rate": 5.4902795435253306e-05, "epoch": 0.4776768296081601, "percentage": 47.77, "elapsed_time": "20:16:53", "remaining_time": "22:10:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8571, "total_steps": 17941, "loss": 1.8136, "learning_rate": 5.489393403158769e-05, "epoch": 0.47773256786132323, "percentage": 47.77, "elapsed_time": "20:17:01", "remaining_time": "22:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8572, "total_steps": 17941, "loss": 1.9469, "learning_rate": 5.488507247271502e-05, "epoch": 0.47778830611448636, "percentage": 47.78, "elapsed_time": "20:17:10", "remaining_time": "22:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8573, "total_steps": 17941, "loss": 1.7089, "learning_rate": 5.487621075891632e-05, "epoch": 0.47784404436764955, "percentage": 47.78, "elapsed_time": "20:17:18", "remaining_time": "22:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8574, "total_steps": 17941, "loss": 1.8108, "learning_rate": 5.4867348890472646e-05, "epoch": 0.4778997826208127, "percentage": 47.79, "elapsed_time": "20:17:27", "remaining_time": "22:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8575, "total_steps": 17941, "loss": 1.5179, "learning_rate": 5.485848686766506e-05, "epoch": 0.4779555208739758, "percentage": 47.8, "elapsed_time": "20:17:35", "remaining_time": "22:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8576, "total_steps": 17941, "loss": 1.6112, "learning_rate": 5.484962469077458e-05, "epoch": 0.47801125912713893, "percentage": 47.8, "elapsed_time": "20:17:44", "remaining_time": "22:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8577, "total_steps": 17941, "loss": 1.6932, "learning_rate": 5.4840762360082286e-05, "epoch": 0.4780669973803021, "percentage": 47.81, "elapsed_time": "20:17:52", "remaining_time": "22:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8578, "total_steps": 17941, "loss": 1.7001, "learning_rate": 5.483189987586924e-05, "epoch": 0.47812273563346525, "percentage": 47.81, "elapsed_time": "20:18:00", "remaining_time": "22:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8579, "total_steps": 17941, "loss": 1.7767, "learning_rate": 5.4823037238416506e-05, "epoch": 0.4781784738866284, "percentage": 47.82, "elapsed_time": "20:18:09", "remaining_time": "22:09:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8580, "total_steps": 17941, "loss": 1.6749, "learning_rate": 5.481417444800512e-05, "epoch": 0.47823421213979156, "percentage": 47.82, "elapsed_time": "20:18:18", "remaining_time": "22:09:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8581, "total_steps": 17941, "loss": 1.723, "learning_rate": 5.480531150491622e-05, "epoch": 0.4782899503929547, "percentage": 47.83, "elapsed_time": "20:18:26", "remaining_time": "22:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8582, "total_steps": 17941, "loss": 1.8049, "learning_rate": 5.4796448409430845e-05, "epoch": 0.4783456886461178, "percentage": 47.83, "elapsed_time": "20:18:34", "remaining_time": "22:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8583, "total_steps": 17941, "loss": 1.979, "learning_rate": 5.478758516183009e-05, "epoch": 0.478401426899281, "percentage": 47.84, "elapsed_time": "20:18:43", "remaining_time": "22:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8584, "total_steps": 17941, "loss": 1.738, "learning_rate": 5.477872176239506e-05, "epoch": 0.47845716515244413, "percentage": 47.85, "elapsed_time": "20:18:51", "remaining_time": "22:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8585, "total_steps": 17941, "loss": 1.5133, "learning_rate": 5.4769858211406824e-05, "epoch": 0.47851290340560726, "percentage": 47.85, "elapsed_time": "20:19:00", "remaining_time": "22:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8586, "total_steps": 17941, "loss": 1.6054, "learning_rate": 5.4760994509146514e-05, "epoch": 0.4785686416587704, "percentage": 47.86, "elapsed_time": "20:19:08", "remaining_time": "22:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8587, "total_steps": 17941, "loss": 1.4712, "learning_rate": 5.475213065589518e-05, "epoch": 0.4786243799119336, "percentage": 47.86, "elapsed_time": "20:19:17", "remaining_time": "22:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8588, "total_steps": 17941, "loss": 1.4907, "learning_rate": 5.4743266651934e-05, "epoch": 0.4786801181650967, "percentage": 47.87, "elapsed_time": "20:19:25", "remaining_time": "22:08:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8589, "total_steps": 17941, "loss": 1.4832, "learning_rate": 5.4734402497544044e-05, "epoch": 0.47873585641825983, "percentage": 47.87, "elapsed_time": "20:19:34", "remaining_time": "22:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8590, "total_steps": 17941, "loss": 1.6588, "learning_rate": 5.472553819300645e-05, "epoch": 0.478791594671423, "percentage": 47.88, "elapsed_time": "20:19:42", "remaining_time": "22:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8591, "total_steps": 17941, "loss": 1.6905, "learning_rate": 5.471667373860234e-05, "epoch": 0.47884733292458614, "percentage": 47.88, "elapsed_time": "20:19:51", "remaining_time": "22:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8592, "total_steps": 17941, "loss": 1.7177, "learning_rate": 5.4707809134612844e-05, "epoch": 0.4789030711777493, "percentage": 47.89, "elapsed_time": "20:19:59", "remaining_time": "22:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8593, "total_steps": 17941, "loss": 1.8388, "learning_rate": 5.469894438131906e-05, "epoch": 0.47895880943091246, "percentage": 47.9, "elapsed_time": "20:20:08", "remaining_time": "22:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8594, "total_steps": 17941, "loss": 1.9354, "learning_rate": 5.469007947900219e-05, "epoch": 0.4790145476840756, "percentage": 47.9, "elapsed_time": "20:20:16", "remaining_time": "22:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8595, "total_steps": 17941, "loss": 1.6465, "learning_rate": 5.468121442794333e-05, "epoch": 0.4790702859372387, "percentage": 47.91, "elapsed_time": "20:20:25", "remaining_time": "22:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8596, "total_steps": 17941, "loss": 1.8636, "learning_rate": 5.467234922842363e-05, "epoch": 0.4791260241904019, "percentage": 47.91, "elapsed_time": "20:20:33", "remaining_time": "22:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8597, "total_steps": 17941, "loss": 1.7346, "learning_rate": 5.4663483880724275e-05, "epoch": 0.47918176244356503, "percentage": 47.92, "elapsed_time": "20:20:41", "remaining_time": "22:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8598, "total_steps": 17941, "loss": 1.8068, "learning_rate": 5.46546183851264e-05, "epoch": 0.47923750069672816, "percentage": 47.92, "elapsed_time": "20:20:50", "remaining_time": "22:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8599, "total_steps": 17941, "loss": 1.4534, "learning_rate": 5.464575274191116e-05, "epoch": 0.4792932389498913, "percentage": 47.93, "elapsed_time": "20:20:58", "remaining_time": "22:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8600, "total_steps": 17941, "loss": 1.5212, "learning_rate": 5.4636886951359726e-05, "epoch": 0.47934897720305447, "percentage": 47.93, "elapsed_time": "20:21:07", "remaining_time": "22:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8601, "total_steps": 17941, "loss": 1.6756, "learning_rate": 5.4628021013753284e-05, "epoch": 0.4794047154562176, "percentage": 47.94, "elapsed_time": "20:21:15", "remaining_time": "22:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8602, "total_steps": 17941, "loss": 1.7895, "learning_rate": 5.461915492937299e-05, "epoch": 0.47946045370938073, "percentage": 47.95, "elapsed_time": "20:21:24", "remaining_time": "22:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8603, "total_steps": 17941, "loss": 1.7024, "learning_rate": 5.461028869850004e-05, "epoch": 0.4795161919625439, "percentage": 47.95, "elapsed_time": "20:21:32", "remaining_time": "22:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8604, "total_steps": 17941, "loss": 1.7879, "learning_rate": 5.4601422321415606e-05, "epoch": 0.47957193021570704, "percentage": 47.96, "elapsed_time": "20:21:41", "remaining_time": "22:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8605, "total_steps": 17941, "loss": 1.6198, "learning_rate": 5.459255579840089e-05, "epoch": 0.47962766846887017, "percentage": 47.96, "elapsed_time": "20:21:50", "remaining_time": "22:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8606, "total_steps": 17941, "loss": 1.6159, "learning_rate": 5.458368912973707e-05, "epoch": 0.47968340672203336, "percentage": 47.97, "elapsed_time": "20:21:59", "remaining_time": "22:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8607, "total_steps": 17941, "loss": 1.6843, "learning_rate": 5.4574822315705366e-05, "epoch": 0.4797391449751965, "percentage": 47.97, "elapsed_time": "20:22:08", "remaining_time": "22:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8608, "total_steps": 17941, "loss": 1.8092, "learning_rate": 5.456595535658696e-05, "epoch": 0.4797948832283596, "percentage": 47.98, "elapsed_time": "20:22:16", "remaining_time": "22:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8609, "total_steps": 17941, "loss": 1.7726, "learning_rate": 5.455708825266308e-05, "epoch": 0.47985062148152274, "percentage": 47.99, "elapsed_time": "20:22:25", "remaining_time": "22:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8610, "total_steps": 17941, "loss": 1.7107, "learning_rate": 5.4548221004214936e-05, "epoch": 0.47990635973468593, "percentage": 47.99, "elapsed_time": "20:22:33", "remaining_time": "22:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8611, "total_steps": 17941, "loss": 1.5578, "learning_rate": 5.453935361152374e-05, "epoch": 0.47996209798784906, "percentage": 48.0, "elapsed_time": "20:22:41", "remaining_time": "22:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8612, "total_steps": 17941, "loss": 1.8959, "learning_rate": 5.45304860748707e-05, "epoch": 0.4800178362410122, "percentage": 48.0, "elapsed_time": "20:22:50", "remaining_time": "22:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8613, "total_steps": 17941, "loss": 1.9346, "learning_rate": 5.4521618394537056e-05, "epoch": 0.48007357449417537, "percentage": 48.01, "elapsed_time": "20:22:59", "remaining_time": "22:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8614, "total_steps": 17941, "loss": 1.6191, "learning_rate": 5.451275057080405e-05, "epoch": 0.4801293127473385, "percentage": 48.01, "elapsed_time": "20:23:07", "remaining_time": "22:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8615, "total_steps": 17941, "loss": 1.6555, "learning_rate": 5.4503882603952905e-05, "epoch": 0.48018505100050163, "percentage": 48.02, "elapsed_time": "20:23:16", "remaining_time": "22:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8616, "total_steps": 17941, "loss": 1.7481, "learning_rate": 5.449501449426487e-05, "epoch": 0.4802407892536648, "percentage": 48.02, "elapsed_time": "20:23:24", "remaining_time": "22:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8617, "total_steps": 17941, "loss": 1.7338, "learning_rate": 5.448614624202117e-05, "epoch": 0.48029652750682794, "percentage": 48.03, "elapsed_time": "20:23:33", "remaining_time": "22:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8618, "total_steps": 17941, "loss": 1.7127, "learning_rate": 5.447727784750308e-05, "epoch": 0.48035226575999107, "percentage": 48.04, "elapsed_time": "20:23:41", "remaining_time": "22:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8619, "total_steps": 17941, "loss": 1.733, "learning_rate": 5.446840931099182e-05, "epoch": 0.48040800401315426, "percentage": 48.04, "elapsed_time": "20:23:50", "remaining_time": "22:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8620, "total_steps": 17941, "loss": 1.5931, "learning_rate": 5.445954063276869e-05, "epoch": 0.4804637422663174, "percentage": 48.05, "elapsed_time": "20:23:58", "remaining_time": "22:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8621, "total_steps": 17941, "loss": 1.6994, "learning_rate": 5.445067181311492e-05, "epoch": 0.4805194805194805, "percentage": 48.05, "elapsed_time": "20:24:07", "remaining_time": "22:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8622, "total_steps": 17941, "loss": 1.5357, "learning_rate": 5.4441802852311795e-05, "epoch": 0.48057521877264364, "percentage": 48.06, "elapsed_time": "20:24:15", "remaining_time": "22:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8623, "total_steps": 17941, "loss": 1.5543, "learning_rate": 5.443293375064058e-05, "epoch": 0.4806309570258068, "percentage": 48.06, "elapsed_time": "20:24:24", "remaining_time": "22:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8624, "total_steps": 17941, "loss": 1.902, "learning_rate": 5.4424064508382556e-05, "epoch": 0.48068669527896996, "percentage": 48.07, "elapsed_time": "20:24:33", "remaining_time": "22:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8625, "total_steps": 17941, "loss": 1.7444, "learning_rate": 5.4415195125819e-05, "epoch": 0.4807424335321331, "percentage": 48.07, "elapsed_time": "20:24:41", "remaining_time": "22:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8626, "total_steps": 17941, "loss": 1.6553, "learning_rate": 5.440632560323118e-05, "epoch": 0.48079817178529627, "percentage": 48.08, "elapsed_time": "20:24:49", "remaining_time": "22:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8627, "total_steps": 17941, "loss": 1.3808, "learning_rate": 5.439745594090042e-05, "epoch": 0.4808539100384594, "percentage": 48.09, "elapsed_time": "20:24:58", "remaining_time": "22:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8628, "total_steps": 17941, "loss": 1.5705, "learning_rate": 5.438858613910799e-05, "epoch": 0.4809096482916225, "percentage": 48.09, "elapsed_time": "20:25:06", "remaining_time": "22:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8629, "total_steps": 17941, "loss": 1.9702, "learning_rate": 5.43797161981352e-05, "epoch": 0.4809653865447857, "percentage": 48.1, "elapsed_time": "20:25:15", "remaining_time": "22:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8630, "total_steps": 17941, "loss": 1.8149, "learning_rate": 5.4370846118263354e-05, "epoch": 0.48102112479794884, "percentage": 48.1, "elapsed_time": "20:25:24", "remaining_time": "22:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8631, "total_steps": 17941, "loss": 1.5798, "learning_rate": 5.436197589977374e-05, "epoch": 0.48107686305111197, "percentage": 48.11, "elapsed_time": "20:25:33", "remaining_time": "22:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8632, "total_steps": 17941, "loss": 1.6549, "learning_rate": 5.435310554294769e-05, "epoch": 0.4811326013042751, "percentage": 48.11, "elapsed_time": "20:25:41", "remaining_time": "22:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8633, "total_steps": 17941, "loss": 1.7124, "learning_rate": 5.434423504806651e-05, "epoch": 0.4811883395574383, "percentage": 48.12, "elapsed_time": "20:25:50", "remaining_time": "22:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8634, "total_steps": 17941, "loss": 1.568, "learning_rate": 5.433536441541152e-05, "epoch": 0.4812440778106014, "percentage": 48.12, "elapsed_time": "20:25:58", "remaining_time": "22:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8635, "total_steps": 17941, "loss": 1.4785, "learning_rate": 5.432649364526403e-05, "epoch": 0.48129981606376454, "percentage": 48.13, "elapsed_time": "20:26:07", "remaining_time": "22:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8636, "total_steps": 17941, "loss": 1.4929, "learning_rate": 5.4317622737905413e-05, "epoch": 0.4813555543169277, "percentage": 48.14, "elapsed_time": "20:26:15", "remaining_time": "22:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8637, "total_steps": 17941, "loss": 1.7861, "learning_rate": 5.4308751693616975e-05, "epoch": 0.48141129257009085, "percentage": 48.14, "elapsed_time": "20:26:24", "remaining_time": "22:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8638, "total_steps": 17941, "loss": 1.6655, "learning_rate": 5.429988051268006e-05, "epoch": 0.481467030823254, "percentage": 48.15, "elapsed_time": "20:26:32", "remaining_time": "22:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8639, "total_steps": 17941, "loss": 1.8461, "learning_rate": 5.429100919537597e-05, "epoch": 0.48152276907641717, "percentage": 48.15, "elapsed_time": "20:26:41", "remaining_time": "22:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8640, "total_steps": 17941, "loss": 1.9077, "learning_rate": 5.4282137741986125e-05, "epoch": 0.4815785073295803, "percentage": 48.16, "elapsed_time": "20:26:50", "remaining_time": "22:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8641, "total_steps": 17941, "loss": 1.6468, "learning_rate": 5.427326615279182e-05, "epoch": 0.4816342455827434, "percentage": 48.16, "elapsed_time": "20:26:58", "remaining_time": "22:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8642, "total_steps": 17941, "loss": 1.7315, "learning_rate": 5.426439442807444e-05, "epoch": 0.4816899838359066, "percentage": 48.17, "elapsed_time": "20:27:07", "remaining_time": "22:00:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8643, "total_steps": 17941, "loss": 1.8597, "learning_rate": 5.4255522568115314e-05, "epoch": 0.48174572208906974, "percentage": 48.17, "elapsed_time": "20:27:15", "remaining_time": "22:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8644, "total_steps": 17941, "loss": 1.4579, "learning_rate": 5.424665057319584e-05, "epoch": 0.48180146034223287, "percentage": 48.18, "elapsed_time": "20:27:24", "remaining_time": "22:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8645, "total_steps": 17941, "loss": 1.7045, "learning_rate": 5.4237778443597366e-05, "epoch": 0.481857198595396, "percentage": 48.19, "elapsed_time": "20:27:32", "remaining_time": "21:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8646, "total_steps": 17941, "loss": 1.7194, "learning_rate": 5.4228906179601256e-05, "epoch": 0.4819129368485592, "percentage": 48.19, "elapsed_time": "20:27:41", "remaining_time": "21:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8647, "total_steps": 17941, "loss": 1.8115, "learning_rate": 5.42200337814889e-05, "epoch": 0.4819686751017223, "percentage": 48.2, "elapsed_time": "20:27:49", "remaining_time": "21:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8648, "total_steps": 17941, "loss": 1.7122, "learning_rate": 5.421116124954169e-05, "epoch": 0.48202441335488544, "percentage": 48.2, "elapsed_time": "20:27:58", "remaining_time": "21:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8649, "total_steps": 17941, "loss": 1.6734, "learning_rate": 5.4202288584040996e-05, "epoch": 0.4820801516080486, "percentage": 48.21, "elapsed_time": "20:28:06", "remaining_time": "21:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8650, "total_steps": 17941, "loss": 1.9098, "learning_rate": 5.4193415785268195e-05, "epoch": 0.48213588986121175, "percentage": 48.21, "elapsed_time": "20:28:15", "remaining_time": "21:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8651, "total_steps": 17941, "loss": 1.5751, "learning_rate": 5.418454285350472e-05, "epoch": 0.4821916281143749, "percentage": 48.22, "elapsed_time": "20:28:23", "remaining_time": "21:59:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8652, "total_steps": 17941, "loss": 1.9574, "learning_rate": 5.4175669789031904e-05, "epoch": 0.48224736636753807, "percentage": 48.22, "elapsed_time": "20:28:32", "remaining_time": "21:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8653, "total_steps": 17941, "loss": 1.6274, "learning_rate": 5.4166796592131216e-05, "epoch": 0.4823031046207012, "percentage": 48.23, "elapsed_time": "20:28:40", "remaining_time": "21:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8654, "total_steps": 17941, "loss": 1.6101, "learning_rate": 5.415792326308403e-05, "epoch": 0.4823588428738643, "percentage": 48.24, "elapsed_time": "20:28:49", "remaining_time": "21:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8655, "total_steps": 17941, "loss": 1.7006, "learning_rate": 5.414904980217177e-05, "epoch": 0.48241458112702745, "percentage": 48.24, "elapsed_time": "20:28:57", "remaining_time": "21:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8656, "total_steps": 17941, "loss": 1.5782, "learning_rate": 5.414017620967582e-05, "epoch": 0.48247031938019064, "percentage": 48.25, "elapsed_time": "20:29:06", "remaining_time": "21:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8657, "total_steps": 17941, "loss": 1.8762, "learning_rate": 5.4131302485877635e-05, "epoch": 0.48252605763335377, "percentage": 48.25, "elapsed_time": "20:29:14", "remaining_time": "21:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8658, "total_steps": 17941, "loss": 1.6882, "learning_rate": 5.412242863105862e-05, "epoch": 0.4825817958865169, "percentage": 48.26, "elapsed_time": "20:29:22", "remaining_time": "21:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8659, "total_steps": 17941, "loss": 1.6909, "learning_rate": 5.41135546455002e-05, "epoch": 0.4826375341396801, "percentage": 48.26, "elapsed_time": "20:29:31", "remaining_time": "21:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8660, "total_steps": 17941, "loss": 1.8966, "learning_rate": 5.410468052948381e-05, "epoch": 0.4826932723928432, "percentage": 48.27, "elapsed_time": "20:29:39", "remaining_time": "21:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8661, "total_steps": 17941, "loss": 1.6114, "learning_rate": 5.409580628329088e-05, "epoch": 0.48274901064600634, "percentage": 48.27, "elapsed_time": "20:29:48", "remaining_time": "21:57:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8662, "total_steps": 17941, "loss": 1.4296, "learning_rate": 5.408693190720288e-05, "epoch": 0.4828047488991695, "percentage": 48.28, "elapsed_time": "20:29:56", "remaining_time": "21:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8663, "total_steps": 17941, "loss": 1.7761, "learning_rate": 5.40780574015012e-05, "epoch": 0.48286048715233265, "percentage": 48.29, "elapsed_time": "20:30:05", "remaining_time": "21:57:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8664, "total_steps": 17941, "loss": 1.7426, "learning_rate": 5.406918276646733e-05, "epoch": 0.4829162254054958, "percentage": 48.29, "elapsed_time": "20:30:13", "remaining_time": "21:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8665, "total_steps": 17941, "loss": 1.5949, "learning_rate": 5.40603080023827e-05, "epoch": 0.48297196365865896, "percentage": 48.3, "elapsed_time": "20:30:22", "remaining_time": "21:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8666, "total_steps": 17941, "loss": 1.9571, "learning_rate": 5.405143310952878e-05, "epoch": 0.4830277019118221, "percentage": 48.3, "elapsed_time": "20:30:30", "remaining_time": "21:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8667, "total_steps": 17941, "loss": 1.9154, "learning_rate": 5.4042558088187014e-05, "epoch": 0.4830834401649852, "percentage": 48.31, "elapsed_time": "20:30:39", "remaining_time": "21:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8668, "total_steps": 17941, "loss": 1.5508, "learning_rate": 5.40336829386389e-05, "epoch": 0.48313917841814835, "percentage": 48.31, "elapsed_time": "20:30:47", "remaining_time": "21:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8669, "total_steps": 17941, "loss": 1.5887, "learning_rate": 5.4024807661165855e-05, "epoch": 0.48319491667131154, "percentage": 48.32, "elapsed_time": "20:30:56", "remaining_time": "21:56:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8670, "total_steps": 17941, "loss": 1.5876, "learning_rate": 5.4015932256049386e-05, "epoch": 0.48325065492447467, "percentage": 48.33, "elapsed_time": "20:31:04", "remaining_time": "21:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8671, "total_steps": 17941, "loss": 1.8633, "learning_rate": 5.4007056723570956e-05, "epoch": 0.4833063931776378, "percentage": 48.33, "elapsed_time": "20:31:13", "remaining_time": "21:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8672, "total_steps": 17941, "loss": 1.7922, "learning_rate": 5.399818106401206e-05, "epoch": 0.483362131430801, "percentage": 48.34, "elapsed_time": "20:31:21", "remaining_time": "21:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8673, "total_steps": 17941, "loss": 1.7496, "learning_rate": 5.3989305277654156e-05, "epoch": 0.4834178696839641, "percentage": 48.34, "elapsed_time": "20:31:29", "remaining_time": "21:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8674, "total_steps": 17941, "loss": 1.6191, "learning_rate": 5.398042936477875e-05, "epoch": 0.48347360793712724, "percentage": 48.35, "elapsed_time": "20:31:38", "remaining_time": "21:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8675, "total_steps": 17941, "loss": 1.8695, "learning_rate": 5.397155332566736e-05, "epoch": 0.4835293461902904, "percentage": 48.35, "elapsed_time": "20:31:47", "remaining_time": "21:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8676, "total_steps": 17941, "loss": 1.5275, "learning_rate": 5.3962677160601426e-05, "epoch": 0.48358508444345355, "percentage": 48.36, "elapsed_time": "20:31:55", "remaining_time": "21:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8677, "total_steps": 17941, "loss": 1.4847, "learning_rate": 5.395380086986249e-05, "epoch": 0.4836408226966167, "percentage": 48.36, "elapsed_time": "20:32:04", "remaining_time": "21:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8678, "total_steps": 17941, "loss": 1.652, "learning_rate": 5.3944924453732014e-05, "epoch": 0.4836965609497798, "percentage": 48.37, "elapsed_time": "20:32:12", "remaining_time": "21:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8679, "total_steps": 17941, "loss": 1.356, "learning_rate": 5.3936047912491574e-05, "epoch": 0.483752299202943, "percentage": 48.38, "elapsed_time": "20:32:21", "remaining_time": "21:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8680, "total_steps": 17941, "loss": 1.7965, "learning_rate": 5.3927171246422615e-05, "epoch": 0.4838080374561061, "percentage": 48.38, "elapsed_time": "20:32:29", "remaining_time": "21:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8681, "total_steps": 17941, "loss": 1.6595, "learning_rate": 5.39182944558067e-05, "epoch": 0.48386377570926925, "percentage": 48.39, "elapsed_time": "20:32:38", "remaining_time": "21:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8682, "total_steps": 17941, "loss": 1.6973, "learning_rate": 5.390941754092532e-05, "epoch": 0.48391951396243243, "percentage": 48.39, "elapsed_time": "20:32:46", "remaining_time": "21:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8683, "total_steps": 17941, "loss": 1.6383, "learning_rate": 5.3900540502060015e-05, "epoch": 0.48397525221559556, "percentage": 48.4, "elapsed_time": "20:32:54", "remaining_time": "21:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8684, "total_steps": 17941, "loss": 1.73, "learning_rate": 5.3891663339492306e-05, "epoch": 0.4840309904687587, "percentage": 48.4, "elapsed_time": "20:33:03", "remaining_time": "21:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8685, "total_steps": 17941, "loss": 1.5295, "learning_rate": 5.388278605350372e-05, "epoch": 0.4840867287219219, "percentage": 48.41, "elapsed_time": "20:33:11", "remaining_time": "21:54:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8686, "total_steps": 17941, "loss": 1.6765, "learning_rate": 5.38739086443758e-05, "epoch": 0.484142466975085, "percentage": 48.41, "elapsed_time": "20:33:20", "remaining_time": "21:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8687, "total_steps": 17941, "loss": 1.5357, "learning_rate": 5.386503111239008e-05, "epoch": 0.48419820522824814, "percentage": 48.42, "elapsed_time": "20:33:28", "remaining_time": "21:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8688, "total_steps": 17941, "loss": 1.7396, "learning_rate": 5.385615345782813e-05, "epoch": 0.4842539434814113, "percentage": 48.43, "elapsed_time": "20:33:37", "remaining_time": "21:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8689, "total_steps": 17941, "loss": 1.7116, "learning_rate": 5.3847275680971454e-05, "epoch": 0.48430968173457445, "percentage": 48.43, "elapsed_time": "20:33:45", "remaining_time": "21:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8690, "total_steps": 17941, "loss": 1.6747, "learning_rate": 5.383839778210163e-05, "epoch": 0.4843654199877376, "percentage": 48.44, "elapsed_time": "20:33:54", "remaining_time": "21:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8691, "total_steps": 17941, "loss": 1.5563, "learning_rate": 5.38295197615002e-05, "epoch": 0.4844211582409007, "percentage": 48.44, "elapsed_time": "20:34:02", "remaining_time": "21:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8692, "total_steps": 17941, "loss": 2.1129, "learning_rate": 5.382064161944874e-05, "epoch": 0.4844768964940639, "percentage": 48.45, "elapsed_time": "20:34:11", "remaining_time": "21:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8693, "total_steps": 17941, "loss": 1.6652, "learning_rate": 5.3811763356228804e-05, "epoch": 0.484532634747227, "percentage": 48.45, "elapsed_time": "20:34:19", "remaining_time": "21:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8694, "total_steps": 17941, "loss": 1.7085, "learning_rate": 5.3802884972121955e-05, "epoch": 0.48458837300039015, "percentage": 48.46, "elapsed_time": "20:34:28", "remaining_time": "21:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8695, "total_steps": 17941, "loss": 1.7126, "learning_rate": 5.379400646740977e-05, "epoch": 0.48464411125355333, "percentage": 48.46, "elapsed_time": "20:34:36", "remaining_time": "21:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8696, "total_steps": 17941, "loss": 1.7257, "learning_rate": 5.3785127842373814e-05, "epoch": 0.48469984950671646, "percentage": 48.47, "elapsed_time": "20:34:45", "remaining_time": "21:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8697, "total_steps": 17941, "loss": 1.6778, "learning_rate": 5.3776249097295696e-05, "epoch": 0.4847555877598796, "percentage": 48.48, "elapsed_time": "20:34:53", "remaining_time": "21:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8698, "total_steps": 17941, "loss": 1.717, "learning_rate": 5.376737023245695e-05, "epoch": 0.4848113260130428, "percentage": 48.48, "elapsed_time": "20:35:02", "remaining_time": "21:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8699, "total_steps": 17941, "loss": 1.9998, "learning_rate": 5.375849124813919e-05, "epoch": 0.4848670642662059, "percentage": 48.49, "elapsed_time": "20:35:11", "remaining_time": "21:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8700, "total_steps": 17941, "loss": 1.9211, "learning_rate": 5.3749612144623995e-05, "epoch": 0.48492280251936903, "percentage": 48.49, "elapsed_time": "20:35:19", "remaining_time": "21:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8701, "total_steps": 17941, "loss": 1.7934, "learning_rate": 5.374073292219297e-05, "epoch": 0.48497854077253216, "percentage": 48.5, "elapsed_time": "20:35:28", "remaining_time": "21:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8702, "total_steps": 17941, "loss": 1.8932, "learning_rate": 5.3731853581127714e-05, "epoch": 0.48503427902569535, "percentage": 48.5, "elapsed_time": "20:35:36", "remaining_time": "21:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8703, "total_steps": 17941, "loss": 1.7465, "learning_rate": 5.3722974121709815e-05, "epoch": 0.4850900172788585, "percentage": 48.51, "elapsed_time": "20:35:44", "remaining_time": "21:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8704, "total_steps": 17941, "loss": 1.7025, "learning_rate": 5.371409454422087e-05, "epoch": 0.4851457555320216, "percentage": 48.51, "elapsed_time": "20:35:53", "remaining_time": "21:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8705, "total_steps": 17941, "loss": 1.6435, "learning_rate": 5.370521484894252e-05, "epoch": 0.4852014937851848, "percentage": 48.52, "elapsed_time": "20:36:02", "remaining_time": "21:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8706, "total_steps": 17941, "loss": 1.7067, "learning_rate": 5.3696335036156345e-05, "epoch": 0.4852572320383479, "percentage": 48.53, "elapsed_time": "20:36:10", "remaining_time": "21:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8707, "total_steps": 17941, "loss": 1.6528, "learning_rate": 5.368745510614399e-05, "epoch": 0.48531297029151105, "percentage": 48.53, "elapsed_time": "20:36:19", "remaining_time": "21:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8708, "total_steps": 17941, "loss": 1.8253, "learning_rate": 5.367857505918704e-05, "epoch": 0.48536870854467423, "percentage": 48.54, "elapsed_time": "20:36:27", "remaining_time": "21:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8709, "total_steps": 17941, "loss": 1.8483, "learning_rate": 5.3669694895567145e-05, "epoch": 0.48542444679783736, "percentage": 48.54, "elapsed_time": "20:36:36", "remaining_time": "21:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8710, "total_steps": 17941, "loss": 1.4705, "learning_rate": 5.366081461556593e-05, "epoch": 0.4854801850510005, "percentage": 48.55, "elapsed_time": "20:36:44", "remaining_time": "21:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8711, "total_steps": 17941, "loss": 1.4843, "learning_rate": 5.365193421946502e-05, "epoch": 0.4855359233041637, "percentage": 48.55, "elapsed_time": "20:36:52", "remaining_time": "21:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8712, "total_steps": 17941, "loss": 1.6045, "learning_rate": 5.3643053707546034e-05, "epoch": 0.4855916615573268, "percentage": 48.56, "elapsed_time": "20:37:01", "remaining_time": "21:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8713, "total_steps": 17941, "loss": 1.7184, "learning_rate": 5.363417308009062e-05, "epoch": 0.48564739981048993, "percentage": 48.56, "elapsed_time": "20:37:10", "remaining_time": "21:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8714, "total_steps": 17941, "loss": 1.6326, "learning_rate": 5.362529233738045e-05, "epoch": 0.48570313806365306, "percentage": 48.57, "elapsed_time": "20:37:18", "remaining_time": "21:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8715, "total_steps": 17941, "loss": 1.6036, "learning_rate": 5.361641147969713e-05, "epoch": 0.48575887631681625, "percentage": 48.58, "elapsed_time": "20:37:27", "remaining_time": "21:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8716, "total_steps": 17941, "loss": 1.8542, "learning_rate": 5.3607530507322334e-05, "epoch": 0.4858146145699794, "percentage": 48.58, "elapsed_time": "20:37:36", "remaining_time": "21:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8717, "total_steps": 17941, "loss": 1.6413, "learning_rate": 5.3598649420537675e-05, "epoch": 0.4858703528231425, "percentage": 48.59, "elapsed_time": "20:37:44", "remaining_time": "21:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8718, "total_steps": 17941, "loss": 1.7414, "learning_rate": 5.358976821962487e-05, "epoch": 0.4859260910763057, "percentage": 48.59, "elapsed_time": "20:37:53", "remaining_time": "21:49:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8719, "total_steps": 17941, "loss": 1.623, "learning_rate": 5.358088690486553e-05, "epoch": 0.4859818293294688, "percentage": 48.6, "elapsed_time": "20:38:01", "remaining_time": "21:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8720, "total_steps": 17941, "loss": 1.4861, "learning_rate": 5.357200547654134e-05, "epoch": 0.48603756758263195, "percentage": 48.6, "elapsed_time": "20:38:09", "remaining_time": "21:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8721, "total_steps": 17941, "loss": 1.763, "learning_rate": 5.356312393493396e-05, "epoch": 0.48609330583579513, "percentage": 48.61, "elapsed_time": "20:38:18", "remaining_time": "21:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8722, "total_steps": 17941, "loss": 1.4284, "learning_rate": 5.3554242280325064e-05, "epoch": 0.48614904408895826, "percentage": 48.61, "elapsed_time": "20:38:27", "remaining_time": "21:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8723, "total_steps": 17941, "loss": 1.8725, "learning_rate": 5.354536051299634e-05, "epoch": 0.4862047823421214, "percentage": 48.62, "elapsed_time": "20:38:35", "remaining_time": "21:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8724, "total_steps": 17941, "loss": 1.6673, "learning_rate": 5.353647863322943e-05, "epoch": 0.4862605205952845, "percentage": 48.63, "elapsed_time": "20:38:44", "remaining_time": "21:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8725, "total_steps": 17941, "loss": 1.7026, "learning_rate": 5.3527596641306034e-05, "epoch": 0.4863162588484477, "percentage": 48.63, "elapsed_time": "20:38:52", "remaining_time": "21:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8726, "total_steps": 17941, "loss": 1.3786, "learning_rate": 5.3518714537507855e-05, "epoch": 0.48637199710161083, "percentage": 48.64, "elapsed_time": "20:39:01", "remaining_time": "21:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8727, "total_steps": 17941, "loss": 1.5461, "learning_rate": 5.350983232211657e-05, "epoch": 0.48642773535477396, "percentage": 48.64, "elapsed_time": "20:39:09", "remaining_time": "21:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8728, "total_steps": 17941, "loss": 1.8215, "learning_rate": 5.350094999541385e-05, "epoch": 0.48648347360793714, "percentage": 48.65, "elapsed_time": "20:39:18", "remaining_time": "21:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8729, "total_steps": 17941, "loss": 1.6419, "learning_rate": 5.349206755768142e-05, "epoch": 0.4865392118611003, "percentage": 48.65, "elapsed_time": "20:39:26", "remaining_time": "21:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8730, "total_steps": 17941, "loss": 1.7303, "learning_rate": 5.3483185009200955e-05, "epoch": 0.4865949501142634, "percentage": 48.66, "elapsed_time": "20:39:35", "remaining_time": "21:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8731, "total_steps": 17941, "loss": 1.8506, "learning_rate": 5.347430235025419e-05, "epoch": 0.4866506883674266, "percentage": 48.67, "elapsed_time": "20:39:43", "remaining_time": "21:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8732, "total_steps": 17941, "loss": 1.4549, "learning_rate": 5.34654195811228e-05, "epoch": 0.4867064266205897, "percentage": 48.67, "elapsed_time": "20:39:52", "remaining_time": "21:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8733, "total_steps": 17941, "loss": 1.6001, "learning_rate": 5.345653670208851e-05, "epoch": 0.48676216487375285, "percentage": 48.68, "elapsed_time": "20:40:00", "remaining_time": "21:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8734, "total_steps": 17941, "loss": 1.7102, "learning_rate": 5.344765371343302e-05, "epoch": 0.48681790312691603, "percentage": 48.68, "elapsed_time": "20:40:08", "remaining_time": "21:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8735, "total_steps": 17941, "loss": 1.5661, "learning_rate": 5.343877061543806e-05, "epoch": 0.48687364138007916, "percentage": 48.69, "elapsed_time": "20:40:17", "remaining_time": "21:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8736, "total_steps": 17941, "loss": 1.9036, "learning_rate": 5.342988740838535e-05, "epoch": 0.4869293796332423, "percentage": 48.69, "elapsed_time": "20:40:25", "remaining_time": "21:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8737, "total_steps": 17941, "loss": 1.8516, "learning_rate": 5.342100409255659e-05, "epoch": 0.4869851178864054, "percentage": 48.7, "elapsed_time": "20:40:34", "remaining_time": "21:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8738, "total_steps": 17941, "loss": 1.5462, "learning_rate": 5.341212066823355e-05, "epoch": 0.4870408561395686, "percentage": 48.7, "elapsed_time": "20:40:43", "remaining_time": "21:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8739, "total_steps": 17941, "loss": 1.7118, "learning_rate": 5.340323713569792e-05, "epoch": 0.48709659439273173, "percentage": 48.71, "elapsed_time": "20:40:51", "remaining_time": "21:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8740, "total_steps": 17941, "loss": 1.8225, "learning_rate": 5.339435349523148e-05, "epoch": 0.48715233264589486, "percentage": 48.72, "elapsed_time": "20:40:59", "remaining_time": "21:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8741, "total_steps": 17941, "loss": 1.9512, "learning_rate": 5.33854697471159e-05, "epoch": 0.48720807089905804, "percentage": 48.72, "elapsed_time": "20:41:08", "remaining_time": "21:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8742, "total_steps": 17941, "loss": 1.6836, "learning_rate": 5.337658589163299e-05, "epoch": 0.4872638091522212, "percentage": 48.73, "elapsed_time": "20:41:17", "remaining_time": "21:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8743, "total_steps": 17941, "loss": 1.709, "learning_rate": 5.3367701929064426e-05, "epoch": 0.4873195474053843, "percentage": 48.73, "elapsed_time": "20:41:25", "remaining_time": "21:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8744, "total_steps": 17941, "loss": 1.5885, "learning_rate": 5.3358817859692025e-05, "epoch": 0.4873752856585475, "percentage": 48.74, "elapsed_time": "20:41:34", "remaining_time": "21:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8745, "total_steps": 17941, "loss": 1.6946, "learning_rate": 5.334993368379748e-05, "epoch": 0.4874310239117106, "percentage": 48.74, "elapsed_time": "20:41:42", "remaining_time": "21:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8746, "total_steps": 17941, "loss": 1.5776, "learning_rate": 5.3341049401662594e-05, "epoch": 0.48748676216487374, "percentage": 48.75, "elapsed_time": "20:41:51", "remaining_time": "21:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8747, "total_steps": 17941, "loss": 1.6057, "learning_rate": 5.333216501356909e-05, "epoch": 0.4875425004180369, "percentage": 48.75, "elapsed_time": "20:42:00", "remaining_time": "21:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8748, "total_steps": 17941, "loss": 1.7629, "learning_rate": 5.332328051979873e-05, "epoch": 0.48759823867120006, "percentage": 48.76, "elapsed_time": "20:42:08", "remaining_time": "21:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8749, "total_steps": 17941, "loss": 1.7972, "learning_rate": 5.3314395920633306e-05, "epoch": 0.4876539769243632, "percentage": 48.77, "elapsed_time": "20:42:17", "remaining_time": "21:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8750, "total_steps": 17941, "loss": 1.7521, "learning_rate": 5.330551121635454e-05, "epoch": 0.4877097151775263, "percentage": 48.77, "elapsed_time": "20:42:25", "remaining_time": "21:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8751, "total_steps": 17941, "loss": 1.4613, "learning_rate": 5.329662640724426e-05, "epoch": 0.4877654534306895, "percentage": 48.78, "elapsed_time": "20:42:34", "remaining_time": "21:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8752, "total_steps": 17941, "loss": 1.4367, "learning_rate": 5.32877414935842e-05, "epoch": 0.48782119168385263, "percentage": 48.78, "elapsed_time": "20:42:42", "remaining_time": "21:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8753, "total_steps": 17941, "loss": 1.649, "learning_rate": 5.3278856475656144e-05, "epoch": 0.48787692993701576, "percentage": 48.79, "elapsed_time": "20:42:51", "remaining_time": "21:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8754, "total_steps": 17941, "loss": 1.9406, "learning_rate": 5.326997135374189e-05, "epoch": 0.48793266819017894, "percentage": 48.79, "elapsed_time": "20:42:59", "remaining_time": "21:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8755, "total_steps": 17941, "loss": 1.6661, "learning_rate": 5.3261086128123206e-05, "epoch": 0.48798840644334207, "percentage": 48.8, "elapsed_time": "20:43:08", "remaining_time": "21:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8756, "total_steps": 17941, "loss": 1.9258, "learning_rate": 5.3252200799081875e-05, "epoch": 0.4880441446965052, "percentage": 48.8, "elapsed_time": "20:43:16", "remaining_time": "21:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8757, "total_steps": 17941, "loss": 1.6868, "learning_rate": 5.3243315366899694e-05, "epoch": 0.4880998829496684, "percentage": 48.81, "elapsed_time": "20:43:24", "remaining_time": "21:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8758, "total_steps": 17941, "loss": 1.4586, "learning_rate": 5.3234429831858466e-05, "epoch": 0.4881556212028315, "percentage": 48.82, "elapsed_time": "20:43:33", "remaining_time": "21:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8759, "total_steps": 17941, "loss": 1.6262, "learning_rate": 5.3225544194239984e-05, "epoch": 0.48821135945599464, "percentage": 48.82, "elapsed_time": "20:43:41", "remaining_time": "21:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8760, "total_steps": 17941, "loss": 1.5789, "learning_rate": 5.3216658454326043e-05, "epoch": 0.48826709770915777, "percentage": 48.83, "elapsed_time": "20:43:50", "remaining_time": "21:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8761, "total_steps": 17941, "loss": 1.8751, "learning_rate": 5.3207772612398444e-05, "epoch": 0.48832283596232096, "percentage": 48.83, "elapsed_time": "20:43:58", "remaining_time": "21:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8762, "total_steps": 17941, "loss": 1.5181, "learning_rate": 5.319888666873902e-05, "epoch": 0.4883785742154841, "percentage": 48.84, "elapsed_time": "20:44:07", "remaining_time": "21:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8763, "total_steps": 17941, "loss": 1.6698, "learning_rate": 5.319000062362953e-05, "epoch": 0.4884343124686472, "percentage": 48.84, "elapsed_time": "20:44:16", "remaining_time": "21:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8764, "total_steps": 17941, "loss": 1.6822, "learning_rate": 5.318111447735186e-05, "epoch": 0.4884900507218104, "percentage": 48.85, "elapsed_time": "20:44:24", "remaining_time": "21:43:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8765, "total_steps": 17941, "loss": 1.8201, "learning_rate": 5.317222823018775e-05, "epoch": 0.4885457889749735, "percentage": 48.85, "elapsed_time": "20:44:33", "remaining_time": "21:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8766, "total_steps": 17941, "loss": 1.705, "learning_rate": 5.316334188241908e-05, "epoch": 0.48860152722813666, "percentage": 48.86, "elapsed_time": "20:44:41", "remaining_time": "21:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8767, "total_steps": 17941, "loss": 1.7352, "learning_rate": 5.3154455434327634e-05, "epoch": 0.48865726548129984, "percentage": 48.87, "elapsed_time": "20:44:49", "remaining_time": "21:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8768, "total_steps": 17941, "loss": 1.7109, "learning_rate": 5.314556888619527e-05, "epoch": 0.48871300373446297, "percentage": 48.87, "elapsed_time": "20:44:59", "remaining_time": "21:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8769, "total_steps": 17941, "loss": 1.7114, "learning_rate": 5.313668223830378e-05, "epoch": 0.4887687419876261, "percentage": 48.88, "elapsed_time": "20:45:07", "remaining_time": "21:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8770, "total_steps": 17941, "loss": 1.5484, "learning_rate": 5.312779549093503e-05, "epoch": 0.4888244802407892, "percentage": 48.88, "elapsed_time": "20:45:16", "remaining_time": "21:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8771, "total_steps": 17941, "loss": 1.7072, "learning_rate": 5.3118908644370834e-05, "epoch": 0.4888802184939524, "percentage": 48.89, "elapsed_time": "20:45:24", "remaining_time": "21:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8772, "total_steps": 17941, "loss": 1.7843, "learning_rate": 5.3110021698893053e-05, "epoch": 0.48893595674711554, "percentage": 48.89, "elapsed_time": "20:45:32", "remaining_time": "21:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8773, "total_steps": 17941, "loss": 1.5887, "learning_rate": 5.310113465478351e-05, "epoch": 0.48899169500027867, "percentage": 48.9, "elapsed_time": "20:45:41", "remaining_time": "21:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8774, "total_steps": 17941, "loss": 1.5671, "learning_rate": 5.309224751232406e-05, "epoch": 0.48904743325344185, "percentage": 48.9, "elapsed_time": "20:45:49", "remaining_time": "21:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8775, "total_steps": 17941, "loss": 1.8061, "learning_rate": 5.308336027179655e-05, "epoch": 0.489103171506605, "percentage": 48.91, "elapsed_time": "20:45:58", "remaining_time": "21:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8776, "total_steps": 17941, "loss": 1.7021, "learning_rate": 5.307447293348281e-05, "epoch": 0.4891589097597681, "percentage": 48.92, "elapsed_time": "20:46:07", "remaining_time": "21:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8777, "total_steps": 17941, "loss": 1.5089, "learning_rate": 5.306558549766473e-05, "epoch": 0.4892146480129313, "percentage": 48.92, "elapsed_time": "20:46:15", "remaining_time": "21:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8778, "total_steps": 17941, "loss": 1.764, "learning_rate": 5.305669796462415e-05, "epoch": 0.4892703862660944, "percentage": 48.93, "elapsed_time": "20:46:24", "remaining_time": "21:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8779, "total_steps": 17941, "loss": 1.751, "learning_rate": 5.3047810334642935e-05, "epoch": 0.48932612451925755, "percentage": 48.93, "elapsed_time": "20:46:33", "remaining_time": "21:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8780, "total_steps": 17941, "loss": 1.7939, "learning_rate": 5.303892260800294e-05, "epoch": 0.48938186277242074, "percentage": 48.94, "elapsed_time": "20:46:41", "remaining_time": "21:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8781, "total_steps": 17941, "loss": 1.8436, "learning_rate": 5.303003478498605e-05, "epoch": 0.48943760102558387, "percentage": 48.94, "elapsed_time": "20:46:50", "remaining_time": "21:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8782, "total_steps": 17941, "loss": 1.7894, "learning_rate": 5.3021146865874117e-05, "epoch": 0.489493339278747, "percentage": 48.95, "elapsed_time": "20:46:58", "remaining_time": "21:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8783, "total_steps": 17941, "loss": 1.7486, "learning_rate": 5.301225885094902e-05, "epoch": 0.4895490775319101, "percentage": 48.95, "elapsed_time": "20:47:06", "remaining_time": "21:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8784, "total_steps": 17941, "loss": 1.7971, "learning_rate": 5.300337074049262e-05, "epoch": 0.4896048157850733, "percentage": 48.96, "elapsed_time": "20:47:15", "remaining_time": "21:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8785, "total_steps": 17941, "loss": 1.6085, "learning_rate": 5.299448253478683e-05, "epoch": 0.48966055403823644, "percentage": 48.97, "elapsed_time": "20:47:23", "remaining_time": "21:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8786, "total_steps": 17941, "loss": 1.8445, "learning_rate": 5.29855942341135e-05, "epoch": 0.48971629229139957, "percentage": 48.97, "elapsed_time": "20:47:32", "remaining_time": "21:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8787, "total_steps": 17941, "loss": 1.7854, "learning_rate": 5.297670583875454e-05, "epoch": 0.48977203054456275, "percentage": 48.98, "elapsed_time": "20:47:40", "remaining_time": "21:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8788, "total_steps": 17941, "loss": 1.4982, "learning_rate": 5.296781734899182e-05, "epoch": 0.4898277687977259, "percentage": 48.98, "elapsed_time": "20:47:49", "remaining_time": "21:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8789, "total_steps": 17941, "loss": 1.7415, "learning_rate": 5.295892876510723e-05, "epoch": 0.489883507050889, "percentage": 48.99, "elapsed_time": "20:47:57", "remaining_time": "21:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8790, "total_steps": 17941, "loss": 1.5488, "learning_rate": 5.295004008738268e-05, "epoch": 0.4899392453040522, "percentage": 48.99, "elapsed_time": "20:48:06", "remaining_time": "21:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8791, "total_steps": 17941, "loss": 1.7582, "learning_rate": 5.294115131610006e-05, "epoch": 0.4899949835572153, "percentage": 49.0, "elapsed_time": "20:48:14", "remaining_time": "21:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8792, "total_steps": 17941, "loss": 1.5738, "learning_rate": 5.293226245154127e-05, "epoch": 0.49005072181037845, "percentage": 49.01, "elapsed_time": "20:48:23", "remaining_time": "21:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8793, "total_steps": 17941, "loss": 1.7709, "learning_rate": 5.292337349398821e-05, "epoch": 0.4901064600635416, "percentage": 49.01, "elapsed_time": "20:48:31", "remaining_time": "21:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8794, "total_steps": 17941, "loss": 1.5022, "learning_rate": 5.291448444372279e-05, "epoch": 0.49016219831670477, "percentage": 49.02, "elapsed_time": "20:48:40", "remaining_time": "21:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8795, "total_steps": 17941, "loss": 1.7136, "learning_rate": 5.29055953010269e-05, "epoch": 0.4902179365698679, "percentage": 49.02, "elapsed_time": "20:48:48", "remaining_time": "21:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8796, "total_steps": 17941, "loss": 1.5791, "learning_rate": 5.289670606618248e-05, "epoch": 0.490273674823031, "percentage": 49.03, "elapsed_time": "20:48:56", "remaining_time": "21:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8797, "total_steps": 17941, "loss": 1.7905, "learning_rate": 5.288781673947143e-05, "epoch": 0.4903294130761942, "percentage": 49.03, "elapsed_time": "20:49:05", "remaining_time": "21:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8798, "total_steps": 17941, "loss": 1.7184, "learning_rate": 5.2878927321175676e-05, "epoch": 0.49038515132935734, "percentage": 49.04, "elapsed_time": "20:49:13", "remaining_time": "21:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8799, "total_steps": 17941, "loss": 1.5013, "learning_rate": 5.2870037811577125e-05, "epoch": 0.49044088958252047, "percentage": 49.04, "elapsed_time": "20:49:22", "remaining_time": "21:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8800, "total_steps": 17941, "loss": 1.7939, "learning_rate": 5.28611482109577e-05, "epoch": 0.49049662783568365, "percentage": 49.05, "elapsed_time": "20:49:30", "remaining_time": "21:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8801, "total_steps": 17941, "loss": 1.5717, "learning_rate": 5.2852258519599365e-05, "epoch": 0.4905523660888468, "percentage": 49.06, "elapsed_time": "20:49:39", "remaining_time": "21:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8802, "total_steps": 17941, "loss": 1.5725, "learning_rate": 5.284336873778398e-05, "epoch": 0.4906081043420099, "percentage": 49.06, "elapsed_time": "20:49:47", "remaining_time": "21:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8803, "total_steps": 17941, "loss": 1.5918, "learning_rate": 5.2834478865793545e-05, "epoch": 0.4906638425951731, "percentage": 49.07, "elapsed_time": "20:49:55", "remaining_time": "21:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8804, "total_steps": 17941, "loss": 1.7262, "learning_rate": 5.282558890390995e-05, "epoch": 0.4907195808483362, "percentage": 49.07, "elapsed_time": "20:50:05", "remaining_time": "21:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8805, "total_steps": 17941, "loss": 1.6374, "learning_rate": 5.281669885241517e-05, "epoch": 0.49077531910149935, "percentage": 49.08, "elapsed_time": "20:50:13", "remaining_time": "21:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8806, "total_steps": 17941, "loss": 1.7363, "learning_rate": 5.280780871159111e-05, "epoch": 0.4908310573546625, "percentage": 49.08, "elapsed_time": "20:50:22", "remaining_time": "21:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8807, "total_steps": 17941, "loss": 1.8078, "learning_rate": 5.279891848171974e-05, "epoch": 0.49088679560782567, "percentage": 49.09, "elapsed_time": "20:50:30", "remaining_time": "21:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8808, "total_steps": 17941, "loss": 1.5397, "learning_rate": 5.2790028163082985e-05, "epoch": 0.4909425338609888, "percentage": 49.09, "elapsed_time": "20:50:39", "remaining_time": "21:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8809, "total_steps": 17941, "loss": 1.6362, "learning_rate": 5.2781137755962794e-05, "epoch": 0.4909982721141519, "percentage": 49.1, "elapsed_time": "20:50:47", "remaining_time": "21:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8810, "total_steps": 17941, "loss": 1.765, "learning_rate": 5.2772247260641136e-05, "epoch": 0.4910540103673151, "percentage": 49.11, "elapsed_time": "20:50:56", "remaining_time": "21:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8811, "total_steps": 17941, "loss": 1.7014, "learning_rate": 5.276335667739998e-05, "epoch": 0.49110974862047824, "percentage": 49.11, "elapsed_time": "20:51:04", "remaining_time": "21:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8812, "total_steps": 17941, "loss": 1.7533, "learning_rate": 5.275446600652123e-05, "epoch": 0.49116548687364137, "percentage": 49.12, "elapsed_time": "20:51:14", "remaining_time": "21:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8813, "total_steps": 17941, "loss": 2.1051, "learning_rate": 5.2745575248286895e-05, "epoch": 0.49122122512680455, "percentage": 49.12, "elapsed_time": "20:51:22", "remaining_time": "21:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8814, "total_steps": 17941, "loss": 1.6069, "learning_rate": 5.273668440297892e-05, "epoch": 0.4912769633799677, "percentage": 49.13, "elapsed_time": "20:51:31", "remaining_time": "21:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8815, "total_steps": 17941, "loss": 1.4399, "learning_rate": 5.272779347087925e-05, "epoch": 0.4913327016331308, "percentage": 49.13, "elapsed_time": "20:51:39", "remaining_time": "21:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8816, "total_steps": 17941, "loss": 1.5401, "learning_rate": 5.27189024522699e-05, "epoch": 0.49138843988629394, "percentage": 49.14, "elapsed_time": "20:51:48", "remaining_time": "21:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8817, "total_steps": 17941, "loss": 1.6588, "learning_rate": 5.271001134743281e-05, "epoch": 0.4914441781394571, "percentage": 49.14, "elapsed_time": "20:51:56", "remaining_time": "21:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8818, "total_steps": 17941, "loss": 1.7393, "learning_rate": 5.270112015664997e-05, "epoch": 0.49149991639262025, "percentage": 49.15, "elapsed_time": "20:52:04", "remaining_time": "21:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8819, "total_steps": 17941, "loss": 1.6144, "learning_rate": 5.2692228880203333e-05, "epoch": 0.4915556546457834, "percentage": 49.16, "elapsed_time": "20:52:13", "remaining_time": "21:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8820, "total_steps": 17941, "loss": 1.6107, "learning_rate": 5.2683337518374906e-05, "epoch": 0.49161139289894656, "percentage": 49.16, "elapsed_time": "20:52:21", "remaining_time": "21:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8821, "total_steps": 17941, "loss": 1.5545, "learning_rate": 5.267444607144665e-05, "epoch": 0.4916671311521097, "percentage": 49.17, "elapsed_time": "20:52:30", "remaining_time": "21:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8822, "total_steps": 17941, "loss": 1.6128, "learning_rate": 5.2665554539700554e-05, "epoch": 0.4917228694052728, "percentage": 49.17, "elapsed_time": "20:52:39", "remaining_time": "21:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8823, "total_steps": 17941, "loss": 2.064, "learning_rate": 5.265666292341861e-05, "epoch": 0.491778607658436, "percentage": 49.18, "elapsed_time": "20:52:47", "remaining_time": "21:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8824, "total_steps": 17941, "loss": 1.2805, "learning_rate": 5.26477712228828e-05, "epoch": 0.49183434591159914, "percentage": 49.18, "elapsed_time": "20:52:56", "remaining_time": "21:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8825, "total_steps": 17941, "loss": 1.8211, "learning_rate": 5.2638879438375144e-05, "epoch": 0.49189008416476226, "percentage": 49.19, "elapsed_time": "20:53:04", "remaining_time": "21:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8826, "total_steps": 17941, "loss": 1.6321, "learning_rate": 5.2629987570177606e-05, "epoch": 0.49194582241792545, "percentage": 49.19, "elapsed_time": "20:53:13", "remaining_time": "21:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8827, "total_steps": 17941, "loss": 1.782, "learning_rate": 5.262109561857221e-05, "epoch": 0.4920015606710886, "percentage": 49.2, "elapsed_time": "20:53:22", "remaining_time": "21:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8828, "total_steps": 17941, "loss": 1.5132, "learning_rate": 5.261220358384091e-05, "epoch": 0.4920572989242517, "percentage": 49.21, "elapsed_time": "20:53:30", "remaining_time": "21:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8829, "total_steps": 17941, "loss": 1.4457, "learning_rate": 5.260331146626578e-05, "epoch": 0.49211303717741484, "percentage": 49.21, "elapsed_time": "20:53:38", "remaining_time": "21:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8830, "total_steps": 17941, "loss": 1.6268, "learning_rate": 5.259441926612877e-05, "epoch": 0.492168775430578, "percentage": 49.22, "elapsed_time": "20:53:48", "remaining_time": "21:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8831, "total_steps": 17941, "loss": 1.5747, "learning_rate": 5.2585526983711916e-05, "epoch": 0.49222451368374115, "percentage": 49.22, "elapsed_time": "20:53:56", "remaining_time": "21:33:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8832, "total_steps": 17941, "loss": 1.6989, "learning_rate": 5.2576634619297216e-05, "epoch": 0.4922802519369043, "percentage": 49.23, "elapsed_time": "20:54:05", "remaining_time": "21:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8833, "total_steps": 17941, "loss": 1.4546, "learning_rate": 5.256774217316669e-05, "epoch": 0.49233599019006746, "percentage": 49.23, "elapsed_time": "20:54:13", "remaining_time": "21:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8834, "total_steps": 17941, "loss": 1.6071, "learning_rate": 5.255884964560235e-05, "epoch": 0.4923917284432306, "percentage": 49.24, "elapsed_time": "20:54:22", "remaining_time": "21:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8835, "total_steps": 17941, "loss": 1.7096, "learning_rate": 5.254995703688621e-05, "epoch": 0.4924474666963937, "percentage": 49.24, "elapsed_time": "20:54:31", "remaining_time": "21:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8836, "total_steps": 17941, "loss": 1.6175, "learning_rate": 5.2541064347300306e-05, "epoch": 0.4925032049495569, "percentage": 49.25, "elapsed_time": "20:54:39", "remaining_time": "21:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8837, "total_steps": 17941, "loss": 1.2836, "learning_rate": 5.253217157712666e-05, "epoch": 0.49255894320272003, "percentage": 49.26, "elapsed_time": "20:54:47", "remaining_time": "21:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8838, "total_steps": 17941, "loss": 1.7038, "learning_rate": 5.2523278726647304e-05, "epoch": 0.49261468145588316, "percentage": 49.26, "elapsed_time": "20:54:56", "remaining_time": "21:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8839, "total_steps": 17941, "loss": 1.8079, "learning_rate": 5.251438579614425e-05, "epoch": 0.4926704197090463, "percentage": 49.27, "elapsed_time": "20:55:04", "remaining_time": "21:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8840, "total_steps": 17941, "loss": 1.8102, "learning_rate": 5.250549278589955e-05, "epoch": 0.4927261579622095, "percentage": 49.27, "elapsed_time": "20:55:13", "remaining_time": "21:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8841, "total_steps": 17941, "loss": 1.6611, "learning_rate": 5.249659969619519e-05, "epoch": 0.4927818962153726, "percentage": 49.28, "elapsed_time": "20:55:21", "remaining_time": "21:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8842, "total_steps": 17941, "loss": 1.5826, "learning_rate": 5.248770652731327e-05, "epoch": 0.49283763446853573, "percentage": 49.28, "elapsed_time": "20:55:30", "remaining_time": "21:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8843, "total_steps": 17941, "loss": 1.5787, "learning_rate": 5.247881327953581e-05, "epoch": 0.4928933727216989, "percentage": 49.29, "elapsed_time": "20:55:39", "remaining_time": "21:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8844, "total_steps": 17941, "loss": 1.7769, "learning_rate": 5.246991995314484e-05, "epoch": 0.49294911097486205, "percentage": 49.29, "elapsed_time": "20:55:47", "remaining_time": "21:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8845, "total_steps": 17941, "loss": 1.6973, "learning_rate": 5.24610265484224e-05, "epoch": 0.4930048492280252, "percentage": 49.3, "elapsed_time": "20:55:56", "remaining_time": "21:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8846, "total_steps": 17941, "loss": 1.4484, "learning_rate": 5.2452133065650565e-05, "epoch": 0.49306058748118836, "percentage": 49.31, "elapsed_time": "20:56:04", "remaining_time": "21:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8847, "total_steps": 17941, "loss": 1.7145, "learning_rate": 5.2443239505111354e-05, "epoch": 0.4931163257343515, "percentage": 49.31, "elapsed_time": "20:56:13", "remaining_time": "21:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8848, "total_steps": 17941, "loss": 1.5229, "learning_rate": 5.243434586708682e-05, "epoch": 0.4931720639875146, "percentage": 49.32, "elapsed_time": "20:56:21", "remaining_time": "21:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8849, "total_steps": 17941, "loss": 1.4448, "learning_rate": 5.2425452151859045e-05, "epoch": 0.4932278022406778, "percentage": 49.32, "elapsed_time": "20:56:29", "remaining_time": "21:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8850, "total_steps": 17941, "loss": 1.8291, "learning_rate": 5.241655835971006e-05, "epoch": 0.49328354049384093, "percentage": 49.33, "elapsed_time": "20:56:38", "remaining_time": "21:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8851, "total_steps": 17941, "loss": 1.53, "learning_rate": 5.240766449092194e-05, "epoch": 0.49333927874700406, "percentage": 49.33, "elapsed_time": "20:56:46", "remaining_time": "21:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8852, "total_steps": 17941, "loss": 1.7215, "learning_rate": 5.239877054577673e-05, "epoch": 0.4933950170001672, "percentage": 49.34, "elapsed_time": "20:56:55", "remaining_time": "21:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8853, "total_steps": 17941, "loss": 1.8231, "learning_rate": 5.2389876524556526e-05, "epoch": 0.4934507552533304, "percentage": 49.35, "elapsed_time": "20:57:03", "remaining_time": "21:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8854, "total_steps": 17941, "loss": 1.7529, "learning_rate": 5.2380982427543346e-05, "epoch": 0.4935064935064935, "percentage": 49.35, "elapsed_time": "20:57:12", "remaining_time": "21:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8855, "total_steps": 17941, "loss": 1.5894, "learning_rate": 5.23720882550193e-05, "epoch": 0.49356223175965663, "percentage": 49.36, "elapsed_time": "20:57:20", "remaining_time": "21:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8856, "total_steps": 17941, "loss": 1.811, "learning_rate": 5.2363194007266435e-05, "epoch": 0.4936179700128198, "percentage": 49.36, "elapsed_time": "20:57:29", "remaining_time": "21:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8857, "total_steps": 17941, "loss": 1.6787, "learning_rate": 5.2354299684566856e-05, "epoch": 0.49367370826598295, "percentage": 49.37, "elapsed_time": "20:57:37", "remaining_time": "21:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8858, "total_steps": 17941, "loss": 1.4917, "learning_rate": 5.2345405287202596e-05, "epoch": 0.4937294465191461, "percentage": 49.37, "elapsed_time": "20:57:46", "remaining_time": "21:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8859, "total_steps": 17941, "loss": 1.6775, "learning_rate": 5.233651081545577e-05, "epoch": 0.49378518477230926, "percentage": 49.38, "elapsed_time": "20:57:55", "remaining_time": "21:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8860, "total_steps": 17941, "loss": 1.6414, "learning_rate": 5.232761626960844e-05, "epoch": 0.4938409230254724, "percentage": 49.38, "elapsed_time": "20:58:03", "remaining_time": "21:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8861, "total_steps": 17941, "loss": 1.6513, "learning_rate": 5.231872164994268e-05, "epoch": 0.4938966612786355, "percentage": 49.39, "elapsed_time": "20:58:11", "remaining_time": "21:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8862, "total_steps": 17941, "loss": 1.7083, "learning_rate": 5.230982695674059e-05, "epoch": 0.49395239953179865, "percentage": 49.4, "elapsed_time": "20:58:20", "remaining_time": "21:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8863, "total_steps": 17941, "loss": 1.5971, "learning_rate": 5.230093219028427e-05, "epoch": 0.49400813778496183, "percentage": 49.4, "elapsed_time": "20:58:28", "remaining_time": "21:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8864, "total_steps": 17941, "loss": 1.5896, "learning_rate": 5.229203735085579e-05, "epoch": 0.49406387603812496, "percentage": 49.41, "elapsed_time": "20:58:37", "remaining_time": "21:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8865, "total_steps": 17941, "loss": 1.8503, "learning_rate": 5.2283142438737245e-05, "epoch": 0.4941196142912881, "percentage": 49.41, "elapsed_time": "20:58:45", "remaining_time": "21:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8866, "total_steps": 17941, "loss": 1.6416, "learning_rate": 5.227424745421074e-05, "epoch": 0.4941753525444513, "percentage": 49.42, "elapsed_time": "20:58:54", "remaining_time": "21:28:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8867, "total_steps": 17941, "loss": 1.3659, "learning_rate": 5.2265352397558354e-05, "epoch": 0.4942310907976144, "percentage": 49.42, "elapsed_time": "20:59:02", "remaining_time": "21:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8868, "total_steps": 17941, "loss": 1.5523, "learning_rate": 5.225645726906222e-05, "epoch": 0.49428682905077753, "percentage": 49.43, "elapsed_time": "20:59:10", "remaining_time": "21:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8869, "total_steps": 17941, "loss": 1.7921, "learning_rate": 5.224756206900439e-05, "epoch": 0.4943425673039407, "percentage": 49.43, "elapsed_time": "20:59:19", "remaining_time": "21:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8870, "total_steps": 17941, "loss": 1.6013, "learning_rate": 5.2238666797667026e-05, "epoch": 0.49439830555710385, "percentage": 49.44, "elapsed_time": "20:59:27", "remaining_time": "21:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8871, "total_steps": 17941, "loss": 1.4794, "learning_rate": 5.2229771455332176e-05, "epoch": 0.494454043810267, "percentage": 49.45, "elapsed_time": "20:59:36", "remaining_time": "21:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8872, "total_steps": 17941, "loss": 1.5029, "learning_rate": 5.2220876042281995e-05, "epoch": 0.49450978206343016, "percentage": 49.45, "elapsed_time": "20:59:44", "remaining_time": "21:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8873, "total_steps": 17941, "loss": 1.7888, "learning_rate": 5.2211980558798565e-05, "epoch": 0.4945655203165933, "percentage": 49.46, "elapsed_time": "20:59:54", "remaining_time": "21:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8874, "total_steps": 17941, "loss": 1.6931, "learning_rate": 5.220308500516401e-05, "epoch": 0.4946212585697564, "percentage": 49.46, "elapsed_time": "21:00:02", "remaining_time": "21:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8875, "total_steps": 17941, "loss": 1.6718, "learning_rate": 5.219418938166044e-05, "epoch": 0.49467699682291955, "percentage": 49.47, "elapsed_time": "21:00:10", "remaining_time": "21:27:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8876, "total_steps": 17941, "loss": 1.6968, "learning_rate": 5.218529368856997e-05, "epoch": 0.49473273507608273, "percentage": 49.47, "elapsed_time": "21:00:19", "remaining_time": "21:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8877, "total_steps": 17941, "loss": 1.5859, "learning_rate": 5.217639792617475e-05, "epoch": 0.49478847332924586, "percentage": 49.48, "elapsed_time": "21:00:27", "remaining_time": "21:27:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8878, "total_steps": 17941, "loss": 1.7858, "learning_rate": 5.216750209475685e-05, "epoch": 0.494844211582409, "percentage": 49.48, "elapsed_time": "21:00:36", "remaining_time": "21:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8879, "total_steps": 17941, "loss": 1.4827, "learning_rate": 5.2158606194598436e-05, "epoch": 0.4948999498355722, "percentage": 49.49, "elapsed_time": "21:00:45", "remaining_time": "21:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8880, "total_steps": 17941, "loss": 1.7799, "learning_rate": 5.214971022598162e-05, "epoch": 0.4949556880887353, "percentage": 49.5, "elapsed_time": "21:00:53", "remaining_time": "21:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8881, "total_steps": 17941, "loss": 1.6708, "learning_rate": 5.2140814189188514e-05, "epoch": 0.49501142634189843, "percentage": 49.5, "elapsed_time": "21:01:01", "remaining_time": "21:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8882, "total_steps": 17941, "loss": 1.6558, "learning_rate": 5.213191808450127e-05, "epoch": 0.4950671645950616, "percentage": 49.51, "elapsed_time": "21:01:10", "remaining_time": "21:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8883, "total_steps": 17941, "loss": 1.5644, "learning_rate": 5.212302191220203e-05, "epoch": 0.49512290284822474, "percentage": 49.51, "elapsed_time": "21:01:18", "remaining_time": "21:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8884, "total_steps": 17941, "loss": 1.7236, "learning_rate": 5.21141256725729e-05, "epoch": 0.4951786411013879, "percentage": 49.52, "elapsed_time": "21:01:27", "remaining_time": "21:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8885, "total_steps": 17941, "loss": 1.5429, "learning_rate": 5.210522936589604e-05, "epoch": 0.495234379354551, "percentage": 49.52, "elapsed_time": "21:01:36", "remaining_time": "21:25:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8886, "total_steps": 17941, "loss": 1.7254, "learning_rate": 5.209633299245357e-05, "epoch": 0.4952901176077142, "percentage": 49.53, "elapsed_time": "21:01:44", "remaining_time": "21:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8887, "total_steps": 17941, "loss": 1.4012, "learning_rate": 5.208743655252763e-05, "epoch": 0.4953458558608773, "percentage": 49.53, "elapsed_time": "21:01:53", "remaining_time": "21:25:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8888, "total_steps": 17941, "loss": 1.7249, "learning_rate": 5.207854004640038e-05, "epoch": 0.49540159411404044, "percentage": 49.54, "elapsed_time": "21:02:01", "remaining_time": "21:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8889, "total_steps": 17941, "loss": 1.6312, "learning_rate": 5.206964347435396e-05, "epoch": 0.49545733236720363, "percentage": 49.55, "elapsed_time": "21:02:10", "remaining_time": "21:25:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8890, "total_steps": 17941, "loss": 1.7241, "learning_rate": 5.206074683667053e-05, "epoch": 0.49551307062036676, "percentage": 49.55, "elapsed_time": "21:02:18", "remaining_time": "21:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8891, "total_steps": 17941, "loss": 1.6946, "learning_rate": 5.2051850133632206e-05, "epoch": 0.4955688088735299, "percentage": 49.56, "elapsed_time": "21:02:27", "remaining_time": "21:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8892, "total_steps": 17941, "loss": 1.503, "learning_rate": 5.204295336552117e-05, "epoch": 0.49562454712669307, "percentage": 49.56, "elapsed_time": "21:02:35", "remaining_time": "21:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8893, "total_steps": 17941, "loss": 1.5574, "learning_rate": 5.203405653261956e-05, "epoch": 0.4956802853798562, "percentage": 49.57, "elapsed_time": "21:02:44", "remaining_time": "21:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8894, "total_steps": 17941, "loss": 1.85, "learning_rate": 5.202515963520953e-05, "epoch": 0.49573602363301933, "percentage": 49.57, "elapsed_time": "21:02:52", "remaining_time": "21:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8895, "total_steps": 17941, "loss": 1.3931, "learning_rate": 5.2016262673573246e-05, "epoch": 0.4957917618861825, "percentage": 49.58, "elapsed_time": "21:03:01", "remaining_time": "21:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8896, "total_steps": 17941, "loss": 1.7307, "learning_rate": 5.200736564799288e-05, "epoch": 0.49584750013934564, "percentage": 49.58, "elapsed_time": "21:03:10", "remaining_time": "21:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8897, "total_steps": 17941, "loss": 1.4952, "learning_rate": 5.199846855875057e-05, "epoch": 0.49590323839250877, "percentage": 49.59, "elapsed_time": "21:03:18", "remaining_time": "21:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8898, "total_steps": 17941, "loss": 1.5023, "learning_rate": 5.19895714061285e-05, "epoch": 0.4959589766456719, "percentage": 49.6, "elapsed_time": "21:03:27", "remaining_time": "21:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8899, "total_steps": 17941, "loss": 1.7862, "learning_rate": 5.198067419040881e-05, "epoch": 0.4960147148988351, "percentage": 49.6, "elapsed_time": "21:03:35", "remaining_time": "21:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8900, "total_steps": 17941, "loss": 1.6099, "learning_rate": 5.197177691187368e-05, "epoch": 0.4960704531519982, "percentage": 49.61, "elapsed_time": "21:03:44", "remaining_time": "21:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8901, "total_steps": 17941, "loss": 1.5929, "learning_rate": 5.196287957080529e-05, "epoch": 0.49612619140516134, "percentage": 49.61, "elapsed_time": "21:03:53", "remaining_time": "21:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8902, "total_steps": 17941, "loss": 1.5723, "learning_rate": 5.195398216748579e-05, "epoch": 0.4961819296583245, "percentage": 49.62, "elapsed_time": "21:04:01", "remaining_time": "21:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8903, "total_steps": 17941, "loss": 1.6633, "learning_rate": 5.194508470219739e-05, "epoch": 0.49623766791148766, "percentage": 49.62, "elapsed_time": "21:04:09", "remaining_time": "21:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8904, "total_steps": 17941, "loss": 1.6933, "learning_rate": 5.193618717522224e-05, "epoch": 0.4962934061646508, "percentage": 49.63, "elapsed_time": "21:04:18", "remaining_time": "21:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8905, "total_steps": 17941, "loss": 1.8085, "learning_rate": 5.192728958684252e-05, "epoch": 0.49634914441781397, "percentage": 49.63, "elapsed_time": "21:04:26", "remaining_time": "21:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8906, "total_steps": 17941, "loss": 1.6682, "learning_rate": 5.1918391937340405e-05, "epoch": 0.4964048826709771, "percentage": 49.64, "elapsed_time": "21:04:35", "remaining_time": "21:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8907, "total_steps": 17941, "loss": 1.7887, "learning_rate": 5.190949422699808e-05, "epoch": 0.49646062092414023, "percentage": 49.65, "elapsed_time": "21:04:43", "remaining_time": "21:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8908, "total_steps": 17941, "loss": 1.6192, "learning_rate": 5.1900596456097736e-05, "epoch": 0.49651635917730336, "percentage": 49.65, "elapsed_time": "21:04:52", "remaining_time": "21:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8909, "total_steps": 17941, "loss": 1.482, "learning_rate": 5.189169862492156e-05, "epoch": 0.49657209743046654, "percentage": 49.66, "elapsed_time": "21:05:00", "remaining_time": "21:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8910, "total_steps": 17941, "loss": 1.5428, "learning_rate": 5.188280073375173e-05, "epoch": 0.49662783568362967, "percentage": 49.66, "elapsed_time": "21:05:08", "remaining_time": "21:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8911, "total_steps": 17941, "loss": 1.751, "learning_rate": 5.187390278287043e-05, "epoch": 0.4966835739367928, "percentage": 49.67, "elapsed_time": "21:05:17", "remaining_time": "21:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8912, "total_steps": 17941, "loss": 1.6317, "learning_rate": 5.1865004772559876e-05, "epoch": 0.496739312189956, "percentage": 49.67, "elapsed_time": "21:05:25", "remaining_time": "21:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8913, "total_steps": 17941, "loss": 1.382, "learning_rate": 5.1856106703102225e-05, "epoch": 0.4967950504431191, "percentage": 49.68, "elapsed_time": "21:05:34", "remaining_time": "21:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8914, "total_steps": 17941, "loss": 1.6059, "learning_rate": 5.18472085747797e-05, "epoch": 0.49685078869628224, "percentage": 49.69, "elapsed_time": "21:05:42", "remaining_time": "21:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8915, "total_steps": 17941, "loss": 1.7905, "learning_rate": 5.183831038787449e-05, "epoch": 0.4969065269494454, "percentage": 49.69, "elapsed_time": "21:05:51", "remaining_time": "21:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8916, "total_steps": 17941, "loss": 1.7827, "learning_rate": 5.18294121426688e-05, "epoch": 0.49696226520260856, "percentage": 49.7, "elapsed_time": "21:05:59", "remaining_time": "21:21:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8917, "total_steps": 17941, "loss": 1.5225, "learning_rate": 5.1820513839444804e-05, "epoch": 0.4970180034557717, "percentage": 49.7, "elapsed_time": "21:06:08", "remaining_time": "21:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8918, "total_steps": 17941, "loss": 1.584, "learning_rate": 5.181161547848474e-05, "epoch": 0.49707374170893487, "percentage": 49.71, "elapsed_time": "21:06:16", "remaining_time": "21:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8919, "total_steps": 17941, "loss": 1.7048, "learning_rate": 5.1802717060070795e-05, "epoch": 0.497129479962098, "percentage": 49.71, "elapsed_time": "21:06:25", "remaining_time": "21:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8920, "total_steps": 17941, "loss": 1.7254, "learning_rate": 5.1793818584485166e-05, "epoch": 0.4971852182152611, "percentage": 49.72, "elapsed_time": "21:06:33", "remaining_time": "21:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8921, "total_steps": 17941, "loss": 1.4276, "learning_rate": 5.178492005201007e-05, "epoch": 0.49724095646842426, "percentage": 49.72, "elapsed_time": "21:06:42", "remaining_time": "21:20:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8922, "total_steps": 17941, "loss": 1.7886, "learning_rate": 5.177602146292773e-05, "epoch": 0.49729669472158744, "percentage": 49.73, "elapsed_time": "21:06:50", "remaining_time": "21:20:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8923, "total_steps": 17941, "loss": 1.5135, "learning_rate": 5.176712281752033e-05, "epoch": 0.49735243297475057, "percentage": 49.74, "elapsed_time": "21:06:59", "remaining_time": "21:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8924, "total_steps": 17941, "loss": 1.284, "learning_rate": 5.17582241160701e-05, "epoch": 0.4974081712279137, "percentage": 49.74, "elapsed_time": "21:07:07", "remaining_time": "21:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8925, "total_steps": 17941, "loss": 1.5666, "learning_rate": 5.1749325358859255e-05, "epoch": 0.4974639094810769, "percentage": 49.75, "elapsed_time": "21:07:16", "remaining_time": "21:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8926, "total_steps": 17941, "loss": 1.7793, "learning_rate": 5.1740426546170003e-05, "epoch": 0.49751964773424, "percentage": 49.75, "elapsed_time": "21:07:24", "remaining_time": "21:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8927, "total_steps": 17941, "loss": 1.7579, "learning_rate": 5.1731527678284575e-05, "epoch": 0.49757538598740314, "percentage": 49.76, "elapsed_time": "21:07:33", "remaining_time": "21:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8928, "total_steps": 17941, "loss": 1.691, "learning_rate": 5.172262875548518e-05, "epoch": 0.4976311242405663, "percentage": 49.76, "elapsed_time": "21:07:41", "remaining_time": "21:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8929, "total_steps": 17941, "loss": 1.5507, "learning_rate": 5.171372977805405e-05, "epoch": 0.49768686249372945, "percentage": 49.77, "elapsed_time": "21:07:49", "remaining_time": "21:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8930, "total_steps": 17941, "loss": 1.8044, "learning_rate": 5.17048307462734e-05, "epoch": 0.4977426007468926, "percentage": 49.77, "elapsed_time": "21:07:58", "remaining_time": "21:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8931, "total_steps": 17941, "loss": 1.6068, "learning_rate": 5.169593166042547e-05, "epoch": 0.4977983390000557, "percentage": 49.78, "elapsed_time": "21:08:06", "remaining_time": "21:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8932, "total_steps": 17941, "loss": 1.6587, "learning_rate": 5.1687032520792464e-05, "epoch": 0.4978540772532189, "percentage": 49.79, "elapsed_time": "21:08:15", "remaining_time": "21:19:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8933, "total_steps": 17941, "loss": 1.7269, "learning_rate": 5.1678133327656616e-05, "epoch": 0.497909815506382, "percentage": 49.79, "elapsed_time": "21:08:23", "remaining_time": "21:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8934, "total_steps": 17941, "loss": 1.7147, "learning_rate": 5.166923408130016e-05, "epoch": 0.49796555375954515, "percentage": 49.8, "elapsed_time": "21:08:32", "remaining_time": "21:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8935, "total_steps": 17941, "loss": 1.5815, "learning_rate": 5.166033478200536e-05, "epoch": 0.49802129201270834, "percentage": 49.8, "elapsed_time": "21:08:40", "remaining_time": "21:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8936, "total_steps": 17941, "loss": 1.7004, "learning_rate": 5.1651435430054396e-05, "epoch": 0.49807703026587147, "percentage": 49.81, "elapsed_time": "21:08:49", "remaining_time": "21:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8937, "total_steps": 17941, "loss": 1.5522, "learning_rate": 5.164253602572954e-05, "epoch": 0.4981327685190346, "percentage": 49.81, "elapsed_time": "21:08:57", "remaining_time": "21:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8938, "total_steps": 17941, "loss": 1.6626, "learning_rate": 5.1633636569313014e-05, "epoch": 0.4981885067721978, "percentage": 49.82, "elapsed_time": "21:09:05", "remaining_time": "21:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8939, "total_steps": 17941, "loss": 1.5598, "learning_rate": 5.1624737061087056e-05, "epoch": 0.4982442450253609, "percentage": 49.82, "elapsed_time": "21:09:14", "remaining_time": "21:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8940, "total_steps": 17941, "loss": 1.6661, "learning_rate": 5.161583750133392e-05, "epoch": 0.49829998327852404, "percentage": 49.83, "elapsed_time": "21:09:23", "remaining_time": "21:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8941, "total_steps": 17941, "loss": 1.3436, "learning_rate": 5.160693789033583e-05, "epoch": 0.4983557215316872, "percentage": 49.84, "elapsed_time": "21:09:32", "remaining_time": "21:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8942, "total_steps": 17941, "loss": 1.5994, "learning_rate": 5.159803822837506e-05, "epoch": 0.49841145978485035, "percentage": 49.84, "elapsed_time": "21:09:40", "remaining_time": "21:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8943, "total_steps": 17941, "loss": 1.8826, "learning_rate": 5.1589138515733805e-05, "epoch": 0.4984671980380135, "percentage": 49.85, "elapsed_time": "21:09:49", "remaining_time": "21:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8944, "total_steps": 17941, "loss": 1.465, "learning_rate": 5.158023875269436e-05, "epoch": 0.4985229362911766, "percentage": 49.85, "elapsed_time": "21:09:57", "remaining_time": "21:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8945, "total_steps": 17941, "loss": 1.624, "learning_rate": 5.157133893953895e-05, "epoch": 0.4985786745443398, "percentage": 49.86, "elapsed_time": "21:10:05", "remaining_time": "21:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8946, "total_steps": 17941, "loss": 1.6433, "learning_rate": 5.156243907654983e-05, "epoch": 0.4986344127975029, "percentage": 49.86, "elapsed_time": "21:10:14", "remaining_time": "21:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8947, "total_steps": 17941, "loss": 1.7598, "learning_rate": 5.155353916400925e-05, "epoch": 0.49869015105066605, "percentage": 49.87, "elapsed_time": "21:10:22", "remaining_time": "21:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8948, "total_steps": 17941, "loss": 1.7002, "learning_rate": 5.154463920219947e-05, "epoch": 0.49874588930382924, "percentage": 49.87, "elapsed_time": "21:10:31", "remaining_time": "21:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8949, "total_steps": 17941, "loss": 1.5513, "learning_rate": 5.153573919140274e-05, "epoch": 0.49880162755699237, "percentage": 49.88, "elapsed_time": "21:10:39", "remaining_time": "21:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8950, "total_steps": 17941, "loss": 1.8855, "learning_rate": 5.1526839131901315e-05, "epoch": 0.4988573658101555, "percentage": 49.89, "elapsed_time": "21:10:48", "remaining_time": "21:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8951, "total_steps": 17941, "loss": 1.591, "learning_rate": 5.151793902397747e-05, "epoch": 0.4989131040633187, "percentage": 49.89, "elapsed_time": "21:10:56", "remaining_time": "21:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8952, "total_steps": 17941, "loss": 1.54, "learning_rate": 5.150903886791343e-05, "epoch": 0.4989688423164818, "percentage": 49.9, "elapsed_time": "21:11:04", "remaining_time": "21:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8953, "total_steps": 17941, "loss": 1.417, "learning_rate": 5.150013866399147e-05, "epoch": 0.49902458056964494, "percentage": 49.9, "elapsed_time": "21:11:13", "remaining_time": "21:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8954, "total_steps": 17941, "loss": 1.5283, "learning_rate": 5.149123841249387e-05, "epoch": 0.49908031882280807, "percentage": 49.91, "elapsed_time": "21:11:21", "remaining_time": "21:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8955, "total_steps": 17941, "loss": 1.9128, "learning_rate": 5.148233811370289e-05, "epoch": 0.49913605707597125, "percentage": 49.91, "elapsed_time": "21:11:30", "remaining_time": "21:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8956, "total_steps": 17941, "loss": 1.5466, "learning_rate": 5.1473437767900766e-05, "epoch": 0.4991917953291344, "percentage": 49.92, "elapsed_time": "21:11:39", "remaining_time": "21:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8957, "total_steps": 17941, "loss": 1.7227, "learning_rate": 5.1464537375369816e-05, "epoch": 0.4992475335822975, "percentage": 49.92, "elapsed_time": "21:11:48", "remaining_time": "21:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8958, "total_steps": 17941, "loss": 1.5488, "learning_rate": 5.145563693639226e-05, "epoch": 0.4993032718354607, "percentage": 49.93, "elapsed_time": "21:11:56", "remaining_time": "21:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8959, "total_steps": 17941, "loss": 1.6493, "learning_rate": 5.144673645125039e-05, "epoch": 0.4993590100886238, "percentage": 49.94, "elapsed_time": "21:12:05", "remaining_time": "21:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8960, "total_steps": 17941, "loss": 1.6502, "learning_rate": 5.143783592022646e-05, "epoch": 0.49941474834178695, "percentage": 49.94, "elapsed_time": "21:12:13", "remaining_time": "21:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8961, "total_steps": 17941, "loss": 1.389, "learning_rate": 5.142893534360278e-05, "epoch": 0.49947048659495014, "percentage": 49.95, "elapsed_time": "21:12:22", "remaining_time": "21:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8962, "total_steps": 17941, "loss": 1.882, "learning_rate": 5.1420034721661594e-05, "epoch": 0.49952622484811326, "percentage": 49.95, "elapsed_time": "21:12:30", "remaining_time": "21:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8963, "total_steps": 17941, "loss": 1.6304, "learning_rate": 5.1411134054685185e-05, "epoch": 0.4995819631012764, "percentage": 49.96, "elapsed_time": "21:12:39", "remaining_time": "21:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8964, "total_steps": 17941, "loss": 1.7474, "learning_rate": 5.140223334295584e-05, "epoch": 0.4996377013544396, "percentage": 49.96, "elapsed_time": "21:12:47", "remaining_time": "21:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8965, "total_steps": 17941, "loss": 1.7623, "learning_rate": 5.139333258675582e-05, "epoch": 0.4996934396076027, "percentage": 49.97, "elapsed_time": "21:12:56", "remaining_time": "21:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8966, "total_steps": 17941, "loss": 1.5633, "learning_rate": 5.138443178636742e-05, "epoch": 0.49974917786076584, "percentage": 49.97, "elapsed_time": "21:13:04", "remaining_time": "21:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8967, "total_steps": 17941, "loss": 1.6215, "learning_rate": 5.13755309420729e-05, "epoch": 0.49980491611392897, "percentage": 49.98, "elapsed_time": "21:13:13", "remaining_time": "21:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8968, "total_steps": 17941, "loss": 1.6782, "learning_rate": 5.1366630054154576e-05, "epoch": 0.49986065436709215, "percentage": 49.99, "elapsed_time": "21:13:21", "remaining_time": "21:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8969, "total_steps": 17941, "loss": 1.7972, "learning_rate": 5.1357729122894706e-05, "epoch": 0.4999163926202553, "percentage": 49.99, "elapsed_time": "21:13:30", "remaining_time": "21:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8970, "total_steps": 17941, "loss": 1.5217, "learning_rate": 5.134882814857559e-05, "epoch": 0.4999721308734184, "percentage": 50.0, "elapsed_time": "21:13:38", "remaining_time": "21:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8971, "total_steps": 17941, "loss": 1.7474, "learning_rate": 5.1339927131479503e-05, "epoch": 0.5000278691265816, "percentage": 50.0, "elapsed_time": "21:13:47", "remaining_time": "21:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8972, "total_steps": 17941, "loss": 1.7703, "learning_rate": 5.133102607188874e-05, "epoch": 0.5000836073797447, "percentage": 50.01, "elapsed_time": "21:13:55", "remaining_time": "21:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8973, "total_steps": 17941, "loss": 1.6809, "learning_rate": 5.132212497008559e-05, "epoch": 0.5001393456329079, "percentage": 50.01, "elapsed_time": "21:14:04", "remaining_time": "21:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8974, "total_steps": 17941, "loss": 1.6982, "learning_rate": 5.1313223826352365e-05, "epoch": 0.500195083886071, "percentage": 50.02, "elapsed_time": "21:14:12", "remaining_time": "21:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8975, "total_steps": 17941, "loss": 1.5646, "learning_rate": 5.1304322640971315e-05, "epoch": 0.5002508221392341, "percentage": 50.03, "elapsed_time": "21:14:20", "remaining_time": "21:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8976, "total_steps": 17941, "loss": 1.6019, "learning_rate": 5.1295421414224754e-05, "epoch": 0.5003065603923973, "percentage": 50.03, "elapsed_time": "21:14:29", "remaining_time": "21:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8977, "total_steps": 17941, "loss": 1.6455, "learning_rate": 5.128652014639499e-05, "epoch": 0.5003622986455605, "percentage": 50.04, "elapsed_time": "21:14:37", "remaining_time": "21:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8978, "total_steps": 17941, "loss": 1.5586, "learning_rate": 5.1277618837764294e-05, "epoch": 0.5004180368987236, "percentage": 50.04, "elapsed_time": "21:14:46", "remaining_time": "21:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8979, "total_steps": 17941, "loss": 1.8271, "learning_rate": 5.126871748861499e-05, "epoch": 0.5004737751518867, "percentage": 50.05, "elapsed_time": "21:14:54", "remaining_time": "21:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8980, "total_steps": 17941, "loss": 1.7673, "learning_rate": 5.125981609922935e-05, "epoch": 0.5005295134050499, "percentage": 50.05, "elapsed_time": "21:15:03", "remaining_time": "21:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8981, "total_steps": 17941, "loss": 1.5127, "learning_rate": 5.1250914669889714e-05, "epoch": 0.500585251658213, "percentage": 50.06, "elapsed_time": "21:15:12", "remaining_time": "21:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8982, "total_steps": 17941, "loss": 1.7471, "learning_rate": 5.124201320087833e-05, "epoch": 0.5006409899113762, "percentage": 50.06, "elapsed_time": "21:15:21", "remaining_time": "21:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8983, "total_steps": 17941, "loss": 1.6188, "learning_rate": 5.1233111692477555e-05, "epoch": 0.5006967281645394, "percentage": 50.07, "elapsed_time": "21:15:29", "remaining_time": "21:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8984, "total_steps": 17941, "loss": 1.6802, "learning_rate": 5.122421014496965e-05, "epoch": 0.5007524664177024, "percentage": 50.08, "elapsed_time": "21:15:37", "remaining_time": "21:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8985, "total_steps": 17941, "loss": 1.5793, "learning_rate": 5.1215308558636944e-05, "epoch": 0.5008082046708656, "percentage": 50.08, "elapsed_time": "21:15:46", "remaining_time": "21:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8986, "total_steps": 17941, "loss": 1.3947, "learning_rate": 5.1206406933761716e-05, "epoch": 0.5008639429240288, "percentage": 50.09, "elapsed_time": "21:15:55", "remaining_time": "21:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8987, "total_steps": 17941, "loss": 1.9244, "learning_rate": 5.119750527062632e-05, "epoch": 0.5009196811771919, "percentage": 50.09, "elapsed_time": "21:16:03", "remaining_time": "21:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8988, "total_steps": 17941, "loss": 1.6002, "learning_rate": 5.1188603569513025e-05, "epoch": 0.5009754194303551, "percentage": 50.1, "elapsed_time": "21:16:12", "remaining_time": "21:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8989, "total_steps": 17941, "loss": 1.8124, "learning_rate": 5.117970183070416e-05, "epoch": 0.5010311576835182, "percentage": 50.1, "elapsed_time": "21:16:20", "remaining_time": "21:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8990, "total_steps": 17941, "loss": 1.6561, "learning_rate": 5.1170800054482035e-05, "epoch": 0.5010868959366813, "percentage": 50.11, "elapsed_time": "21:16:29", "remaining_time": "21:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8991, "total_steps": 17941, "loss": 1.7734, "learning_rate": 5.116189824112896e-05, "epoch": 0.5011426341898445, "percentage": 50.11, "elapsed_time": "21:16:37", "remaining_time": "21:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8992, "total_steps": 17941, "loss": 1.4226, "learning_rate": 5.115299639092723e-05, "epoch": 0.5011983724430077, "percentage": 50.12, "elapsed_time": "21:16:46", "remaining_time": "21:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8993, "total_steps": 17941, "loss": 1.4967, "learning_rate": 5.114409450415919e-05, "epoch": 0.5012541106961708, "percentage": 50.13, "elapsed_time": "21:16:55", "remaining_time": "21:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8994, "total_steps": 17941, "loss": 1.6527, "learning_rate": 5.113519258110715e-05, "epoch": 0.501309848949334, "percentage": 50.13, "elapsed_time": "21:17:03", "remaining_time": "21:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8995, "total_steps": 17941, "loss": 1.7632, "learning_rate": 5.1126290622053405e-05, "epoch": 0.501365587202497, "percentage": 50.14, "elapsed_time": "21:17:11", "remaining_time": "21:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8996, "total_steps": 17941, "loss": 1.5339, "learning_rate": 5.1117388627280305e-05, "epoch": 0.5014213254556602, "percentage": 50.14, "elapsed_time": "21:17:20", "remaining_time": "21:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8997, "total_steps": 17941, "loss": 1.6767, "learning_rate": 5.1108486597070125e-05, "epoch": 0.5014770637088234, "percentage": 50.15, "elapsed_time": "21:17:28", "remaining_time": "21:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8998, "total_steps": 17941, "loss": 1.7141, "learning_rate": 5.109958453170524e-05, "epoch": 0.5015328019619865, "percentage": 50.15, "elapsed_time": "21:17:37", "remaining_time": "21:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8999, "total_steps": 17941, "loss": 1.393, "learning_rate": 5.109068243146793e-05, "epoch": 0.5015885402151496, "percentage": 50.16, "elapsed_time": "21:17:45", "remaining_time": "21:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9000, "total_steps": 17941, "loss": 1.8804, "learning_rate": 5.1081780296640535e-05, "epoch": 0.5016442784683128, "percentage": 50.16, "elapsed_time": "21:17:54", "remaining_time": "21:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9001, "total_steps": 17941, "loss": 1.6947, "learning_rate": 5.107287812750538e-05, "epoch": 0.5017000167214759, "percentage": 50.17, "elapsed_time": "21:18:03", "remaining_time": "21:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9002, "total_steps": 17941, "loss": 1.6008, "learning_rate": 5.106397592434478e-05, "epoch": 0.5017557549746391, "percentage": 50.18, "elapsed_time": "21:18:12", "remaining_time": "21:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9003, "total_steps": 17941, "loss": 1.6802, "learning_rate": 5.105507368744108e-05, "epoch": 0.5018114932278023, "percentage": 50.18, "elapsed_time": "21:18:20", "remaining_time": "21:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9004, "total_steps": 17941, "loss": 1.653, "learning_rate": 5.1046171417076584e-05, "epoch": 0.5018672314809653, "percentage": 50.19, "elapsed_time": "21:18:29", "remaining_time": "21:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9005, "total_steps": 17941, "loss": 1.7098, "learning_rate": 5.103726911353363e-05, "epoch": 0.5019229697341285, "percentage": 50.19, "elapsed_time": "21:18:38", "remaining_time": "21:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9006, "total_steps": 17941, "loss": 1.9008, "learning_rate": 5.1028366777094536e-05, "epoch": 0.5019787079872917, "percentage": 50.2, "elapsed_time": "21:18:46", "remaining_time": "21:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9007, "total_steps": 17941, "loss": 1.4168, "learning_rate": 5.101946440804166e-05, "epoch": 0.5020344462404548, "percentage": 50.2, "elapsed_time": "21:18:55", "remaining_time": "21:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9008, "total_steps": 17941, "loss": 1.7717, "learning_rate": 5.101056200665731e-05, "epoch": 0.502090184493618, "percentage": 50.21, "elapsed_time": "21:19:03", "remaining_time": "21:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9009, "total_steps": 17941, "loss": 1.4358, "learning_rate": 5.100165957322384e-05, "epoch": 0.5021459227467812, "percentage": 50.21, "elapsed_time": "21:19:12", "remaining_time": "21:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9010, "total_steps": 17941, "loss": 1.7202, "learning_rate": 5.099275710802355e-05, "epoch": 0.5022016609999442, "percentage": 50.22, "elapsed_time": "21:19:20", "remaining_time": "21:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9011, "total_steps": 17941, "loss": 1.8804, "learning_rate": 5.09838546113388e-05, "epoch": 0.5022573992531074, "percentage": 50.23, "elapsed_time": "21:19:29", "remaining_time": "21:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9012, "total_steps": 17941, "loss": 1.7409, "learning_rate": 5.097495208345191e-05, "epoch": 0.5023131375062706, "percentage": 50.23, "elapsed_time": "21:19:38", "remaining_time": "21:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9013, "total_steps": 17941, "loss": 1.6353, "learning_rate": 5.096604952464524e-05, "epoch": 0.5023688757594337, "percentage": 50.24, "elapsed_time": "21:19:46", "remaining_time": "21:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9014, "total_steps": 17941, "loss": 1.8436, "learning_rate": 5.095714693520111e-05, "epoch": 0.5024246140125969, "percentage": 50.24, "elapsed_time": "21:19:55", "remaining_time": "21:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9015, "total_steps": 17941, "loss": 1.5617, "learning_rate": 5.094824431540184e-05, "epoch": 0.50248035226576, "percentage": 50.25, "elapsed_time": "21:20:03", "remaining_time": "21:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9016, "total_steps": 17941, "loss": 1.7339, "learning_rate": 5.093934166552981e-05, "epoch": 0.5025360905189231, "percentage": 50.25, "elapsed_time": "21:20:12", "remaining_time": "21:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9017, "total_steps": 17941, "loss": 1.892, "learning_rate": 5.0930438985867326e-05, "epoch": 0.5025918287720863, "percentage": 50.26, "elapsed_time": "21:20:21", "remaining_time": "21:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9018, "total_steps": 17941, "loss": 1.6645, "learning_rate": 5.0921536276696745e-05, "epoch": 0.5026475670252494, "percentage": 50.26, "elapsed_time": "21:20:30", "remaining_time": "21:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9019, "total_steps": 17941, "loss": 1.8816, "learning_rate": 5.09126335383004e-05, "epoch": 0.5027033052784126, "percentage": 50.27, "elapsed_time": "21:20:39", "remaining_time": "21:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9020, "total_steps": 17941, "loss": 1.8134, "learning_rate": 5.090373077096067e-05, "epoch": 0.5027590435315757, "percentage": 50.28, "elapsed_time": "21:20:47", "remaining_time": "21:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9021, "total_steps": 17941, "loss": 1.625, "learning_rate": 5.089482797495984e-05, "epoch": 0.5028147817847388, "percentage": 50.28, "elapsed_time": "21:20:56", "remaining_time": "21:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9022, "total_steps": 17941, "loss": 1.8258, "learning_rate": 5.0885925150580295e-05, "epoch": 0.502870520037902, "percentage": 50.29, "elapsed_time": "21:21:04", "remaining_time": "21:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9023, "total_steps": 17941, "loss": 1.5994, "learning_rate": 5.0877022298104356e-05, "epoch": 0.5029262582910652, "percentage": 50.29, "elapsed_time": "21:21:12", "remaining_time": "21:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9024, "total_steps": 17941, "loss": 1.4209, "learning_rate": 5.08681194178144e-05, "epoch": 0.5029819965442283, "percentage": 50.3, "elapsed_time": "21:21:21", "remaining_time": "21:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9025, "total_steps": 17941, "loss": 2.1234, "learning_rate": 5.0859216509992743e-05, "epoch": 0.5030377347973914, "percentage": 50.3, "elapsed_time": "21:21:30", "remaining_time": "21:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9026, "total_steps": 17941, "loss": 1.6014, "learning_rate": 5.085031357492177e-05, "epoch": 0.5030934730505546, "percentage": 50.31, "elapsed_time": "21:21:38", "remaining_time": "21:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9027, "total_steps": 17941, "loss": 1.6218, "learning_rate": 5.0841410612883786e-05, "epoch": 0.5031492113037177, "percentage": 50.31, "elapsed_time": "21:21:47", "remaining_time": "21:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9028, "total_steps": 17941, "loss": 1.4808, "learning_rate": 5.083250762416116e-05, "epoch": 0.5032049495568809, "percentage": 50.32, "elapsed_time": "21:21:55", "remaining_time": "21:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9029, "total_steps": 17941, "loss": 1.7044, "learning_rate": 5.082360460903627e-05, "epoch": 0.5032606878100441, "percentage": 50.33, "elapsed_time": "21:22:04", "remaining_time": "21:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9030, "total_steps": 17941, "loss": 1.923, "learning_rate": 5.0814701567791436e-05, "epoch": 0.5033164260632071, "percentage": 50.33, "elapsed_time": "21:22:12", "remaining_time": "21:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9031, "total_steps": 17941, "loss": 1.888, "learning_rate": 5.0805798500709e-05, "epoch": 0.5033721643163703, "percentage": 50.34, "elapsed_time": "21:22:21", "remaining_time": "21:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9032, "total_steps": 17941, "loss": 1.7227, "learning_rate": 5.0796895408071344e-05, "epoch": 0.5034279025695335, "percentage": 50.34, "elapsed_time": "21:22:29", "remaining_time": "21:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9033, "total_steps": 17941, "loss": 1.7073, "learning_rate": 5.0787992290160827e-05, "epoch": 0.5034836408226966, "percentage": 50.35, "elapsed_time": "21:22:38", "remaining_time": "21:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9034, "total_steps": 17941, "loss": 1.6084, "learning_rate": 5.0779089147259774e-05, "epoch": 0.5035393790758598, "percentage": 50.35, "elapsed_time": "21:22:46", "remaining_time": "21:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9035, "total_steps": 17941, "loss": 1.6793, "learning_rate": 5.077018597965056e-05, "epoch": 0.503595117329023, "percentage": 50.36, "elapsed_time": "21:22:54", "remaining_time": "21:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9036, "total_steps": 17941, "loss": 1.6211, "learning_rate": 5.076128278761554e-05, "epoch": 0.503650855582186, "percentage": 50.37, "elapsed_time": "21:23:03", "remaining_time": "21:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9037, "total_steps": 17941, "loss": 1.5416, "learning_rate": 5.075237957143706e-05, "epoch": 0.5037065938353492, "percentage": 50.37, "elapsed_time": "21:23:12", "remaining_time": "21:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9038, "total_steps": 17941, "loss": 1.7137, "learning_rate": 5.0743476331397474e-05, "epoch": 0.5037623320885124, "percentage": 50.38, "elapsed_time": "21:23:20", "remaining_time": "21:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9039, "total_steps": 17941, "loss": 1.2725, "learning_rate": 5.073457306777919e-05, "epoch": 0.5038180703416755, "percentage": 50.38, "elapsed_time": "21:23:28", "remaining_time": "21:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9040, "total_steps": 17941, "loss": 1.7186, "learning_rate": 5.0725669780864505e-05, "epoch": 0.5038738085948387, "percentage": 50.39, "elapsed_time": "21:23:37", "remaining_time": "21:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9041, "total_steps": 17941, "loss": 1.5712, "learning_rate": 5.0716766470935806e-05, "epoch": 0.5039295468480017, "percentage": 50.39, "elapsed_time": "21:23:45", "remaining_time": "21:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9042, "total_steps": 17941, "loss": 1.4333, "learning_rate": 5.070786313827547e-05, "epoch": 0.5039852851011649, "percentage": 50.4, "elapsed_time": "21:23:54", "remaining_time": "21:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9043, "total_steps": 17941, "loss": 1.7388, "learning_rate": 5.069895978316582e-05, "epoch": 0.5040410233543281, "percentage": 50.4, "elapsed_time": "21:24:02", "remaining_time": "21:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9044, "total_steps": 17941, "loss": 1.5896, "learning_rate": 5.0690056405889255e-05, "epoch": 0.5040967616074912, "percentage": 50.41, "elapsed_time": "21:24:11", "remaining_time": "21:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9045, "total_steps": 17941, "loss": 1.4889, "learning_rate": 5.068115300672812e-05, "epoch": 0.5041524998606544, "percentage": 50.42, "elapsed_time": "21:24:19", "remaining_time": "21:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9046, "total_steps": 17941, "loss": 1.6881, "learning_rate": 5.0672249585964796e-05, "epoch": 0.5042082381138175, "percentage": 50.42, "elapsed_time": "21:24:28", "remaining_time": "21:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9047, "total_steps": 17941, "loss": 1.9196, "learning_rate": 5.0663346143881617e-05, "epoch": 0.5042639763669806, "percentage": 50.43, "elapsed_time": "21:24:36", "remaining_time": "21:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9048, "total_steps": 17941, "loss": 1.8109, "learning_rate": 5.065444268076097e-05, "epoch": 0.5043197146201438, "percentage": 50.43, "elapsed_time": "21:24:45", "remaining_time": "21:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9049, "total_steps": 17941, "loss": 1.7364, "learning_rate": 5.0645539196885214e-05, "epoch": 0.504375452873307, "percentage": 50.44, "elapsed_time": "21:24:53", "remaining_time": "21:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9050, "total_steps": 17941, "loss": 1.4389, "learning_rate": 5.0636635692536724e-05, "epoch": 0.5044311911264701, "percentage": 50.44, "elapsed_time": "21:25:02", "remaining_time": "21:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9051, "total_steps": 17941, "loss": 1.5368, "learning_rate": 5.062773216799786e-05, "epoch": 0.5044869293796332, "percentage": 50.45, "elapsed_time": "21:25:11", "remaining_time": "21:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9052, "total_steps": 17941, "loss": 1.561, "learning_rate": 5.0618828623550996e-05, "epoch": 0.5045426676327964, "percentage": 50.45, "elapsed_time": "21:25:19", "remaining_time": "21:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9053, "total_steps": 17941, "loss": 1.6605, "learning_rate": 5.060992505947849e-05, "epoch": 0.5045984058859595, "percentage": 50.46, "elapsed_time": "21:25:28", "remaining_time": "21:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9054, "total_steps": 17941, "loss": 1.6417, "learning_rate": 5.0601021476062714e-05, "epoch": 0.5046541441391227, "percentage": 50.47, "elapsed_time": "21:25:36", "remaining_time": "21:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9055, "total_steps": 17941, "loss": 1.8285, "learning_rate": 5.059211787358607e-05, "epoch": 0.5047098823922859, "percentage": 50.47, "elapsed_time": "21:25:45", "remaining_time": "21:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9056, "total_steps": 17941, "loss": 1.8365, "learning_rate": 5.058321425233087e-05, "epoch": 0.5047656206454489, "percentage": 50.48, "elapsed_time": "21:25:53", "remaining_time": "21:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9057, "total_steps": 17941, "loss": 1.7859, "learning_rate": 5.0574310612579515e-05, "epoch": 0.5048213588986121, "percentage": 50.48, "elapsed_time": "21:26:02", "remaining_time": "21:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9058, "total_steps": 17941, "loss": 1.6426, "learning_rate": 5.056540695461437e-05, "epoch": 0.5048770971517753, "percentage": 50.49, "elapsed_time": "21:26:10", "remaining_time": "21:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9059, "total_steps": 17941, "loss": 1.9062, "learning_rate": 5.0556503278717836e-05, "epoch": 0.5049328354049384, "percentage": 50.49, "elapsed_time": "21:26:18", "remaining_time": "21:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9060, "total_steps": 17941, "loss": 1.7185, "learning_rate": 5.0547599585172245e-05, "epoch": 0.5049885736581016, "percentage": 50.5, "elapsed_time": "21:26:27", "remaining_time": "21:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9061, "total_steps": 17941, "loss": 1.5759, "learning_rate": 5.053869587426e-05, "epoch": 0.5050443119112648, "percentage": 50.5, "elapsed_time": "21:26:35", "remaining_time": "21:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9062, "total_steps": 17941, "loss": 1.7592, "learning_rate": 5.052979214626346e-05, "epoch": 0.5051000501644278, "percentage": 50.51, "elapsed_time": "21:26:44", "remaining_time": "21:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9063, "total_steps": 17941, "loss": 1.4266, "learning_rate": 5.0520888401464994e-05, "epoch": 0.505155788417591, "percentage": 50.52, "elapsed_time": "21:26:52", "remaining_time": "21:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9064, "total_steps": 17941, "loss": 1.852, "learning_rate": 5.051198464014698e-05, "epoch": 0.5052115266707541, "percentage": 50.52, "elapsed_time": "21:27:01", "remaining_time": "21:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9065, "total_steps": 17941, "loss": 1.6573, "learning_rate": 5.0503080862591824e-05, "epoch": 0.5052672649239173, "percentage": 50.53, "elapsed_time": "21:27:09", "remaining_time": "21:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9066, "total_steps": 17941, "loss": 1.9084, "learning_rate": 5.049417706908185e-05, "epoch": 0.5053230031770805, "percentage": 50.53, "elapsed_time": "21:27:18", "remaining_time": "21:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9067, "total_steps": 17941, "loss": 1.6099, "learning_rate": 5.0485273259899465e-05, "epoch": 0.5053787414302435, "percentage": 50.54, "elapsed_time": "21:27:26", "remaining_time": "21:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9068, "total_steps": 17941, "loss": 1.7669, "learning_rate": 5.0476369435327066e-05, "epoch": 0.5054344796834067, "percentage": 50.54, "elapsed_time": "21:27:35", "remaining_time": "20:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9069, "total_steps": 17941, "loss": 1.6294, "learning_rate": 5.046746559564698e-05, "epoch": 0.5054902179365699, "percentage": 50.55, "elapsed_time": "21:27:43", "remaining_time": "20:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9070, "total_steps": 17941, "loss": 1.4943, "learning_rate": 5.045856174114161e-05, "epoch": 0.505545956189733, "percentage": 50.55, "elapsed_time": "21:27:51", "remaining_time": "20:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9071, "total_steps": 17941, "loss": 1.4914, "learning_rate": 5.044965787209333e-05, "epoch": 0.5056016944428962, "percentage": 50.56, "elapsed_time": "21:28:00", "remaining_time": "20:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9072, "total_steps": 17941, "loss": 1.5848, "learning_rate": 5.044075398878456e-05, "epoch": 0.5056574326960593, "percentage": 50.57, "elapsed_time": "21:28:08", "remaining_time": "20:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9073, "total_steps": 17941, "loss": 1.8014, "learning_rate": 5.0431850091497614e-05, "epoch": 0.5057131709492224, "percentage": 50.57, "elapsed_time": "21:28:17", "remaining_time": "20:59:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9074, "total_steps": 17941, "loss": 1.5506, "learning_rate": 5.042294618051492e-05, "epoch": 0.5057689092023856, "percentage": 50.58, "elapsed_time": "21:28:25", "remaining_time": "20:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9075, "total_steps": 17941, "loss": 1.7151, "learning_rate": 5.041404225611882e-05, "epoch": 0.5058246474555488, "percentage": 50.58, "elapsed_time": "21:28:34", "remaining_time": "20:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9076, "total_steps": 17941, "loss": 1.6034, "learning_rate": 5.040513831859172e-05, "epoch": 0.5058803857087119, "percentage": 50.59, "elapsed_time": "21:28:43", "remaining_time": "20:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9077, "total_steps": 17941, "loss": 1.7025, "learning_rate": 5.0396234368215986e-05, "epoch": 0.505936123961875, "percentage": 50.59, "elapsed_time": "21:28:51", "remaining_time": "20:58:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9078, "total_steps": 17941, "loss": 1.6266, "learning_rate": 5.0387330405274027e-05, "epoch": 0.5059918622150382, "percentage": 50.6, "elapsed_time": "21:29:00", "remaining_time": "20:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9079, "total_steps": 17941, "loss": 1.9665, "learning_rate": 5.0378426430048185e-05, "epoch": 0.5060476004682013, "percentage": 50.6, "elapsed_time": "21:29:08", "remaining_time": "20:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9080, "total_steps": 17941, "loss": 1.7505, "learning_rate": 5.036952244282087e-05, "epoch": 0.5061033387213645, "percentage": 50.61, "elapsed_time": "21:29:16", "remaining_time": "20:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9081, "total_steps": 17941, "loss": 1.3145, "learning_rate": 5.036061844387447e-05, "epoch": 0.5061590769745277, "percentage": 50.62, "elapsed_time": "21:29:25", "remaining_time": "20:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9082, "total_steps": 17941, "loss": 1.8727, "learning_rate": 5.035171443349135e-05, "epoch": 0.5062148152276907, "percentage": 50.62, "elapsed_time": "21:29:33", "remaining_time": "20:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9083, "total_steps": 17941, "loss": 1.8522, "learning_rate": 5.034281041195389e-05, "epoch": 0.5062705534808539, "percentage": 50.63, "elapsed_time": "21:29:42", "remaining_time": "20:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9084, "total_steps": 17941, "loss": 1.4206, "learning_rate": 5.0333906379544485e-05, "epoch": 0.5063262917340171, "percentage": 50.63, "elapsed_time": "21:29:50", "remaining_time": "20:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9085, "total_steps": 17941, "loss": 1.6741, "learning_rate": 5.0325002336545525e-05, "epoch": 0.5063820299871802, "percentage": 50.64, "elapsed_time": "21:29:59", "remaining_time": "20:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9086, "total_steps": 17941, "loss": 1.6622, "learning_rate": 5.031609828323938e-05, "epoch": 0.5064377682403434, "percentage": 50.64, "elapsed_time": "21:30:07", "remaining_time": "20:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9087, "total_steps": 17941, "loss": 1.6901, "learning_rate": 5.030719421990845e-05, "epoch": 0.5064935064935064, "percentage": 50.65, "elapsed_time": "21:30:16", "remaining_time": "20:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9088, "total_steps": 17941, "loss": 1.5533, "learning_rate": 5.029829014683509e-05, "epoch": 0.5065492447466696, "percentage": 50.65, "elapsed_time": "21:30:24", "remaining_time": "20:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9089, "total_steps": 17941, "loss": 2.0952, "learning_rate": 5.0289386064301715e-05, "epoch": 0.5066049829998328, "percentage": 50.66, "elapsed_time": "21:30:32", "remaining_time": "20:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9090, "total_steps": 17941, "loss": 1.5283, "learning_rate": 5.0280481972590696e-05, "epoch": 0.5066607212529959, "percentage": 50.67, "elapsed_time": "21:30:41", "remaining_time": "20:56:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9091, "total_steps": 17941, "loss": 1.5935, "learning_rate": 5.027157787198443e-05, "epoch": 0.5067164595061591, "percentage": 50.67, "elapsed_time": "21:30:49", "remaining_time": "20:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9092, "total_steps": 17941, "loss": 1.6714, "learning_rate": 5.0262673762765314e-05, "epoch": 0.5067721977593223, "percentage": 50.68, "elapsed_time": "21:30:58", "remaining_time": "20:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9093, "total_steps": 17941, "loss": 1.6966, "learning_rate": 5.0253769645215684e-05, "epoch": 0.5068279360124853, "percentage": 50.68, "elapsed_time": "21:31:06", "remaining_time": "20:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9094, "total_steps": 17941, "loss": 1.8099, "learning_rate": 5.024486551961799e-05, "epoch": 0.5068836742656485, "percentage": 50.69, "elapsed_time": "21:31:15", "remaining_time": "20:56:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9095, "total_steps": 17941, "loss": 1.8034, "learning_rate": 5.0235961386254584e-05, "epoch": 0.5069394125188117, "percentage": 50.69, "elapsed_time": "21:31:23", "remaining_time": "20:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9096, "total_steps": 17941, "loss": 1.761, "learning_rate": 5.022705724540785e-05, "epoch": 0.5069951507719748, "percentage": 50.7, "elapsed_time": "21:31:32", "remaining_time": "20:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9097, "total_steps": 17941, "loss": 1.5518, "learning_rate": 5.0218153097360174e-05, "epoch": 0.507050889025138, "percentage": 50.71, "elapsed_time": "21:31:41", "remaining_time": "20:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9098, "total_steps": 17941, "loss": 1.6151, "learning_rate": 5.0209248942393975e-05, "epoch": 0.5071066272783011, "percentage": 50.71, "elapsed_time": "21:31:50", "remaining_time": "20:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9099, "total_steps": 17941, "loss": 1.6079, "learning_rate": 5.020034478079161e-05, "epoch": 0.5071623655314642, "percentage": 50.72, "elapsed_time": "21:31:58", "remaining_time": "20:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9100, "total_steps": 17941, "loss": 1.4861, "learning_rate": 5.0191440612835484e-05, "epoch": 0.5072181037846274, "percentage": 50.72, "elapsed_time": "21:32:07", "remaining_time": "20:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9101, "total_steps": 17941, "loss": 1.6863, "learning_rate": 5.018253643880797e-05, "epoch": 0.5072738420377906, "percentage": 50.73, "elapsed_time": "21:32:15", "remaining_time": "20:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9102, "total_steps": 17941, "loss": 1.5901, "learning_rate": 5.017363225899147e-05, "epoch": 0.5073295802909537, "percentage": 50.73, "elapsed_time": "21:32:24", "remaining_time": "20:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9103, "total_steps": 17941, "loss": 1.6177, "learning_rate": 5.0164728073668354e-05, "epoch": 0.5073853185441168, "percentage": 50.74, "elapsed_time": "21:32:32", "remaining_time": "20:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9104, "total_steps": 17941, "loss": 1.5947, "learning_rate": 5.0155823883121025e-05, "epoch": 0.50744105679728, "percentage": 50.74, "elapsed_time": "21:32:41", "remaining_time": "20:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9105, "total_steps": 17941, "loss": 1.6997, "learning_rate": 5.014691968763189e-05, "epoch": 0.5074967950504431, "percentage": 50.75, "elapsed_time": "21:32:49", "remaining_time": "20:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9106, "total_steps": 17941, "loss": 1.7778, "learning_rate": 5.0138015487483305e-05, "epoch": 0.5075525333036063, "percentage": 50.76, "elapsed_time": "21:32:58", "remaining_time": "20:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9107, "total_steps": 17941, "loss": 1.6958, "learning_rate": 5.012911128295768e-05, "epoch": 0.5076082715567695, "percentage": 50.76, "elapsed_time": "21:33:06", "remaining_time": "20:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9108, "total_steps": 17941, "loss": 1.7133, "learning_rate": 5.012020707433739e-05, "epoch": 0.5076640098099325, "percentage": 50.77, "elapsed_time": "21:33:15", "remaining_time": "20:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9109, "total_steps": 17941, "loss": 1.3029, "learning_rate": 5.011130286190483e-05, "epoch": 0.5077197480630957, "percentage": 50.77, "elapsed_time": "21:33:23", "remaining_time": "20:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9110, "total_steps": 17941, "loss": 1.6388, "learning_rate": 5.0102398645942404e-05, "epoch": 0.5077754863162588, "percentage": 50.78, "elapsed_time": "21:33:31", "remaining_time": "20:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9111, "total_steps": 17941, "loss": 1.6256, "learning_rate": 5.009349442673249e-05, "epoch": 0.507831224569422, "percentage": 50.78, "elapsed_time": "21:33:40", "remaining_time": "20:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9112, "total_steps": 17941, "loss": 1.7203, "learning_rate": 5.008459020455747e-05, "epoch": 0.5078869628225852, "percentage": 50.79, "elapsed_time": "21:33:48", "remaining_time": "20:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9113, "total_steps": 17941, "loss": 1.6371, "learning_rate": 5.007568597969975e-05, "epoch": 0.5079427010757482, "percentage": 50.79, "elapsed_time": "21:33:57", "remaining_time": "20:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9114, "total_steps": 17941, "loss": 1.7731, "learning_rate": 5.00667817524417e-05, "epoch": 0.5079984393289114, "percentage": 50.8, "elapsed_time": "21:34:05", "remaining_time": "20:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9115, "total_steps": 17941, "loss": 1.7304, "learning_rate": 5.005787752306573e-05, "epoch": 0.5080541775820746, "percentage": 50.81, "elapsed_time": "21:34:14", "remaining_time": "20:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9116, "total_steps": 17941, "loss": 1.6358, "learning_rate": 5.0048973291854215e-05, "epoch": 0.5081099158352377, "percentage": 50.81, "elapsed_time": "21:34:22", "remaining_time": "20:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9117, "total_steps": 17941, "loss": 1.6261, "learning_rate": 5.004006905908956e-05, "epoch": 0.5081656540884009, "percentage": 50.82, "elapsed_time": "21:34:31", "remaining_time": "20:52:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9118, "total_steps": 17941, "loss": 1.7944, "learning_rate": 5.0031164825054154e-05, "epoch": 0.508221392341564, "percentage": 50.82, "elapsed_time": "21:34:39", "remaining_time": "20:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9119, "total_steps": 17941, "loss": 1.6483, "learning_rate": 5.0022260590030365e-05, "epoch": 0.5082771305947271, "percentage": 50.83, "elapsed_time": "21:34:48", "remaining_time": "20:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9120, "total_steps": 17941, "loss": 1.7028, "learning_rate": 5.0013356354300625e-05, "epoch": 0.5083328688478903, "percentage": 50.83, "elapsed_time": "21:34:56", "remaining_time": "20:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9121, "total_steps": 17941, "loss": 1.7512, "learning_rate": 5.000445211814727e-05, "epoch": 0.5083886071010535, "percentage": 50.84, "elapsed_time": "21:35:05", "remaining_time": "20:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9122, "total_steps": 17941, "loss": 1.6766, "learning_rate": 4.9995547881852745e-05, "epoch": 0.5084443453542166, "percentage": 50.84, "elapsed_time": "21:35:13", "remaining_time": "20:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9123, "total_steps": 17941, "loss": 1.3173, "learning_rate": 4.9986643645699387e-05, "epoch": 0.5085000836073797, "percentage": 50.85, "elapsed_time": "21:35:22", "remaining_time": "20:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9124, "total_steps": 17941, "loss": 1.7782, "learning_rate": 4.997773940996964e-05, "epoch": 0.5085558218605429, "percentage": 50.86, "elapsed_time": "21:35:30", "remaining_time": "20:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9125, "total_steps": 17941, "loss": 1.566, "learning_rate": 4.9968835174945864e-05, "epoch": 0.508611560113706, "percentage": 50.86, "elapsed_time": "21:35:38", "remaining_time": "20:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9126, "total_steps": 17941, "loss": 1.61, "learning_rate": 4.995993094091044e-05, "epoch": 0.5086672983668692, "percentage": 50.87, "elapsed_time": "21:35:47", "remaining_time": "20:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9127, "total_steps": 17941, "loss": 1.3672, "learning_rate": 4.995102670814579e-05, "epoch": 0.5087230366200324, "percentage": 50.87, "elapsed_time": "21:35:55", "remaining_time": "20:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9128, "total_steps": 17941, "loss": 1.8647, "learning_rate": 4.9942122476934286e-05, "epoch": 0.5087787748731954, "percentage": 50.88, "elapsed_time": "21:36:04", "remaining_time": "20:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9129, "total_steps": 17941, "loss": 1.4283, "learning_rate": 4.9933218247558316e-05, "epoch": 0.5088345131263586, "percentage": 50.88, "elapsed_time": "21:36:12", "remaining_time": "20:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9130, "total_steps": 17941, "loss": 1.7816, "learning_rate": 4.992431402030026e-05, "epoch": 0.5088902513795218, "percentage": 50.89, "elapsed_time": "21:36:21", "remaining_time": "20:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9131, "total_steps": 17941, "loss": 1.5547, "learning_rate": 4.9915409795442553e-05, "epoch": 0.5089459896326849, "percentage": 50.89, "elapsed_time": "21:36:29", "remaining_time": "20:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9132, "total_steps": 17941, "loss": 1.6848, "learning_rate": 4.990650557326752e-05, "epoch": 0.5090017278858481, "percentage": 50.9, "elapsed_time": "21:36:38", "remaining_time": "20:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9133, "total_steps": 17941, "loss": 1.5241, "learning_rate": 4.98976013540576e-05, "epoch": 0.5090574661390111, "percentage": 50.91, "elapsed_time": "21:36:46", "remaining_time": "20:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9134, "total_steps": 17941, "loss": 1.3605, "learning_rate": 4.988869713809518e-05, "epoch": 0.5091132043921743, "percentage": 50.91, "elapsed_time": "21:36:55", "remaining_time": "20:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9135, "total_steps": 17941, "loss": 1.663, "learning_rate": 4.9879792925662624e-05, "epoch": 0.5091689426453375, "percentage": 50.92, "elapsed_time": "21:37:03", "remaining_time": "20:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9136, "total_steps": 17941, "loss": 1.7112, "learning_rate": 4.987088871704234e-05, "epoch": 0.5092246808985006, "percentage": 50.92, "elapsed_time": "21:37:12", "remaining_time": "20:50:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9137, "total_steps": 17941, "loss": 1.5613, "learning_rate": 4.9861984512516706e-05, "epoch": 0.5092804191516638, "percentage": 50.93, "elapsed_time": "21:37:20", "remaining_time": "20:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9138, "total_steps": 17941, "loss": 1.7832, "learning_rate": 4.985308031236811e-05, "epoch": 0.509336157404827, "percentage": 50.93, "elapsed_time": "21:37:28", "remaining_time": "20:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9139, "total_steps": 17941, "loss": 1.6785, "learning_rate": 4.984417611687899e-05, "epoch": 0.50939189565799, "percentage": 50.94, "elapsed_time": "21:37:37", "remaining_time": "20:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9140, "total_steps": 17941, "loss": 1.6664, "learning_rate": 4.983527192633165e-05, "epoch": 0.5094476339111532, "percentage": 50.94, "elapsed_time": "21:37:45", "remaining_time": "20:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9141, "total_steps": 17941, "loss": 1.5922, "learning_rate": 4.982636774100855e-05, "epoch": 0.5095033721643164, "percentage": 50.95, "elapsed_time": "21:37:54", "remaining_time": "20:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9142, "total_steps": 17941, "loss": 1.51, "learning_rate": 4.981746356119204e-05, "epoch": 0.5095591104174795, "percentage": 50.96, "elapsed_time": "21:38:02", "remaining_time": "20:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9143, "total_steps": 17941, "loss": 1.661, "learning_rate": 4.980855938716454e-05, "epoch": 0.5096148486706427, "percentage": 50.96, "elapsed_time": "21:38:11", "remaining_time": "20:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9144, "total_steps": 17941, "loss": 1.5701, "learning_rate": 4.97996552192084e-05, "epoch": 0.5096705869238058, "percentage": 50.97, "elapsed_time": "21:38:19", "remaining_time": "20:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9145, "total_steps": 17941, "loss": 1.389, "learning_rate": 4.979075105760603e-05, "epoch": 0.5097263251769689, "percentage": 50.97, "elapsed_time": "21:38:28", "remaining_time": "20:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9146, "total_steps": 17941, "loss": 1.585, "learning_rate": 4.978184690263983e-05, "epoch": 0.5097820634301321, "percentage": 50.98, "elapsed_time": "21:38:36", "remaining_time": "20:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9147, "total_steps": 17941, "loss": 1.7289, "learning_rate": 4.9772942754592156e-05, "epoch": 0.5098378016832953, "percentage": 50.98, "elapsed_time": "21:38:45", "remaining_time": "20:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9148, "total_steps": 17941, "loss": 1.6774, "learning_rate": 4.976403861374545e-05, "epoch": 0.5098935399364584, "percentage": 50.99, "elapsed_time": "21:38:53", "remaining_time": "20:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9149, "total_steps": 17941, "loss": 1.4913, "learning_rate": 4.975513448038202e-05, "epoch": 0.5099492781896215, "percentage": 50.99, "elapsed_time": "21:39:01", "remaining_time": "20:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9150, "total_steps": 17941, "loss": 1.8086, "learning_rate": 4.974623035478432e-05, "epoch": 0.5100050164427847, "percentage": 51.0, "elapsed_time": "21:39:10", "remaining_time": "20:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9151, "total_steps": 17941, "loss": 1.48, "learning_rate": 4.9737326237234704e-05, "epoch": 0.5100607546959478, "percentage": 51.01, "elapsed_time": "21:39:18", "remaining_time": "20:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9152, "total_steps": 17941, "loss": 1.6754, "learning_rate": 4.972842212801557e-05, "epoch": 0.510116492949111, "percentage": 51.01, "elapsed_time": "21:39:27", "remaining_time": "20:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9153, "total_steps": 17941, "loss": 1.6418, "learning_rate": 4.9719518027409315e-05, "epoch": 0.5101722312022742, "percentage": 51.02, "elapsed_time": "21:39:35", "remaining_time": "20:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9154, "total_steps": 17941, "loss": 1.5825, "learning_rate": 4.9710613935698296e-05, "epoch": 0.5102279694554372, "percentage": 51.02, "elapsed_time": "21:39:44", "remaining_time": "20:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9155, "total_steps": 17941, "loss": 1.7214, "learning_rate": 4.970170985316493e-05, "epoch": 0.5102837077086004, "percentage": 51.03, "elapsed_time": "21:39:52", "remaining_time": "20:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9156, "total_steps": 17941, "loss": 1.6079, "learning_rate": 4.969280578009157e-05, "epoch": 0.5103394459617635, "percentage": 51.03, "elapsed_time": "21:40:01", "remaining_time": "20:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9157, "total_steps": 17941, "loss": 1.7796, "learning_rate": 4.9683901716760645e-05, "epoch": 0.5103951842149267, "percentage": 51.04, "elapsed_time": "21:40:10", "remaining_time": "20:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9158, "total_steps": 17941, "loss": 1.5331, "learning_rate": 4.967499766345449e-05, "epoch": 0.5104509224680899, "percentage": 51.05, "elapsed_time": "21:40:18", "remaining_time": "20:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9159, "total_steps": 17941, "loss": 1.5991, "learning_rate": 4.966609362045552e-05, "epoch": 0.510506660721253, "percentage": 51.05, "elapsed_time": "21:40:26", "remaining_time": "20:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9160, "total_steps": 17941, "loss": 1.6963, "learning_rate": 4.9657189588046125e-05, "epoch": 0.5105623989744161, "percentage": 51.06, "elapsed_time": "21:40:35", "remaining_time": "20:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9161, "total_steps": 17941, "loss": 1.4591, "learning_rate": 4.964828556650867e-05, "epoch": 0.5106181372275793, "percentage": 51.06, "elapsed_time": "21:40:43", "remaining_time": "20:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9162, "total_steps": 17941, "loss": 1.7269, "learning_rate": 4.9639381556125545e-05, "epoch": 0.5106738754807424, "percentage": 51.07, "elapsed_time": "21:40:52", "remaining_time": "20:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9163, "total_steps": 17941, "loss": 1.7202, "learning_rate": 4.963047755717914e-05, "epoch": 0.5107296137339056, "percentage": 51.07, "elapsed_time": "21:41:00", "remaining_time": "20:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9164, "total_steps": 17941, "loss": 1.543, "learning_rate": 4.962157356995181e-05, "epoch": 0.5107853519870688, "percentage": 51.08, "elapsed_time": "21:41:09", "remaining_time": "20:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9165, "total_steps": 17941, "loss": 1.506, "learning_rate": 4.9612669594725985e-05, "epoch": 0.5108410902402318, "percentage": 51.08, "elapsed_time": "21:41:17", "remaining_time": "20:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9166, "total_steps": 17941, "loss": 1.4054, "learning_rate": 4.960376563178402e-05, "epoch": 0.510896828493395, "percentage": 51.09, "elapsed_time": "21:41:26", "remaining_time": "20:45:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9167, "total_steps": 17941, "loss": 1.8014, "learning_rate": 4.95948616814083e-05, "epoch": 0.5109525667465582, "percentage": 51.1, "elapsed_time": "21:41:34", "remaining_time": "20:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9168, "total_steps": 17941, "loss": 1.6825, "learning_rate": 4.958595774388119e-05, "epoch": 0.5110083049997213, "percentage": 51.1, "elapsed_time": "21:41:42", "remaining_time": "20:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9169, "total_steps": 17941, "loss": 1.8822, "learning_rate": 4.9577053819485106e-05, "epoch": 0.5110640432528845, "percentage": 51.11, "elapsed_time": "21:41:51", "remaining_time": "20:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9170, "total_steps": 17941, "loss": 1.5337, "learning_rate": 4.95681499085024e-05, "epoch": 0.5111197815060476, "percentage": 51.11, "elapsed_time": "21:41:59", "remaining_time": "20:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9171, "total_steps": 17941, "loss": 1.6926, "learning_rate": 4.9559246011215445e-05, "epoch": 0.5111755197592107, "percentage": 51.12, "elapsed_time": "21:42:08", "remaining_time": "20:45:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9172, "total_steps": 17941, "loss": 1.8106, "learning_rate": 4.955034212790667e-05, "epoch": 0.5112312580123739, "percentage": 51.12, "elapsed_time": "21:42:16", "remaining_time": "20:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9173, "total_steps": 17941, "loss": 1.5418, "learning_rate": 4.954143825885839e-05, "epoch": 0.5112869962655371, "percentage": 51.13, "elapsed_time": "21:42:25", "remaining_time": "20:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9174, "total_steps": 17941, "loss": 1.7995, "learning_rate": 4.9532534404353045e-05, "epoch": 0.5113427345187002, "percentage": 51.13, "elapsed_time": "21:42:33", "remaining_time": "20:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9175, "total_steps": 17941, "loss": 1.7018, "learning_rate": 4.952363056467295e-05, "epoch": 0.5113984727718633, "percentage": 51.14, "elapsed_time": "21:42:42", "remaining_time": "20:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9176, "total_steps": 17941, "loss": 1.4375, "learning_rate": 4.951472674010054e-05, "epoch": 0.5114542110250265, "percentage": 51.15, "elapsed_time": "21:42:50", "remaining_time": "20:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9177, "total_steps": 17941, "loss": 1.856, "learning_rate": 4.9505822930918154e-05, "epoch": 0.5115099492781896, "percentage": 51.15, "elapsed_time": "21:42:59", "remaining_time": "20:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9178, "total_steps": 17941, "loss": 1.5449, "learning_rate": 4.9496919137408194e-05, "epoch": 0.5115656875313528, "percentage": 51.16, "elapsed_time": "21:43:07", "remaining_time": "20:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9179, "total_steps": 17941, "loss": 1.5744, "learning_rate": 4.948801535985302e-05, "epoch": 0.5116214257845159, "percentage": 51.16, "elapsed_time": "21:43:16", "remaining_time": "20:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9180, "total_steps": 17941, "loss": 1.5903, "learning_rate": 4.947911159853502e-05, "epoch": 0.511677164037679, "percentage": 51.17, "elapsed_time": "21:43:24", "remaining_time": "20:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9181, "total_steps": 17941, "loss": 1.6904, "learning_rate": 4.947020785373657e-05, "epoch": 0.5117329022908422, "percentage": 51.17, "elapsed_time": "21:43:33", "remaining_time": "20:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9182, "total_steps": 17941, "loss": 1.6402, "learning_rate": 4.9461304125740006e-05, "epoch": 0.5117886405440053, "percentage": 51.18, "elapsed_time": "21:43:41", "remaining_time": "20:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9183, "total_steps": 17941, "loss": 1.6268, "learning_rate": 4.945240041482777e-05, "epoch": 0.5118443787971685, "percentage": 51.18, "elapsed_time": "21:43:50", "remaining_time": "20:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9184, "total_steps": 17941, "loss": 1.7676, "learning_rate": 4.9443496721282176e-05, "epoch": 0.5119001170503317, "percentage": 51.19, "elapsed_time": "21:43:58", "remaining_time": "20:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9185, "total_steps": 17941, "loss": 1.787, "learning_rate": 4.943459304538562e-05, "epoch": 0.5119558553034947, "percentage": 51.2, "elapsed_time": "21:44:07", "remaining_time": "20:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9186, "total_steps": 17941, "loss": 1.4734, "learning_rate": 4.94256893874205e-05, "epoch": 0.5120115935566579, "percentage": 51.2, "elapsed_time": "21:44:15", "remaining_time": "20:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9187, "total_steps": 17941, "loss": 1.6512, "learning_rate": 4.941678574766915e-05, "epoch": 0.5120673318098211, "percentage": 51.21, "elapsed_time": "21:44:24", "remaining_time": "20:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9188, "total_steps": 17941, "loss": 1.6187, "learning_rate": 4.9407882126413964e-05, "epoch": 0.5121230700629842, "percentage": 51.21, "elapsed_time": "21:44:33", "remaining_time": "20:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9189, "total_steps": 17941, "loss": 1.7205, "learning_rate": 4.939897852393729e-05, "epoch": 0.5121788083161474, "percentage": 51.22, "elapsed_time": "21:44:42", "remaining_time": "20:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9190, "total_steps": 17941, "loss": 1.7667, "learning_rate": 4.939007494052153e-05, "epoch": 0.5122345465693106, "percentage": 51.22, "elapsed_time": "21:44:50", "remaining_time": "20:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9191, "total_steps": 17941, "loss": 1.6104, "learning_rate": 4.938117137644901e-05, "epoch": 0.5122902848224736, "percentage": 51.23, "elapsed_time": "21:44:59", "remaining_time": "20:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9192, "total_steps": 17941, "loss": 1.5063, "learning_rate": 4.937226783200214e-05, "epoch": 0.5123460230756368, "percentage": 51.23, "elapsed_time": "21:45:07", "remaining_time": "20:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9193, "total_steps": 17941, "loss": 1.8014, "learning_rate": 4.936336430746328e-05, "epoch": 0.5124017613288, "percentage": 51.24, "elapsed_time": "21:45:15", "remaining_time": "20:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9194, "total_steps": 17941, "loss": 2.0275, "learning_rate": 4.935446080311479e-05, "epoch": 0.5124574995819631, "percentage": 51.25, "elapsed_time": "21:45:24", "remaining_time": "20:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9195, "total_steps": 17941, "loss": 1.4672, "learning_rate": 4.934555731923905e-05, "epoch": 0.5125132378351263, "percentage": 51.25, "elapsed_time": "21:45:33", "remaining_time": "20:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9196, "total_steps": 17941, "loss": 1.9117, "learning_rate": 4.9336653856118395e-05, "epoch": 0.5125689760882894, "percentage": 51.26, "elapsed_time": "21:45:42", "remaining_time": "20:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9197, "total_steps": 17941, "loss": 1.7259, "learning_rate": 4.932775041403521e-05, "epoch": 0.5126247143414525, "percentage": 51.26, "elapsed_time": "21:45:50", "remaining_time": "20:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9198, "total_steps": 17941, "loss": 1.6182, "learning_rate": 4.93188469932719e-05, "epoch": 0.5126804525946157, "percentage": 51.27, "elapsed_time": "21:45:58", "remaining_time": "20:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9199, "total_steps": 17941, "loss": 1.6146, "learning_rate": 4.9309943594110743e-05, "epoch": 0.5127361908477789, "percentage": 51.27, "elapsed_time": "21:46:07", "remaining_time": "20:41:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9200, "total_steps": 17941, "loss": 1.5467, "learning_rate": 4.93010402168342e-05, "epoch": 0.512791929100942, "percentage": 51.28, "elapsed_time": "21:46:15", "remaining_time": "20:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9201, "total_steps": 17941, "loss": 1.7189, "learning_rate": 4.9292136861724544e-05, "epoch": 0.5128476673541051, "percentage": 51.28, "elapsed_time": "21:46:24", "remaining_time": "20:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9202, "total_steps": 17941, "loss": 1.6331, "learning_rate": 4.9283233529064205e-05, "epoch": 0.5129034056072682, "percentage": 51.29, "elapsed_time": "21:46:32", "remaining_time": "20:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9203, "total_steps": 17941, "loss": 1.3119, "learning_rate": 4.9274330219135506e-05, "epoch": 0.5129591438604314, "percentage": 51.3, "elapsed_time": "21:46:41", "remaining_time": "20:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9204, "total_steps": 17941, "loss": 1.7628, "learning_rate": 4.926542693222083e-05, "epoch": 0.5130148821135946, "percentage": 51.3, "elapsed_time": "21:46:49", "remaining_time": "20:40:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9205, "total_steps": 17941, "loss": 1.8385, "learning_rate": 4.925652366860253e-05, "epoch": 0.5130706203667577, "percentage": 51.31, "elapsed_time": "21:46:58", "remaining_time": "20:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9206, "total_steps": 17941, "loss": 1.5642, "learning_rate": 4.9247620428562954e-05, "epoch": 0.5131263586199208, "percentage": 51.31, "elapsed_time": "21:47:06", "remaining_time": "20:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9207, "total_steps": 17941, "loss": 1.5955, "learning_rate": 4.9238717212384485e-05, "epoch": 0.513182096873084, "percentage": 51.32, "elapsed_time": "21:47:14", "remaining_time": "20:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9208, "total_steps": 17941, "loss": 1.4373, "learning_rate": 4.922981402034945e-05, "epoch": 0.5132378351262471, "percentage": 51.32, "elapsed_time": "21:47:23", "remaining_time": "20:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9209, "total_steps": 17941, "loss": 1.5492, "learning_rate": 4.922091085274025e-05, "epoch": 0.5132935733794103, "percentage": 51.33, "elapsed_time": "21:47:31", "remaining_time": "20:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9210, "total_steps": 17941, "loss": 1.7274, "learning_rate": 4.9212007709839185e-05, "epoch": 0.5133493116325735, "percentage": 51.33, "elapsed_time": "21:47:40", "remaining_time": "20:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9211, "total_steps": 17941, "loss": 1.6216, "learning_rate": 4.9203104591928654e-05, "epoch": 0.5134050498857365, "percentage": 51.34, "elapsed_time": "21:47:48", "remaining_time": "20:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9212, "total_steps": 17941, "loss": 1.7127, "learning_rate": 4.919420149929101e-05, "epoch": 0.5134607881388997, "percentage": 51.35, "elapsed_time": "21:47:57", "remaining_time": "20:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9213, "total_steps": 17941, "loss": 1.8044, "learning_rate": 4.918529843220858e-05, "epoch": 0.5135165263920629, "percentage": 51.35, "elapsed_time": "21:48:05", "remaining_time": "20:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9214, "total_steps": 17941, "loss": 1.7176, "learning_rate": 4.917639539096375e-05, "epoch": 0.513572264645226, "percentage": 51.36, "elapsed_time": "21:48:14", "remaining_time": "20:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9215, "total_steps": 17941, "loss": 1.8507, "learning_rate": 4.9167492375838844e-05, "epoch": 0.5136280028983892, "percentage": 51.36, "elapsed_time": "21:48:23", "remaining_time": "20:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9216, "total_steps": 17941, "loss": 1.4948, "learning_rate": 4.915858938711624e-05, "epoch": 0.5136837411515524, "percentage": 51.37, "elapsed_time": "21:48:31", "remaining_time": "20:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9217, "total_steps": 17941, "loss": 1.7211, "learning_rate": 4.914968642507824e-05, "epoch": 0.5137394794047154, "percentage": 51.37, "elapsed_time": "21:48:40", "remaining_time": "20:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9218, "total_steps": 17941, "loss": 1.6642, "learning_rate": 4.9140783490007255e-05, "epoch": 0.5137952176578786, "percentage": 51.38, "elapsed_time": "21:48:49", "remaining_time": "20:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9219, "total_steps": 17941, "loss": 1.7359, "learning_rate": 4.9131880582185614e-05, "epoch": 0.5138509559110418, "percentage": 51.39, "elapsed_time": "21:48:57", "remaining_time": "20:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9220, "total_steps": 17941, "loss": 1.6898, "learning_rate": 4.912297770189565e-05, "epoch": 0.5139066941642049, "percentage": 51.39, "elapsed_time": "21:49:06", "remaining_time": "20:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9221, "total_steps": 17941, "loss": 1.6172, "learning_rate": 4.911407484941973e-05, "epoch": 0.513962432417368, "percentage": 51.4, "elapsed_time": "21:49:14", "remaining_time": "20:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9222, "total_steps": 17941, "loss": 1.6677, "learning_rate": 4.910517202504017e-05, "epoch": 0.5140181706705312, "percentage": 51.4, "elapsed_time": "21:49:22", "remaining_time": "20:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9223, "total_steps": 17941, "loss": 1.8476, "learning_rate": 4.909626922903934e-05, "epoch": 0.5140739089236943, "percentage": 51.41, "elapsed_time": "21:49:32", "remaining_time": "20:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9224, "total_steps": 17941, "loss": 1.9254, "learning_rate": 4.90873664616996e-05, "epoch": 0.5141296471768575, "percentage": 51.41, "elapsed_time": "21:49:40", "remaining_time": "20:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9225, "total_steps": 17941, "loss": 2.0271, "learning_rate": 4.907846372330325e-05, "epoch": 0.5141853854300206, "percentage": 51.42, "elapsed_time": "21:49:49", "remaining_time": "20:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9226, "total_steps": 17941, "loss": 1.8016, "learning_rate": 4.906956101413269e-05, "epoch": 0.5142411236831838, "percentage": 51.42, "elapsed_time": "21:49:57", "remaining_time": "20:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9227, "total_steps": 17941, "loss": 1.7529, "learning_rate": 4.90606583344702e-05, "epoch": 0.5142968619363469, "percentage": 51.43, "elapsed_time": "21:50:07", "remaining_time": "20:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9228, "total_steps": 17941, "loss": 1.7477, "learning_rate": 4.905175568459817e-05, "epoch": 0.51435260018951, "percentage": 51.44, "elapsed_time": "21:50:15", "remaining_time": "20:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9229, "total_steps": 17941, "loss": 1.627, "learning_rate": 4.904285306479891e-05, "epoch": 0.5144083384426732, "percentage": 51.44, "elapsed_time": "21:50:24", "remaining_time": "20:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9230, "total_steps": 17941, "loss": 1.459, "learning_rate": 4.903395047535477e-05, "epoch": 0.5144640766958364, "percentage": 51.45, "elapsed_time": "21:50:32", "remaining_time": "20:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9231, "total_steps": 17941, "loss": 1.6794, "learning_rate": 4.90250479165481e-05, "epoch": 0.5145198149489995, "percentage": 51.45, "elapsed_time": "21:50:41", "remaining_time": "20:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9232, "total_steps": 17941, "loss": 1.5589, "learning_rate": 4.901614538866121e-05, "epoch": 0.5145755532021626, "percentage": 51.46, "elapsed_time": "21:50:49", "remaining_time": "20:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9233, "total_steps": 17941, "loss": 1.9199, "learning_rate": 4.900724289197647e-05, "epoch": 0.5146312914553258, "percentage": 51.46, "elapsed_time": "21:50:57", "remaining_time": "20:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9234, "total_steps": 17941, "loss": 1.8075, "learning_rate": 4.899834042677617e-05, "epoch": 0.5146870297084889, "percentage": 51.47, "elapsed_time": "21:51:06", "remaining_time": "20:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9235, "total_steps": 17941, "loss": 1.4777, "learning_rate": 4.898943799334271e-05, "epoch": 0.5147427679616521, "percentage": 51.47, "elapsed_time": "21:51:14", "remaining_time": "20:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9236, "total_steps": 17941, "loss": 1.8581, "learning_rate": 4.8980535591958346e-05, "epoch": 0.5147985062148153, "percentage": 51.48, "elapsed_time": "21:51:23", "remaining_time": "20:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9237, "total_steps": 17941, "loss": 1.9628, "learning_rate": 4.897163322290546e-05, "epoch": 0.5148542444679783, "percentage": 51.49, "elapsed_time": "21:51:32", "remaining_time": "20:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9238, "total_steps": 17941, "loss": 1.5789, "learning_rate": 4.896273088646639e-05, "epoch": 0.5149099827211415, "percentage": 51.49, "elapsed_time": "21:51:40", "remaining_time": "20:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9239, "total_steps": 17941, "loss": 1.6334, "learning_rate": 4.8953828582923435e-05, "epoch": 0.5149657209743047, "percentage": 51.5, "elapsed_time": "21:51:49", "remaining_time": "20:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9240, "total_steps": 17941, "loss": 1.7236, "learning_rate": 4.894492631255895e-05, "epoch": 0.5150214592274678, "percentage": 51.5, "elapsed_time": "21:51:57", "remaining_time": "20:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9241, "total_steps": 17941, "loss": 1.8026, "learning_rate": 4.8936024075655234e-05, "epoch": 0.515077197480631, "percentage": 51.51, "elapsed_time": "21:52:06", "remaining_time": "20:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9242, "total_steps": 17941, "loss": 1.7085, "learning_rate": 4.892712187249465e-05, "epoch": 0.5151329357337942, "percentage": 51.51, "elapsed_time": "21:52:14", "remaining_time": "20:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9243, "total_steps": 17941, "loss": 1.8545, "learning_rate": 4.891821970335948e-05, "epoch": 0.5151886739869572, "percentage": 51.52, "elapsed_time": "21:52:23", "remaining_time": "20:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9244, "total_steps": 17941, "loss": 1.5689, "learning_rate": 4.8909317568532074e-05, "epoch": 0.5152444122401204, "percentage": 51.52, "elapsed_time": "21:52:31", "remaining_time": "20:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9245, "total_steps": 17941, "loss": 1.6177, "learning_rate": 4.890041546829478e-05, "epoch": 0.5153001504932836, "percentage": 51.53, "elapsed_time": "21:52:40", "remaining_time": "20:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9246, "total_steps": 17941, "loss": 1.6859, "learning_rate": 4.889151340292988e-05, "epoch": 0.5153558887464467, "percentage": 51.54, "elapsed_time": "21:52:48", "remaining_time": "20:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9247, "total_steps": 17941, "loss": 1.7225, "learning_rate": 4.888261137271972e-05, "epoch": 0.5154116269996099, "percentage": 51.54, "elapsed_time": "21:52:57", "remaining_time": "20:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9248, "total_steps": 17941, "loss": 1.8317, "learning_rate": 4.8873709377946607e-05, "epoch": 0.5154673652527729, "percentage": 51.55, "elapsed_time": "21:53:05", "remaining_time": "20:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9249, "total_steps": 17941, "loss": 1.3468, "learning_rate": 4.886480741889285e-05, "epoch": 0.5155231035059361, "percentage": 51.55, "elapsed_time": "21:53:14", "remaining_time": "20:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9250, "total_steps": 17941, "loss": 1.8712, "learning_rate": 4.8855905495840824e-05, "epoch": 0.5155788417590993, "percentage": 51.56, "elapsed_time": "21:53:22", "remaining_time": "20:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9251, "total_steps": 17941, "loss": 1.7937, "learning_rate": 4.8847003609072766e-05, "epoch": 0.5156345800122624, "percentage": 51.56, "elapsed_time": "21:53:30", "remaining_time": "20:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9252, "total_steps": 17941, "loss": 1.6511, "learning_rate": 4.883810175887106e-05, "epoch": 0.5156903182654256, "percentage": 51.57, "elapsed_time": "21:53:39", "remaining_time": "20:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9253, "total_steps": 17941, "loss": 1.6945, "learning_rate": 4.882919994551797e-05, "epoch": 0.5157460565185887, "percentage": 51.57, "elapsed_time": "21:53:47", "remaining_time": "20:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9254, "total_steps": 17941, "loss": 1.555, "learning_rate": 4.882029816929585e-05, "epoch": 0.5158017947717518, "percentage": 51.58, "elapsed_time": "21:53:56", "remaining_time": "20:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9255, "total_steps": 17941, "loss": 1.5392, "learning_rate": 4.881139643048698e-05, "epoch": 0.515857533024915, "percentage": 51.59, "elapsed_time": "21:54:04", "remaining_time": "20:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9256, "total_steps": 17941, "loss": 1.5023, "learning_rate": 4.8802494729373684e-05, "epoch": 0.5159132712780782, "percentage": 51.59, "elapsed_time": "21:54:13", "remaining_time": "20:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9257, "total_steps": 17941, "loss": 1.7664, "learning_rate": 4.879359306623829e-05, "epoch": 0.5159690095312413, "percentage": 51.6, "elapsed_time": "21:54:21", "remaining_time": "20:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9258, "total_steps": 17941, "loss": 1.7523, "learning_rate": 4.878469144136306e-05, "epoch": 0.5160247477844044, "percentage": 51.6, "elapsed_time": "21:54:30", "remaining_time": "20:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9259, "total_steps": 17941, "loss": 1.7377, "learning_rate": 4.8775789855030366e-05, "epoch": 0.5160804860375676, "percentage": 51.61, "elapsed_time": "21:54:38", "remaining_time": "20:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9260, "total_steps": 17941, "loss": 1.9714, "learning_rate": 4.876688830752245e-05, "epoch": 0.5161362242907307, "percentage": 51.61, "elapsed_time": "21:54:46", "remaining_time": "20:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9261, "total_steps": 17941, "loss": 1.5455, "learning_rate": 4.8757986799121685e-05, "epoch": 0.5161919625438939, "percentage": 51.62, "elapsed_time": "21:54:55", "remaining_time": "20:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9262, "total_steps": 17941, "loss": 1.547, "learning_rate": 4.87490853301103e-05, "epoch": 0.5162477007970571, "percentage": 51.62, "elapsed_time": "21:55:03", "remaining_time": "20:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9263, "total_steps": 17941, "loss": 1.7112, "learning_rate": 4.874018390077065e-05, "epoch": 0.5163034390502201, "percentage": 51.63, "elapsed_time": "21:55:12", "remaining_time": "20:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9264, "total_steps": 17941, "loss": 1.5646, "learning_rate": 4.8731282511385025e-05, "epoch": 0.5163591773033833, "percentage": 51.64, "elapsed_time": "21:55:20", "remaining_time": "20:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9265, "total_steps": 17941, "loss": 1.7205, "learning_rate": 4.872238116223571e-05, "epoch": 0.5164149155565465, "percentage": 51.64, "elapsed_time": "21:55:30", "remaining_time": "20:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9266, "total_steps": 17941, "loss": 1.641, "learning_rate": 4.871347985360503e-05, "epoch": 0.5164706538097096, "percentage": 51.65, "elapsed_time": "21:55:38", "remaining_time": "20:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9267, "total_steps": 17941, "loss": 1.7817, "learning_rate": 4.870457858577526e-05, "epoch": 0.5165263920628728, "percentage": 51.65, "elapsed_time": "21:55:47", "remaining_time": "20:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9268, "total_steps": 17941, "loss": 2.0283, "learning_rate": 4.869567735902871e-05, "epoch": 0.516582130316036, "percentage": 51.66, "elapsed_time": "21:55:55", "remaining_time": "20:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9269, "total_steps": 17941, "loss": 1.7466, "learning_rate": 4.8686776173647653e-05, "epoch": 0.516637868569199, "percentage": 51.66, "elapsed_time": "21:56:04", "remaining_time": "20:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9270, "total_steps": 17941, "loss": 1.4493, "learning_rate": 4.867787502991441e-05, "epoch": 0.5166936068223622, "percentage": 51.67, "elapsed_time": "21:56:12", "remaining_time": "20:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9271, "total_steps": 17941, "loss": 1.6095, "learning_rate": 4.866897392811126e-05, "epoch": 0.5167493450755253, "percentage": 51.67, "elapsed_time": "21:56:21", "remaining_time": "20:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9272, "total_steps": 17941, "loss": 1.6357, "learning_rate": 4.866007286852051e-05, "epoch": 0.5168050833286885, "percentage": 51.68, "elapsed_time": "21:56:29", "remaining_time": "20:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9273, "total_steps": 17941, "loss": 1.6251, "learning_rate": 4.865117185142443e-05, "epoch": 0.5168608215818516, "percentage": 51.69, "elapsed_time": "21:56:38", "remaining_time": "20:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9274, "total_steps": 17941, "loss": 1.6139, "learning_rate": 4.8642270877105305e-05, "epoch": 0.5169165598350147, "percentage": 51.69, "elapsed_time": "21:56:46", "remaining_time": "20:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9275, "total_steps": 17941, "loss": 1.7346, "learning_rate": 4.863336994584542e-05, "epoch": 0.5169722980881779, "percentage": 51.7, "elapsed_time": "21:56:55", "remaining_time": "20:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9276, "total_steps": 17941, "loss": 1.8586, "learning_rate": 4.8624469057927116e-05, "epoch": 0.5170280363413411, "percentage": 51.7, "elapsed_time": "21:57:04", "remaining_time": "20:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9277, "total_steps": 17941, "loss": 1.6571, "learning_rate": 4.861556821363259e-05, "epoch": 0.5170837745945042, "percentage": 51.71, "elapsed_time": "21:57:12", "remaining_time": "20:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9278, "total_steps": 17941, "loss": 1.6364, "learning_rate": 4.860666741324419e-05, "epoch": 0.5171395128476673, "percentage": 51.71, "elapsed_time": "21:57:21", "remaining_time": "20:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9279, "total_steps": 17941, "loss": 1.5787, "learning_rate": 4.8597766657044166e-05, "epoch": 0.5171952511008305, "percentage": 51.72, "elapsed_time": "21:57:29", "remaining_time": "20:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9280, "total_steps": 17941, "loss": 1.7362, "learning_rate": 4.8588865945314826e-05, "epoch": 0.5172509893539936, "percentage": 51.73, "elapsed_time": "21:57:38", "remaining_time": "20:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9281, "total_steps": 17941, "loss": 1.9419, "learning_rate": 4.857996527833841e-05, "epoch": 0.5173067276071568, "percentage": 51.73, "elapsed_time": "21:57:46", "remaining_time": "20:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9282, "total_steps": 17941, "loss": 1.8925, "learning_rate": 4.857106465639723e-05, "epoch": 0.51736246586032, "percentage": 51.74, "elapsed_time": "21:57:55", "remaining_time": "20:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9283, "total_steps": 17941, "loss": 1.5802, "learning_rate": 4.8562164079773545e-05, "epoch": 0.517418204113483, "percentage": 51.74, "elapsed_time": "21:58:03", "remaining_time": "20:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9284, "total_steps": 17941, "loss": 1.651, "learning_rate": 4.855326354874962e-05, "epoch": 0.5174739423666462, "percentage": 51.75, "elapsed_time": "21:58:12", "remaining_time": "20:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9285, "total_steps": 17941, "loss": 1.5509, "learning_rate": 4.8544363063607764e-05, "epoch": 0.5175296806198094, "percentage": 51.75, "elapsed_time": "21:58:20", "remaining_time": "20:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9286, "total_steps": 17941, "loss": 1.5164, "learning_rate": 4.8535462624630196e-05, "epoch": 0.5175854188729725, "percentage": 51.76, "elapsed_time": "21:58:29", "remaining_time": "20:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9287, "total_steps": 17941, "loss": 1.4815, "learning_rate": 4.852656223209925e-05, "epoch": 0.5176411571261357, "percentage": 51.76, "elapsed_time": "21:58:37", "remaining_time": "20:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9288, "total_steps": 17941, "loss": 1.6221, "learning_rate": 4.8517661886297124e-05, "epoch": 0.5176968953792989, "percentage": 51.77, "elapsed_time": "21:58:46", "remaining_time": "20:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9289, "total_steps": 17941, "loss": 1.5974, "learning_rate": 4.850876158750613e-05, "epoch": 0.5177526336324619, "percentage": 51.78, "elapsed_time": "21:58:55", "remaining_time": "20:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9290, "total_steps": 17941, "loss": 1.7308, "learning_rate": 4.849986133600854e-05, "epoch": 0.5178083718856251, "percentage": 51.78, "elapsed_time": "21:59:03", "remaining_time": "20:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9291, "total_steps": 17941, "loss": 1.828, "learning_rate": 4.849096113208658e-05, "epoch": 0.5178641101387883, "percentage": 51.79, "elapsed_time": "21:59:12", "remaining_time": "20:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9292, "total_steps": 17941, "loss": 1.7686, "learning_rate": 4.848206097602256e-05, "epoch": 0.5179198483919514, "percentage": 51.79, "elapsed_time": "21:59:20", "remaining_time": "20:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9293, "total_steps": 17941, "loss": 1.8687, "learning_rate": 4.8473160868098697e-05, "epoch": 0.5179755866451146, "percentage": 51.8, "elapsed_time": "21:59:29", "remaining_time": "20:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9294, "total_steps": 17941, "loss": 1.4875, "learning_rate": 4.8464260808597276e-05, "epoch": 0.5180313248982776, "percentage": 51.8, "elapsed_time": "21:59:37", "remaining_time": "20:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9295, "total_steps": 17941, "loss": 1.7863, "learning_rate": 4.8455360797800534e-05, "epoch": 0.5180870631514408, "percentage": 51.81, "elapsed_time": "21:59:46", "remaining_time": "20:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9296, "total_steps": 17941, "loss": 1.842, "learning_rate": 4.844646083599075e-05, "epoch": 0.518142801404604, "percentage": 51.81, "elapsed_time": "21:59:54", "remaining_time": "20:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9297, "total_steps": 17941, "loss": 1.4797, "learning_rate": 4.843756092345018e-05, "epoch": 0.5181985396577671, "percentage": 51.82, "elapsed_time": "22:00:03", "remaining_time": "20:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9298, "total_steps": 17941, "loss": 1.6694, "learning_rate": 4.8428661060461055e-05, "epoch": 0.5182542779109303, "percentage": 51.83, "elapsed_time": "22:00:12", "remaining_time": "20:27:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9299, "total_steps": 17941, "loss": 1.611, "learning_rate": 4.8419761247305655e-05, "epoch": 0.5183100161640934, "percentage": 51.83, "elapsed_time": "22:00:20", "remaining_time": "20:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9300, "total_steps": 17941, "loss": 1.4735, "learning_rate": 4.8410861484266206e-05, "epoch": 0.5183657544172565, "percentage": 51.84, "elapsed_time": "22:00:30", "remaining_time": "20:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9301, "total_steps": 17941, "loss": 1.5019, "learning_rate": 4.8401961771624946e-05, "epoch": 0.5184214926704197, "percentage": 51.84, "elapsed_time": "22:00:38", "remaining_time": "20:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9302, "total_steps": 17941, "loss": 1.7617, "learning_rate": 4.839306210966418e-05, "epoch": 0.5184772309235829, "percentage": 51.85, "elapsed_time": "22:00:46", "remaining_time": "20:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9303, "total_steps": 17941, "loss": 1.8268, "learning_rate": 4.838416249866608e-05, "epoch": 0.518532969176746, "percentage": 51.85, "elapsed_time": "22:00:55", "remaining_time": "20:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9304, "total_steps": 17941, "loss": 1.816, "learning_rate": 4.837526293891295e-05, "epoch": 0.5185887074299091, "percentage": 51.86, "elapsed_time": "22:01:03", "remaining_time": "20:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9305, "total_steps": 17941, "loss": 1.6345, "learning_rate": 4.8366363430687e-05, "epoch": 0.5186444456830723, "percentage": 51.86, "elapsed_time": "22:01:12", "remaining_time": "20:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9306, "total_steps": 17941, "loss": 1.5671, "learning_rate": 4.8357463974270474e-05, "epoch": 0.5187001839362354, "percentage": 51.87, "elapsed_time": "22:01:20", "remaining_time": "20:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9307, "total_steps": 17941, "loss": 1.5713, "learning_rate": 4.834856456994561e-05, "epoch": 0.5187559221893986, "percentage": 51.88, "elapsed_time": "22:01:29", "remaining_time": "20:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9308, "total_steps": 17941, "loss": 1.6636, "learning_rate": 4.8339665217994654e-05, "epoch": 0.5188116604425618, "percentage": 51.88, "elapsed_time": "22:01:38", "remaining_time": "20:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9309, "total_steps": 17941, "loss": 1.6706, "learning_rate": 4.833076591869984e-05, "epoch": 0.5188673986957248, "percentage": 51.89, "elapsed_time": "22:01:46", "remaining_time": "20:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9310, "total_steps": 17941, "loss": 1.6778, "learning_rate": 4.832186667234338e-05, "epoch": 0.518923136948888, "percentage": 51.89, "elapsed_time": "22:01:55", "remaining_time": "20:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9311, "total_steps": 17941, "loss": 1.7534, "learning_rate": 4.831296747920756e-05, "epoch": 0.5189788752020512, "percentage": 51.9, "elapsed_time": "22:02:03", "remaining_time": "20:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9312, "total_steps": 17941, "loss": 1.5795, "learning_rate": 4.8304068339574536e-05, "epoch": 0.5190346134552143, "percentage": 51.9, "elapsed_time": "22:02:11", "remaining_time": "20:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9313, "total_steps": 17941, "loss": 1.5837, "learning_rate": 4.829516925372662e-05, "epoch": 0.5190903517083775, "percentage": 51.91, "elapsed_time": "22:02:20", "remaining_time": "20:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9314, "total_steps": 17941, "loss": 1.3961, "learning_rate": 4.828627022194596e-05, "epoch": 0.5191460899615407, "percentage": 51.91, "elapsed_time": "22:02:28", "remaining_time": "20:24:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9315, "total_steps": 17941, "loss": 1.6917, "learning_rate": 4.827737124451482e-05, "epoch": 0.5192018282147037, "percentage": 51.92, "elapsed_time": "22:02:38", "remaining_time": "20:24:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9316, "total_steps": 17941, "loss": 1.4865, "learning_rate": 4.8268472321715437e-05, "epoch": 0.5192575664678669, "percentage": 51.93, "elapsed_time": "22:02:46", "remaining_time": "20:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9317, "total_steps": 17941, "loss": 1.6661, "learning_rate": 4.825957345383e-05, "epoch": 0.51931330472103, "percentage": 51.93, "elapsed_time": "22:02:54", "remaining_time": "20:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9318, "total_steps": 17941, "loss": 1.8197, "learning_rate": 4.8250674641140763e-05, "epoch": 0.5193690429741932, "percentage": 51.94, "elapsed_time": "22:03:03", "remaining_time": "20:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9319, "total_steps": 17941, "loss": 1.6962, "learning_rate": 4.8241775883929914e-05, "epoch": 0.5194247812273564, "percentage": 51.94, "elapsed_time": "22:03:12", "remaining_time": "20:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9320, "total_steps": 17941, "loss": 1.7966, "learning_rate": 4.82328771824797e-05, "epoch": 0.5194805194805194, "percentage": 51.95, "elapsed_time": "22:03:20", "remaining_time": "20:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9321, "total_steps": 17941, "loss": 1.7016, "learning_rate": 4.822397853707228e-05, "epoch": 0.5195362577336826, "percentage": 51.95, "elapsed_time": "22:03:29", "remaining_time": "20:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9322, "total_steps": 17941, "loss": 1.4905, "learning_rate": 4.821507994798993e-05, "epoch": 0.5195919959868458, "percentage": 51.96, "elapsed_time": "22:03:38", "remaining_time": "20:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9323, "total_steps": 17941, "loss": 1.6682, "learning_rate": 4.820618141551485e-05, "epoch": 0.5196477342400089, "percentage": 51.96, "elapsed_time": "22:03:46", "remaining_time": "20:23:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9324, "total_steps": 17941, "loss": 1.6271, "learning_rate": 4.819728293992922e-05, "epoch": 0.5197034724931721, "percentage": 51.97, "elapsed_time": "22:03:54", "remaining_time": "20:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9325, "total_steps": 17941, "loss": 1.8624, "learning_rate": 4.8188384521515276e-05, "epoch": 0.5197592107463352, "percentage": 51.98, "elapsed_time": "22:04:03", "remaining_time": "20:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9326, "total_steps": 17941, "loss": 1.6311, "learning_rate": 4.817948616055521e-05, "epoch": 0.5198149489994983, "percentage": 51.98, "elapsed_time": "22:04:11", "remaining_time": "20:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9327, "total_steps": 17941, "loss": 1.706, "learning_rate": 4.817058785733123e-05, "epoch": 0.5198706872526615, "percentage": 51.99, "elapsed_time": "22:04:20", "remaining_time": "20:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9328, "total_steps": 17941, "loss": 1.5919, "learning_rate": 4.8161689612125524e-05, "epoch": 0.5199264255058247, "percentage": 51.99, "elapsed_time": "22:04:28", "remaining_time": "20:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9329, "total_steps": 17941, "loss": 1.6905, "learning_rate": 4.8152791425220304e-05, "epoch": 0.5199821637589878, "percentage": 52.0, "elapsed_time": "22:04:37", "remaining_time": "20:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9330, "total_steps": 17941, "loss": 1.6947, "learning_rate": 4.814389329689778e-05, "epoch": 0.5200379020121509, "percentage": 52.0, "elapsed_time": "22:04:45", "remaining_time": "20:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9331, "total_steps": 17941, "loss": 1.6495, "learning_rate": 4.8134995227440136e-05, "epoch": 0.5200936402653141, "percentage": 52.01, "elapsed_time": "22:04:54", "remaining_time": "20:22:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9332, "total_steps": 17941, "loss": 1.6507, "learning_rate": 4.8126097217129576e-05, "epoch": 0.5201493785184772, "percentage": 52.01, "elapsed_time": "22:05:02", "remaining_time": "20:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9333, "total_steps": 17941, "loss": 1.6496, "learning_rate": 4.811719926624828e-05, "epoch": 0.5202051167716404, "percentage": 52.02, "elapsed_time": "22:05:11", "remaining_time": "20:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9334, "total_steps": 17941, "loss": 1.7513, "learning_rate": 4.8108301375078445e-05, "epoch": 0.5202608550248036, "percentage": 52.03, "elapsed_time": "22:05:19", "remaining_time": "20:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9335, "total_steps": 17941, "loss": 1.5815, "learning_rate": 4.809940354390227e-05, "epoch": 0.5203165932779666, "percentage": 52.03, "elapsed_time": "22:05:28", "remaining_time": "20:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9336, "total_steps": 17941, "loss": 1.8808, "learning_rate": 4.809050577300191e-05, "epoch": 0.5203723315311298, "percentage": 52.04, "elapsed_time": "22:05:36", "remaining_time": "20:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9337, "total_steps": 17941, "loss": 1.5373, "learning_rate": 4.8081608062659614e-05, "epoch": 0.520428069784293, "percentage": 52.04, "elapsed_time": "22:05:44", "remaining_time": "20:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9338, "total_steps": 17941, "loss": 1.7677, "learning_rate": 4.807271041315749e-05, "epoch": 0.5204838080374561, "percentage": 52.05, "elapsed_time": "22:05:53", "remaining_time": "20:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9339, "total_steps": 17941, "loss": 1.7192, "learning_rate": 4.806381282477778e-05, "epoch": 0.5205395462906193, "percentage": 52.05, "elapsed_time": "22:06:02", "remaining_time": "20:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9340, "total_steps": 17941, "loss": 1.6621, "learning_rate": 4.8054915297802616e-05, "epoch": 0.5205952845437823, "percentage": 52.06, "elapsed_time": "22:06:10", "remaining_time": "20:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9341, "total_steps": 17941, "loss": 1.8134, "learning_rate": 4.8046017832514206e-05, "epoch": 0.5206510227969455, "percentage": 52.07, "elapsed_time": "22:06:19", "remaining_time": "20:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9342, "total_steps": 17941, "loss": 1.811, "learning_rate": 4.803712042919473e-05, "epoch": 0.5207067610501087, "percentage": 52.07, "elapsed_time": "22:06:27", "remaining_time": "20:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9343, "total_steps": 17941, "loss": 1.6691, "learning_rate": 4.8028223088126336e-05, "epoch": 0.5207624993032718, "percentage": 52.08, "elapsed_time": "22:06:35", "remaining_time": "20:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9344, "total_steps": 17941, "loss": 1.8073, "learning_rate": 4.8019325809591216e-05, "epoch": 0.520818237556435, "percentage": 52.08, "elapsed_time": "22:06:44", "remaining_time": "20:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9345, "total_steps": 17941, "loss": 1.5679, "learning_rate": 4.8010428593871517e-05, "epoch": 0.5208739758095982, "percentage": 52.09, "elapsed_time": "22:06:52", "remaining_time": "20:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9346, "total_steps": 17941, "loss": 1.4528, "learning_rate": 4.8001531441249457e-05, "epoch": 0.5209297140627612, "percentage": 52.09, "elapsed_time": "22:07:01", "remaining_time": "20:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9347, "total_steps": 17941, "loss": 1.5618, "learning_rate": 4.7992634352007125e-05, "epoch": 0.5209854523159244, "percentage": 52.1, "elapsed_time": "22:07:09", "remaining_time": "20:20:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9348, "total_steps": 17941, "loss": 1.7091, "learning_rate": 4.7983737326426746e-05, "epoch": 0.5210411905690876, "percentage": 52.1, "elapsed_time": "22:07:18", "remaining_time": "20:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9349, "total_steps": 17941, "loss": 1.7043, "learning_rate": 4.7974840364790476e-05, "epoch": 0.5210969288222507, "percentage": 52.11, "elapsed_time": "22:07:26", "remaining_time": "20:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9350, "total_steps": 17941, "loss": 1.5431, "learning_rate": 4.7965943467380446e-05, "epoch": 0.5211526670754139, "percentage": 52.12, "elapsed_time": "22:07:35", "remaining_time": "20:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9351, "total_steps": 17941, "loss": 1.5314, "learning_rate": 4.7957046634478846e-05, "epoch": 0.521208405328577, "percentage": 52.12, "elapsed_time": "22:07:43", "remaining_time": "20:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9352, "total_steps": 17941, "loss": 1.9862, "learning_rate": 4.7948149866367806e-05, "epoch": 0.5212641435817401, "percentage": 52.13, "elapsed_time": "22:07:52", "remaining_time": "20:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9353, "total_steps": 17941, "loss": 1.6921, "learning_rate": 4.7939253163329496e-05, "epoch": 0.5213198818349033, "percentage": 52.13, "elapsed_time": "22:08:00", "remaining_time": "20:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9354, "total_steps": 17941, "loss": 1.5896, "learning_rate": 4.7930356525646046e-05, "epoch": 0.5213756200880665, "percentage": 52.14, "elapsed_time": "22:08:09", "remaining_time": "20:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9355, "total_steps": 17941, "loss": 1.7059, "learning_rate": 4.792145995359962e-05, "epoch": 0.5214313583412296, "percentage": 52.14, "elapsed_time": "22:08:17", "remaining_time": "20:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9356, "total_steps": 17941, "loss": 1.5835, "learning_rate": 4.791256344747238e-05, "epoch": 0.5214870965943927, "percentage": 52.15, "elapsed_time": "22:08:26", "remaining_time": "20:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9357, "total_steps": 17941, "loss": 1.5472, "learning_rate": 4.790366700754644e-05, "epoch": 0.5215428348475559, "percentage": 52.15, "elapsed_time": "22:08:35", "remaining_time": "20:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9358, "total_steps": 17941, "loss": 1.7969, "learning_rate": 4.789477063410399e-05, "epoch": 0.521598573100719, "percentage": 52.16, "elapsed_time": "22:08:43", "remaining_time": "20:18:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9359, "total_steps": 17941, "loss": 1.6338, "learning_rate": 4.788587432742711e-05, "epoch": 0.5216543113538822, "percentage": 52.17, "elapsed_time": "22:08:52", "remaining_time": "20:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9360, "total_steps": 17941, "loss": 1.7335, "learning_rate": 4.787697808779798e-05, "epoch": 0.5217100496070454, "percentage": 52.17, "elapsed_time": "22:09:00", "remaining_time": "20:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9361, "total_steps": 17941, "loss": 1.9916, "learning_rate": 4.7868081915498734e-05, "epoch": 0.5217657878602084, "percentage": 52.18, "elapsed_time": "22:09:09", "remaining_time": "20:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9362, "total_steps": 17941, "loss": 1.6839, "learning_rate": 4.785918581081148e-05, "epoch": 0.5218215261133716, "percentage": 52.18, "elapsed_time": "22:09:17", "remaining_time": "20:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9363, "total_steps": 17941, "loss": 1.6613, "learning_rate": 4.7850289774018404e-05, "epoch": 0.5218772643665347, "percentage": 52.19, "elapsed_time": "22:09:26", "remaining_time": "20:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9364, "total_steps": 17941, "loss": 1.4462, "learning_rate": 4.784139380540157e-05, "epoch": 0.5219330026196979, "percentage": 52.19, "elapsed_time": "22:09:34", "remaining_time": "20:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9365, "total_steps": 17941, "loss": 1.826, "learning_rate": 4.7832497905243164e-05, "epoch": 0.5219887408728611, "percentage": 52.2, "elapsed_time": "22:09:43", "remaining_time": "20:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9366, "total_steps": 17941, "loss": 1.6403, "learning_rate": 4.782360207382527e-05, "epoch": 0.5220444791260241, "percentage": 52.2, "elapsed_time": "22:09:51", "remaining_time": "20:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9367, "total_steps": 17941, "loss": 1.6031, "learning_rate": 4.781470631143003e-05, "epoch": 0.5221002173791873, "percentage": 52.21, "elapsed_time": "22:10:00", "remaining_time": "20:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9368, "total_steps": 17941, "loss": 1.7744, "learning_rate": 4.780581061833958e-05, "epoch": 0.5221559556323505, "percentage": 52.22, "elapsed_time": "22:10:08", "remaining_time": "20:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9369, "total_steps": 17941, "loss": 1.7062, "learning_rate": 4.7796914994836003e-05, "epoch": 0.5222116938855136, "percentage": 52.22, "elapsed_time": "22:10:16", "remaining_time": "20:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9370, "total_steps": 17941, "loss": 1.6158, "learning_rate": 4.778801944120146e-05, "epoch": 0.5222674321386768, "percentage": 52.23, "elapsed_time": "22:10:25", "remaining_time": "20:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9371, "total_steps": 17941, "loss": 1.8501, "learning_rate": 4.7779123957718016e-05, "epoch": 0.52232317039184, "percentage": 52.23, "elapsed_time": "22:10:33", "remaining_time": "20:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9372, "total_steps": 17941, "loss": 1.677, "learning_rate": 4.777022854466784e-05, "epoch": 0.522378908645003, "percentage": 52.24, "elapsed_time": "22:10:42", "remaining_time": "20:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9373, "total_steps": 17941, "loss": 1.6819, "learning_rate": 4.7761333202332986e-05, "epoch": 0.5224346468981662, "percentage": 52.24, "elapsed_time": "22:10:50", "remaining_time": "20:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9374, "total_steps": 17941, "loss": 1.8114, "learning_rate": 4.7752437930995605e-05, "epoch": 0.5224903851513294, "percentage": 52.25, "elapsed_time": "22:11:00", "remaining_time": "20:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9375, "total_steps": 17941, "loss": 1.6216, "learning_rate": 4.7743542730937794e-05, "epoch": 0.5225461234044925, "percentage": 52.25, "elapsed_time": "22:11:08", "remaining_time": "20:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9376, "total_steps": 17941, "loss": 1.5714, "learning_rate": 4.7734647602441644e-05, "epoch": 0.5226018616576557, "percentage": 52.26, "elapsed_time": "22:11:17", "remaining_time": "20:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9377, "total_steps": 17941, "loss": 1.7383, "learning_rate": 4.7725752545789276e-05, "epoch": 0.5226575999108188, "percentage": 52.27, "elapsed_time": "22:11:25", "remaining_time": "20:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9378, "total_steps": 17941, "loss": 1.4746, "learning_rate": 4.771685756126276e-05, "epoch": 0.5227133381639819, "percentage": 52.27, "elapsed_time": "22:11:33", "remaining_time": "20:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9379, "total_steps": 17941, "loss": 1.762, "learning_rate": 4.7707962649144225e-05, "epoch": 0.5227690764171451, "percentage": 52.28, "elapsed_time": "22:11:42", "remaining_time": "20:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9380, "total_steps": 17941, "loss": 1.6694, "learning_rate": 4.769906780971575e-05, "epoch": 0.5228248146703083, "percentage": 52.28, "elapsed_time": "22:11:51", "remaining_time": "20:15:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9381, "total_steps": 17941, "loss": 1.6952, "learning_rate": 4.769017304325941e-05, "epoch": 0.5228805529234714, "percentage": 52.29, "elapsed_time": "22:12:00", "remaining_time": "20:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9382, "total_steps": 17941, "loss": 1.8446, "learning_rate": 4.768127835005733e-05, "epoch": 0.5229362911766345, "percentage": 52.29, "elapsed_time": "22:12:08", "remaining_time": "20:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9383, "total_steps": 17941, "loss": 1.5253, "learning_rate": 4.767238373039157e-05, "epoch": 0.5229920294297977, "percentage": 52.3, "elapsed_time": "22:12:17", "remaining_time": "20:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9384, "total_steps": 17941, "loss": 1.7674, "learning_rate": 4.7663489184544246e-05, "epoch": 0.5230477676829608, "percentage": 52.3, "elapsed_time": "22:12:25", "remaining_time": "20:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9385, "total_steps": 17941, "loss": 1.6636, "learning_rate": 4.7654594712797415e-05, "epoch": 0.523103505936124, "percentage": 52.31, "elapsed_time": "22:12:33", "remaining_time": "20:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9386, "total_steps": 17941, "loss": 1.6065, "learning_rate": 4.7645700315433155e-05, "epoch": 0.523159244189287, "percentage": 52.32, "elapsed_time": "22:12:42", "remaining_time": "20:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9387, "total_steps": 17941, "loss": 1.8092, "learning_rate": 4.763680599273357e-05, "epoch": 0.5232149824424502, "percentage": 52.32, "elapsed_time": "22:12:50", "remaining_time": "20:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9388, "total_steps": 17941, "loss": 1.5921, "learning_rate": 4.76279117449807e-05, "epoch": 0.5232707206956134, "percentage": 52.33, "elapsed_time": "22:12:59", "remaining_time": "20:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9389, "total_steps": 17941, "loss": 1.7831, "learning_rate": 4.761901757245667e-05, "epoch": 0.5233264589487765, "percentage": 52.33, "elapsed_time": "22:13:08", "remaining_time": "20:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9390, "total_steps": 17941, "loss": 1.7594, "learning_rate": 4.7610123475443486e-05, "epoch": 0.5233821972019397, "percentage": 52.34, "elapsed_time": "22:13:17", "remaining_time": "20:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9391, "total_steps": 17941, "loss": 1.635, "learning_rate": 4.7601229454223275e-05, "epoch": 0.5234379354551029, "percentage": 52.34, "elapsed_time": "22:13:25", "remaining_time": "20:14:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9392, "total_steps": 17941, "loss": 1.6621, "learning_rate": 4.759233550907807e-05, "epoch": 0.5234936737082659, "percentage": 52.35, "elapsed_time": "22:13:33", "remaining_time": "20:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9393, "total_steps": 17941, "loss": 1.6687, "learning_rate": 4.7583441640289946e-05, "epoch": 0.5235494119614291, "percentage": 52.35, "elapsed_time": "22:13:42", "remaining_time": "20:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9394, "total_steps": 17941, "loss": 1.7393, "learning_rate": 4.757454784814097e-05, "epoch": 0.5236051502145923, "percentage": 52.36, "elapsed_time": "22:13:50", "remaining_time": "20:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9395, "total_steps": 17941, "loss": 1.7908, "learning_rate": 4.756565413291318e-05, "epoch": 0.5236608884677554, "percentage": 52.37, "elapsed_time": "22:13:59", "remaining_time": "20:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9396, "total_steps": 17941, "loss": 1.6024, "learning_rate": 4.755676049488867e-05, "epoch": 0.5237166267209186, "percentage": 52.37, "elapsed_time": "22:14:07", "remaining_time": "20:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9397, "total_steps": 17941, "loss": 1.7352, "learning_rate": 4.7547866934349447e-05, "epoch": 0.5237723649740817, "percentage": 52.38, "elapsed_time": "22:14:16", "remaining_time": "20:13:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9398, "total_steps": 17941, "loss": 1.6196, "learning_rate": 4.753897345157762e-05, "epoch": 0.5238281032272448, "percentage": 52.38, "elapsed_time": "22:14:24", "remaining_time": "20:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9399, "total_steps": 17941, "loss": 1.5433, "learning_rate": 4.753008004685517e-05, "epoch": 0.523883841480408, "percentage": 52.39, "elapsed_time": "22:14:33", "remaining_time": "20:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9400, "total_steps": 17941, "loss": 1.4725, "learning_rate": 4.752118672046419e-05, "epoch": 0.5239395797335712, "percentage": 52.39, "elapsed_time": "22:14:41", "remaining_time": "20:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9401, "total_steps": 17941, "loss": 1.6878, "learning_rate": 4.751229347268673e-05, "epoch": 0.5239953179867343, "percentage": 52.4, "elapsed_time": "22:14:50", "remaining_time": "20:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9402, "total_steps": 17941, "loss": 1.4368, "learning_rate": 4.750340030380481e-05, "epoch": 0.5240510562398975, "percentage": 52.41, "elapsed_time": "22:14:58", "remaining_time": "20:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9403, "total_steps": 17941, "loss": 1.8745, "learning_rate": 4.749450721410048e-05, "epoch": 0.5241067944930606, "percentage": 52.41, "elapsed_time": "22:15:07", "remaining_time": "20:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9404, "total_steps": 17941, "loss": 1.8433, "learning_rate": 4.748561420385577e-05, "epoch": 0.5241625327462237, "percentage": 52.42, "elapsed_time": "22:15:15", "remaining_time": "20:12:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9405, "total_steps": 17941, "loss": 1.6408, "learning_rate": 4.747672127335272e-05, "epoch": 0.5242182709993869, "percentage": 52.42, "elapsed_time": "22:15:23", "remaining_time": "20:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9406, "total_steps": 17941, "loss": 1.74, "learning_rate": 4.746782842287335e-05, "epoch": 0.5242740092525501, "percentage": 52.43, "elapsed_time": "22:15:32", "remaining_time": "20:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9407, "total_steps": 17941, "loss": 1.7131, "learning_rate": 4.7458935652699686e-05, "epoch": 0.5243297475057132, "percentage": 52.43, "elapsed_time": "22:15:41", "remaining_time": "20:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9408, "total_steps": 17941, "loss": 1.6917, "learning_rate": 4.7450042963113794e-05, "epoch": 0.5243854857588763, "percentage": 52.44, "elapsed_time": "22:15:49", "remaining_time": "20:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9409, "total_steps": 17941, "loss": 1.5985, "learning_rate": 4.744115035439766e-05, "epoch": 0.5244412240120394, "percentage": 52.44, "elapsed_time": "22:15:58", "remaining_time": "20:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9410, "total_steps": 17941, "loss": 1.3233, "learning_rate": 4.743225782683333e-05, "epoch": 0.5244969622652026, "percentage": 52.45, "elapsed_time": "22:16:06", "remaining_time": "20:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9411, "total_steps": 17941, "loss": 1.7022, "learning_rate": 4.74233653807028e-05, "epoch": 0.5245527005183658, "percentage": 52.46, "elapsed_time": "22:16:14", "remaining_time": "20:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9412, "total_steps": 17941, "loss": 1.5126, "learning_rate": 4.7414473016288096e-05, "epoch": 0.5246084387715289, "percentage": 52.46, "elapsed_time": "22:16:23", "remaining_time": "20:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9413, "total_steps": 17941, "loss": 1.736, "learning_rate": 4.740558073387124e-05, "epoch": 0.524664177024692, "percentage": 52.47, "elapsed_time": "22:16:32", "remaining_time": "20:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9414, "total_steps": 17941, "loss": 1.7664, "learning_rate": 4.7396688533734224e-05, "epoch": 0.5247199152778552, "percentage": 52.47, "elapsed_time": "22:16:40", "remaining_time": "20:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9415, "total_steps": 17941, "loss": 1.6379, "learning_rate": 4.7387796416159094e-05, "epoch": 0.5247756535310183, "percentage": 52.48, "elapsed_time": "22:16:49", "remaining_time": "20:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9416, "total_steps": 17941, "loss": 1.6248, "learning_rate": 4.7378904381427805e-05, "epoch": 0.5248313917841815, "percentage": 52.48, "elapsed_time": "22:16:57", "remaining_time": "20:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9417, "total_steps": 17941, "loss": 1.8269, "learning_rate": 4.7370012429822405e-05, "epoch": 0.5248871300373447, "percentage": 52.49, "elapsed_time": "22:17:05", "remaining_time": "20:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9418, "total_steps": 17941, "loss": 1.6686, "learning_rate": 4.736112056162486e-05, "epoch": 0.5249428682905077, "percentage": 52.49, "elapsed_time": "22:17:14", "remaining_time": "20:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9419, "total_steps": 17941, "loss": 1.6043, "learning_rate": 4.7352228777117195e-05, "epoch": 0.5249986065436709, "percentage": 52.5, "elapsed_time": "22:17:22", "remaining_time": "20:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9420, "total_steps": 17941, "loss": 1.3681, "learning_rate": 4.73433370765814e-05, "epoch": 0.5250543447968341, "percentage": 52.51, "elapsed_time": "22:17:31", "remaining_time": "20:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9421, "total_steps": 17941, "loss": 1.8752, "learning_rate": 4.733444546029946e-05, "epoch": 0.5251100830499972, "percentage": 52.51, "elapsed_time": "22:17:39", "remaining_time": "20:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9422, "total_steps": 17941, "loss": 1.6649, "learning_rate": 4.7325553928553375e-05, "epoch": 0.5251658213031604, "percentage": 52.52, "elapsed_time": "22:17:48", "remaining_time": "20:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9423, "total_steps": 17941, "loss": 0.7808, "learning_rate": 4.73166624816251e-05, "epoch": 0.5252215595563235, "percentage": 52.52, "elapsed_time": "22:17:56", "remaining_time": "20:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9424, "total_steps": 17941, "loss": 1.9264, "learning_rate": 4.7307771119796685e-05, "epoch": 0.5252772978094866, "percentage": 52.53, "elapsed_time": "22:18:05", "remaining_time": "20:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9425, "total_steps": 17941, "loss": 1.4697, "learning_rate": 4.729887984335004e-05, "epoch": 0.5253330360626498, "percentage": 52.53, "elapsed_time": "22:18:13", "remaining_time": "20:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9426, "total_steps": 17941, "loss": 1.7123, "learning_rate": 4.728998865256718e-05, "epoch": 0.525388774315813, "percentage": 52.54, "elapsed_time": "22:18:21", "remaining_time": "20:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9427, "total_steps": 17941, "loss": 1.6069, "learning_rate": 4.728109754773011e-05, "epoch": 0.5254445125689761, "percentage": 52.54, "elapsed_time": "22:18:30", "remaining_time": "20:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9428, "total_steps": 17941, "loss": 1.5449, "learning_rate": 4.727220652912074e-05, "epoch": 0.5255002508221392, "percentage": 52.55, "elapsed_time": "22:18:38", "remaining_time": "20:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9429, "total_steps": 17941, "loss": 1.3929, "learning_rate": 4.72633155970211e-05, "epoch": 0.5255559890753024, "percentage": 52.56, "elapsed_time": "22:18:47", "remaining_time": "20:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9430, "total_steps": 17941, "loss": 1.5311, "learning_rate": 4.725442475171312e-05, "epoch": 0.5256117273284655, "percentage": 52.56, "elapsed_time": "22:18:55", "remaining_time": "20:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9431, "total_steps": 17941, "loss": 1.8386, "learning_rate": 4.724553399347879e-05, "epoch": 0.5256674655816287, "percentage": 52.57, "elapsed_time": "22:19:04", "remaining_time": "20:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9432, "total_steps": 17941, "loss": 1.4743, "learning_rate": 4.723664332260004e-05, "epoch": 0.5257232038347918, "percentage": 52.57, "elapsed_time": "22:19:12", "remaining_time": "20:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9433, "total_steps": 17941, "loss": 1.5645, "learning_rate": 4.722775273935886e-05, "epoch": 0.525778942087955, "percentage": 52.58, "elapsed_time": "22:19:21", "remaining_time": "20:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9434, "total_steps": 17941, "loss": 1.8844, "learning_rate": 4.721886224403722e-05, "epoch": 0.5258346803411181, "percentage": 52.58, "elapsed_time": "22:19:30", "remaining_time": "20:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9435, "total_steps": 17941, "loss": 1.6094, "learning_rate": 4.720997183691703e-05, "epoch": 0.5258904185942812, "percentage": 52.59, "elapsed_time": "22:19:38", "remaining_time": "20:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9436, "total_steps": 17941, "loss": 1.6859, "learning_rate": 4.720108151828028e-05, "epoch": 0.5259461568474444, "percentage": 52.59, "elapsed_time": "22:19:46", "remaining_time": "20:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9437, "total_steps": 17941, "loss": 1.8112, "learning_rate": 4.71921912884089e-05, "epoch": 0.5260018951006076, "percentage": 52.6, "elapsed_time": "22:19:55", "remaining_time": "20:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9438, "total_steps": 17941, "loss": 1.783, "learning_rate": 4.7183301147584854e-05, "epoch": 0.5260576333537706, "percentage": 52.61, "elapsed_time": "22:20:03", "remaining_time": "20:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9439, "total_steps": 17941, "loss": 1.5162, "learning_rate": 4.717441109609006e-05, "epoch": 0.5261133716069338, "percentage": 52.61, "elapsed_time": "22:20:12", "remaining_time": "20:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9440, "total_steps": 17941, "loss": 1.5676, "learning_rate": 4.716552113420646e-05, "epoch": 0.526169109860097, "percentage": 52.62, "elapsed_time": "22:20:20", "remaining_time": "20:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9441, "total_steps": 17941, "loss": 1.812, "learning_rate": 4.715663126221603e-05, "epoch": 0.5262248481132601, "percentage": 52.62, "elapsed_time": "22:20:29", "remaining_time": "20:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9442, "total_steps": 17941, "loss": 1.8001, "learning_rate": 4.714774148040065e-05, "epoch": 0.5262805863664233, "percentage": 52.63, "elapsed_time": "22:20:37", "remaining_time": "20:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9443, "total_steps": 17941, "loss": 1.8504, "learning_rate": 4.713885178904231e-05, "epoch": 0.5263363246195865, "percentage": 52.63, "elapsed_time": "22:20:46", "remaining_time": "20:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9444, "total_steps": 17941, "loss": 1.7862, "learning_rate": 4.7129962188422886e-05, "epoch": 0.5263920628727495, "percentage": 52.64, "elapsed_time": "22:20:54", "remaining_time": "20:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9445, "total_steps": 17941, "loss": 1.6889, "learning_rate": 4.712107267882434e-05, "epoch": 0.5264478011259127, "percentage": 52.64, "elapsed_time": "22:21:03", "remaining_time": "20:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9446, "total_steps": 17941, "loss": 1.4817, "learning_rate": 4.7112183260528584e-05, "epoch": 0.5265035393790759, "percentage": 52.65, "elapsed_time": "22:21:12", "remaining_time": "20:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9447, "total_steps": 17941, "loss": 1.7066, "learning_rate": 4.710329393381753e-05, "epoch": 0.526559277632239, "percentage": 52.66, "elapsed_time": "22:21:20", "remaining_time": "20:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9448, "total_steps": 17941, "loss": 1.4955, "learning_rate": 4.709440469897312e-05, "epoch": 0.5266150158854022, "percentage": 52.66, "elapsed_time": "22:21:29", "remaining_time": "20:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9449, "total_steps": 17941, "loss": 1.6005, "learning_rate": 4.708551555627723e-05, "epoch": 0.5266707541385653, "percentage": 52.67, "elapsed_time": "22:21:37", "remaining_time": "20:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9450, "total_steps": 17941, "loss": 1.6138, "learning_rate": 4.707662650601182e-05, "epoch": 0.5267264923917284, "percentage": 52.67, "elapsed_time": "22:21:46", "remaining_time": "20:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9451, "total_steps": 17941, "loss": 1.8049, "learning_rate": 4.706773754845874e-05, "epoch": 0.5267822306448916, "percentage": 52.68, "elapsed_time": "22:21:54", "remaining_time": "20:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9452, "total_steps": 17941, "loss": 1.4986, "learning_rate": 4.705884868389994e-05, "epoch": 0.5268379688980548, "percentage": 52.68, "elapsed_time": "22:22:03", "remaining_time": "20:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9453, "total_steps": 17941, "loss": 1.6794, "learning_rate": 4.704995991261733e-05, "epoch": 0.5268937071512179, "percentage": 52.69, "elapsed_time": "22:22:12", "remaining_time": "20:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9454, "total_steps": 17941, "loss": 1.544, "learning_rate": 4.704107123489277e-05, "epoch": 0.526949445404381, "percentage": 52.69, "elapsed_time": "22:22:20", "remaining_time": "20:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9455, "total_steps": 17941, "loss": 1.556, "learning_rate": 4.70321826510082e-05, "epoch": 0.5270051836575441, "percentage": 52.7, "elapsed_time": "22:22:29", "remaining_time": "20:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9456, "total_steps": 17941, "loss": 1.5109, "learning_rate": 4.702329416124548e-05, "epoch": 0.5270609219107073, "percentage": 52.71, "elapsed_time": "22:22:38", "remaining_time": "20:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9457, "total_steps": 17941, "loss": 1.6984, "learning_rate": 4.701440576588652e-05, "epoch": 0.5271166601638705, "percentage": 52.71, "elapsed_time": "22:22:46", "remaining_time": "20:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9458, "total_steps": 17941, "loss": 1.6543, "learning_rate": 4.700551746521318e-05, "epoch": 0.5271723984170336, "percentage": 52.72, "elapsed_time": "22:22:54", "remaining_time": "20:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9459, "total_steps": 17941, "loss": 1.5402, "learning_rate": 4.699662925950738e-05, "epoch": 0.5272281366701967, "percentage": 52.72, "elapsed_time": "22:23:03", "remaining_time": "20:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9460, "total_steps": 17941, "loss": 1.6698, "learning_rate": 4.6987741149051e-05, "epoch": 0.5272838749233599, "percentage": 52.73, "elapsed_time": "22:23:11", "remaining_time": "20:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9461, "total_steps": 17941, "loss": 1.7072, "learning_rate": 4.69788531341259e-05, "epoch": 0.527339613176523, "percentage": 52.73, "elapsed_time": "22:23:20", "remaining_time": "20:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9462, "total_steps": 17941, "loss": 1.443, "learning_rate": 4.6969965215013964e-05, "epoch": 0.5273953514296862, "percentage": 52.74, "elapsed_time": "22:23:28", "remaining_time": "20:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9463, "total_steps": 17941, "loss": 1.498, "learning_rate": 4.696107739199707e-05, "epoch": 0.5274510896828494, "percentage": 52.75, "elapsed_time": "22:23:37", "remaining_time": "20:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9464, "total_steps": 17941, "loss": 1.7932, "learning_rate": 4.695218966535708e-05, "epoch": 0.5275068279360124, "percentage": 52.75, "elapsed_time": "22:23:45", "remaining_time": "20:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9465, "total_steps": 17941, "loss": 1.5405, "learning_rate": 4.6943302035375864e-05, "epoch": 0.5275625661891756, "percentage": 52.76, "elapsed_time": "22:23:54", "remaining_time": "20:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9466, "total_steps": 17941, "loss": 1.6725, "learning_rate": 4.693441450233527e-05, "epoch": 0.5276183044423388, "percentage": 52.76, "elapsed_time": "22:24:02", "remaining_time": "20:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9467, "total_steps": 17941, "loss": 1.7555, "learning_rate": 4.69255270665172e-05, "epoch": 0.5276740426955019, "percentage": 52.77, "elapsed_time": "22:24:10", "remaining_time": "20:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9468, "total_steps": 17941, "loss": 1.5811, "learning_rate": 4.6916639728203465e-05, "epoch": 0.5277297809486651, "percentage": 52.77, "elapsed_time": "22:24:19", "remaining_time": "20:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9469, "total_steps": 17941, "loss": 1.7571, "learning_rate": 4.6907752487675954e-05, "epoch": 0.5277855192018283, "percentage": 52.78, "elapsed_time": "22:24:27", "remaining_time": "20:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9470, "total_steps": 17941, "loss": 1.8604, "learning_rate": 4.68988653452165e-05, "epoch": 0.5278412574549913, "percentage": 52.78, "elapsed_time": "22:24:36", "remaining_time": "20:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9471, "total_steps": 17941, "loss": 1.7073, "learning_rate": 4.688997830110695e-05, "epoch": 0.5278969957081545, "percentage": 52.79, "elapsed_time": "22:24:44", "remaining_time": "20:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9472, "total_steps": 17941, "loss": 1.8051, "learning_rate": 4.688109135562918e-05, "epoch": 0.5279527339613177, "percentage": 52.8, "elapsed_time": "22:24:53", "remaining_time": "20:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9473, "total_steps": 17941, "loss": 1.4152, "learning_rate": 4.6872204509064984e-05, "epoch": 0.5280084722144808, "percentage": 52.8, "elapsed_time": "22:25:01", "remaining_time": "20:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9474, "total_steps": 17941, "loss": 1.8541, "learning_rate": 4.686331776169624e-05, "epoch": 0.528064210467644, "percentage": 52.81, "elapsed_time": "22:25:10", "remaining_time": "20:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9475, "total_steps": 17941, "loss": 1.5225, "learning_rate": 4.685443111380474e-05, "epoch": 0.5281199487208071, "percentage": 52.81, "elapsed_time": "22:25:18", "remaining_time": "20:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9476, "total_steps": 17941, "loss": 1.8114, "learning_rate": 4.6845544565672385e-05, "epoch": 0.5281756869739702, "percentage": 52.82, "elapsed_time": "22:25:26", "remaining_time": "20:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9477, "total_steps": 17941, "loss": 1.698, "learning_rate": 4.683665811758093e-05, "epoch": 0.5282314252271334, "percentage": 52.82, "elapsed_time": "22:25:35", "remaining_time": "20:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9478, "total_steps": 17941, "loss": 1.9423, "learning_rate": 4.6827771769812247e-05, "epoch": 0.5282871634802965, "percentage": 52.83, "elapsed_time": "22:25:43", "remaining_time": "20:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9479, "total_steps": 17941, "loss": 1.8993, "learning_rate": 4.681888552264816e-05, "epoch": 0.5283429017334597, "percentage": 52.83, "elapsed_time": "22:25:52", "remaining_time": "20:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9480, "total_steps": 17941, "loss": 1.4992, "learning_rate": 4.680999937637047e-05, "epoch": 0.5283986399866228, "percentage": 52.84, "elapsed_time": "22:26:00", "remaining_time": "20:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9481, "total_steps": 17941, "loss": 1.469, "learning_rate": 4.6801113331261e-05, "epoch": 0.5284543782397859, "percentage": 52.85, "elapsed_time": "22:26:09", "remaining_time": "20:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9482, "total_steps": 17941, "loss": 1.5147, "learning_rate": 4.679222738760156e-05, "epoch": 0.5285101164929491, "percentage": 52.85, "elapsed_time": "22:26:17", "remaining_time": "20:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9483, "total_steps": 17941, "loss": 1.7303, "learning_rate": 4.6783341545673975e-05, "epoch": 0.5285658547461123, "percentage": 52.86, "elapsed_time": "22:26:26", "remaining_time": "20:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9484, "total_steps": 17941, "loss": 1.4783, "learning_rate": 4.677445580576003e-05, "epoch": 0.5286215929992754, "percentage": 52.86, "elapsed_time": "22:26:34", "remaining_time": "20:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9485, "total_steps": 17941, "loss": 1.6925, "learning_rate": 4.676557016814154e-05, "epoch": 0.5286773312524385, "percentage": 52.87, "elapsed_time": "22:26:43", "remaining_time": "20:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9486, "total_steps": 17941, "loss": 1.562, "learning_rate": 4.675668463310032e-05, "epoch": 0.5287330695056017, "percentage": 52.87, "elapsed_time": "22:26:51", "remaining_time": "20:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9487, "total_steps": 17941, "loss": 1.8974, "learning_rate": 4.674779920091814e-05, "epoch": 0.5287888077587648, "percentage": 52.88, "elapsed_time": "22:26:59", "remaining_time": "20:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9488, "total_steps": 17941, "loss": 1.6163, "learning_rate": 4.673891387187682e-05, "epoch": 0.528844546011928, "percentage": 52.88, "elapsed_time": "22:27:08", "remaining_time": "20:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9489, "total_steps": 17941, "loss": 1.7773, "learning_rate": 4.673002864625813e-05, "epoch": 0.5289002842650912, "percentage": 52.89, "elapsed_time": "22:27:16", "remaining_time": "20:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9490, "total_steps": 17941, "loss": 1.6477, "learning_rate": 4.6721143524343874e-05, "epoch": 0.5289560225182542, "percentage": 52.9, "elapsed_time": "22:27:25", "remaining_time": "19:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9491, "total_steps": 17941, "loss": 1.3446, "learning_rate": 4.671225850641582e-05, "epoch": 0.5290117607714174, "percentage": 52.9, "elapsed_time": "22:27:33", "remaining_time": "19:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9492, "total_steps": 17941, "loss": 1.864, "learning_rate": 4.670337359275574e-05, "epoch": 0.5290674990245806, "percentage": 52.91, "elapsed_time": "22:27:42", "remaining_time": "19:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9493, "total_steps": 17941, "loss": 1.9024, "learning_rate": 4.6694488783645466e-05, "epoch": 0.5291232372777437, "percentage": 52.91, "elapsed_time": "22:27:50", "remaining_time": "19:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9494, "total_steps": 17941, "loss": 1.7019, "learning_rate": 4.6685604079366706e-05, "epoch": 0.5291789755309069, "percentage": 52.92, "elapsed_time": "22:27:59", "remaining_time": "19:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9495, "total_steps": 17941, "loss": 1.545, "learning_rate": 4.667671948020128e-05, "epoch": 0.52923471378407, "percentage": 52.92, "elapsed_time": "22:28:07", "remaining_time": "19:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9496, "total_steps": 17941, "loss": 1.4809, "learning_rate": 4.666783498643093e-05, "epoch": 0.5292904520372331, "percentage": 52.93, "elapsed_time": "22:28:15", "remaining_time": "19:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9497, "total_steps": 17941, "loss": 1.3123, "learning_rate": 4.665895059833741e-05, "epoch": 0.5293461902903963, "percentage": 52.93, "elapsed_time": "22:28:24", "remaining_time": "19:58:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9498, "total_steps": 17941, "loss": 1.5795, "learning_rate": 4.6650066316202525e-05, "epoch": 0.5294019285435595, "percentage": 52.94, "elapsed_time": "22:28:32", "remaining_time": "19:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9499, "total_steps": 17941, "loss": 1.7409, "learning_rate": 4.6641182140307986e-05, "epoch": 0.5294576667967226, "percentage": 52.95, "elapsed_time": "22:28:41", "remaining_time": "19:58:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9500, "total_steps": 17941, "loss": 1.5922, "learning_rate": 4.663229807093558e-05, "epoch": 0.5295134050498858, "percentage": 52.95, "elapsed_time": "22:28:49", "remaining_time": "19:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9501, "total_steps": 17941, "loss": 1.6494, "learning_rate": 4.662341410836703e-05, "epoch": 0.5295691433030488, "percentage": 52.96, "elapsed_time": "22:28:58", "remaining_time": "19:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9502, "total_steps": 17941, "loss": 1.5342, "learning_rate": 4.661453025288411e-05, "epoch": 0.529624881556212, "percentage": 52.96, "elapsed_time": "22:29:06", "remaining_time": "19:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9503, "total_steps": 17941, "loss": 1.6725, "learning_rate": 4.660564650476854e-05, "epoch": 0.5296806198093752, "percentage": 52.97, "elapsed_time": "22:29:15", "remaining_time": "19:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9504, "total_steps": 17941, "loss": 1.9948, "learning_rate": 4.6596762864302076e-05, "epoch": 0.5297363580625383, "percentage": 52.97, "elapsed_time": "22:29:23", "remaining_time": "19:57:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9505, "total_steps": 17941, "loss": 1.4934, "learning_rate": 4.658787933176646e-05, "epoch": 0.5297920963157015, "percentage": 52.98, "elapsed_time": "22:29:31", "remaining_time": "19:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9506, "total_steps": 17941, "loss": 1.627, "learning_rate": 4.657899590744341e-05, "epoch": 0.5298478345688646, "percentage": 52.98, "elapsed_time": "22:29:40", "remaining_time": "19:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9507, "total_steps": 17941, "loss": 1.5898, "learning_rate": 4.6570112591614664e-05, "epoch": 0.5299035728220277, "percentage": 52.99, "elapsed_time": "22:29:48", "remaining_time": "19:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9508, "total_steps": 17941, "loss": 1.4714, "learning_rate": 4.656122938456195e-05, "epoch": 0.5299593110751909, "percentage": 53.0, "elapsed_time": "22:29:57", "remaining_time": "19:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9509, "total_steps": 17941, "loss": 1.6165, "learning_rate": 4.6552346286567e-05, "epoch": 0.5300150493283541, "percentage": 53.0, "elapsed_time": "22:30:05", "remaining_time": "19:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9510, "total_steps": 17941, "loss": 1.8067, "learning_rate": 4.65434632979115e-05, "epoch": 0.5300707875815172, "percentage": 53.01, "elapsed_time": "22:30:14", "remaining_time": "19:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9511, "total_steps": 17941, "loss": 1.5718, "learning_rate": 4.6534580418877205e-05, "epoch": 0.5301265258346803, "percentage": 53.01, "elapsed_time": "22:30:23", "remaining_time": "19:56:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9512, "total_steps": 17941, "loss": 1.5877, "learning_rate": 4.652569764974582e-05, "epoch": 0.5301822640878435, "percentage": 53.02, "elapsed_time": "22:30:31", "remaining_time": "19:56:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9513, "total_steps": 17941, "loss": 1.7207, "learning_rate": 4.651681499079904e-05, "epoch": 0.5302380023410066, "percentage": 53.02, "elapsed_time": "22:30:39", "remaining_time": "19:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9514, "total_steps": 17941, "loss": 1.1782, "learning_rate": 4.6507932442318596e-05, "epoch": 0.5302937405941698, "percentage": 53.03, "elapsed_time": "22:30:48", "remaining_time": "19:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9515, "total_steps": 17941, "loss": 1.2772, "learning_rate": 4.649905000458616e-05, "epoch": 0.530349478847333, "percentage": 53.03, "elapsed_time": "22:30:56", "remaining_time": "19:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9516, "total_steps": 17941, "loss": 1.6083, "learning_rate": 4.6490167677883457e-05, "epoch": 0.530405217100496, "percentage": 53.04, "elapsed_time": "22:31:05", "remaining_time": "19:56:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9517, "total_steps": 17941, "loss": 1.687, "learning_rate": 4.648128546249216e-05, "epoch": 0.5304609553536592, "percentage": 53.05, "elapsed_time": "22:31:13", "remaining_time": "19:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9518, "total_steps": 17941, "loss": 1.5031, "learning_rate": 4.6472403358693964e-05, "epoch": 0.5305166936068224, "percentage": 53.05, "elapsed_time": "22:31:22", "remaining_time": "19:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9519, "total_steps": 17941, "loss": 1.7177, "learning_rate": 4.646352136677058e-05, "epoch": 0.5305724318599855, "percentage": 53.06, "elapsed_time": "22:31:30", "remaining_time": "19:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9520, "total_steps": 17941, "loss": 1.4941, "learning_rate": 4.645463948700368e-05, "epoch": 0.5306281701131487, "percentage": 53.06, "elapsed_time": "22:31:38", "remaining_time": "19:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9521, "total_steps": 17941, "loss": 1.5097, "learning_rate": 4.644575771967495e-05, "epoch": 0.5306839083663119, "percentage": 53.07, "elapsed_time": "22:31:47", "remaining_time": "19:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9522, "total_steps": 17941, "loss": 1.6904, "learning_rate": 4.6436876065066046e-05, "epoch": 0.5307396466194749, "percentage": 53.07, "elapsed_time": "22:31:55", "remaining_time": "19:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9523, "total_steps": 17941, "loss": 1.7481, "learning_rate": 4.642799452345867e-05, "epoch": 0.5307953848726381, "percentage": 53.08, "elapsed_time": "22:32:04", "remaining_time": "19:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9524, "total_steps": 17941, "loss": 1.8227, "learning_rate": 4.6419113095134485e-05, "epoch": 0.5308511231258012, "percentage": 53.09, "elapsed_time": "22:32:12", "remaining_time": "19:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9525, "total_steps": 17941, "loss": 1.5991, "learning_rate": 4.641023178037514e-05, "epoch": 0.5309068613789644, "percentage": 53.09, "elapsed_time": "22:32:21", "remaining_time": "19:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9526, "total_steps": 17941, "loss": 1.7392, "learning_rate": 4.6401350579462337e-05, "epoch": 0.5309625996321276, "percentage": 53.1, "elapsed_time": "22:32:29", "remaining_time": "19:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9527, "total_steps": 17941, "loss": 1.9319, "learning_rate": 4.6392469492677685e-05, "epoch": 0.5310183378852906, "percentage": 53.1, "elapsed_time": "22:32:38", "remaining_time": "19:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9528, "total_steps": 17941, "loss": 1.4941, "learning_rate": 4.63835885203029e-05, "epoch": 0.5310740761384538, "percentage": 53.11, "elapsed_time": "22:32:46", "remaining_time": "19:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9529, "total_steps": 17941, "loss": 1.8894, "learning_rate": 4.637470766261956e-05, "epoch": 0.531129814391617, "percentage": 53.11, "elapsed_time": "22:32:55", "remaining_time": "19:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9530, "total_steps": 17941, "loss": 1.5257, "learning_rate": 4.636582691990937e-05, "epoch": 0.5311855526447801, "percentage": 53.12, "elapsed_time": "22:33:03", "remaining_time": "19:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9531, "total_steps": 17941, "loss": 1.6217, "learning_rate": 4.6356946292453984e-05, "epoch": 0.5312412908979433, "percentage": 53.12, "elapsed_time": "22:33:12", "remaining_time": "19:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9532, "total_steps": 17941, "loss": 1.4773, "learning_rate": 4.6348065780535e-05, "epoch": 0.5312970291511064, "percentage": 53.13, "elapsed_time": "22:33:21", "remaining_time": "19:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9533, "total_steps": 17941, "loss": 1.5962, "learning_rate": 4.633918538443409e-05, "epoch": 0.5313527674042695, "percentage": 53.14, "elapsed_time": "22:33:29", "remaining_time": "19:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9534, "total_steps": 17941, "loss": 1.9244, "learning_rate": 4.633030510443287e-05, "epoch": 0.5314085056574327, "percentage": 53.14, "elapsed_time": "22:33:38", "remaining_time": "19:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9535, "total_steps": 17941, "loss": 1.5354, "learning_rate": 4.632142494081298e-05, "epoch": 0.5314642439105959, "percentage": 53.15, "elapsed_time": "22:33:46", "remaining_time": "19:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9536, "total_steps": 17941, "loss": 1.7756, "learning_rate": 4.631254489385602e-05, "epoch": 0.531519982163759, "percentage": 53.15, "elapsed_time": "22:33:54", "remaining_time": "19:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9537, "total_steps": 17941, "loss": 1.7578, "learning_rate": 4.630366496384365e-05, "epoch": 0.5315757204169221, "percentage": 53.16, "elapsed_time": "22:34:03", "remaining_time": "19:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9538, "total_steps": 17941, "loss": 1.8384, "learning_rate": 4.629478515105749e-05, "epoch": 0.5316314586700853, "percentage": 53.16, "elapsed_time": "22:34:11", "remaining_time": "19:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9539, "total_steps": 17941, "loss": 1.7661, "learning_rate": 4.6285905455779136e-05, "epoch": 0.5316871969232484, "percentage": 53.17, "elapsed_time": "22:34:20", "remaining_time": "19:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9540, "total_steps": 17941, "loss": 1.965, "learning_rate": 4.6277025878290204e-05, "epoch": 0.5317429351764116, "percentage": 53.17, "elapsed_time": "22:34:28", "remaining_time": "19:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9541, "total_steps": 17941, "loss": 1.7107, "learning_rate": 4.6268146418872305e-05, "epoch": 0.5317986734295748, "percentage": 53.18, "elapsed_time": "22:34:37", "remaining_time": "19:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9542, "total_steps": 17941, "loss": 1.7749, "learning_rate": 4.625926707780705e-05, "epoch": 0.5318544116827378, "percentage": 53.19, "elapsed_time": "22:34:46", "remaining_time": "19:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9543, "total_steps": 17941, "loss": 1.6059, "learning_rate": 4.625038785537602e-05, "epoch": 0.531910149935901, "percentage": 53.19, "elapsed_time": "22:34:55", "remaining_time": "19:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9544, "total_steps": 17941, "loss": 1.8484, "learning_rate": 4.6241508751860816e-05, "epoch": 0.5319658881890642, "percentage": 53.2, "elapsed_time": "22:35:04", "remaining_time": "19:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9545, "total_steps": 17941, "loss": 1.6221, "learning_rate": 4.623262976754307e-05, "epoch": 0.5320216264422273, "percentage": 53.2, "elapsed_time": "22:35:13", "remaining_time": "19:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9546, "total_steps": 17941, "loss": 1.6821, "learning_rate": 4.622375090270432e-05, "epoch": 0.5320773646953905, "percentage": 53.21, "elapsed_time": "22:35:22", "remaining_time": "19:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9547, "total_steps": 17941, "loss": 1.8067, "learning_rate": 4.621487215762619e-05, "epoch": 0.5321331029485535, "percentage": 53.21, "elapsed_time": "22:35:30", "remaining_time": "19:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9548, "total_steps": 17941, "loss": 1.4202, "learning_rate": 4.620599353259023e-05, "epoch": 0.5321888412017167, "percentage": 53.22, "elapsed_time": "22:35:39", "remaining_time": "19:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9549, "total_steps": 17941, "loss": 1.832, "learning_rate": 4.619711502787805e-05, "epoch": 0.5322445794548799, "percentage": 53.22, "elapsed_time": "22:35:47", "remaining_time": "19:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9550, "total_steps": 17941, "loss": 1.6861, "learning_rate": 4.618823664377121e-05, "epoch": 0.532300317708043, "percentage": 53.23, "elapsed_time": "22:35:56", "remaining_time": "19:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9551, "total_steps": 17941, "loss": 1.6477, "learning_rate": 4.6179358380551255e-05, "epoch": 0.5323560559612062, "percentage": 53.24, "elapsed_time": "22:36:04", "remaining_time": "19:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9552, "total_steps": 17941, "loss": 1.8258, "learning_rate": 4.617048023849981e-05, "epoch": 0.5324117942143693, "percentage": 53.24, "elapsed_time": "22:36:12", "remaining_time": "19:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9553, "total_steps": 17941, "loss": 2.1279, "learning_rate": 4.616160221789837e-05, "epoch": 0.5324675324675324, "percentage": 53.25, "elapsed_time": "22:36:22", "remaining_time": "19:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9554, "total_steps": 17941, "loss": 1.8833, "learning_rate": 4.615272431902857e-05, "epoch": 0.5325232707206956, "percentage": 53.25, "elapsed_time": "22:36:30", "remaining_time": "19:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9555, "total_steps": 17941, "loss": 1.5675, "learning_rate": 4.614384654217189e-05, "epoch": 0.5325790089738588, "percentage": 53.26, "elapsed_time": "22:36:39", "remaining_time": "19:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9556, "total_steps": 17941, "loss": 1.7209, "learning_rate": 4.6134968887609915e-05, "epoch": 0.5326347472270219, "percentage": 53.26, "elapsed_time": "22:36:47", "remaining_time": "19:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9557, "total_steps": 17941, "loss": 1.8778, "learning_rate": 4.6126091355624215e-05, "epoch": 0.532690485480185, "percentage": 53.27, "elapsed_time": "22:36:56", "remaining_time": "19:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9558, "total_steps": 17941, "loss": 1.6063, "learning_rate": 4.611721394649629e-05, "epoch": 0.5327462237333482, "percentage": 53.27, "elapsed_time": "22:37:04", "remaining_time": "19:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9559, "total_steps": 17941, "loss": 1.7225, "learning_rate": 4.610833666050771e-05, "epoch": 0.5328019619865113, "percentage": 53.28, "elapsed_time": "22:37:13", "remaining_time": "19:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9560, "total_steps": 17941, "loss": 1.6031, "learning_rate": 4.609945949794e-05, "epoch": 0.5328577002396745, "percentage": 53.29, "elapsed_time": "22:37:21", "remaining_time": "19:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9561, "total_steps": 17941, "loss": 1.519, "learning_rate": 4.60905824590747e-05, "epoch": 0.5329134384928377, "percentage": 53.29, "elapsed_time": "22:37:30", "remaining_time": "19:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9562, "total_steps": 17941, "loss": 1.5729, "learning_rate": 4.60817055441933e-05, "epoch": 0.5329691767460008, "percentage": 53.3, "elapsed_time": "22:37:39", "remaining_time": "19:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9563, "total_steps": 17941, "loss": 1.4728, "learning_rate": 4.607282875357738e-05, "epoch": 0.5330249149991639, "percentage": 53.3, "elapsed_time": "22:37:47", "remaining_time": "19:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9564, "total_steps": 17941, "loss": 1.4295, "learning_rate": 4.606395208750844e-05, "epoch": 0.5330806532523271, "percentage": 53.31, "elapsed_time": "22:37:56", "remaining_time": "19:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9565, "total_steps": 17941, "loss": 1.836, "learning_rate": 4.605507554626798e-05, "epoch": 0.5331363915054902, "percentage": 53.31, "elapsed_time": "22:38:05", "remaining_time": "19:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9566, "total_steps": 17941, "loss": 1.6115, "learning_rate": 4.6046199130137536e-05, "epoch": 0.5331921297586534, "percentage": 53.32, "elapsed_time": "22:38:13", "remaining_time": "19:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9567, "total_steps": 17941, "loss": 1.5308, "learning_rate": 4.6037322839398586e-05, "epoch": 0.5332478680118166, "percentage": 53.32, "elapsed_time": "22:38:22", "remaining_time": "19:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9568, "total_steps": 17941, "loss": 1.6254, "learning_rate": 4.602844667433267e-05, "epoch": 0.5333036062649796, "percentage": 53.33, "elapsed_time": "22:38:30", "remaining_time": "19:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9569, "total_steps": 17941, "loss": 1.7533, "learning_rate": 4.601957063522125e-05, "epoch": 0.5333593445181428, "percentage": 53.34, "elapsed_time": "22:38:39", "remaining_time": "19:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9570, "total_steps": 17941, "loss": 1.8627, "learning_rate": 4.601069472234584e-05, "epoch": 0.5334150827713059, "percentage": 53.34, "elapsed_time": "22:38:48", "remaining_time": "19:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9571, "total_steps": 17941, "loss": 1.8637, "learning_rate": 4.6001818935987954e-05, "epoch": 0.5334708210244691, "percentage": 53.35, "elapsed_time": "22:38:56", "remaining_time": "19:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9572, "total_steps": 17941, "loss": 1.8194, "learning_rate": 4.599294327642905e-05, "epoch": 0.5335265592776323, "percentage": 53.35, "elapsed_time": "22:39:04", "remaining_time": "19:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9573, "total_steps": 17941, "loss": 1.7858, "learning_rate": 4.598406774395063e-05, "epoch": 0.5335822975307953, "percentage": 53.36, "elapsed_time": "22:39:13", "remaining_time": "19:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9574, "total_steps": 17941, "loss": 1.8332, "learning_rate": 4.597519233883416e-05, "epoch": 0.5336380357839585, "percentage": 53.36, "elapsed_time": "22:39:21", "remaining_time": "19:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9575, "total_steps": 17941, "loss": 1.7374, "learning_rate": 4.596631706136113e-05, "epoch": 0.5336937740371217, "percentage": 53.37, "elapsed_time": "22:39:30", "remaining_time": "19:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9576, "total_steps": 17941, "loss": 1.6939, "learning_rate": 4.595744191181299e-05, "epoch": 0.5337495122902848, "percentage": 53.37, "elapsed_time": "22:39:38", "remaining_time": "19:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9577, "total_steps": 17941, "loss": 1.5649, "learning_rate": 4.5948566890471226e-05, "epoch": 0.533805250543448, "percentage": 53.38, "elapsed_time": "22:39:47", "remaining_time": "19:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9578, "total_steps": 17941, "loss": 1.6355, "learning_rate": 4.593969199761732e-05, "epoch": 0.5338609887966111, "percentage": 53.39, "elapsed_time": "22:39:55", "remaining_time": "19:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9579, "total_steps": 17941, "loss": 1.5703, "learning_rate": 4.593081723353267e-05, "epoch": 0.5339167270497742, "percentage": 53.39, "elapsed_time": "22:40:04", "remaining_time": "19:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9580, "total_steps": 17941, "loss": 1.6562, "learning_rate": 4.592194259849882e-05, "epoch": 0.5339724653029374, "percentage": 53.4, "elapsed_time": "22:40:12", "remaining_time": "19:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9581, "total_steps": 17941, "loss": 1.3497, "learning_rate": 4.591306809279714e-05, "epoch": 0.5340282035561006, "percentage": 53.4, "elapsed_time": "22:40:20", "remaining_time": "19:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9582, "total_steps": 17941, "loss": 1.6694, "learning_rate": 4.590419371670912e-05, "epoch": 0.5340839418092637, "percentage": 53.41, "elapsed_time": "22:40:29", "remaining_time": "19:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9583, "total_steps": 17941, "loss": 1.823, "learning_rate": 4.5895319470516204e-05, "epoch": 0.5341396800624268, "percentage": 53.41, "elapsed_time": "22:40:37", "remaining_time": "19:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9584, "total_steps": 17941, "loss": 1.6351, "learning_rate": 4.5886445354499814e-05, "epoch": 0.53419541831559, "percentage": 53.42, "elapsed_time": "22:40:46", "remaining_time": "19:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9585, "total_steps": 17941, "loss": 1.6793, "learning_rate": 4.58775713689414e-05, "epoch": 0.5342511565687531, "percentage": 53.43, "elapsed_time": "22:40:54", "remaining_time": "19:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9586, "total_steps": 17941, "loss": 1.5092, "learning_rate": 4.5868697514122384e-05, "epoch": 0.5343068948219163, "percentage": 53.43, "elapsed_time": "22:41:03", "remaining_time": "19:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9587, "total_steps": 17941, "loss": 1.7538, "learning_rate": 4.5859823790324194e-05, "epoch": 0.5343626330750795, "percentage": 53.44, "elapsed_time": "22:41:11", "remaining_time": "19:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9588, "total_steps": 17941, "loss": 1.7059, "learning_rate": 4.5850950197828247e-05, "epoch": 0.5344183713282425, "percentage": 53.44, "elapsed_time": "22:41:20", "remaining_time": "19:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9589, "total_steps": 17941, "loss": 1.9543, "learning_rate": 4.5842076736915974e-05, "epoch": 0.5344741095814057, "percentage": 53.45, "elapsed_time": "22:41:28", "remaining_time": "19:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9590, "total_steps": 17941, "loss": 1.5304, "learning_rate": 4.583320340786879e-05, "epoch": 0.5345298478345689, "percentage": 53.45, "elapsed_time": "22:41:37", "remaining_time": "19:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9591, "total_steps": 17941, "loss": 1.6066, "learning_rate": 4.58243302109681e-05, "epoch": 0.534585586087732, "percentage": 53.46, "elapsed_time": "22:41:45", "remaining_time": "19:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9592, "total_steps": 17941, "loss": 1.5607, "learning_rate": 4.581545714649531e-05, "epoch": 0.5346413243408952, "percentage": 53.46, "elapsed_time": "22:41:54", "remaining_time": "19:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9593, "total_steps": 17941, "loss": 1.5174, "learning_rate": 4.5806584214731816e-05, "epoch": 0.5346970625940582, "percentage": 53.47, "elapsed_time": "22:42:02", "remaining_time": "19:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9594, "total_steps": 17941, "loss": 1.5984, "learning_rate": 4.579771141595903e-05, "epoch": 0.5347528008472214, "percentage": 53.48, "elapsed_time": "22:42:11", "remaining_time": "19:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9595, "total_steps": 17941, "loss": 1.7833, "learning_rate": 4.578883875045833e-05, "epoch": 0.5348085391003846, "percentage": 53.48, "elapsed_time": "22:42:20", "remaining_time": "19:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9596, "total_steps": 17941, "loss": 1.8074, "learning_rate": 4.5779966218511094e-05, "epoch": 0.5348642773535477, "percentage": 53.49, "elapsed_time": "22:42:28", "remaining_time": "19:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9597, "total_steps": 17941, "loss": 1.6128, "learning_rate": 4.5771093820398756e-05, "epoch": 0.5349200156067109, "percentage": 53.49, "elapsed_time": "22:42:36", "remaining_time": "19:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9598, "total_steps": 17941, "loss": 1.9675, "learning_rate": 4.576222155640265e-05, "epoch": 0.5349757538598741, "percentage": 53.5, "elapsed_time": "22:42:45", "remaining_time": "19:44:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9599, "total_steps": 17941, "loss": 1.7877, "learning_rate": 4.5753349426804176e-05, "epoch": 0.5350314921130371, "percentage": 53.5, "elapsed_time": "22:42:53", "remaining_time": "19:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9600, "total_steps": 17941, "loss": 1.7376, "learning_rate": 4.574447743188469e-05, "epoch": 0.5350872303662003, "percentage": 53.51, "elapsed_time": "22:43:02", "remaining_time": "19:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9601, "total_steps": 17941, "loss": 1.5553, "learning_rate": 4.573560557192558e-05, "epoch": 0.5351429686193635, "percentage": 53.51, "elapsed_time": "22:43:10", "remaining_time": "19:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9602, "total_steps": 17941, "loss": 1.5464, "learning_rate": 4.572673384720819e-05, "epoch": 0.5351987068725266, "percentage": 53.52, "elapsed_time": "22:43:19", "remaining_time": "19:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9603, "total_steps": 17941, "loss": 1.7513, "learning_rate": 4.571786225801388e-05, "epoch": 0.5352544451256898, "percentage": 53.53, "elapsed_time": "22:43:28", "remaining_time": "19:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9604, "total_steps": 17941, "loss": 1.658, "learning_rate": 4.570899080462404e-05, "epoch": 0.5353101833788529, "percentage": 53.53, "elapsed_time": "22:43:36", "remaining_time": "19:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9605, "total_steps": 17941, "loss": 1.7345, "learning_rate": 4.570011948731996e-05, "epoch": 0.535365921632016, "percentage": 53.54, "elapsed_time": "22:43:45", "remaining_time": "19:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9606, "total_steps": 17941, "loss": 1.5001, "learning_rate": 4.569124830638304e-05, "epoch": 0.5354216598851792, "percentage": 53.54, "elapsed_time": "22:43:53", "remaining_time": "19:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9607, "total_steps": 17941, "loss": 1.8614, "learning_rate": 4.568237726209459e-05, "epoch": 0.5354773981383424, "percentage": 53.55, "elapsed_time": "22:44:02", "remaining_time": "19:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9608, "total_steps": 17941, "loss": 1.5247, "learning_rate": 4.567350635473596e-05, "epoch": 0.5355331363915055, "percentage": 53.55, "elapsed_time": "22:44:10", "remaining_time": "19:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9609, "total_steps": 17941, "loss": 1.4937, "learning_rate": 4.56646355845885e-05, "epoch": 0.5355888746446686, "percentage": 53.56, "elapsed_time": "22:44:19", "remaining_time": "19:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9610, "total_steps": 17941, "loss": 1.6458, "learning_rate": 4.565576495193351e-05, "epoch": 0.5356446128978318, "percentage": 53.56, "elapsed_time": "22:44:27", "remaining_time": "19:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9611, "total_steps": 17941, "loss": 1.6966, "learning_rate": 4.564689445705233e-05, "epoch": 0.5357003511509949, "percentage": 53.57, "elapsed_time": "22:44:36", "remaining_time": "19:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9612, "total_steps": 17941, "loss": 1.5728, "learning_rate": 4.563802410022627e-05, "epoch": 0.5357560894041581, "percentage": 53.58, "elapsed_time": "22:44:44", "remaining_time": "19:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9613, "total_steps": 17941, "loss": 1.5377, "learning_rate": 4.562915388173668e-05, "epoch": 0.5358118276573213, "percentage": 53.58, "elapsed_time": "22:44:52", "remaining_time": "19:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9614, "total_steps": 17941, "loss": 1.6114, "learning_rate": 4.562028380186481e-05, "epoch": 0.5358675659104843, "percentage": 53.59, "elapsed_time": "22:45:01", "remaining_time": "19:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9615, "total_steps": 17941, "loss": 1.2671, "learning_rate": 4.561141386089201e-05, "epoch": 0.5359233041636475, "percentage": 53.59, "elapsed_time": "22:45:09", "remaining_time": "19:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9616, "total_steps": 17941, "loss": 1.5903, "learning_rate": 4.560254405909959e-05, "epoch": 0.5359790424168106, "percentage": 53.6, "elapsed_time": "22:45:18", "remaining_time": "19:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9617, "total_steps": 17941, "loss": 1.5522, "learning_rate": 4.559367439676882e-05, "epoch": 0.5360347806699738, "percentage": 53.6, "elapsed_time": "22:45:26", "remaining_time": "19:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9618, "total_steps": 17941, "loss": 1.6349, "learning_rate": 4.558480487418102e-05, "epoch": 0.536090518923137, "percentage": 53.61, "elapsed_time": "22:45:35", "remaining_time": "19:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9619, "total_steps": 17941, "loss": 1.7025, "learning_rate": 4.557593549161746e-05, "epoch": 0.5361462571763, "percentage": 53.61, "elapsed_time": "22:45:43", "remaining_time": "19:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9620, "total_steps": 17941, "loss": 1.5889, "learning_rate": 4.556706624935944e-05, "epoch": 0.5362019954294632, "percentage": 53.62, "elapsed_time": "22:45:52", "remaining_time": "19:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9621, "total_steps": 17941, "loss": 1.5922, "learning_rate": 4.555819714768822e-05, "epoch": 0.5362577336826264, "percentage": 53.63, "elapsed_time": "22:46:01", "remaining_time": "19:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9622, "total_steps": 17941, "loss": 1.4581, "learning_rate": 4.554932818688508e-05, "epoch": 0.5363134719357895, "percentage": 53.63, "elapsed_time": "22:46:09", "remaining_time": "19:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9623, "total_steps": 17941, "loss": 1.8858, "learning_rate": 4.554045936723132e-05, "epoch": 0.5363692101889527, "percentage": 53.64, "elapsed_time": "22:46:18", "remaining_time": "19:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9624, "total_steps": 17941, "loss": 1.6621, "learning_rate": 4.553159068900818e-05, "epoch": 0.5364249484421159, "percentage": 53.64, "elapsed_time": "22:46:26", "remaining_time": "19:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9625, "total_steps": 17941, "loss": 1.6915, "learning_rate": 4.552272215249694e-05, "epoch": 0.5364806866952789, "percentage": 53.65, "elapsed_time": "22:46:35", "remaining_time": "19:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9626, "total_steps": 17941, "loss": 1.6064, "learning_rate": 4.551385375797884e-05, "epoch": 0.5365364249484421, "percentage": 53.65, "elapsed_time": "22:46:43", "remaining_time": "19:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9627, "total_steps": 17941, "loss": 1.721, "learning_rate": 4.5504985505735154e-05, "epoch": 0.5365921632016053, "percentage": 53.66, "elapsed_time": "22:46:52", "remaining_time": "19:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9628, "total_steps": 17941, "loss": 1.6382, "learning_rate": 4.5496117396047107e-05, "epoch": 0.5366479014547684, "percentage": 53.66, "elapsed_time": "22:47:00", "remaining_time": "19:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9629, "total_steps": 17941, "loss": 1.8254, "learning_rate": 4.5487249429195946e-05, "epoch": 0.5367036397079316, "percentage": 53.67, "elapsed_time": "22:47:09", "remaining_time": "19:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9630, "total_steps": 17941, "loss": 1.9322, "learning_rate": 4.5478381605462955e-05, "epoch": 0.5367593779610947, "percentage": 53.68, "elapsed_time": "22:47:17", "remaining_time": "19:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9631, "total_steps": 17941, "loss": 1.6886, "learning_rate": 4.54695139251293e-05, "epoch": 0.5368151162142578, "percentage": 53.68, "elapsed_time": "22:47:26", "remaining_time": "19:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9632, "total_steps": 17941, "loss": 1.6018, "learning_rate": 4.546064638847628e-05, "epoch": 0.536870854467421, "percentage": 53.69, "elapsed_time": "22:47:34", "remaining_time": "19:39:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9633, "total_steps": 17941, "loss": 1.6915, "learning_rate": 4.545177899578507e-05, "epoch": 0.5369265927205842, "percentage": 53.69, "elapsed_time": "22:47:43", "remaining_time": "19:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9634, "total_steps": 17941, "loss": 1.6215, "learning_rate": 4.544291174733692e-05, "epoch": 0.5369823309737473, "percentage": 53.7, "elapsed_time": "22:47:52", "remaining_time": "19:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9635, "total_steps": 17941, "loss": 1.5721, "learning_rate": 4.543404464341304e-05, "epoch": 0.5370380692269104, "percentage": 53.7, "elapsed_time": "22:48:00", "remaining_time": "19:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9636, "total_steps": 17941, "loss": 1.6407, "learning_rate": 4.5425177684294645e-05, "epoch": 0.5370938074800736, "percentage": 53.71, "elapsed_time": "22:48:08", "remaining_time": "19:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9637, "total_steps": 17941, "loss": 1.6858, "learning_rate": 4.541631087026294e-05, "epoch": 0.5371495457332367, "percentage": 53.71, "elapsed_time": "22:48:17", "remaining_time": "19:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9638, "total_steps": 17941, "loss": 1.4761, "learning_rate": 4.5407444201599115e-05, "epoch": 0.5372052839863999, "percentage": 53.72, "elapsed_time": "22:48:25", "remaining_time": "19:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9639, "total_steps": 17941, "loss": 1.6962, "learning_rate": 4.539857767858441e-05, "epoch": 0.537261022239563, "percentage": 53.73, "elapsed_time": "22:48:34", "remaining_time": "19:38:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9640, "total_steps": 17941, "loss": 1.5394, "learning_rate": 4.538971130149997e-05, "epoch": 0.5373167604927261, "percentage": 53.73, "elapsed_time": "22:48:43", "remaining_time": "19:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9641, "total_steps": 17941, "loss": 1.629, "learning_rate": 4.538084507062702e-05, "epoch": 0.5373724987458893, "percentage": 53.74, "elapsed_time": "22:48:51", "remaining_time": "19:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9642, "total_steps": 17941, "loss": 1.5614, "learning_rate": 4.537197898624673e-05, "epoch": 0.5374282369990524, "percentage": 53.74, "elapsed_time": "22:49:00", "remaining_time": "19:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9643, "total_steps": 17941, "loss": 1.532, "learning_rate": 4.536311304864028e-05, "epoch": 0.5374839752522156, "percentage": 53.75, "elapsed_time": "22:49:08", "remaining_time": "19:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9644, "total_steps": 17941, "loss": 1.5766, "learning_rate": 4.5354247258088854e-05, "epoch": 0.5375397135053788, "percentage": 53.75, "elapsed_time": "22:49:17", "remaining_time": "19:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9645, "total_steps": 17941, "loss": 1.727, "learning_rate": 4.534538161487362e-05, "epoch": 0.5375954517585418, "percentage": 53.76, "elapsed_time": "22:49:25", "remaining_time": "19:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9646, "total_steps": 17941, "loss": 1.6667, "learning_rate": 4.533651611927574e-05, "epoch": 0.537651190011705, "percentage": 53.77, "elapsed_time": "22:49:34", "remaining_time": "19:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9647, "total_steps": 17941, "loss": 1.6659, "learning_rate": 4.532765077157637e-05, "epoch": 0.5377069282648682, "percentage": 53.77, "elapsed_time": "22:49:42", "remaining_time": "19:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9648, "total_steps": 17941, "loss": 1.6792, "learning_rate": 4.5318785572056674e-05, "epoch": 0.5377626665180313, "percentage": 53.78, "elapsed_time": "22:49:50", "remaining_time": "19:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9649, "total_steps": 17941, "loss": 1.5461, "learning_rate": 4.530992052099782e-05, "epoch": 0.5378184047711945, "percentage": 53.78, "elapsed_time": "22:49:59", "remaining_time": "19:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9650, "total_steps": 17941, "loss": 1.6144, "learning_rate": 4.530105561868094e-05, "epoch": 0.5378741430243577, "percentage": 53.79, "elapsed_time": "22:50:08", "remaining_time": "19:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9651, "total_steps": 17941, "loss": 1.7566, "learning_rate": 4.529219086538718e-05, "epoch": 0.5379298812775207, "percentage": 53.79, "elapsed_time": "22:50:16", "remaining_time": "19:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9652, "total_steps": 17941, "loss": 1.6659, "learning_rate": 4.528332626139767e-05, "epoch": 0.5379856195306839, "percentage": 53.8, "elapsed_time": "22:50:25", "remaining_time": "19:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9653, "total_steps": 17941, "loss": 1.7152, "learning_rate": 4.527446180699356e-05, "epoch": 0.5380413577838471, "percentage": 53.8, "elapsed_time": "22:50:33", "remaining_time": "19:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9654, "total_steps": 17941, "loss": 1.7, "learning_rate": 4.526559750245597e-05, "epoch": 0.5380970960370102, "percentage": 53.81, "elapsed_time": "22:50:41", "remaining_time": "19:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9655, "total_steps": 17941, "loss": 1.5537, "learning_rate": 4.5256733348066e-05, "epoch": 0.5381528342901734, "percentage": 53.82, "elapsed_time": "22:50:51", "remaining_time": "19:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9656, "total_steps": 17941, "loss": 1.5007, "learning_rate": 4.524786934410483e-05, "epoch": 0.5382085725433365, "percentage": 53.82, "elapsed_time": "22:51:00", "remaining_time": "19:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9657, "total_steps": 17941, "loss": 1.7346, "learning_rate": 4.5239005490853505e-05, "epoch": 0.5382643107964996, "percentage": 53.83, "elapsed_time": "22:51:08", "remaining_time": "19:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9658, "total_steps": 17941, "loss": 1.5088, "learning_rate": 4.523014178859319e-05, "epoch": 0.5383200490496628, "percentage": 53.83, "elapsed_time": "22:51:17", "remaining_time": "19:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9659, "total_steps": 17941, "loss": 1.6899, "learning_rate": 4.522127823760495e-05, "epoch": 0.538375787302826, "percentage": 53.84, "elapsed_time": "22:51:25", "remaining_time": "19:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9660, "total_steps": 17941, "loss": 1.564, "learning_rate": 4.5212414838169905e-05, "epoch": 0.538431525555989, "percentage": 53.84, "elapsed_time": "22:51:34", "remaining_time": "19:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9661, "total_steps": 17941, "loss": 1.7485, "learning_rate": 4.520355159056917e-05, "epoch": 0.5384872638091522, "percentage": 53.85, "elapsed_time": "22:51:42", "remaining_time": "19:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9662, "total_steps": 17941, "loss": 1.4511, "learning_rate": 4.519468849508379e-05, "epoch": 0.5385430020623153, "percentage": 53.85, "elapsed_time": "22:51:51", "remaining_time": "19:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9663, "total_steps": 17941, "loss": 1.7853, "learning_rate": 4.5185825551994884e-05, "epoch": 0.5385987403154785, "percentage": 53.86, "elapsed_time": "22:52:00", "remaining_time": "19:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9664, "total_steps": 17941, "loss": 1.6016, "learning_rate": 4.5176962761583505e-05, "epoch": 0.5386544785686417, "percentage": 53.87, "elapsed_time": "22:52:08", "remaining_time": "19:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9665, "total_steps": 17941, "loss": 1.8608, "learning_rate": 4.5168100124130787e-05, "epoch": 0.5387102168218048, "percentage": 53.87, "elapsed_time": "22:52:17", "remaining_time": "19:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9666, "total_steps": 17941, "loss": 1.6971, "learning_rate": 4.515923763991772e-05, "epoch": 0.5387659550749679, "percentage": 53.88, "elapsed_time": "22:52:25", "remaining_time": "19:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9667, "total_steps": 17941, "loss": 2.0262, "learning_rate": 4.515037530922542e-05, "epoch": 0.5388216933281311, "percentage": 53.88, "elapsed_time": "22:52:34", "remaining_time": "19:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9668, "total_steps": 17941, "loss": 1.5727, "learning_rate": 4.5141513132334956e-05, "epoch": 0.5388774315812942, "percentage": 53.89, "elapsed_time": "22:52:42", "remaining_time": "19:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9669, "total_steps": 17941, "loss": 1.7543, "learning_rate": 4.513265110952736e-05, "epoch": 0.5389331698344574, "percentage": 53.89, "elapsed_time": "22:52:51", "remaining_time": "19:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9670, "total_steps": 17941, "loss": 1.7567, "learning_rate": 4.5123789241083696e-05, "epoch": 0.5389889080876206, "percentage": 53.9, "elapsed_time": "22:52:59", "remaining_time": "19:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9671, "total_steps": 17941, "loss": 1.8279, "learning_rate": 4.5114927527285e-05, "epoch": 0.5390446463407836, "percentage": 53.9, "elapsed_time": "22:53:07", "remaining_time": "19:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9672, "total_steps": 17941, "loss": 1.7168, "learning_rate": 4.510606596841233e-05, "epoch": 0.5391003845939468, "percentage": 53.91, "elapsed_time": "22:53:16", "remaining_time": "19:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9673, "total_steps": 17941, "loss": 1.8184, "learning_rate": 4.5097204564746705e-05, "epoch": 0.53915612284711, "percentage": 53.92, "elapsed_time": "22:53:25", "remaining_time": "19:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9674, "total_steps": 17941, "loss": 1.5677, "learning_rate": 4.5088343316569156e-05, "epoch": 0.5392118611002731, "percentage": 53.92, "elapsed_time": "22:53:33", "remaining_time": "19:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9675, "total_steps": 17941, "loss": 1.423, "learning_rate": 4.507948222416074e-05, "epoch": 0.5392675993534363, "percentage": 53.93, "elapsed_time": "22:53:42", "remaining_time": "19:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9676, "total_steps": 17941, "loss": 1.7762, "learning_rate": 4.507062128780245e-05, "epoch": 0.5393233376065995, "percentage": 53.93, "elapsed_time": "22:53:50", "remaining_time": "19:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9677, "total_steps": 17941, "loss": 1.5931, "learning_rate": 4.506176050777532e-05, "epoch": 0.5393790758597625, "percentage": 53.94, "elapsed_time": "22:53:58", "remaining_time": "19:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9678, "total_steps": 17941, "loss": 1.8376, "learning_rate": 4.505289988436034e-05, "epoch": 0.5394348141129257, "percentage": 53.94, "elapsed_time": "22:54:07", "remaining_time": "19:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9679, "total_steps": 17941, "loss": 1.695, "learning_rate": 4.504403941783855e-05, "epoch": 0.5394905523660889, "percentage": 53.95, "elapsed_time": "22:54:15", "remaining_time": "19:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9680, "total_steps": 17941, "loss": 1.7173, "learning_rate": 4.503517910849093e-05, "epoch": 0.539546290619252, "percentage": 53.95, "elapsed_time": "22:54:24", "remaining_time": "19:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9681, "total_steps": 17941, "loss": 1.3706, "learning_rate": 4.502631895659846e-05, "epoch": 0.5396020288724152, "percentage": 53.96, "elapsed_time": "22:54:33", "remaining_time": "19:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9682, "total_steps": 17941, "loss": 1.6029, "learning_rate": 4.501745896244219e-05, "epoch": 0.5396577671255783, "percentage": 53.97, "elapsed_time": "22:54:41", "remaining_time": "19:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9683, "total_steps": 17941, "loss": 1.8895, "learning_rate": 4.500859912630303e-05, "epoch": 0.5397135053787414, "percentage": 53.97, "elapsed_time": "22:54:50", "remaining_time": "19:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9684, "total_steps": 17941, "loss": 1.5352, "learning_rate": 4.499973944846204e-05, "epoch": 0.5397692436319046, "percentage": 53.98, "elapsed_time": "22:54:58", "remaining_time": "19:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9685, "total_steps": 17941, "loss": 1.5303, "learning_rate": 4.499087992920015e-05, "epoch": 0.5398249818850677, "percentage": 53.98, "elapsed_time": "22:55:07", "remaining_time": "19:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9686, "total_steps": 17941, "loss": 1.9174, "learning_rate": 4.4982020568798344e-05, "epoch": 0.5398807201382309, "percentage": 53.99, "elapsed_time": "22:55:15", "remaining_time": "19:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9687, "total_steps": 17941, "loss": 1.858, "learning_rate": 4.497316136753759e-05, "epoch": 0.539936458391394, "percentage": 53.99, "elapsed_time": "22:55:24", "remaining_time": "19:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9688, "total_steps": 17941, "loss": 1.6544, "learning_rate": 4.496430232569884e-05, "epoch": 0.5399921966445571, "percentage": 54.0, "elapsed_time": "22:55:32", "remaining_time": "19:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9689, "total_steps": 17941, "loss": 1.6606, "learning_rate": 4.4955443443563064e-05, "epoch": 0.5400479348977203, "percentage": 54.0, "elapsed_time": "22:55:41", "remaining_time": "19:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9690, "total_steps": 17941, "loss": 1.5377, "learning_rate": 4.49465847214112e-05, "epoch": 0.5401036731508835, "percentage": 54.01, "elapsed_time": "22:55:49", "remaining_time": "19:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9691, "total_steps": 17941, "loss": 1.6281, "learning_rate": 4.4937726159524235e-05, "epoch": 0.5401594114040466, "percentage": 54.02, "elapsed_time": "22:55:58", "remaining_time": "19:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9692, "total_steps": 17941, "loss": 1.6659, "learning_rate": 4.492886775818305e-05, "epoch": 0.5402151496572097, "percentage": 54.02, "elapsed_time": "22:56:06", "remaining_time": "19:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9693, "total_steps": 17941, "loss": 1.5169, "learning_rate": 4.492000951766862e-05, "epoch": 0.5402708879103729, "percentage": 54.03, "elapsed_time": "22:56:14", "remaining_time": "19:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9694, "total_steps": 17941, "loss": 1.4738, "learning_rate": 4.4911151438261885e-05, "epoch": 0.540326626163536, "percentage": 54.03, "elapsed_time": "22:56:23", "remaining_time": "19:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9695, "total_steps": 17941, "loss": 1.7376, "learning_rate": 4.4902293520243746e-05, "epoch": 0.5403823644166992, "percentage": 54.04, "elapsed_time": "22:56:31", "remaining_time": "19:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9696, "total_steps": 17941, "loss": 1.7419, "learning_rate": 4.489343576389514e-05, "epoch": 0.5404381026698624, "percentage": 54.04, "elapsed_time": "22:56:40", "remaining_time": "19:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9697, "total_steps": 17941, "loss": 1.4912, "learning_rate": 4.488457816949697e-05, "epoch": 0.5404938409230254, "percentage": 54.05, "elapsed_time": "22:56:48", "remaining_time": "19:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9698, "total_steps": 17941, "loss": 1.8182, "learning_rate": 4.487572073733017e-05, "epoch": 0.5405495791761886, "percentage": 54.05, "elapsed_time": "22:56:57", "remaining_time": "19:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9699, "total_steps": 17941, "loss": 1.7492, "learning_rate": 4.48668634676756e-05, "epoch": 0.5406053174293518, "percentage": 54.06, "elapsed_time": "22:57:05", "remaining_time": "19:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9700, "total_steps": 17941, "loss": 1.7785, "learning_rate": 4.4858006360814215e-05, "epoch": 0.5406610556825149, "percentage": 54.07, "elapsed_time": "22:57:14", "remaining_time": "19:30:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9701, "total_steps": 17941, "loss": 1.6768, "learning_rate": 4.484914941702689e-05, "epoch": 0.5407167939356781, "percentage": 54.07, "elapsed_time": "22:57:23", "remaining_time": "19:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9702, "total_steps": 17941, "loss": 1.6993, "learning_rate": 4.484029263659451e-05, "epoch": 0.5407725321888412, "percentage": 54.08, "elapsed_time": "22:57:31", "remaining_time": "19:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9703, "total_steps": 17941, "loss": 1.882, "learning_rate": 4.4831436019797976e-05, "epoch": 0.5408282704420043, "percentage": 54.08, "elapsed_time": "22:57:40", "remaining_time": "19:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9704, "total_steps": 17941, "loss": 1.8899, "learning_rate": 4.482257956691814e-05, "epoch": 0.5408840086951675, "percentage": 54.09, "elapsed_time": "22:57:49", "remaining_time": "19:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9705, "total_steps": 17941, "loss": 1.576, "learning_rate": 4.48137232782359e-05, "epoch": 0.5409397469483307, "percentage": 54.09, "elapsed_time": "22:57:57", "remaining_time": "19:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9706, "total_steps": 17941, "loss": 1.7682, "learning_rate": 4.480486715403212e-05, "epoch": 0.5409954852014938, "percentage": 54.1, "elapsed_time": "22:58:06", "remaining_time": "19:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9707, "total_steps": 17941, "loss": 1.8614, "learning_rate": 4.479601119458765e-05, "epoch": 0.541051223454657, "percentage": 54.11, "elapsed_time": "22:58:14", "remaining_time": "19:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9708, "total_steps": 17941, "loss": 1.9185, "learning_rate": 4.478715540018339e-05, "epoch": 0.54110696170782, "percentage": 54.11, "elapsed_time": "22:58:23", "remaining_time": "19:28:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9709, "total_steps": 17941, "loss": 1.5266, "learning_rate": 4.477829977110014e-05, "epoch": 0.5411626999609832, "percentage": 54.12, "elapsed_time": "22:58:31", "remaining_time": "19:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9710, "total_steps": 17941, "loss": 1.5938, "learning_rate": 4.4769444307618804e-05, "epoch": 0.5412184382141464, "percentage": 54.12, "elapsed_time": "22:58:40", "remaining_time": "19:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9711, "total_steps": 17941, "loss": 1.7021, "learning_rate": 4.476058901002018e-05, "epoch": 0.5412741764673095, "percentage": 54.13, "elapsed_time": "22:58:48", "remaining_time": "19:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9712, "total_steps": 17941, "loss": 1.7607, "learning_rate": 4.475173387858513e-05, "epoch": 0.5413299147204726, "percentage": 54.13, "elapsed_time": "22:58:57", "remaining_time": "19:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9713, "total_steps": 17941, "loss": 1.6063, "learning_rate": 4.4742878913594485e-05, "epoch": 0.5413856529736358, "percentage": 54.14, "elapsed_time": "22:59:05", "remaining_time": "19:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9714, "total_steps": 17941, "loss": 1.5175, "learning_rate": 4.4734024115329066e-05, "epoch": 0.5414413912267989, "percentage": 54.14, "elapsed_time": "22:59:14", "remaining_time": "19:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9715, "total_steps": 17941, "loss": 1.9511, "learning_rate": 4.4725169484069706e-05, "epoch": 0.5414971294799621, "percentage": 54.15, "elapsed_time": "22:59:22", "remaining_time": "19:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9716, "total_steps": 17941, "loss": 1.7098, "learning_rate": 4.47163150200972e-05, "epoch": 0.5415528677331253, "percentage": 54.16, "elapsed_time": "22:59:30", "remaining_time": "19:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9717, "total_steps": 17941, "loss": 1.6926, "learning_rate": 4.4707460723692396e-05, "epoch": 0.5416086059862883, "percentage": 54.16, "elapsed_time": "22:59:39", "remaining_time": "19:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9718, "total_steps": 17941, "loss": 1.5529, "learning_rate": 4.469860659513606e-05, "epoch": 0.5416643442394515, "percentage": 54.17, "elapsed_time": "22:59:47", "remaining_time": "19:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9719, "total_steps": 17941, "loss": 1.5383, "learning_rate": 4.468975263470902e-05, "epoch": 0.5417200824926147, "percentage": 54.17, "elapsed_time": "22:59:56", "remaining_time": "19:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9720, "total_steps": 17941, "loss": 1.437, "learning_rate": 4.468089884269207e-05, "epoch": 0.5417758207457778, "percentage": 54.18, "elapsed_time": "23:00:04", "remaining_time": "19:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9721, "total_steps": 17941, "loss": 1.5692, "learning_rate": 4.467204521936599e-05, "epoch": 0.541831558998941, "percentage": 54.18, "elapsed_time": "23:00:13", "remaining_time": "19:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9722, "total_steps": 17941, "loss": 1.7301, "learning_rate": 4.466319176501159e-05, "epoch": 0.5418872972521042, "percentage": 54.19, "elapsed_time": "23:00:21", "remaining_time": "19:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9723, "total_steps": 17941, "loss": 1.806, "learning_rate": 4.465433847990961e-05, "epoch": 0.5419430355052672, "percentage": 54.19, "elapsed_time": "23:00:30", "remaining_time": "19:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9724, "total_steps": 17941, "loss": 1.8704, "learning_rate": 4.464548536434086e-05, "epoch": 0.5419987737584304, "percentage": 54.2, "elapsed_time": "23:00:38", "remaining_time": "19:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9725, "total_steps": 17941, "loss": 1.5875, "learning_rate": 4.463663241858607e-05, "epoch": 0.5420545120115936, "percentage": 54.21, "elapsed_time": "23:00:46", "remaining_time": "19:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9726, "total_steps": 17941, "loss": 1.504, "learning_rate": 4.462777964292605e-05, "epoch": 0.5421102502647567, "percentage": 54.21, "elapsed_time": "23:00:55", "remaining_time": "19:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9727, "total_steps": 17941, "loss": 1.7438, "learning_rate": 4.461892703764154e-05, "epoch": 0.5421659885179199, "percentage": 54.22, "elapsed_time": "23:01:03", "remaining_time": "19:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9728, "total_steps": 17941, "loss": 1.8666, "learning_rate": 4.461007460301328e-05, "epoch": 0.542221726771083, "percentage": 54.22, "elapsed_time": "23:01:12", "remaining_time": "19:26:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9729, "total_steps": 17941, "loss": 1.456, "learning_rate": 4.4601222339322045e-05, "epoch": 0.5422774650242461, "percentage": 54.23, "elapsed_time": "23:01:20", "remaining_time": "19:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9730, "total_steps": 17941, "loss": 1.4502, "learning_rate": 4.459237024684855e-05, "epoch": 0.5423332032774093, "percentage": 54.23, "elapsed_time": "23:01:29", "remaining_time": "19:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9731, "total_steps": 17941, "loss": 1.9578, "learning_rate": 4.458351832587354e-05, "epoch": 0.5423889415305724, "percentage": 54.24, "elapsed_time": "23:01:37", "remaining_time": "19:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9732, "total_steps": 17941, "loss": 1.867, "learning_rate": 4.457466657667775e-05, "epoch": 0.5424446797837356, "percentage": 54.24, "elapsed_time": "23:01:46", "remaining_time": "19:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9733, "total_steps": 17941, "loss": 1.8218, "learning_rate": 4.456581499954189e-05, "epoch": 0.5425004180368987, "percentage": 54.25, "elapsed_time": "23:01:54", "remaining_time": "19:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9734, "total_steps": 17941, "loss": 1.7565, "learning_rate": 4.4556963594746724e-05, "epoch": 0.5425561562900618, "percentage": 54.26, "elapsed_time": "23:02:03", "remaining_time": "19:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9735, "total_steps": 17941, "loss": 1.5784, "learning_rate": 4.4548112362572915e-05, "epoch": 0.542611894543225, "percentage": 54.26, "elapsed_time": "23:02:11", "remaining_time": "19:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9736, "total_steps": 17941, "loss": 1.6293, "learning_rate": 4.45392613033012e-05, "epoch": 0.5426676327963882, "percentage": 54.27, "elapsed_time": "23:02:20", "remaining_time": "19:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9737, "total_steps": 17941, "loss": 1.8317, "learning_rate": 4.453041041721228e-05, "epoch": 0.5427233710495513, "percentage": 54.27, "elapsed_time": "23:02:28", "remaining_time": "19:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9738, "total_steps": 17941, "loss": 1.7089, "learning_rate": 4.452155970458686e-05, "epoch": 0.5427791093027144, "percentage": 54.28, "elapsed_time": "23:02:37", "remaining_time": "19:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9739, "total_steps": 17941, "loss": 1.7275, "learning_rate": 4.451270916570562e-05, "epoch": 0.5428348475558776, "percentage": 54.28, "elapsed_time": "23:02:45", "remaining_time": "19:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9740, "total_steps": 17941, "loss": 1.6992, "learning_rate": 4.450385880084924e-05, "epoch": 0.5428905858090407, "percentage": 54.29, "elapsed_time": "23:02:53", "remaining_time": "19:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9741, "total_steps": 17941, "loss": 1.6468, "learning_rate": 4.4495008610298435e-05, "epoch": 0.5429463240622039, "percentage": 54.29, "elapsed_time": "23:03:02", "remaining_time": "19:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9742, "total_steps": 17941, "loss": 1.7285, "learning_rate": 4.448615859433383e-05, "epoch": 0.5430020623153671, "percentage": 54.3, "elapsed_time": "23:03:10", "remaining_time": "19:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9743, "total_steps": 17941, "loss": 1.5839, "learning_rate": 4.447730875323617e-05, "epoch": 0.5430578005685301, "percentage": 54.31, "elapsed_time": "23:03:19", "remaining_time": "19:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9744, "total_steps": 17941, "loss": 1.8845, "learning_rate": 4.446845908728604e-05, "epoch": 0.5431135388216933, "percentage": 54.31, "elapsed_time": "23:03:27", "remaining_time": "19:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9745, "total_steps": 17941, "loss": 1.8191, "learning_rate": 4.445960959676414e-05, "epoch": 0.5431692770748565, "percentage": 54.32, "elapsed_time": "23:03:36", "remaining_time": "19:23:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9746, "total_steps": 17941, "loss": 1.8001, "learning_rate": 4.4450760281951134e-05, "epoch": 0.5432250153280196, "percentage": 54.32, "elapsed_time": "23:03:45", "remaining_time": "19:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9747, "total_steps": 17941, "loss": 1.8329, "learning_rate": 4.444191114312765e-05, "epoch": 0.5432807535811828, "percentage": 54.33, "elapsed_time": "23:03:53", "remaining_time": "19:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9748, "total_steps": 17941, "loss": 1.4827, "learning_rate": 4.4433062180574356e-05, "epoch": 0.543336491834346, "percentage": 54.33, "elapsed_time": "23:04:02", "remaining_time": "19:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9749, "total_steps": 17941, "loss": 1.5864, "learning_rate": 4.442421339457185e-05, "epoch": 0.543392230087509, "percentage": 54.34, "elapsed_time": "23:04:10", "remaining_time": "19:23:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9750, "total_steps": 17941, "loss": 1.5616, "learning_rate": 4.44153647854008e-05, "epoch": 0.5434479683406722, "percentage": 54.34, "elapsed_time": "23:04:18", "remaining_time": "19:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9751, "total_steps": 17941, "loss": 1.773, "learning_rate": 4.44065163533418e-05, "epoch": 0.5435037065938354, "percentage": 54.35, "elapsed_time": "23:04:27", "remaining_time": "19:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9752, "total_steps": 17941, "loss": 1.8526, "learning_rate": 4.43976680986755e-05, "epoch": 0.5435594448469985, "percentage": 54.36, "elapsed_time": "23:04:35", "remaining_time": "19:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9753, "total_steps": 17941, "loss": 1.5885, "learning_rate": 4.438882002168251e-05, "epoch": 0.5436151831001617, "percentage": 54.36, "elapsed_time": "23:04:44", "remaining_time": "19:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9754, "total_steps": 17941, "loss": 1.5476, "learning_rate": 4.437997212264343e-05, "epoch": 0.5436709213533247, "percentage": 54.37, "elapsed_time": "23:04:52", "remaining_time": "19:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9755, "total_steps": 17941, "loss": 1.8489, "learning_rate": 4.437112440183887e-05, "epoch": 0.5437266596064879, "percentage": 54.37, "elapsed_time": "23:05:01", "remaining_time": "19:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9756, "total_steps": 17941, "loss": 1.4991, "learning_rate": 4.436227685954942e-05, "epoch": 0.5437823978596511, "percentage": 54.38, "elapsed_time": "23:05:09", "remaining_time": "19:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9757, "total_steps": 17941, "loss": 1.6384, "learning_rate": 4.4353429496055685e-05, "epoch": 0.5438381361128142, "percentage": 54.38, "elapsed_time": "23:05:18", "remaining_time": "19:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9758, "total_steps": 17941, "loss": 1.5669, "learning_rate": 4.4344582311638234e-05, "epoch": 0.5438938743659774, "percentage": 54.39, "elapsed_time": "23:05:26", "remaining_time": "19:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9759, "total_steps": 17941, "loss": 1.8168, "learning_rate": 4.4335735306577645e-05, "epoch": 0.5439496126191405, "percentage": 54.39, "elapsed_time": "23:05:35", "remaining_time": "19:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9760, "total_steps": 17941, "loss": 1.449, "learning_rate": 4.432688848115455e-05, "epoch": 0.5440053508723036, "percentage": 54.4, "elapsed_time": "23:05:43", "remaining_time": "19:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9761, "total_steps": 17941, "loss": 1.7658, "learning_rate": 4.431804183564944e-05, "epoch": 0.5440610891254668, "percentage": 54.41, "elapsed_time": "23:05:52", "remaining_time": "19:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9762, "total_steps": 17941, "loss": 1.6033, "learning_rate": 4.430919537034293e-05, "epoch": 0.54411682737863, "percentage": 54.41, "elapsed_time": "23:06:00", "remaining_time": "19:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9763, "total_steps": 17941, "loss": 1.5546, "learning_rate": 4.430034908551556e-05, "epoch": 0.5441725656317931, "percentage": 54.42, "elapsed_time": "23:06:09", "remaining_time": "19:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9764, "total_steps": 17941, "loss": 1.6856, "learning_rate": 4.429150298144789e-05, "epoch": 0.5442283038849562, "percentage": 54.42, "elapsed_time": "23:06:17", "remaining_time": "19:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9765, "total_steps": 17941, "loss": 1.7699, "learning_rate": 4.428265705842045e-05, "epoch": 0.5442840421381194, "percentage": 54.43, "elapsed_time": "23:06:26", "remaining_time": "19:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9766, "total_steps": 17941, "loss": 1.5959, "learning_rate": 4.42738113167138e-05, "epoch": 0.5443397803912825, "percentage": 54.43, "elapsed_time": "23:06:34", "remaining_time": "19:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9767, "total_steps": 17941, "loss": 1.7393, "learning_rate": 4.426496575660848e-05, "epoch": 0.5443955186444457, "percentage": 54.44, "elapsed_time": "23:06:42", "remaining_time": "19:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9768, "total_steps": 17941, "loss": 1.7109, "learning_rate": 4.425612037838498e-05, "epoch": 0.5444512568976089, "percentage": 54.45, "elapsed_time": "23:06:51", "remaining_time": "19:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9769, "total_steps": 17941, "loss": 1.5678, "learning_rate": 4.424727518232389e-05, "epoch": 0.5445069951507719, "percentage": 54.45, "elapsed_time": "23:06:59", "remaining_time": "19:20:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9770, "total_steps": 17941, "loss": 1.6594, "learning_rate": 4.4238430168705655e-05, "epoch": 0.5445627334039351, "percentage": 54.46, "elapsed_time": "23:07:08", "remaining_time": "19:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9771, "total_steps": 17941, "loss": 1.6752, "learning_rate": 4.422958533781084e-05, "epoch": 0.5446184716570983, "percentage": 54.46, "elapsed_time": "23:07:16", "remaining_time": "19:19:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9772, "total_steps": 17941, "loss": 1.6174, "learning_rate": 4.422074068991994e-05, "epoch": 0.5446742099102614, "percentage": 54.47, "elapsed_time": "23:07:25", "remaining_time": "19:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9773, "total_steps": 17941, "loss": 1.666, "learning_rate": 4.4211896225313446e-05, "epoch": 0.5447299481634246, "percentage": 54.47, "elapsed_time": "23:07:33", "remaining_time": "19:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9774, "total_steps": 17941, "loss": 1.7369, "learning_rate": 4.420305194427186e-05, "epoch": 0.5447856864165878, "percentage": 54.48, "elapsed_time": "23:07:42", "remaining_time": "19:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9775, "total_steps": 17941, "loss": 1.6213, "learning_rate": 4.4194207847075655e-05, "epoch": 0.5448414246697508, "percentage": 54.48, "elapsed_time": "23:07:50", "remaining_time": "19:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9776, "total_steps": 17941, "loss": 1.8705, "learning_rate": 4.4185363934005346e-05, "epoch": 0.544897162922914, "percentage": 54.49, "elapsed_time": "23:07:59", "remaining_time": "19:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9777, "total_steps": 17941, "loss": 1.8517, "learning_rate": 4.417652020534137e-05, "epoch": 0.5449529011760771, "percentage": 54.5, "elapsed_time": "23:08:07", "remaining_time": "19:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9778, "total_steps": 17941, "loss": 1.4589, "learning_rate": 4.416767666136422e-05, "epoch": 0.5450086394292403, "percentage": 54.5, "elapsed_time": "23:08:17", "remaining_time": "19:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9779, "total_steps": 17941, "loss": 1.6545, "learning_rate": 4.415883330235438e-05, "epoch": 0.5450643776824035, "percentage": 54.51, "elapsed_time": "23:08:25", "remaining_time": "19:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9780, "total_steps": 17941, "loss": 1.951, "learning_rate": 4.4149990128592275e-05, "epoch": 0.5451201159355665, "percentage": 54.51, "elapsed_time": "23:08:34", "remaining_time": "19:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9781, "total_steps": 17941, "loss": 1.7445, "learning_rate": 4.41411471403584e-05, "epoch": 0.5451758541887297, "percentage": 54.52, "elapsed_time": "23:08:42", "remaining_time": "19:18:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9782, "total_steps": 17941, "loss": 1.8898, "learning_rate": 4.413230433793315e-05, "epoch": 0.5452315924418929, "percentage": 54.52, "elapsed_time": "23:08:50", "remaining_time": "19:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9783, "total_steps": 17941, "loss": 1.7319, "learning_rate": 4.4123461721597016e-05, "epoch": 0.545287330695056, "percentage": 54.53, "elapsed_time": "23:08:59", "remaining_time": "19:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9784, "total_steps": 17941, "loss": 1.7698, "learning_rate": 4.41146192916304e-05, "epoch": 0.5453430689482192, "percentage": 54.53, "elapsed_time": "23:09:07", "remaining_time": "19:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9785, "total_steps": 17941, "loss": 1.8118, "learning_rate": 4.4105777048313734e-05, "epoch": 0.5453988072013823, "percentage": 54.54, "elapsed_time": "23:09:16", "remaining_time": "19:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9786, "total_steps": 17941, "loss": 1.6101, "learning_rate": 4.409693499192748e-05, "epoch": 0.5454545454545454, "percentage": 54.55, "elapsed_time": "23:09:24", "remaining_time": "19:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9787, "total_steps": 17941, "loss": 1.55, "learning_rate": 4.408809312275202e-05, "epoch": 0.5455102837077086, "percentage": 54.55, "elapsed_time": "23:09:33", "remaining_time": "19:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9788, "total_steps": 17941, "loss": 1.7077, "learning_rate": 4.407925144106778e-05, "epoch": 0.5455660219608718, "percentage": 54.56, "elapsed_time": "23:09:42", "remaining_time": "19:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9789, "total_steps": 17941, "loss": 1.736, "learning_rate": 4.4070409947155164e-05, "epoch": 0.5456217602140349, "percentage": 54.56, "elapsed_time": "23:09:50", "remaining_time": "19:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9790, "total_steps": 17941, "loss": 1.5738, "learning_rate": 4.406156864129458e-05, "epoch": 0.545677498467198, "percentage": 54.57, "elapsed_time": "23:09:59", "remaining_time": "19:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9791, "total_steps": 17941, "loss": 1.6053, "learning_rate": 4.40527275237664e-05, "epoch": 0.5457332367203612, "percentage": 54.57, "elapsed_time": "23:10:07", "remaining_time": "19:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9792, "total_steps": 17941, "loss": 1.3866, "learning_rate": 4.404388659485102e-05, "epoch": 0.5457889749735243, "percentage": 54.58, "elapsed_time": "23:10:16", "remaining_time": "19:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9793, "total_steps": 17941, "loss": 1.8915, "learning_rate": 4.403504585482886e-05, "epoch": 0.5458447132266875, "percentage": 54.58, "elapsed_time": "23:10:24", "remaining_time": "19:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9794, "total_steps": 17941, "loss": 1.7637, "learning_rate": 4.402620530398024e-05, "epoch": 0.5459004514798507, "percentage": 54.59, "elapsed_time": "23:10:33", "remaining_time": "19:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9795, "total_steps": 17941, "loss": 1.6987, "learning_rate": 4.401736494258559e-05, "epoch": 0.5459561897330137, "percentage": 54.6, "elapsed_time": "23:10:41", "remaining_time": "19:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9796, "total_steps": 17941, "loss": 1.4462, "learning_rate": 4.400852477092521e-05, "epoch": 0.5460119279861769, "percentage": 54.6, "elapsed_time": "23:10:49", "remaining_time": "19:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9797, "total_steps": 17941, "loss": 1.5191, "learning_rate": 4.399968478927949e-05, "epoch": 0.5460676662393401, "percentage": 54.61, "elapsed_time": "23:10:58", "remaining_time": "19:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9798, "total_steps": 17941, "loss": 1.6671, "learning_rate": 4.399084499792882e-05, "epoch": 0.5461234044925032, "percentage": 54.61, "elapsed_time": "23:11:06", "remaining_time": "19:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9799, "total_steps": 17941, "loss": 1.6921, "learning_rate": 4.398200539715348e-05, "epoch": 0.5461791427456664, "percentage": 54.62, "elapsed_time": "23:11:15", "remaining_time": "19:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9800, "total_steps": 17941, "loss": 1.7919, "learning_rate": 4.397316598723385e-05, "epoch": 0.5462348809988294, "percentage": 54.62, "elapsed_time": "23:11:23", "remaining_time": "19:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9801, "total_steps": 17941, "loss": 1.8814, "learning_rate": 4.396432676845026e-05, "epoch": 0.5462906192519926, "percentage": 54.63, "elapsed_time": "23:11:32", "remaining_time": "19:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9802, "total_steps": 17941, "loss": 1.5737, "learning_rate": 4.395548774108304e-05, "epoch": 0.5463463575051558, "percentage": 54.63, "elapsed_time": "23:11:40", "remaining_time": "19:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9803, "total_steps": 17941, "loss": 1.6611, "learning_rate": 4.3946648905412486e-05, "epoch": 0.5464020957583189, "percentage": 54.64, "elapsed_time": "23:11:49", "remaining_time": "19:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9804, "total_steps": 17941, "loss": 1.7487, "learning_rate": 4.393781026171894e-05, "epoch": 0.5464578340114821, "percentage": 54.65, "elapsed_time": "23:11:57", "remaining_time": "19:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9805, "total_steps": 17941, "loss": 1.5144, "learning_rate": 4.392897181028273e-05, "epoch": 0.5465135722646453, "percentage": 54.65, "elapsed_time": "23:12:05", "remaining_time": "19:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9806, "total_steps": 17941, "loss": 1.4697, "learning_rate": 4.392013355138411e-05, "epoch": 0.5465693105178083, "percentage": 54.66, "elapsed_time": "23:12:14", "remaining_time": "19:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9807, "total_steps": 17941, "loss": 1.5778, "learning_rate": 4.391129548530343e-05, "epoch": 0.5466250487709715, "percentage": 54.66, "elapsed_time": "23:12:22", "remaining_time": "19:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9808, "total_steps": 17941, "loss": 1.692, "learning_rate": 4.390245761232094e-05, "epoch": 0.5466807870241347, "percentage": 54.67, "elapsed_time": "23:12:31", "remaining_time": "19:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9809, "total_steps": 17941, "loss": 1.6905, "learning_rate": 4.389361993271696e-05, "epoch": 0.5467365252772978, "percentage": 54.67, "elapsed_time": "23:12:39", "remaining_time": "19:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9810, "total_steps": 17941, "loss": 1.6399, "learning_rate": 4.388478244677174e-05, "epoch": 0.546792263530461, "percentage": 54.68, "elapsed_time": "23:12:48", "remaining_time": "19:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9811, "total_steps": 17941, "loss": 1.6705, "learning_rate": 4.387594515476555e-05, "epoch": 0.5468480017836241, "percentage": 54.68, "elapsed_time": "23:12:57", "remaining_time": "19:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9812, "total_steps": 17941, "loss": 1.2681, "learning_rate": 4.386710805697871e-05, "epoch": 0.5469037400367872, "percentage": 54.69, "elapsed_time": "23:13:05", "remaining_time": "19:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9813, "total_steps": 17941, "loss": 1.7306, "learning_rate": 4.385827115369142e-05, "epoch": 0.5469594782899504, "percentage": 54.7, "elapsed_time": "23:13:14", "remaining_time": "19:14:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9814, "total_steps": 17941, "loss": 1.7266, "learning_rate": 4.3849434445183977e-05, "epoch": 0.5470152165431136, "percentage": 54.7, "elapsed_time": "23:13:22", "remaining_time": "19:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9815, "total_steps": 17941, "loss": 1.7676, "learning_rate": 4.38405979317366e-05, "epoch": 0.5470709547962767, "percentage": 54.71, "elapsed_time": "23:13:31", "remaining_time": "19:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9816, "total_steps": 17941, "loss": 1.5504, "learning_rate": 4.383176161362956e-05, "epoch": 0.5471266930494398, "percentage": 54.71, "elapsed_time": "23:13:39", "remaining_time": "19:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9817, "total_steps": 17941, "loss": 1.5915, "learning_rate": 4.382292549114306e-05, "epoch": 0.547182431302603, "percentage": 54.72, "elapsed_time": "23:13:48", "remaining_time": "19:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9818, "total_steps": 17941, "loss": 1.7682, "learning_rate": 4.381408956455734e-05, "epoch": 0.5472381695557661, "percentage": 54.72, "elapsed_time": "23:13:56", "remaining_time": "19:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9819, "total_steps": 17941, "loss": 1.7587, "learning_rate": 4.380525383415267e-05, "epoch": 0.5472939078089293, "percentage": 54.73, "elapsed_time": "23:14:05", "remaining_time": "19:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9820, "total_steps": 17941, "loss": 1.8327, "learning_rate": 4.3796418300209194e-05, "epoch": 0.5473496460620925, "percentage": 54.73, "elapsed_time": "23:14:13", "remaining_time": "19:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9821, "total_steps": 17941, "loss": 1.7339, "learning_rate": 4.378758296300719e-05, "epoch": 0.5474053843152555, "percentage": 54.74, "elapsed_time": "23:14:21", "remaining_time": "19:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9822, "total_steps": 17941, "loss": 1.7792, "learning_rate": 4.377874782282681e-05, "epoch": 0.5474611225684187, "percentage": 54.75, "elapsed_time": "23:14:30", "remaining_time": "19:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9823, "total_steps": 17941, "loss": 1.5596, "learning_rate": 4.376991287994829e-05, "epoch": 0.5475168608215818, "percentage": 54.75, "elapsed_time": "23:14:38", "remaining_time": "19:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9824, "total_steps": 17941, "loss": 1.5048, "learning_rate": 4.376107813465181e-05, "epoch": 0.547572599074745, "percentage": 54.76, "elapsed_time": "23:14:47", "remaining_time": "19:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9825, "total_steps": 17941, "loss": 1.6238, "learning_rate": 4.3752243587217546e-05, "epoch": 0.5476283373279082, "percentage": 54.76, "elapsed_time": "23:14:55", "remaining_time": "19:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9826, "total_steps": 17941, "loss": 1.5942, "learning_rate": 4.37434092379257e-05, "epoch": 0.5476840755810712, "percentage": 54.77, "elapsed_time": "23:15:04", "remaining_time": "19:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9827, "total_steps": 17941, "loss": 1.6875, "learning_rate": 4.3734575087056425e-05, "epoch": 0.5477398138342344, "percentage": 54.77, "elapsed_time": "23:15:12", "remaining_time": "19:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9828, "total_steps": 17941, "loss": 1.4169, "learning_rate": 4.372574113488991e-05, "epoch": 0.5477955520873976, "percentage": 54.78, "elapsed_time": "23:15:21", "remaining_time": "19:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9829, "total_steps": 17941, "loss": 1.7524, "learning_rate": 4.371690738170628e-05, "epoch": 0.5478512903405607, "percentage": 54.79, "elapsed_time": "23:15:29", "remaining_time": "19:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9830, "total_steps": 17941, "loss": 1.859, "learning_rate": 4.370807382778573e-05, "epoch": 0.5479070285937239, "percentage": 54.79, "elapsed_time": "23:15:38", "remaining_time": "19:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9831, "total_steps": 17941, "loss": 1.4963, "learning_rate": 4.36992404734084e-05, "epoch": 0.547962766846887, "percentage": 54.8, "elapsed_time": "23:15:47", "remaining_time": "19:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9832, "total_steps": 17941, "loss": 1.4895, "learning_rate": 4.3690407318854416e-05, "epoch": 0.5480185051000501, "percentage": 54.8, "elapsed_time": "23:15:55", "remaining_time": "19:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9833, "total_steps": 17941, "loss": 1.6322, "learning_rate": 4.3681574364403936e-05, "epoch": 0.5480742433532133, "percentage": 54.81, "elapsed_time": "23:16:04", "remaining_time": "19:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9834, "total_steps": 17941, "loss": 1.5524, "learning_rate": 4.367274161033707e-05, "epoch": 0.5481299816063765, "percentage": 54.81, "elapsed_time": "23:16:12", "remaining_time": "19:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9835, "total_steps": 17941, "loss": 1.5659, "learning_rate": 4.366390905693396e-05, "epoch": 0.5481857198595396, "percentage": 54.82, "elapsed_time": "23:16:21", "remaining_time": "19:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9836, "total_steps": 17941, "loss": 1.5188, "learning_rate": 4.36550767044747e-05, "epoch": 0.5482414581127028, "percentage": 54.82, "elapsed_time": "23:16:29", "remaining_time": "19:10:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9837, "total_steps": 17941, "loss": 1.6353, "learning_rate": 4.36462445532394e-05, "epoch": 0.5482971963658659, "percentage": 54.83, "elapsed_time": "23:16:38", "remaining_time": "19:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9838, "total_steps": 17941, "loss": 1.6311, "learning_rate": 4.3637412603508206e-05, "epoch": 0.548352934619029, "percentage": 54.84, "elapsed_time": "23:16:46", "remaining_time": "19:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9839, "total_steps": 17941, "loss": 1.5426, "learning_rate": 4.3628580855561176e-05, "epoch": 0.5484086728721922, "percentage": 54.84, "elapsed_time": "23:16:55", "remaining_time": "19:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9840, "total_steps": 17941, "loss": 1.7261, "learning_rate": 4.361974930967842e-05, "epoch": 0.5484644111253554, "percentage": 54.85, "elapsed_time": "23:17:03", "remaining_time": "19:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9841, "total_steps": 17941, "loss": 1.6934, "learning_rate": 4.361091796614001e-05, "epoch": 0.5485201493785185, "percentage": 54.85, "elapsed_time": "23:17:12", "remaining_time": "19:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9842, "total_steps": 17941, "loss": 1.6504, "learning_rate": 4.360208682522603e-05, "epoch": 0.5485758876316816, "percentage": 54.86, "elapsed_time": "23:17:20", "remaining_time": "19:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9843, "total_steps": 17941, "loss": 1.5194, "learning_rate": 4.3593255887216555e-05, "epoch": 0.5486316258848448, "percentage": 54.86, "elapsed_time": "23:17:29", "remaining_time": "19:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9844, "total_steps": 17941, "loss": 1.7104, "learning_rate": 4.358442515239164e-05, "epoch": 0.5486873641380079, "percentage": 54.87, "elapsed_time": "23:17:37", "remaining_time": "19:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9845, "total_steps": 17941, "loss": 1.547, "learning_rate": 4.357559462103138e-05, "epoch": 0.5487431023911711, "percentage": 54.87, "elapsed_time": "23:17:46", "remaining_time": "19:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9846, "total_steps": 17941, "loss": 1.675, "learning_rate": 4.3566764293415776e-05, "epoch": 0.5487988406443342, "percentage": 54.88, "elapsed_time": "23:17:54", "remaining_time": "19:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9847, "total_steps": 17941, "loss": 1.6043, "learning_rate": 4.355793416982492e-05, "epoch": 0.5488545788974973, "percentage": 54.89, "elapsed_time": "23:18:03", "remaining_time": "19:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9848, "total_steps": 17941, "loss": 1.7647, "learning_rate": 4.354910425053881e-05, "epoch": 0.5489103171506605, "percentage": 54.89, "elapsed_time": "23:18:11", "remaining_time": "19:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9849, "total_steps": 17941, "loss": 1.5597, "learning_rate": 4.3540274535837524e-05, "epoch": 0.5489660554038236, "percentage": 54.9, "elapsed_time": "23:18:20", "remaining_time": "19:08:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9850, "total_steps": 17941, "loss": 1.6489, "learning_rate": 4.353144502600105e-05, "epoch": 0.5490217936569868, "percentage": 54.9, "elapsed_time": "23:18:28", "remaining_time": "19:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9851, "total_steps": 17941, "loss": 1.7917, "learning_rate": 4.3522615721309436e-05, "epoch": 0.54907753191015, "percentage": 54.91, "elapsed_time": "23:18:37", "remaining_time": "19:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9852, "total_steps": 17941, "loss": 1.7261, "learning_rate": 4.3513786622042685e-05, "epoch": 0.549133270163313, "percentage": 54.91, "elapsed_time": "23:18:46", "remaining_time": "19:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9853, "total_steps": 17941, "loss": 1.6477, "learning_rate": 4.35049577284808e-05, "epoch": 0.5491890084164762, "percentage": 54.92, "elapsed_time": "23:18:54", "remaining_time": "19:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9854, "total_steps": 17941, "loss": 1.5079, "learning_rate": 4.3496129040903795e-05, "epoch": 0.5492447466696394, "percentage": 54.92, "elapsed_time": "23:19:02", "remaining_time": "19:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9855, "total_steps": 17941, "loss": 1.6616, "learning_rate": 4.348730055959164e-05, "epoch": 0.5493004849228025, "percentage": 54.93, "elapsed_time": "23:19:11", "remaining_time": "19:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9856, "total_steps": 17941, "loss": 1.8967, "learning_rate": 4.3478472284824346e-05, "epoch": 0.5493562231759657, "percentage": 54.94, "elapsed_time": "23:19:19", "remaining_time": "19:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9857, "total_steps": 17941, "loss": 1.8138, "learning_rate": 4.3469644216881893e-05, "epoch": 0.5494119614291288, "percentage": 54.94, "elapsed_time": "23:19:28", "remaining_time": "19:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9858, "total_steps": 17941, "loss": 1.6882, "learning_rate": 4.346081635604425e-05, "epoch": 0.5494676996822919, "percentage": 54.95, "elapsed_time": "23:19:36", "remaining_time": "19:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9859, "total_steps": 17941, "loss": 1.8155, "learning_rate": 4.34519887025914e-05, "epoch": 0.5495234379354551, "percentage": 54.95, "elapsed_time": "23:19:45", "remaining_time": "19:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9860, "total_steps": 17941, "loss": 1.5754, "learning_rate": 4.3443161256803264e-05, "epoch": 0.5495791761886183, "percentage": 54.96, "elapsed_time": "23:19:54", "remaining_time": "19:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9861, "total_steps": 17941, "loss": 1.6735, "learning_rate": 4.343433401895984e-05, "epoch": 0.5496349144417814, "percentage": 54.96, "elapsed_time": "23:20:03", "remaining_time": "19:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9862, "total_steps": 17941, "loss": 1.5815, "learning_rate": 4.342550698934106e-05, "epoch": 0.5496906526949445, "percentage": 54.97, "elapsed_time": "23:20:12", "remaining_time": "19:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9863, "total_steps": 17941, "loss": 1.5027, "learning_rate": 4.3416680168226855e-05, "epoch": 0.5497463909481077, "percentage": 54.97, "elapsed_time": "23:20:21", "remaining_time": "19:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9864, "total_steps": 17941, "loss": 1.6578, "learning_rate": 4.340785355589718e-05, "epoch": 0.5498021292012708, "percentage": 54.98, "elapsed_time": "23:20:29", "remaining_time": "19:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9865, "total_steps": 17941, "loss": 1.4347, "learning_rate": 4.339902715263195e-05, "epoch": 0.549857867454434, "percentage": 54.99, "elapsed_time": "23:20:38", "remaining_time": "19:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9866, "total_steps": 17941, "loss": 1.6696, "learning_rate": 4.339020095871111e-05, "epoch": 0.5499136057075972, "percentage": 54.99, "elapsed_time": "23:20:46", "remaining_time": "19:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9867, "total_steps": 17941, "loss": 1.6238, "learning_rate": 4.338137497441454e-05, "epoch": 0.5499693439607602, "percentage": 55.0, "elapsed_time": "23:20:55", "remaining_time": "19:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9868, "total_steps": 17941, "loss": 1.6317, "learning_rate": 4.337254920002218e-05, "epoch": 0.5500250822139234, "percentage": 55.0, "elapsed_time": "23:21:03", "remaining_time": "19:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9869, "total_steps": 17941, "loss": 1.4349, "learning_rate": 4.336372363581391e-05, "epoch": 0.5500808204670865, "percentage": 55.01, "elapsed_time": "23:21:12", "remaining_time": "19:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9870, "total_steps": 17941, "loss": 1.4318, "learning_rate": 4.3354898282069624e-05, "epoch": 0.5501365587202497, "percentage": 55.01, "elapsed_time": "23:21:21", "remaining_time": "19:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9871, "total_steps": 17941, "loss": 1.7328, "learning_rate": 4.3346073139069245e-05, "epoch": 0.5501922969734129, "percentage": 55.02, "elapsed_time": "23:21:29", "remaining_time": "19:05:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9872, "total_steps": 17941, "loss": 1.6179, "learning_rate": 4.3337248207092604e-05, "epoch": 0.550248035226576, "percentage": 55.02, "elapsed_time": "23:21:38", "remaining_time": "19:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9873, "total_steps": 17941, "loss": 1.7354, "learning_rate": 4.332842348641962e-05, "epoch": 0.5503037734797391, "percentage": 55.03, "elapsed_time": "23:21:46", "remaining_time": "19:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9874, "total_steps": 17941, "loss": 1.4075, "learning_rate": 4.331959897733015e-05, "epoch": 0.5503595117329023, "percentage": 55.04, "elapsed_time": "23:21:55", "remaining_time": "19:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9875, "total_steps": 17941, "loss": 1.7368, "learning_rate": 4.3310774680104045e-05, "epoch": 0.5504152499860654, "percentage": 55.04, "elapsed_time": "23:22:03", "remaining_time": "19:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9876, "total_steps": 17941, "loss": 1.6125, "learning_rate": 4.330195059502116e-05, "epoch": 0.5504709882392286, "percentage": 55.05, "elapsed_time": "23:22:12", "remaining_time": "19:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9877, "total_steps": 17941, "loss": 1.5961, "learning_rate": 4.329312672236136e-05, "epoch": 0.5505267264923918, "percentage": 55.05, "elapsed_time": "23:22:20", "remaining_time": "19:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9878, "total_steps": 17941, "loss": 1.7871, "learning_rate": 4.328430306240447e-05, "epoch": 0.5505824647455548, "percentage": 55.06, "elapsed_time": "23:22:29", "remaining_time": "19:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9879, "total_steps": 17941, "loss": 1.6864, "learning_rate": 4.327547961543032e-05, "epoch": 0.550638202998718, "percentage": 55.06, "elapsed_time": "23:22:38", "remaining_time": "19:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9880, "total_steps": 17941, "loss": 1.503, "learning_rate": 4.3266656381718776e-05, "epoch": 0.5506939412518812, "percentage": 55.07, "elapsed_time": "23:22:46", "remaining_time": "19:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9881, "total_steps": 17941, "loss": 1.6596, "learning_rate": 4.325783336154961e-05, "epoch": 0.5507496795050443, "percentage": 55.07, "elapsed_time": "23:22:55", "remaining_time": "19:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9882, "total_steps": 17941, "loss": 1.5023, "learning_rate": 4.324901055520266e-05, "epoch": 0.5508054177582075, "percentage": 55.08, "elapsed_time": "23:23:03", "remaining_time": "19:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9883, "total_steps": 17941, "loss": 1.6991, "learning_rate": 4.324018796295776e-05, "epoch": 0.5508611560113706, "percentage": 55.09, "elapsed_time": "23:23:12", "remaining_time": "19:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9884, "total_steps": 17941, "loss": 1.5738, "learning_rate": 4.323136558509466e-05, "epoch": 0.5509168942645337, "percentage": 55.09, "elapsed_time": "23:23:20", "remaining_time": "19:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9885, "total_steps": 17941, "loss": 1.8939, "learning_rate": 4.3222543421893205e-05, "epoch": 0.5509726325176969, "percentage": 55.1, "elapsed_time": "23:23:29", "remaining_time": "19:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9886, "total_steps": 17941, "loss": 1.3017, "learning_rate": 4.3213721473633136e-05, "epoch": 0.5510283707708601, "percentage": 55.1, "elapsed_time": "23:23:37", "remaining_time": "19:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9887, "total_steps": 17941, "loss": 1.6982, "learning_rate": 4.320489974059426e-05, "epoch": 0.5510841090240232, "percentage": 55.11, "elapsed_time": "23:23:46", "remaining_time": "19:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9888, "total_steps": 17941, "loss": 1.75, "learning_rate": 4.3196078223056346e-05, "epoch": 0.5511398472771863, "percentage": 55.11, "elapsed_time": "23:23:54", "remaining_time": "19:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9889, "total_steps": 17941, "loss": 1.6721, "learning_rate": 4.3187256921299155e-05, "epoch": 0.5511955855303495, "percentage": 55.12, "elapsed_time": "23:24:02", "remaining_time": "19:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9890, "total_steps": 17941, "loss": 1.6611, "learning_rate": 4.317843583560246e-05, "epoch": 0.5512513237835126, "percentage": 55.13, "elapsed_time": "23:24:11", "remaining_time": "19:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9891, "total_steps": 17941, "loss": 1.5042, "learning_rate": 4.316961496624601e-05, "epoch": 0.5513070620366758, "percentage": 55.13, "elapsed_time": "23:24:20", "remaining_time": "19:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9892, "total_steps": 17941, "loss": 1.5001, "learning_rate": 4.316079431350956e-05, "epoch": 0.5513628002898389, "percentage": 55.14, "elapsed_time": "23:24:28", "remaining_time": "19:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9893, "total_steps": 17941, "loss": 1.3369, "learning_rate": 4.3151973877672815e-05, "epoch": 0.551418538543002, "percentage": 55.14, "elapsed_time": "23:24:36", "remaining_time": "19:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9894, "total_steps": 17941, "loss": 1.7525, "learning_rate": 4.314315365901555e-05, "epoch": 0.5514742767961652, "percentage": 55.15, "elapsed_time": "23:24:45", "remaining_time": "19:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9895, "total_steps": 17941, "loss": 1.7689, "learning_rate": 4.3134333657817464e-05, "epoch": 0.5515300150493283, "percentage": 55.15, "elapsed_time": "23:24:53", "remaining_time": "19:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9896, "total_steps": 17941, "loss": 1.8022, "learning_rate": 4.312551387435827e-05, "epoch": 0.5515857533024915, "percentage": 55.16, "elapsed_time": "23:25:02", "remaining_time": "19:02:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9897, "total_steps": 17941, "loss": 1.7209, "learning_rate": 4.311669430891773e-05, "epoch": 0.5516414915556547, "percentage": 55.16, "elapsed_time": "23:25:10", "remaining_time": "19:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9898, "total_steps": 17941, "loss": 1.6729, "learning_rate": 4.310787496177548e-05, "epoch": 0.5516972298088177, "percentage": 55.17, "elapsed_time": "23:25:19", "remaining_time": "19:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9899, "total_steps": 17941, "loss": 1.4496, "learning_rate": 4.309905583321128e-05, "epoch": 0.5517529680619809, "percentage": 55.18, "elapsed_time": "23:25:27", "remaining_time": "19:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9900, "total_steps": 17941, "loss": 1.5063, "learning_rate": 4.309023692350478e-05, "epoch": 0.5518087063151441, "percentage": 55.18, "elapsed_time": "23:25:36", "remaining_time": "19:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9901, "total_steps": 17941, "loss": 1.5095, "learning_rate": 4.3081418232935687e-05, "epoch": 0.5518644445683072, "percentage": 55.19, "elapsed_time": "23:25:44", "remaining_time": "19:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9902, "total_steps": 17941, "loss": 1.7476, "learning_rate": 4.3072599761783664e-05, "epoch": 0.5519201828214704, "percentage": 55.19, "elapsed_time": "23:25:53", "remaining_time": "19:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9903, "total_steps": 17941, "loss": 1.3913, "learning_rate": 4.306378151032838e-05, "epoch": 0.5519759210746336, "percentage": 55.2, "elapsed_time": "23:26:01", "remaining_time": "19:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9904, "total_steps": 17941, "loss": 1.6125, "learning_rate": 4.3054963478849517e-05, "epoch": 0.5520316593277966, "percentage": 55.2, "elapsed_time": "23:26:10", "remaining_time": "19:01:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9905, "total_steps": 17941, "loss": 1.8131, "learning_rate": 4.30461456676267e-05, "epoch": 0.5520873975809598, "percentage": 55.21, "elapsed_time": "23:26:18", "remaining_time": "19:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9906, "total_steps": 17941, "loss": 1.4352, "learning_rate": 4.303732807693963e-05, "epoch": 0.552143135834123, "percentage": 55.21, "elapsed_time": "23:26:27", "remaining_time": "19:00:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9907, "total_steps": 17941, "loss": 1.9657, "learning_rate": 4.3028510707067885e-05, "epoch": 0.5521988740872861, "percentage": 55.22, "elapsed_time": "23:26:35", "remaining_time": "19:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9908, "total_steps": 17941, "loss": 1.8648, "learning_rate": 4.3019693558291144e-05, "epoch": 0.5522546123404493, "percentage": 55.23, "elapsed_time": "23:26:44", "remaining_time": "19:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9909, "total_steps": 17941, "loss": 1.4133, "learning_rate": 4.301087663088904e-05, "epoch": 0.5523103505936124, "percentage": 55.23, "elapsed_time": "23:26:52", "remaining_time": "19:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9910, "total_steps": 17941, "loss": 1.8159, "learning_rate": 4.300205992514117e-05, "epoch": 0.5523660888467755, "percentage": 55.24, "elapsed_time": "23:27:01", "remaining_time": "19:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9911, "total_steps": 17941, "loss": 1.7179, "learning_rate": 4.299324344132717e-05, "epoch": 0.5524218270999387, "percentage": 55.24, "elapsed_time": "23:27:09", "remaining_time": "19:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9912, "total_steps": 17941, "loss": 1.6968, "learning_rate": 4.298442717972662e-05, "epoch": 0.5524775653531019, "percentage": 55.25, "elapsed_time": "23:27:17", "remaining_time": "18:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9913, "total_steps": 17941, "loss": 1.6225, "learning_rate": 4.297561114061915e-05, "epoch": 0.552533303606265, "percentage": 55.25, "elapsed_time": "23:27:26", "remaining_time": "18:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9914, "total_steps": 17941, "loss": 1.4759, "learning_rate": 4.2966795324284324e-05, "epoch": 0.5525890418594281, "percentage": 55.26, "elapsed_time": "23:27:34", "remaining_time": "18:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9915, "total_steps": 17941, "loss": 1.456, "learning_rate": 4.295797973100174e-05, "epoch": 0.5526447801125912, "percentage": 55.26, "elapsed_time": "23:27:43", "remaining_time": "18:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9916, "total_steps": 17941, "loss": 1.625, "learning_rate": 4.2949164361051e-05, "epoch": 0.5527005183657544, "percentage": 55.27, "elapsed_time": "23:27:52", "remaining_time": "18:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9917, "total_steps": 17941, "loss": 1.3695, "learning_rate": 4.294034921471164e-05, "epoch": 0.5527562566189176, "percentage": 55.28, "elapsed_time": "23:28:00", "remaining_time": "18:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9918, "total_steps": 17941, "loss": 1.748, "learning_rate": 4.2931534292263264e-05, "epoch": 0.5528119948720807, "percentage": 55.28, "elapsed_time": "23:28:09", "remaining_time": "18:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9919, "total_steps": 17941, "loss": 1.7037, "learning_rate": 4.292271959398539e-05, "epoch": 0.5528677331252438, "percentage": 55.29, "elapsed_time": "23:28:18", "remaining_time": "18:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9920, "total_steps": 17941, "loss": 1.9699, "learning_rate": 4.2913905120157596e-05, "epoch": 0.552923471378407, "percentage": 55.29, "elapsed_time": "23:28:26", "remaining_time": "18:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9921, "total_steps": 17941, "loss": 1.7382, "learning_rate": 4.290509087105942e-05, "epoch": 0.5529792096315701, "percentage": 55.3, "elapsed_time": "23:28:35", "remaining_time": "18:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9922, "total_steps": 17941, "loss": 1.5503, "learning_rate": 4.289627684697037e-05, "epoch": 0.5530349478847333, "percentage": 55.3, "elapsed_time": "23:28:43", "remaining_time": "18:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9923, "total_steps": 17941, "loss": 1.3335, "learning_rate": 4.288746304817004e-05, "epoch": 0.5530906861378965, "percentage": 55.31, "elapsed_time": "23:28:51", "remaining_time": "18:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9924, "total_steps": 17941, "loss": 1.9235, "learning_rate": 4.287864947493788e-05, "epoch": 0.5531464243910595, "percentage": 55.31, "elapsed_time": "23:29:00", "remaining_time": "18:58:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9925, "total_steps": 17941, "loss": 1.7431, "learning_rate": 4.286983612755345e-05, "epoch": 0.5532021626442227, "percentage": 55.32, "elapsed_time": "23:29:08", "remaining_time": "18:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9926, "total_steps": 17941, "loss": 1.6642, "learning_rate": 4.2861023006296245e-05, "epoch": 0.5532579008973859, "percentage": 55.33, "elapsed_time": "23:29:17", "remaining_time": "18:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9927, "total_steps": 17941, "loss": 1.5847, "learning_rate": 4.285221011144578e-05, "epoch": 0.553313639150549, "percentage": 55.33, "elapsed_time": "23:29:26", "remaining_time": "18:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9928, "total_steps": 17941, "loss": 1.6667, "learning_rate": 4.284339744328152e-05, "epoch": 0.5533693774037122, "percentage": 55.34, "elapsed_time": "23:29:34", "remaining_time": "18:57:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9929, "total_steps": 17941, "loss": 1.6661, "learning_rate": 4.283458500208297e-05, "epoch": 0.5534251156568754, "percentage": 55.34, "elapsed_time": "23:29:43", "remaining_time": "18:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9930, "total_steps": 17941, "loss": 1.57, "learning_rate": 4.282577278812962e-05, "epoch": 0.5534808539100384, "percentage": 55.35, "elapsed_time": "23:29:51", "remaining_time": "18:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9931, "total_steps": 17941, "loss": 1.6694, "learning_rate": 4.28169608017009e-05, "epoch": 0.5535365921632016, "percentage": 55.35, "elapsed_time": "23:29:59", "remaining_time": "18:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9932, "total_steps": 17941, "loss": 1.8431, "learning_rate": 4.2808149043076337e-05, "epoch": 0.5535923304163648, "percentage": 55.36, "elapsed_time": "23:30:08", "remaining_time": "18:57:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9933, "total_steps": 17941, "loss": 1.7697, "learning_rate": 4.279933751253533e-05, "epoch": 0.5536480686695279, "percentage": 55.36, "elapsed_time": "23:30:16", "remaining_time": "18:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9934, "total_steps": 17941, "loss": 1.6883, "learning_rate": 4.279052621035738e-05, "epoch": 0.553703806922691, "percentage": 55.37, "elapsed_time": "23:30:25", "remaining_time": "18:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9935, "total_steps": 17941, "loss": 1.88, "learning_rate": 4.2781715136821874e-05, "epoch": 0.5537595451758542, "percentage": 55.38, "elapsed_time": "23:30:34", "remaining_time": "18:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9936, "total_steps": 17941, "loss": 1.9303, "learning_rate": 4.277290429220829e-05, "epoch": 0.5538152834290173, "percentage": 55.38, "elapsed_time": "23:30:42", "remaining_time": "18:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9937, "total_steps": 17941, "loss": 1.7339, "learning_rate": 4.276409367679605e-05, "epoch": 0.5538710216821805, "percentage": 55.39, "elapsed_time": "23:30:51", "remaining_time": "18:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9938, "total_steps": 17941, "loss": 1.8366, "learning_rate": 4.275528329086457e-05, "epoch": 0.5539267599353436, "percentage": 55.39, "elapsed_time": "23:30:59", "remaining_time": "18:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9939, "total_steps": 17941, "loss": 1.5683, "learning_rate": 4.274647313469326e-05, "epoch": 0.5539824981885068, "percentage": 55.4, "elapsed_time": "23:31:08", "remaining_time": "18:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9940, "total_steps": 17941, "loss": 1.7331, "learning_rate": 4.273766320856152e-05, "epoch": 0.5540382364416699, "percentage": 55.4, "elapsed_time": "23:31:16", "remaining_time": "18:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9941, "total_steps": 17941, "loss": 1.6732, "learning_rate": 4.2728853512748774e-05, "epoch": 0.554093974694833, "percentage": 55.41, "elapsed_time": "23:31:25", "remaining_time": "18:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9942, "total_steps": 17941, "loss": 1.7369, "learning_rate": 4.272004404753441e-05, "epoch": 0.5541497129479962, "percentage": 55.41, "elapsed_time": "23:31:33", "remaining_time": "18:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9943, "total_steps": 17941, "loss": 1.5369, "learning_rate": 4.271123481319779e-05, "epoch": 0.5542054512011594, "percentage": 55.42, "elapsed_time": "23:31:42", "remaining_time": "18:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9944, "total_steps": 17941, "loss": 1.9257, "learning_rate": 4.2702425810018314e-05, "epoch": 0.5542611894543225, "percentage": 55.43, "elapsed_time": "23:31:50", "remaining_time": "18:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9945, "total_steps": 17941, "loss": 1.6092, "learning_rate": 4.269361703827533e-05, "epoch": 0.5543169277074856, "percentage": 55.43, "elapsed_time": "23:31:58", "remaining_time": "18:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9946, "total_steps": 17941, "loss": 1.5267, "learning_rate": 4.268480849824824e-05, "epoch": 0.5543726659606488, "percentage": 55.44, "elapsed_time": "23:32:07", "remaining_time": "18:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9947, "total_steps": 17941, "loss": 1.7716, "learning_rate": 4.2676000190216355e-05, "epoch": 0.5544284042138119, "percentage": 55.44, "elapsed_time": "23:32:15", "remaining_time": "18:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9948, "total_steps": 17941, "loss": 1.5671, "learning_rate": 4.266719211445903e-05, "epoch": 0.5544841424669751, "percentage": 55.45, "elapsed_time": "23:32:24", "remaining_time": "18:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9949, "total_steps": 17941, "loss": 1.68, "learning_rate": 4.265838427125565e-05, "epoch": 0.5545398807201383, "percentage": 55.45, "elapsed_time": "23:32:32", "remaining_time": "18:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9950, "total_steps": 17941, "loss": 1.6753, "learning_rate": 4.2649576660885484e-05, "epoch": 0.5545956189733013, "percentage": 55.46, "elapsed_time": "23:32:41", "remaining_time": "18:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9951, "total_steps": 17941, "loss": 1.4447, "learning_rate": 4.264076928362791e-05, "epoch": 0.5546513572264645, "percentage": 55.47, "elapsed_time": "23:32:49", "remaining_time": "18:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9952, "total_steps": 17941, "loss": 1.6929, "learning_rate": 4.2631962139762216e-05, "epoch": 0.5547070954796277, "percentage": 55.47, "elapsed_time": "23:32:58", "remaining_time": "18:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9953, "total_steps": 17941, "loss": 1.3731, "learning_rate": 4.262315522956774e-05, "epoch": 0.5547628337327908, "percentage": 55.48, "elapsed_time": "23:33:06", "remaining_time": "18:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9954, "total_steps": 17941, "loss": 1.4813, "learning_rate": 4.261434855332376e-05, "epoch": 0.554818571985954, "percentage": 55.48, "elapsed_time": "23:33:15", "remaining_time": "18:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9955, "total_steps": 17941, "loss": 1.7245, "learning_rate": 4.2605542111309574e-05, "epoch": 0.5548743102391172, "percentage": 55.49, "elapsed_time": "23:33:23", "remaining_time": "18:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9956, "total_steps": 17941, "loss": 1.6008, "learning_rate": 4.25967359038045e-05, "epoch": 0.5549300484922802, "percentage": 55.49, "elapsed_time": "23:33:32", "remaining_time": "18:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9957, "total_steps": 17941, "loss": 1.483, "learning_rate": 4.258792993108777e-05, "epoch": 0.5549857867454434, "percentage": 55.5, "elapsed_time": "23:33:41", "remaining_time": "18:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9958, "total_steps": 17941, "loss": 1.7526, "learning_rate": 4.257912419343872e-05, "epoch": 0.5550415249986066, "percentage": 55.5, "elapsed_time": "23:33:49", "remaining_time": "18:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9959, "total_steps": 17941, "loss": 1.593, "learning_rate": 4.257031869113656e-05, "epoch": 0.5550972632517697, "percentage": 55.51, "elapsed_time": "23:33:58", "remaining_time": "18:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9960, "total_steps": 17941, "loss": 1.6164, "learning_rate": 4.256151342446059e-05, "epoch": 0.5551530015049329, "percentage": 55.52, "elapsed_time": "23:34:06", "remaining_time": "18:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9961, "total_steps": 17941, "loss": 1.4945, "learning_rate": 4.255270839369003e-05, "epoch": 0.5552087397580959, "percentage": 55.52, "elapsed_time": "23:34:15", "remaining_time": "18:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9962, "total_steps": 17941, "loss": 1.7595, "learning_rate": 4.254390359910414e-05, "epoch": 0.5552644780112591, "percentage": 55.53, "elapsed_time": "23:34:23", "remaining_time": "18:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9963, "total_steps": 17941, "loss": 1.6638, "learning_rate": 4.2535099040982174e-05, "epoch": 0.5553202162644223, "percentage": 55.53, "elapsed_time": "23:34:32", "remaining_time": "18:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9964, "total_steps": 17941, "loss": 1.6403, "learning_rate": 4.252629471960332e-05, "epoch": 0.5553759545175854, "percentage": 55.54, "elapsed_time": "23:34:40", "remaining_time": "18:52:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9965, "total_steps": 17941, "loss": 1.7287, "learning_rate": 4.251749063524684e-05, "epoch": 0.5554316927707486, "percentage": 55.54, "elapsed_time": "23:34:49", "remaining_time": "18:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9966, "total_steps": 17941, "loss": 1.4819, "learning_rate": 4.2508686788191917e-05, "epoch": 0.5554874310239117, "percentage": 55.55, "elapsed_time": "23:34:57", "remaining_time": "18:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9967, "total_steps": 17941, "loss": 1.6855, "learning_rate": 4.249988317871777e-05, "epoch": 0.5555431692770748, "percentage": 55.55, "elapsed_time": "23:35:06", "remaining_time": "18:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9968, "total_steps": 17941, "loss": 1.6364, "learning_rate": 4.249107980710362e-05, "epoch": 0.555598907530238, "percentage": 55.56, "elapsed_time": "23:35:14", "remaining_time": "18:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9969, "total_steps": 17941, "loss": 1.6847, "learning_rate": 4.2482276673628626e-05, "epoch": 0.5556546457834012, "percentage": 55.57, "elapsed_time": "23:35:23", "remaining_time": "18:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9970, "total_steps": 17941, "loss": 1.5898, "learning_rate": 4.247347377857199e-05, "epoch": 0.5557103840365643, "percentage": 55.57, "elapsed_time": "23:35:31", "remaining_time": "18:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9971, "total_steps": 17941, "loss": 1.7209, "learning_rate": 4.2464671122212876e-05, "epoch": 0.5557661222897274, "percentage": 55.58, "elapsed_time": "23:35:40", "remaining_time": "18:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9972, "total_steps": 17941, "loss": 1.9442, "learning_rate": 4.245586870483047e-05, "epoch": 0.5558218605428906, "percentage": 55.58, "elapsed_time": "23:35:48", "remaining_time": "18:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9973, "total_steps": 17941, "loss": 1.6745, "learning_rate": 4.2447066526703914e-05, "epoch": 0.5558775987960537, "percentage": 55.59, "elapsed_time": "23:35:57", "remaining_time": "18:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9974, "total_steps": 17941, "loss": 1.7414, "learning_rate": 4.2438264588112354e-05, "epoch": 0.5559333370492169, "percentage": 55.59, "elapsed_time": "23:36:05", "remaining_time": "18:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9975, "total_steps": 17941, "loss": 1.654, "learning_rate": 4.242946288933499e-05, "epoch": 0.5559890753023801, "percentage": 55.6, "elapsed_time": "23:36:15", "remaining_time": "18:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9976, "total_steps": 17941, "loss": 1.8102, "learning_rate": 4.2420661430650895e-05, "epoch": 0.5560448135555431, "percentage": 55.6, "elapsed_time": "23:36:24", "remaining_time": "18:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9977, "total_steps": 17941, "loss": 1.6475, "learning_rate": 4.241186021233925e-05, "epoch": 0.5561005518087063, "percentage": 55.61, "elapsed_time": "23:36:32", "remaining_time": "18:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9978, "total_steps": 17941, "loss": 2.1339, "learning_rate": 4.240305923467914e-05, "epoch": 0.5561562900618695, "percentage": 55.62, "elapsed_time": "23:36:41", "remaining_time": "18:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9979, "total_steps": 17941, "loss": 1.6901, "learning_rate": 4.239425849794971e-05, "epoch": 0.5562120283150326, "percentage": 55.62, "elapsed_time": "23:36:50", "remaining_time": "18:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9980, "total_steps": 17941, "loss": 1.3724, "learning_rate": 4.238545800243005e-05, "epoch": 0.5562677665681958, "percentage": 55.63, "elapsed_time": "23:36:58", "remaining_time": "18:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9981, "total_steps": 17941, "loss": 1.6478, "learning_rate": 4.237665774839926e-05, "epoch": 0.556323504821359, "percentage": 55.63, "elapsed_time": "23:37:07", "remaining_time": "18:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9982, "total_steps": 17941, "loss": 1.8298, "learning_rate": 4.236785773613646e-05, "epoch": 0.556379243074522, "percentage": 55.64, "elapsed_time": "23:37:15", "remaining_time": "18:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9983, "total_steps": 17941, "loss": 1.5858, "learning_rate": 4.2359057965920684e-05, "epoch": 0.5564349813276852, "percentage": 55.64, "elapsed_time": "23:37:24", "remaining_time": "18:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9984, "total_steps": 17941, "loss": 1.7207, "learning_rate": 4.235025843803108e-05, "epoch": 0.5564907195808483, "percentage": 55.65, "elapsed_time": "23:37:32", "remaining_time": "18:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9985, "total_steps": 17941, "loss": 1.6093, "learning_rate": 4.234145915274663e-05, "epoch": 0.5565464578340115, "percentage": 55.65, "elapsed_time": "23:37:41", "remaining_time": "18:49:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9986, "total_steps": 17941, "loss": 1.6445, "learning_rate": 4.233266011034648e-05, "epoch": 0.5566021960871746, "percentage": 55.66, "elapsed_time": "23:37:49", "remaining_time": "18:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9987, "total_steps": 17941, "loss": 1.5421, "learning_rate": 4.232386131110963e-05, "epoch": 0.5566579343403377, "percentage": 55.67, "elapsed_time": "23:37:58", "remaining_time": "18:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9988, "total_steps": 17941, "loss": 1.7904, "learning_rate": 4.231506275531514e-05, "epoch": 0.5567136725935009, "percentage": 55.67, "elapsed_time": "23:38:06", "remaining_time": "18:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9989, "total_steps": 17941, "loss": 1.8607, "learning_rate": 4.230626444324207e-05, "epoch": 0.5567694108466641, "percentage": 55.68, "elapsed_time": "23:38:15", "remaining_time": "18:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9990, "total_steps": 17941, "loss": 1.6841, "learning_rate": 4.2297466375169425e-05, "epoch": 0.5568251490998272, "percentage": 55.68, "elapsed_time": "23:38:23", "remaining_time": "18:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9991, "total_steps": 17941, "loss": 1.5424, "learning_rate": 4.2288668551376246e-05, "epoch": 0.5568808873529904, "percentage": 55.69, "elapsed_time": "23:38:32", "remaining_time": "18:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9992, "total_steps": 17941, "loss": 1.7097, "learning_rate": 4.2279870972141516e-05, "epoch": 0.5569366256061535, "percentage": 55.69, "elapsed_time": "23:38:40", "remaining_time": "18:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9993, "total_steps": 17941, "loss": 1.6374, "learning_rate": 4.227107363774429e-05, "epoch": 0.5569923638593166, "percentage": 55.7, "elapsed_time": "23:38:49", "remaining_time": "18:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9994, "total_steps": 17941, "loss": 1.6, "learning_rate": 4.226227654846354e-05, "epoch": 0.5570481021124798, "percentage": 55.7, "elapsed_time": "23:38:57", "remaining_time": "18:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9995, "total_steps": 17941, "loss": 1.5008, "learning_rate": 4.2253479704578255e-05, "epoch": 0.557103840365643, "percentage": 55.71, "elapsed_time": "23:39:06", "remaining_time": "18:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9996, "total_steps": 17941, "loss": 1.6418, "learning_rate": 4.224468310636745e-05, "epoch": 0.557159578618806, "percentage": 55.72, "elapsed_time": "23:39:14", "remaining_time": "18:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9997, "total_steps": 17941, "loss": 1.8126, "learning_rate": 4.223588675411007e-05, "epoch": 0.5572153168719692, "percentage": 55.72, "elapsed_time": "23:39:23", "remaining_time": "18:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9998, "total_steps": 17941, "loss": 1.7107, "learning_rate": 4.222709064808509e-05, "epoch": 0.5572710551251324, "percentage": 55.73, "elapsed_time": "23:39:31", "remaining_time": "18:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9999, "total_steps": 17941, "loss": 1.6814, "learning_rate": 4.221829478857148e-05, "epoch": 0.5573267933782955, "percentage": 55.73, "elapsed_time": "23:39:40", "remaining_time": "18:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10000, "total_steps": 17941, "loss": 1.7406, "learning_rate": 4.220949917584817e-05, "epoch": 0.5573825316314587, "percentage": 55.74, "elapsed_time": "23:39:49", "remaining_time": "18:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10001, "total_steps": 17941, "loss": 1.6824, "learning_rate": 4.2200703810194155e-05, "epoch": 0.5574382698846219, "percentage": 55.74, "elapsed_time": "23:39:57", "remaining_time": "18:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10002, "total_steps": 17941, "loss": 1.6746, "learning_rate": 4.219190869188831e-05, "epoch": 0.5574940081377849, "percentage": 55.75, "elapsed_time": "23:40:06", "remaining_time": "18:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10003, "total_steps": 17941, "loss": 1.9145, "learning_rate": 4.2183113821209625e-05, "epoch": 0.5575497463909481, "percentage": 55.75, "elapsed_time": "23:40:14", "remaining_time": "18:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10004, "total_steps": 17941, "loss": 1.6127, "learning_rate": 4.2174319198436976e-05, "epoch": 0.5576054846441113, "percentage": 55.76, "elapsed_time": "23:40:23", "remaining_time": "18:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10005, "total_steps": 17941, "loss": 1.6454, "learning_rate": 4.216552482384931e-05, "epoch": 0.5576612228972744, "percentage": 55.77, "elapsed_time": "23:40:31", "remaining_time": "18:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10006, "total_steps": 17941, "loss": 1.7028, "learning_rate": 4.215673069772551e-05, "epoch": 0.5577169611504376, "percentage": 55.77, "elapsed_time": "23:40:40", "remaining_time": "18:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10007, "total_steps": 17941, "loss": 1.7396, "learning_rate": 4.214793682034448e-05, "epoch": 0.5577726994036006, "percentage": 55.78, "elapsed_time": "23:40:48", "remaining_time": "18:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10008, "total_steps": 17941, "loss": 1.9985, "learning_rate": 4.213914319198512e-05, "epoch": 0.5578284376567638, "percentage": 55.78, "elapsed_time": "23:40:57", "remaining_time": "18:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10009, "total_steps": 17941, "loss": 1.5067, "learning_rate": 4.213034981292629e-05, "epoch": 0.557884175909927, "percentage": 55.79, "elapsed_time": "23:41:05", "remaining_time": "18:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10010, "total_steps": 17941, "loss": 1.5677, "learning_rate": 4.212155668344691e-05, "epoch": 0.5579399141630901, "percentage": 55.79, "elapsed_time": "23:41:14", "remaining_time": "18:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10011, "total_steps": 17941, "loss": 1.5929, "learning_rate": 4.211276380382579e-05, "epoch": 0.5579956524162533, "percentage": 55.8, "elapsed_time": "23:41:22", "remaining_time": "18:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10012, "total_steps": 17941, "loss": 1.5922, "learning_rate": 4.210397117434183e-05, "epoch": 0.5580513906694164, "percentage": 55.81, "elapsed_time": "23:41:31", "remaining_time": "18:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10013, "total_steps": 17941, "loss": 1.6061, "learning_rate": 4.2095178795273864e-05, "epoch": 0.5581071289225795, "percentage": 55.81, "elapsed_time": "23:41:39", "remaining_time": "18:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10014, "total_steps": 17941, "loss": 1.6108, "learning_rate": 4.208638666690074e-05, "epoch": 0.5581628671757427, "percentage": 55.82, "elapsed_time": "23:41:48", "remaining_time": "18:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10015, "total_steps": 17941, "loss": 1.6811, "learning_rate": 4.207759478950129e-05, "epoch": 0.5582186054289059, "percentage": 55.82, "elapsed_time": "23:41:57", "remaining_time": "18:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10016, "total_steps": 17941, "loss": 1.5484, "learning_rate": 4.2068803163354344e-05, "epoch": 0.558274343682069, "percentage": 55.83, "elapsed_time": "23:42:05", "remaining_time": "18:45:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10017, "total_steps": 17941, "loss": 1.6159, "learning_rate": 4.206001178873872e-05, "epoch": 0.5583300819352321, "percentage": 55.83, "elapsed_time": "23:42:14", "remaining_time": "18:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10018, "total_steps": 17941, "loss": 1.7111, "learning_rate": 4.205122066593321e-05, "epoch": 0.5583858201883953, "percentage": 55.84, "elapsed_time": "23:42:23", "remaining_time": "18:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10019, "total_steps": 17941, "loss": 1.6692, "learning_rate": 4.204242979521665e-05, "epoch": 0.5584415584415584, "percentage": 55.84, "elapsed_time": "23:42:32", "remaining_time": "18:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10020, "total_steps": 17941, "loss": 1.5002, "learning_rate": 4.203363917686784e-05, "epoch": 0.5584972966947216, "percentage": 55.85, "elapsed_time": "23:42:41", "remaining_time": "18:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10021, "total_steps": 17941, "loss": 1.5218, "learning_rate": 4.202484881116553e-05, "epoch": 0.5585530349478848, "percentage": 55.86, "elapsed_time": "23:42:50", "remaining_time": "18:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10022, "total_steps": 17941, "loss": 1.6535, "learning_rate": 4.201605869838852e-05, "epoch": 0.5586087732010478, "percentage": 55.86, "elapsed_time": "23:42:58", "remaining_time": "18:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10023, "total_steps": 17941, "loss": 1.7252, "learning_rate": 4.2007268838815575e-05, "epoch": 0.558664511454211, "percentage": 55.87, "elapsed_time": "23:43:07", "remaining_time": "18:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10024, "total_steps": 17941, "loss": 1.7039, "learning_rate": 4.199847923272547e-05, "epoch": 0.5587202497073742, "percentage": 55.87, "elapsed_time": "23:43:16", "remaining_time": "18:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10025, "total_steps": 17941, "loss": 1.8148, "learning_rate": 4.198968988039695e-05, "epoch": 0.5587759879605373, "percentage": 55.88, "elapsed_time": "23:43:24", "remaining_time": "18:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10026, "total_steps": 17941, "loss": 1.6482, "learning_rate": 4.198090078210874e-05, "epoch": 0.5588317262137005, "percentage": 55.88, "elapsed_time": "23:43:33", "remaining_time": "18:43:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10027, "total_steps": 17941, "loss": 1.7497, "learning_rate": 4.1972111938139636e-05, "epoch": 0.5588874644668637, "percentage": 55.89, "elapsed_time": "23:43:41", "remaining_time": "18:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10028, "total_steps": 17941, "loss": 1.7287, "learning_rate": 4.196332334876831e-05, "epoch": 0.5589432027200267, "percentage": 55.89, "elapsed_time": "23:43:50", "remaining_time": "18:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10029, "total_steps": 17941, "loss": 1.8665, "learning_rate": 4.195453501427353e-05, "epoch": 0.5589989409731899, "percentage": 55.9, "elapsed_time": "23:43:58", "remaining_time": "18:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10030, "total_steps": 17941, "loss": 2.0083, "learning_rate": 4.194574693493398e-05, "epoch": 0.559054679226353, "percentage": 55.91, "elapsed_time": "23:44:07", "remaining_time": "18:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10031, "total_steps": 17941, "loss": 1.4786, "learning_rate": 4.19369591110284e-05, "epoch": 0.5591104174795162, "percentage": 55.91, "elapsed_time": "23:44:15", "remaining_time": "18:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10032, "total_steps": 17941, "loss": 1.5979, "learning_rate": 4.192817154283544e-05, "epoch": 0.5591661557326794, "percentage": 55.92, "elapsed_time": "23:44:24", "remaining_time": "18:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10033, "total_steps": 17941, "loss": 1.612, "learning_rate": 4.1919384230633804e-05, "epoch": 0.5592218939858424, "percentage": 55.92, "elapsed_time": "23:44:33", "remaining_time": "18:42:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10034, "total_steps": 17941, "loss": 1.1854, "learning_rate": 4.191059717470223e-05, "epoch": 0.5592776322390056, "percentage": 55.93, "elapsed_time": "23:44:41", "remaining_time": "18:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10035, "total_steps": 17941, "loss": 1.6482, "learning_rate": 4.19018103753193e-05, "epoch": 0.5593333704921688, "percentage": 55.93, "elapsed_time": "23:44:50", "remaining_time": "18:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10036, "total_steps": 17941, "loss": 1.5681, "learning_rate": 4.1893023832763786e-05, "epoch": 0.5593891087453319, "percentage": 55.94, "elapsed_time": "23:44:59", "remaining_time": "18:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10037, "total_steps": 17941, "loss": 1.5808, "learning_rate": 4.1884237547314244e-05, "epoch": 0.5594448469984951, "percentage": 55.94, "elapsed_time": "23:45:07", "remaining_time": "18:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10038, "total_steps": 17941, "loss": 1.4751, "learning_rate": 4.1875451519249386e-05, "epoch": 0.5595005852516582, "percentage": 55.95, "elapsed_time": "23:45:16", "remaining_time": "18:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10039, "total_steps": 17941, "loss": 1.4774, "learning_rate": 4.186666574884783e-05, "epoch": 0.5595563235048213, "percentage": 55.96, "elapsed_time": "23:45:25", "remaining_time": "18:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10040, "total_steps": 17941, "loss": 1.546, "learning_rate": 4.1857880236388217e-05, "epoch": 0.5596120617579845, "percentage": 55.96, "elapsed_time": "23:45:34", "remaining_time": "18:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10041, "total_steps": 17941, "loss": 1.7583, "learning_rate": 4.184909498214918e-05, "epoch": 0.5596678000111477, "percentage": 55.97, "elapsed_time": "23:45:43", "remaining_time": "18:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10042, "total_steps": 17941, "loss": 1.4077, "learning_rate": 4.1840309986409316e-05, "epoch": 0.5597235382643108, "percentage": 55.97, "elapsed_time": "23:45:51", "remaining_time": "18:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10043, "total_steps": 17941, "loss": 1.7512, "learning_rate": 4.1831525249447255e-05, "epoch": 0.559779276517474, "percentage": 55.98, "elapsed_time": "23:46:00", "remaining_time": "18:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10044, "total_steps": 17941, "loss": 1.8438, "learning_rate": 4.182274077154157e-05, "epoch": 0.5598350147706371, "percentage": 55.98, "elapsed_time": "23:46:09", "remaining_time": "18:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10045, "total_steps": 17941, "loss": 1.7325, "learning_rate": 4.181395655297088e-05, "epoch": 0.5598907530238002, "percentage": 55.99, "elapsed_time": "23:46:17", "remaining_time": "18:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10046, "total_steps": 17941, "loss": 1.662, "learning_rate": 4.180517259401377e-05, "epoch": 0.5599464912769634, "percentage": 55.99, "elapsed_time": "23:46:26", "remaining_time": "18:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10047, "total_steps": 17941, "loss": 1.7033, "learning_rate": 4.179638889494879e-05, "epoch": 0.5600022295301266, "percentage": 56.0, "elapsed_time": "23:46:34", "remaining_time": "18:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10048, "total_steps": 17941, "loss": 1.4528, "learning_rate": 4.1787605456054546e-05, "epoch": 0.5600579677832896, "percentage": 56.01, "elapsed_time": "23:46:43", "remaining_time": "18:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10049, "total_steps": 17941, "loss": 1.6722, "learning_rate": 4.177882227760956e-05, "epoch": 0.5601137060364528, "percentage": 56.01, "elapsed_time": "23:46:51", "remaining_time": "18:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10050, "total_steps": 17941, "loss": 1.534, "learning_rate": 4.17700393598924e-05, "epoch": 0.560169444289616, "percentage": 56.02, "elapsed_time": "23:47:00", "remaining_time": "18:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10051, "total_steps": 17941, "loss": 1.7221, "learning_rate": 4.176125670318161e-05, "epoch": 0.5602251825427791, "percentage": 56.02, "elapsed_time": "23:47:08", "remaining_time": "18:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10052, "total_steps": 17941, "loss": 1.4255, "learning_rate": 4.1752474307755706e-05, "epoch": 0.5602809207959423, "percentage": 56.03, "elapsed_time": "23:47:17", "remaining_time": "18:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10053, "total_steps": 17941, "loss": 1.6083, "learning_rate": 4.174369217389326e-05, "epoch": 0.5603366590491053, "percentage": 56.03, "elapsed_time": "23:47:25", "remaining_time": "18:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10054, "total_steps": 17941, "loss": 1.4492, "learning_rate": 4.173491030187274e-05, "epoch": 0.5603923973022685, "percentage": 56.04, "elapsed_time": "23:47:34", "remaining_time": "18:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10055, "total_steps": 17941, "loss": 1.9517, "learning_rate": 4.172612869197269e-05, "epoch": 0.5604481355554317, "percentage": 56.04, "elapsed_time": "23:47:42", "remaining_time": "18:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10056, "total_steps": 17941, "loss": 1.5612, "learning_rate": 4.171734734447158e-05, "epoch": 0.5605038738085948, "percentage": 56.05, "elapsed_time": "23:47:51", "remaining_time": "18:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10057, "total_steps": 17941, "loss": 1.6853, "learning_rate": 4.1708566259647944e-05, "epoch": 0.560559612061758, "percentage": 56.06, "elapsed_time": "23:47:59", "remaining_time": "18:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10058, "total_steps": 17941, "loss": 1.6625, "learning_rate": 4.1699785437780226e-05, "epoch": 0.5606153503149212, "percentage": 56.06, "elapsed_time": "23:48:08", "remaining_time": "18:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10059, "total_steps": 17941, "loss": 1.6534, "learning_rate": 4.169100487914691e-05, "epoch": 0.5606710885680842, "percentage": 56.07, "elapsed_time": "23:48:17", "remaining_time": "18:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10060, "total_steps": 17941, "loss": 1.7264, "learning_rate": 4.168222458402651e-05, "epoch": 0.5607268268212474, "percentage": 56.07, "elapsed_time": "23:48:25", "remaining_time": "18:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10061, "total_steps": 17941, "loss": 1.6749, "learning_rate": 4.167344455269741e-05, "epoch": 0.5607825650744106, "percentage": 56.08, "elapsed_time": "23:48:34", "remaining_time": "18:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10062, "total_steps": 17941, "loss": 1.5746, "learning_rate": 4.166466478543814e-05, "epoch": 0.5608383033275737, "percentage": 56.08, "elapsed_time": "23:48:43", "remaining_time": "18:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10063, "total_steps": 17941, "loss": 1.4935, "learning_rate": 4.1655885282527075e-05, "epoch": 0.5608940415807369, "percentage": 56.09, "elapsed_time": "23:48:51", "remaining_time": "18:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10064, "total_steps": 17941, "loss": 1.422, "learning_rate": 4.164710604424269e-05, "epoch": 0.5609497798339, "percentage": 56.09, "elapsed_time": "23:49:00", "remaining_time": "18:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10065, "total_steps": 17941, "loss": 1.7145, "learning_rate": 4.1638327070863404e-05, "epoch": 0.5610055180870631, "percentage": 56.1, "elapsed_time": "23:49:08", "remaining_time": "18:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10066, "total_steps": 17941, "loss": 1.565, "learning_rate": 4.162954836266762e-05, "epoch": 0.5610612563402263, "percentage": 56.11, "elapsed_time": "23:49:17", "remaining_time": "18:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10067, "total_steps": 17941, "loss": 1.653, "learning_rate": 4.1620769919933775e-05, "epoch": 0.5611169945933895, "percentage": 56.11, "elapsed_time": "23:49:25", "remaining_time": "18:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10068, "total_steps": 17941, "loss": 1.7342, "learning_rate": 4.161199174294025e-05, "epoch": 0.5611727328465526, "percentage": 56.12, "elapsed_time": "23:49:33", "remaining_time": "18:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10069, "total_steps": 17941, "loss": 1.7592, "learning_rate": 4.1603213831965435e-05, "epoch": 0.5612284710997157, "percentage": 56.12, "elapsed_time": "23:49:42", "remaining_time": "18:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10070, "total_steps": 17941, "loss": 1.6228, "learning_rate": 4.1594436187287714e-05, "epoch": 0.5612842093528789, "percentage": 56.13, "elapsed_time": "23:49:51", "remaining_time": "18:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10071, "total_steps": 17941, "loss": 1.789, "learning_rate": 4.15856588091855e-05, "epoch": 0.561339947606042, "percentage": 56.13, "elapsed_time": "23:49:59", "remaining_time": "18:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10072, "total_steps": 17941, "loss": 1.4986, "learning_rate": 4.157688169793709e-05, "epoch": 0.5613956858592052, "percentage": 56.14, "elapsed_time": "23:50:07", "remaining_time": "18:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10073, "total_steps": 17941, "loss": 1.326, "learning_rate": 4.15681048538209e-05, "epoch": 0.5614514241123684, "percentage": 56.15, "elapsed_time": "23:50:16", "remaining_time": "18:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10074, "total_steps": 17941, "loss": 2.1994, "learning_rate": 4.155932827711527e-05, "epoch": 0.5615071623655314, "percentage": 56.15, "elapsed_time": "23:50:24", "remaining_time": "18:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10075, "total_steps": 17941, "loss": 1.9845, "learning_rate": 4.155055196809852e-05, "epoch": 0.5615629006186946, "percentage": 56.16, "elapsed_time": "23:50:33", "remaining_time": "18:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10076, "total_steps": 17941, "loss": 1.6813, "learning_rate": 4.154177592704901e-05, "epoch": 0.5616186388718577, "percentage": 56.16, "elapsed_time": "23:50:41", "remaining_time": "18:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10077, "total_steps": 17941, "loss": 1.6458, "learning_rate": 4.153300015424505e-05, "epoch": 0.5616743771250209, "percentage": 56.17, "elapsed_time": "23:50:50", "remaining_time": "18:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10078, "total_steps": 17941, "loss": 1.4892, "learning_rate": 4.1524224649964935e-05, "epoch": 0.5617301153781841, "percentage": 56.17, "elapsed_time": "23:50:58", "remaining_time": "18:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10079, "total_steps": 17941, "loss": 1.5534, "learning_rate": 4.1515449414487034e-05, "epoch": 0.5617858536313471, "percentage": 56.18, "elapsed_time": "23:51:07", "remaining_time": "18:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10080, "total_steps": 17941, "loss": 1.7606, "learning_rate": 4.1506674448089586e-05, "epoch": 0.5618415918845103, "percentage": 56.18, "elapsed_time": "23:51:15", "remaining_time": "18:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10081, "total_steps": 17941, "loss": 1.7784, "learning_rate": 4.149789975105092e-05, "epoch": 0.5618973301376735, "percentage": 56.19, "elapsed_time": "23:51:24", "remaining_time": "18:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10082, "total_steps": 17941, "loss": 1.7375, "learning_rate": 4.1489125323649294e-05, "epoch": 0.5619530683908366, "percentage": 56.2, "elapsed_time": "23:51:32", "remaining_time": "18:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10083, "total_steps": 17941, "loss": 1.5098, "learning_rate": 4.1480351166163e-05, "epoch": 0.5620088066439998, "percentage": 56.2, "elapsed_time": "23:51:41", "remaining_time": "18:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10084, "total_steps": 17941, "loss": 1.6152, "learning_rate": 4.1471577278870285e-05, "epoch": 0.562064544897163, "percentage": 56.21, "elapsed_time": "23:51:49", "remaining_time": "18:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10085, "total_steps": 17941, "loss": 1.5779, "learning_rate": 4.14628036620494e-05, "epoch": 0.562120283150326, "percentage": 56.21, "elapsed_time": "23:51:59", "remaining_time": "18:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10086, "total_steps": 17941, "loss": 1.5938, "learning_rate": 4.145403031597865e-05, "epoch": 0.5621760214034892, "percentage": 56.22, "elapsed_time": "23:52:07", "remaining_time": "18:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10087, "total_steps": 17941, "loss": 1.5921, "learning_rate": 4.144525724093619e-05, "epoch": 0.5622317596566524, "percentage": 56.22, "elapsed_time": "23:52:16", "remaining_time": "18:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10088, "total_steps": 17941, "loss": 1.6272, "learning_rate": 4.143648443720033e-05, "epoch": 0.5622874979098155, "percentage": 56.23, "elapsed_time": "23:52:24", "remaining_time": "18:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10089, "total_steps": 17941, "loss": 1.9088, "learning_rate": 4.1427711905049215e-05, "epoch": 0.5623432361629787, "percentage": 56.23, "elapsed_time": "23:52:33", "remaining_time": "18:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10090, "total_steps": 17941, "loss": 1.6455, "learning_rate": 4.1418939644761125e-05, "epoch": 0.5623989744161418, "percentage": 56.24, "elapsed_time": "23:52:41", "remaining_time": "18:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10091, "total_steps": 17941, "loss": 1.71, "learning_rate": 4.141016765661423e-05, "epoch": 0.5624547126693049, "percentage": 56.25, "elapsed_time": "23:52:51", "remaining_time": "18:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10092, "total_steps": 17941, "loss": 1.6911, "learning_rate": 4.1401395940886725e-05, "epoch": 0.5625104509224681, "percentage": 56.25, "elapsed_time": "23:52:59", "remaining_time": "18:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10093, "total_steps": 17941, "loss": 1.7185, "learning_rate": 4.139262449785683e-05, "epoch": 0.5625661891756313, "percentage": 56.26, "elapsed_time": "23:53:08", "remaining_time": "18:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10094, "total_steps": 17941, "loss": 1.5143, "learning_rate": 4.1383853327802686e-05, "epoch": 0.5626219274287944, "percentage": 56.26, "elapsed_time": "23:53:16", "remaining_time": "18:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10095, "total_steps": 17941, "loss": 1.7856, "learning_rate": 4.137508243100249e-05, "epoch": 0.5626776656819575, "percentage": 56.27, "elapsed_time": "23:53:24", "remaining_time": "18:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10096, "total_steps": 17941, "loss": 1.7438, "learning_rate": 4.136631180773437e-05, "epoch": 0.5627334039351207, "percentage": 56.27, "elapsed_time": "23:53:33", "remaining_time": "18:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10097, "total_steps": 17941, "loss": 1.5218, "learning_rate": 4.1357541458276535e-05, "epoch": 0.5627891421882838, "percentage": 56.28, "elapsed_time": "23:53:41", "remaining_time": "18:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10098, "total_steps": 17941, "loss": 1.7985, "learning_rate": 4.134877138290706e-05, "epoch": 0.562844880441447, "percentage": 56.28, "elapsed_time": "23:53:50", "remaining_time": "18:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10099, "total_steps": 17941, "loss": 1.6318, "learning_rate": 4.134000158190413e-05, "epoch": 0.5629006186946102, "percentage": 56.29, "elapsed_time": "23:53:58", "remaining_time": "18:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10100, "total_steps": 17941, "loss": 1.5959, "learning_rate": 4.133123205554587e-05, "epoch": 0.5629563569477732, "percentage": 56.3, "elapsed_time": "23:54:07", "remaining_time": "18:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10101, "total_steps": 17941, "loss": 1.7061, "learning_rate": 4.132246280411038e-05, "epoch": 0.5630120952009364, "percentage": 56.3, "elapsed_time": "23:54:16", "remaining_time": "18:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10102, "total_steps": 17941, "loss": 1.5649, "learning_rate": 4.131369382787578e-05, "epoch": 0.5630678334540995, "percentage": 56.31, "elapsed_time": "23:54:24", "remaining_time": "18:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10103, "total_steps": 17941, "loss": 1.7403, "learning_rate": 4.130492512712016e-05, "epoch": 0.5631235717072627, "percentage": 56.31, "elapsed_time": "23:54:33", "remaining_time": "18:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10104, "total_steps": 17941, "loss": 1.4974, "learning_rate": 4.129615670212161e-05, "epoch": 0.5631793099604259, "percentage": 56.32, "elapsed_time": "23:54:42", "remaining_time": "18:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10105, "total_steps": 17941, "loss": 1.6699, "learning_rate": 4.1287388553158235e-05, "epoch": 0.5632350482135889, "percentage": 56.32, "elapsed_time": "23:54:50", "remaining_time": "18:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10106, "total_steps": 17941, "loss": 1.5078, "learning_rate": 4.1278620680508096e-05, "epoch": 0.5632907864667521, "percentage": 56.33, "elapsed_time": "23:55:00", "remaining_time": "18:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10107, "total_steps": 17941, "loss": 1.7493, "learning_rate": 4.126985308444927e-05, "epoch": 0.5633465247199153, "percentage": 56.33, "elapsed_time": "23:55:08", "remaining_time": "18:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10108, "total_steps": 17941, "loss": 1.5739, "learning_rate": 4.1261085765259786e-05, "epoch": 0.5634022629730784, "percentage": 56.34, "elapsed_time": "23:55:17", "remaining_time": "18:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10109, "total_steps": 17941, "loss": 1.6441, "learning_rate": 4.1252318723217724e-05, "epoch": 0.5634580012262416, "percentage": 56.35, "elapsed_time": "23:55:25", "remaining_time": "18:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10110, "total_steps": 17941, "loss": 1.5001, "learning_rate": 4.1243551958601103e-05, "epoch": 0.5635137394794048, "percentage": 56.35, "elapsed_time": "23:55:34", "remaining_time": "18:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10111, "total_steps": 17941, "loss": 1.6376, "learning_rate": 4.123478547168795e-05, "epoch": 0.5635694777325678, "percentage": 56.36, "elapsed_time": "23:55:42", "remaining_time": "18:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10112, "total_steps": 17941, "loss": 1.723, "learning_rate": 4.122601926275632e-05, "epoch": 0.563625215985731, "percentage": 56.36, "elapsed_time": "23:55:51", "remaining_time": "18:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10113, "total_steps": 17941, "loss": 1.4783, "learning_rate": 4.121725333208418e-05, "epoch": 0.5636809542388942, "percentage": 56.37, "elapsed_time": "23:56:00", "remaining_time": "18:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10114, "total_steps": 17941, "loss": 1.6867, "learning_rate": 4.1208487679949574e-05, "epoch": 0.5637366924920573, "percentage": 56.37, "elapsed_time": "23:56:09", "remaining_time": "18:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10115, "total_steps": 17941, "loss": 1.6556, "learning_rate": 4.119972230663047e-05, "epoch": 0.5637924307452205, "percentage": 56.38, "elapsed_time": "23:56:17", "remaining_time": "18:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10116, "total_steps": 17941, "loss": 1.4309, "learning_rate": 4.119095721240488e-05, "epoch": 0.5638481689983836, "percentage": 56.38, "elapsed_time": "23:56:26", "remaining_time": "18:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10117, "total_steps": 17941, "loss": 1.7376, "learning_rate": 4.118219239755076e-05, "epoch": 0.5639039072515467, "percentage": 56.39, "elapsed_time": "23:56:34", "remaining_time": "18:30:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10118, "total_steps": 17941, "loss": 1.6084, "learning_rate": 4.117342786234608e-05, "epoch": 0.5639596455047099, "percentage": 56.4, "elapsed_time": "23:56:44", "remaining_time": "18:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10119, "total_steps": 17941, "loss": 1.6276, "learning_rate": 4.116466360706881e-05, "epoch": 0.5640153837578731, "percentage": 56.4, "elapsed_time": "23:56:52", "remaining_time": "18:30:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10120, "total_steps": 17941, "loss": 1.7219, "learning_rate": 4.1155899631996883e-05, "epoch": 0.5640711220110362, "percentage": 56.41, "elapsed_time": "23:57:01", "remaining_time": "18:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10121, "total_steps": 17941, "loss": 1.6228, "learning_rate": 4.114713593740828e-05, "epoch": 0.5641268602641993, "percentage": 56.41, "elapsed_time": "23:57:09", "remaining_time": "18:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10122, "total_steps": 17941, "loss": 1.6936, "learning_rate": 4.113837252358089e-05, "epoch": 0.5641825985173625, "percentage": 56.42, "elapsed_time": "23:57:18", "remaining_time": "18:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10123, "total_steps": 17941, "loss": 1.7324, "learning_rate": 4.1129609390792675e-05, "epoch": 0.5642383367705256, "percentage": 56.42, "elapsed_time": "23:57:26", "remaining_time": "18:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10124, "total_steps": 17941, "loss": 1.5449, "learning_rate": 4.112084653932151e-05, "epoch": 0.5642940750236888, "percentage": 56.43, "elapsed_time": "23:57:35", "remaining_time": "18:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10125, "total_steps": 17941, "loss": 1.6333, "learning_rate": 4.111208396944533e-05, "epoch": 0.5643498132768519, "percentage": 56.43, "elapsed_time": "23:57:43", "remaining_time": "18:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10126, "total_steps": 17941, "loss": 1.7363, "learning_rate": 4.110332168144204e-05, "epoch": 0.564405551530015, "percentage": 56.44, "elapsed_time": "23:57:52", "remaining_time": "18:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10127, "total_steps": 17941, "loss": 1.4916, "learning_rate": 4.10945596755895e-05, "epoch": 0.5644612897831782, "percentage": 56.45, "elapsed_time": "23:58:00", "remaining_time": "18:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10128, "total_steps": 17941, "loss": 1.7816, "learning_rate": 4.108579795216562e-05, "epoch": 0.5645170280363413, "percentage": 56.45, "elapsed_time": "23:58:09", "remaining_time": "18:29:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10129, "total_steps": 17941, "loss": 1.6816, "learning_rate": 4.107703651144824e-05, "epoch": 0.5645727662895045, "percentage": 56.46, "elapsed_time": "23:58:17", "remaining_time": "18:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10130, "total_steps": 17941, "loss": 1.5643, "learning_rate": 4.106827535371523e-05, "epoch": 0.5646285045426677, "percentage": 56.46, "elapsed_time": "23:58:26", "remaining_time": "18:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10131, "total_steps": 17941, "loss": 1.8457, "learning_rate": 4.105951447924447e-05, "epoch": 0.5646842427958307, "percentage": 56.47, "elapsed_time": "23:58:34", "remaining_time": "18:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10132, "total_steps": 17941, "loss": 1.8374, "learning_rate": 4.105075388831378e-05, "epoch": 0.5647399810489939, "percentage": 56.47, "elapsed_time": "23:58:43", "remaining_time": "18:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10133, "total_steps": 17941, "loss": 1.9171, "learning_rate": 4.1041993581201e-05, "epoch": 0.5647957193021571, "percentage": 56.48, "elapsed_time": "23:58:51", "remaining_time": "18:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10134, "total_steps": 17941, "loss": 1.8695, "learning_rate": 4.103323355818395e-05, "epoch": 0.5648514575553202, "percentage": 56.49, "elapsed_time": "23:58:59", "remaining_time": "18:28:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10135, "total_steps": 17941, "loss": 1.5685, "learning_rate": 4.102447381954046e-05, "epoch": 0.5649071958084834, "percentage": 56.49, "elapsed_time": "23:59:08", "remaining_time": "18:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10136, "total_steps": 17941, "loss": 1.7752, "learning_rate": 4.1015714365548316e-05, "epoch": 0.5649629340616465, "percentage": 56.5, "elapsed_time": "23:59:17", "remaining_time": "18:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10137, "total_steps": 17941, "loss": 1.3801, "learning_rate": 4.1006955196485324e-05, "epoch": 0.5650186723148096, "percentage": 56.5, "elapsed_time": "23:59:25", "remaining_time": "18:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10138, "total_steps": 17941, "loss": 1.6352, "learning_rate": 4.099819631262931e-05, "epoch": 0.5650744105679728, "percentage": 56.51, "elapsed_time": "23:59:33", "remaining_time": "18:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10139, "total_steps": 17941, "loss": 1.7102, "learning_rate": 4.0989437714258e-05, "epoch": 0.565130148821136, "percentage": 56.51, "elapsed_time": "23:59:42", "remaining_time": "18:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10140, "total_steps": 17941, "loss": 1.7768, "learning_rate": 4.09806794016492e-05, "epoch": 0.5651858870742991, "percentage": 56.52, "elapsed_time": "23:59:50", "remaining_time": "18:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10141, "total_steps": 17941, "loss": 1.5619, "learning_rate": 4.097192137508066e-05, "epoch": 0.5652416253274622, "percentage": 56.52, "elapsed_time": "23:59:59", "remaining_time": "18:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10142, "total_steps": 17941, "loss": 1.5905, "learning_rate": 4.096316363483014e-05, "epoch": 0.5652973635806254, "percentage": 56.53, "elapsed_time": "1 day, 0:00:08", "remaining_time": "18:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10143, "total_steps": 17941, "loss": 1.5628, "learning_rate": 4.095440618117538e-05, "epoch": 0.5653531018337885, "percentage": 56.54, "elapsed_time": "1 day, 0:00:16", "remaining_time": "18:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10144, "total_steps": 17941, "loss": 1.7393, "learning_rate": 4.094564901439411e-05, "epoch": 0.5654088400869517, "percentage": 56.54, "elapsed_time": "1 day, 0:00:25", "remaining_time": "18:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10145, "total_steps": 17941, "loss": 1.6748, "learning_rate": 4.0936892134764076e-05, "epoch": 0.5654645783401149, "percentage": 56.55, "elapsed_time": "1 day, 0:00:33", "remaining_time": "18:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10146, "total_steps": 17941, "loss": 1.7082, "learning_rate": 4.0928135542562964e-05, "epoch": 0.565520316593278, "percentage": 56.55, "elapsed_time": "1 day, 0:00:42", "remaining_time": "18:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10147, "total_steps": 17941, "loss": 1.0838, "learning_rate": 4.0919379238068526e-05, "epoch": 0.5655760548464411, "percentage": 56.56, "elapsed_time": "1 day, 0:00:51", "remaining_time": "18:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10148, "total_steps": 17941, "loss": 1.552, "learning_rate": 4.0910623221558405e-05, "epoch": 0.5656317930996042, "percentage": 56.56, "elapsed_time": "1 day, 0:00:59", "remaining_time": "18:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10149, "total_steps": 17941, "loss": 1.8034, "learning_rate": 4.0901867493310354e-05, "epoch": 0.5656875313527674, "percentage": 56.57, "elapsed_time": "1 day, 0:01:08", "remaining_time": "18:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10150, "total_steps": 17941, "loss": 1.7206, "learning_rate": 4.089311205360199e-05, "epoch": 0.5657432696059306, "percentage": 56.57, "elapsed_time": "1 day, 0:01:16", "remaining_time": "18:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10151, "total_steps": 17941, "loss": 1.6696, "learning_rate": 4.0884356902711016e-05, "epoch": 0.5657990078590937, "percentage": 56.58, "elapsed_time": "1 day, 0:01:25", "remaining_time": "18:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10152, "total_steps": 17941, "loss": 1.6162, "learning_rate": 4.087560204091511e-05, "epoch": 0.5658547461122568, "percentage": 56.59, "elapsed_time": "1 day, 0:01:33", "remaining_time": "18:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10153, "total_steps": 17941, "loss": 1.9385, "learning_rate": 4.08668474684919e-05, "epoch": 0.56591048436542, "percentage": 56.59, "elapsed_time": "1 day, 0:01:42", "remaining_time": "18:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10154, "total_steps": 17941, "loss": 1.7144, "learning_rate": 4.085809318571905e-05, "epoch": 0.5659662226185831, "percentage": 56.6, "elapsed_time": "1 day, 0:01:50", "remaining_time": "18:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10155, "total_steps": 17941, "loss": 1.4162, "learning_rate": 4.084933919287417e-05, "epoch": 0.5660219608717463, "percentage": 56.6, "elapsed_time": "1 day, 0:01:59", "remaining_time": "18:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10156, "total_steps": 17941, "loss": 1.6541, "learning_rate": 4.084058549023488e-05, "epoch": 0.5660776991249095, "percentage": 56.61, "elapsed_time": "1 day, 0:02:07", "remaining_time": "18:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10157, "total_steps": 17941, "loss": 1.5955, "learning_rate": 4.0831832078078845e-05, "epoch": 0.5661334373780725, "percentage": 56.61, "elapsed_time": "1 day, 0:02:15", "remaining_time": "18:25:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10158, "total_steps": 17941, "loss": 1.9304, "learning_rate": 4.082307895668364e-05, "epoch": 0.5661891756312357, "percentage": 56.62, "elapsed_time": "1 day, 0:02:24", "remaining_time": "18:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10159, "total_steps": 17941, "loss": 1.91, "learning_rate": 4.0814326126326864e-05, "epoch": 0.5662449138843989, "percentage": 56.62, "elapsed_time": "1 day, 0:02:32", "remaining_time": "18:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10160, "total_steps": 17941, "loss": 1.848, "learning_rate": 4.080557358728609e-05, "epoch": 0.566300652137562, "percentage": 56.63, "elapsed_time": "1 day, 0:02:42", "remaining_time": "18:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10161, "total_steps": 17941, "loss": 1.6209, "learning_rate": 4.079682133983894e-05, "epoch": 0.5663563903907252, "percentage": 56.64, "elapsed_time": "1 day, 0:02:50", "remaining_time": "18:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10162, "total_steps": 17941, "loss": 1.4589, "learning_rate": 4.0788069384262946e-05, "epoch": 0.5664121286438883, "percentage": 56.64, "elapsed_time": "1 day, 0:02:59", "remaining_time": "18:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10163, "total_steps": 17941, "loss": 1.7792, "learning_rate": 4.077931772083566e-05, "epoch": 0.5664678668970514, "percentage": 56.65, "elapsed_time": "1 day, 0:03:07", "remaining_time": "18:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10164, "total_steps": 17941, "loss": 1.5378, "learning_rate": 4.0770566349834696e-05, "epoch": 0.5665236051502146, "percentage": 56.65, "elapsed_time": "1 day, 0:03:16", "remaining_time": "18:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10165, "total_steps": 17941, "loss": 1.543, "learning_rate": 4.076181527153753e-05, "epoch": 0.5665793434033778, "percentage": 56.66, "elapsed_time": "1 day, 0:03:24", "remaining_time": "18:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10166, "total_steps": 17941, "loss": 1.6944, "learning_rate": 4.0753064486221736e-05, "epoch": 0.5666350816565409, "percentage": 56.66, "elapsed_time": "1 day, 0:03:32", "remaining_time": "18:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10167, "total_steps": 17941, "loss": 1.6907, "learning_rate": 4.0744313994164804e-05, "epoch": 0.566690819909704, "percentage": 56.67, "elapsed_time": "1 day, 0:03:41", "remaining_time": "18:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10168, "total_steps": 17941, "loss": 1.6311, "learning_rate": 4.0735563795644294e-05, "epoch": 0.5667465581628672, "percentage": 56.67, "elapsed_time": "1 day, 0:03:49", "remaining_time": "18:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10169, "total_steps": 17941, "loss": 1.5288, "learning_rate": 4.072681389093767e-05, "epoch": 0.5668022964160303, "percentage": 56.68, "elapsed_time": "1 day, 0:03:58", "remaining_time": "18:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10170, "total_steps": 17941, "loss": 1.5348, "learning_rate": 4.071806428032244e-05, "epoch": 0.5668580346691935, "percentage": 56.69, "elapsed_time": "1 day, 0:04:06", "remaining_time": "18:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10171, "total_steps": 17941, "loss": 1.9325, "learning_rate": 4.07093149640761e-05, "epoch": 0.5669137729223566, "percentage": 56.69, "elapsed_time": "1 day, 0:04:15", "remaining_time": "18:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10172, "total_steps": 17941, "loss": 1.93, "learning_rate": 4.0700565942476104e-05, "epoch": 0.5669695111755197, "percentage": 56.7, "elapsed_time": "1 day, 0:04:24", "remaining_time": "18:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10173, "total_steps": 17941, "loss": 1.6544, "learning_rate": 4.069181721579997e-05, "epoch": 0.5670252494286829, "percentage": 56.7, "elapsed_time": "1 day, 0:04:32", "remaining_time": "18:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10174, "total_steps": 17941, "loss": 1.6509, "learning_rate": 4.068306878432509e-05, "epoch": 0.567080987681846, "percentage": 56.71, "elapsed_time": "1 day, 0:04:41", "remaining_time": "18:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10175, "total_steps": 17941, "loss": 2.02, "learning_rate": 4.067432064832898e-05, "epoch": 0.5671367259350092, "percentage": 56.71, "elapsed_time": "1 day, 0:04:49", "remaining_time": "18:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10176, "total_steps": 17941, "loss": 1.7404, "learning_rate": 4.066557280808901e-05, "epoch": 0.5671924641881724, "percentage": 56.72, "elapsed_time": "1 day, 0:04:59", "remaining_time": "18:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10177, "total_steps": 17941, "loss": 1.7042, "learning_rate": 4.065682526388266e-05, "epoch": 0.5672482024413354, "percentage": 56.72, "elapsed_time": "1 day, 0:05:07", "remaining_time": "18:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10178, "total_steps": 17941, "loss": 1.5399, "learning_rate": 4.064807801598735e-05, "epoch": 0.5673039406944986, "percentage": 56.73, "elapsed_time": "1 day, 0:05:15", "remaining_time": "18:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10179, "total_steps": 17941, "loss": 1.5696, "learning_rate": 4.063933106468047e-05, "epoch": 0.5673596789476618, "percentage": 56.74, "elapsed_time": "1 day, 0:05:24", "remaining_time": "18:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10180, "total_steps": 17941, "loss": 1.5354, "learning_rate": 4.063058441023944e-05, "epoch": 0.5674154172008249, "percentage": 56.74, "elapsed_time": "1 day, 0:05:33", "remaining_time": "18:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10181, "total_steps": 17941, "loss": 1.6381, "learning_rate": 4.062183805294164e-05, "epoch": 0.5674711554539881, "percentage": 56.75, "elapsed_time": "1 day, 0:05:41", "remaining_time": "18:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10182, "total_steps": 17941, "loss": 1.6276, "learning_rate": 4.0613091993064464e-05, "epoch": 0.5675268937071513, "percentage": 56.75, "elapsed_time": "1 day, 0:05:50", "remaining_time": "18:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10183, "total_steps": 17941, "loss": 1.7498, "learning_rate": 4.0604346230885257e-05, "epoch": 0.5675826319603143, "percentage": 56.76, "elapsed_time": "1 day, 0:05:58", "remaining_time": "18:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10184, "total_steps": 17941, "loss": 1.63, "learning_rate": 4.0595600766681425e-05, "epoch": 0.5676383702134775, "percentage": 56.76, "elapsed_time": "1 day, 0:06:07", "remaining_time": "18:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10185, "total_steps": 17941, "loss": 1.6698, "learning_rate": 4.0586855600730314e-05, "epoch": 0.5676941084666407, "percentage": 56.77, "elapsed_time": "1 day, 0:06:15", "remaining_time": "18:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10186, "total_steps": 17941, "loss": 1.4475, "learning_rate": 4.057811073330925e-05, "epoch": 0.5677498467198038, "percentage": 56.77, "elapsed_time": "1 day, 0:06:24", "remaining_time": "18:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10187, "total_steps": 17941, "loss": 1.5655, "learning_rate": 4.056936616469559e-05, "epoch": 0.567805584972967, "percentage": 56.78, "elapsed_time": "1 day, 0:06:32", "remaining_time": "18:21:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10188, "total_steps": 17941, "loss": 1.7327, "learning_rate": 4.056062189516664e-05, "epoch": 0.5678613232261301, "percentage": 56.79, "elapsed_time": "1 day, 0:06:41", "remaining_time": "18:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10189, "total_steps": 17941, "loss": 1.8365, "learning_rate": 4.055187792499971e-05, "epoch": 0.5679170614792932, "percentage": 56.79, "elapsed_time": "1 day, 0:06:49", "remaining_time": "18:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10190, "total_steps": 17941, "loss": 1.5606, "learning_rate": 4.054313425447217e-05, "epoch": 0.5679727997324564, "percentage": 56.8, "elapsed_time": "1 day, 0:06:58", "remaining_time": "18:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10191, "total_steps": 17941, "loss": 1.5273, "learning_rate": 4.053439088386124e-05, "epoch": 0.5680285379856196, "percentage": 56.8, "elapsed_time": "1 day, 0:07:06", "remaining_time": "18:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10192, "total_steps": 17941, "loss": 1.6909, "learning_rate": 4.0525647813444254e-05, "epoch": 0.5680842762387827, "percentage": 56.81, "elapsed_time": "1 day, 0:07:15", "remaining_time": "18:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10193, "total_steps": 17941, "loss": 1.8376, "learning_rate": 4.0516905043498474e-05, "epoch": 0.5681400144919458, "percentage": 56.81, "elapsed_time": "1 day, 0:07:23", "remaining_time": "18:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10194, "total_steps": 17941, "loss": 1.4, "learning_rate": 4.0508162574301195e-05, "epoch": 0.5681957527451089, "percentage": 56.82, "elapsed_time": "1 day, 0:07:31", "remaining_time": "18:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10195, "total_steps": 17941, "loss": 1.6005, "learning_rate": 4.049942040612964e-05, "epoch": 0.5682514909982721, "percentage": 56.83, "elapsed_time": "1 day, 0:07:40", "remaining_time": "18:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10196, "total_steps": 17941, "loss": 1.6205, "learning_rate": 4.049067853926108e-05, "epoch": 0.5683072292514353, "percentage": 56.83, "elapsed_time": "1 day, 0:07:48", "remaining_time": "18:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10197, "total_steps": 17941, "loss": 1.7273, "learning_rate": 4.048193697397276e-05, "epoch": 0.5683629675045984, "percentage": 56.84, "elapsed_time": "1 day, 0:07:57", "remaining_time": "18:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10198, "total_steps": 17941, "loss": 1.7355, "learning_rate": 4.0473195710541886e-05, "epoch": 0.5684187057577615, "percentage": 56.84, "elapsed_time": "1 day, 0:08:05", "remaining_time": "18:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10199, "total_steps": 17941, "loss": 1.8361, "learning_rate": 4.046445474924573e-05, "epoch": 0.5684744440109247, "percentage": 56.85, "elapsed_time": "1 day, 0:08:14", "remaining_time": "18:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10200, "total_steps": 17941, "loss": 1.6124, "learning_rate": 4.0455714090361446e-05, "epoch": 0.5685301822640878, "percentage": 56.85, "elapsed_time": "1 day, 0:08:22", "remaining_time": "18:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10201, "total_steps": 17941, "loss": 1.8331, "learning_rate": 4.044697373416628e-05, "epoch": 0.568585920517251, "percentage": 56.86, "elapsed_time": "1 day, 0:08:31", "remaining_time": "18:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10202, "total_steps": 17941, "loss": 1.7974, "learning_rate": 4.04382336809374e-05, "epoch": 0.5686416587704142, "percentage": 56.86, "elapsed_time": "1 day, 0:08:39", "remaining_time": "18:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10203, "total_steps": 17941, "loss": 1.7206, "learning_rate": 4.0429493930952e-05, "epoch": 0.5686973970235772, "percentage": 56.87, "elapsed_time": "1 day, 0:08:47", "remaining_time": "18:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10204, "total_steps": 17941, "loss": 1.6667, "learning_rate": 4.042075448448726e-05, "epoch": 0.5687531352767404, "percentage": 56.88, "elapsed_time": "1 day, 0:08:56", "remaining_time": "18:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10205, "total_steps": 17941, "loss": 1.5124, "learning_rate": 4.041201534182033e-05, "epoch": 0.5688088735299036, "percentage": 56.88, "elapsed_time": "1 day, 0:09:05", "remaining_time": "18:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10206, "total_steps": 17941, "loss": 1.756, "learning_rate": 4.040327650322838e-05, "epoch": 0.5688646117830667, "percentage": 56.89, "elapsed_time": "1 day, 0:09:14", "remaining_time": "18:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10207, "total_steps": 17941, "loss": 1.7316, "learning_rate": 4.039453796898853e-05, "epoch": 0.5689203500362299, "percentage": 56.89, "elapsed_time": "1 day, 0:09:22", "remaining_time": "18:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10208, "total_steps": 17941, "loss": 1.6193, "learning_rate": 4.038579973937796e-05, "epoch": 0.5689760882893931, "percentage": 56.9, "elapsed_time": "1 day, 0:09:31", "remaining_time": "18:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10209, "total_steps": 17941, "loss": 1.8098, "learning_rate": 4.037706181467373e-05, "epoch": 0.5690318265425561, "percentage": 56.9, "elapsed_time": "1 day, 0:09:39", "remaining_time": "18:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10210, "total_steps": 17941, "loss": 1.792, "learning_rate": 4.036832419515301e-05, "epoch": 0.5690875647957193, "percentage": 56.91, "elapsed_time": "1 day, 0:09:48", "remaining_time": "18:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10211, "total_steps": 17941, "loss": 1.716, "learning_rate": 4.03595868810929e-05, "epoch": 0.5691433030488825, "percentage": 56.91, "elapsed_time": "1 day, 0:09:56", "remaining_time": "18:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10212, "total_steps": 17941, "loss": 1.5782, "learning_rate": 4.035084987277048e-05, "epoch": 0.5691990413020456, "percentage": 56.92, "elapsed_time": "1 day, 0:10:04", "remaining_time": "18:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10213, "total_steps": 17941, "loss": 1.7408, "learning_rate": 4.034211317046285e-05, "epoch": 0.5692547795552088, "percentage": 56.93, "elapsed_time": "1 day, 0:10:13", "remaining_time": "18:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10214, "total_steps": 17941, "loss": 1.5208, "learning_rate": 4.033337677444707e-05, "epoch": 0.5693105178083719, "percentage": 56.93, "elapsed_time": "1 day, 0:10:21", "remaining_time": "18:17:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10215, "total_steps": 17941, "loss": 1.7486, "learning_rate": 4.0324640685000206e-05, "epoch": 0.569366256061535, "percentage": 56.94, "elapsed_time": "1 day, 0:10:30", "remaining_time": "18:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10216, "total_steps": 17941, "loss": 1.8807, "learning_rate": 4.0315904902399367e-05, "epoch": 0.5694219943146982, "percentage": 56.94, "elapsed_time": "1 day, 0:10:38", "remaining_time": "18:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10217, "total_steps": 17941, "loss": 1.7639, "learning_rate": 4.030716942692153e-05, "epoch": 0.5694777325678613, "percentage": 56.95, "elapsed_time": "1 day, 0:10:47", "remaining_time": "18:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10218, "total_steps": 17941, "loss": 1.52, "learning_rate": 4.0298434258843775e-05, "epoch": 0.5695334708210245, "percentage": 56.95, "elapsed_time": "1 day, 0:10:56", "remaining_time": "18:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10219, "total_steps": 17941, "loss": 1.7166, "learning_rate": 4.028969939844312e-05, "epoch": 0.5695892090741876, "percentage": 56.96, "elapsed_time": "1 day, 0:11:04", "remaining_time": "18:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10220, "total_steps": 17941, "loss": 1.7338, "learning_rate": 4.0280964845996597e-05, "epoch": 0.5696449473273507, "percentage": 56.96, "elapsed_time": "1 day, 0:11:12", "remaining_time": "18:16:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10221, "total_steps": 17941, "loss": 1.7374, "learning_rate": 4.027223060178119e-05, "epoch": 0.5697006855805139, "percentage": 56.97, "elapsed_time": "1 day, 0:11:21", "remaining_time": "18:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10222, "total_steps": 17941, "loss": 1.4187, "learning_rate": 4.0263496666073907e-05, "epoch": 0.5697564238336771, "percentage": 56.98, "elapsed_time": "1 day, 0:11:29", "remaining_time": "18:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10223, "total_steps": 17941, "loss": 1.4252, "learning_rate": 4.025476303915176e-05, "epoch": 0.5698121620868402, "percentage": 56.98, "elapsed_time": "1 day, 0:11:38", "remaining_time": "18:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10224, "total_steps": 17941, "loss": 1.8751, "learning_rate": 4.024602972129169e-05, "epoch": 0.5698679003400033, "percentage": 56.99, "elapsed_time": "1 day, 0:11:46", "remaining_time": "18:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10225, "total_steps": 17941, "loss": 1.7274, "learning_rate": 4.0237296712770714e-05, "epoch": 0.5699236385931665, "percentage": 56.99, "elapsed_time": "1 day, 0:11:55", "remaining_time": "18:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10226, "total_steps": 17941, "loss": 1.7434, "learning_rate": 4.022856401386573e-05, "epoch": 0.5699793768463296, "percentage": 57.0, "elapsed_time": "1 day, 0:12:04", "remaining_time": "18:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10227, "total_steps": 17941, "loss": 1.7, "learning_rate": 4.0219831624853754e-05, "epoch": 0.5700351150994928, "percentage": 57.0, "elapsed_time": "1 day, 0:12:13", "remaining_time": "18:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10228, "total_steps": 17941, "loss": 1.3809, "learning_rate": 4.021109954601169e-05, "epoch": 0.570090853352656, "percentage": 57.01, "elapsed_time": "1 day, 0:12:22", "remaining_time": "18:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10229, "total_steps": 17941, "loss": 1.7109, "learning_rate": 4.020236777761646e-05, "epoch": 0.570146591605819, "percentage": 57.01, "elapsed_time": "1 day, 0:12:31", "remaining_time": "18:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10230, "total_steps": 17941, "loss": 1.8791, "learning_rate": 4.0193636319945025e-05, "epoch": 0.5702023298589822, "percentage": 57.02, "elapsed_time": "1 day, 0:12:40", "remaining_time": "18:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10231, "total_steps": 17941, "loss": 1.904, "learning_rate": 4.018490517327425e-05, "epoch": 0.5702580681121454, "percentage": 57.03, "elapsed_time": "1 day, 0:12:48", "remaining_time": "18:14:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10232, "total_steps": 17941, "loss": 1.7688, "learning_rate": 4.0176174337881076e-05, "epoch": 0.5703138063653085, "percentage": 57.03, "elapsed_time": "1 day, 0:12:58", "remaining_time": "18:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10233, "total_steps": 17941, "loss": 1.7515, "learning_rate": 4.0167443814042344e-05, "epoch": 0.5703695446184717, "percentage": 57.04, "elapsed_time": "1 day, 0:13:07", "remaining_time": "18:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10234, "total_steps": 17941, "loss": 1.7589, "learning_rate": 4.0158713602035004e-05, "epoch": 0.5704252828716349, "percentage": 57.04, "elapsed_time": "1 day, 0:13:16", "remaining_time": "18:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10235, "total_steps": 17941, "loss": 1.7212, "learning_rate": 4.014998370213586e-05, "epoch": 0.5704810211247979, "percentage": 57.05, "elapsed_time": "1 day, 0:13:25", "remaining_time": "18:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10236, "total_steps": 17941, "loss": 1.6665, "learning_rate": 4.0141254114621815e-05, "epoch": 0.5705367593779611, "percentage": 57.05, "elapsed_time": "1 day, 0:13:34", "remaining_time": "18:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10237, "total_steps": 17941, "loss": 1.7351, "learning_rate": 4.0132524839769716e-05, "epoch": 0.5705924976311243, "percentage": 57.06, "elapsed_time": "1 day, 0:13:43", "remaining_time": "18:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10238, "total_steps": 17941, "loss": 1.6007, "learning_rate": 4.0123795877856385e-05, "epoch": 0.5706482358842874, "percentage": 57.06, "elapsed_time": "1 day, 0:13:52", "remaining_time": "18:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10239, "total_steps": 17941, "loss": 1.706, "learning_rate": 4.011506722915867e-05, "epoch": 0.5707039741374506, "percentage": 57.07, "elapsed_time": "1 day, 0:14:01", "remaining_time": "18:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10240, "total_steps": 17941, "loss": 1.9076, "learning_rate": 4.01063388939534e-05, "epoch": 0.5707597123906136, "percentage": 57.08, "elapsed_time": "1 day, 0:14:09", "remaining_time": "18:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10241, "total_steps": 17941, "loss": 1.3349, "learning_rate": 4.009761087251735e-05, "epoch": 0.5708154506437768, "percentage": 57.08, "elapsed_time": "1 day, 0:14:18", "remaining_time": "18:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10242, "total_steps": 17941, "loss": 1.7024, "learning_rate": 4.008888316512738e-05, "epoch": 0.57087118889694, "percentage": 57.09, "elapsed_time": "1 day, 0:14:27", "remaining_time": "18:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10243, "total_steps": 17941, "loss": 1.8915, "learning_rate": 4.0080155772060225e-05, "epoch": 0.5709269271501031, "percentage": 57.09, "elapsed_time": "1 day, 0:14:36", "remaining_time": "18:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10244, "total_steps": 17941, "loss": 1.6265, "learning_rate": 4.007142869359272e-05, "epoch": 0.5709826654032663, "percentage": 57.1, "elapsed_time": "1 day, 0:14:44", "remaining_time": "18:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10245, "total_steps": 17941, "loss": 1.6305, "learning_rate": 4.006270193000158e-05, "epoch": 0.5710384036564294, "percentage": 57.1, "elapsed_time": "1 day, 0:14:53", "remaining_time": "18:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10246, "total_steps": 17941, "loss": 1.7311, "learning_rate": 4.005397548156362e-05, "epoch": 0.5710941419095925, "percentage": 57.11, "elapsed_time": "1 day, 0:15:01", "remaining_time": "18:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10247, "total_steps": 17941, "loss": 1.7237, "learning_rate": 4.004524934855555e-05, "epoch": 0.5711498801627557, "percentage": 57.11, "elapsed_time": "1 day, 0:15:10", "remaining_time": "18:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10248, "total_steps": 17941, "loss": 1.6268, "learning_rate": 4.0036523531254136e-05, "epoch": 0.5712056184159189, "percentage": 57.12, "elapsed_time": "1 day, 0:15:18", "remaining_time": "18:12:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10249, "total_steps": 17941, "loss": 1.6511, "learning_rate": 4.0027798029936114e-05, "epoch": 0.571261356669082, "percentage": 57.13, "elapsed_time": "1 day, 0:15:27", "remaining_time": "18:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10250, "total_steps": 17941, "loss": 1.554, "learning_rate": 4.001907284487818e-05, "epoch": 0.5713170949222451, "percentage": 57.13, "elapsed_time": "1 day, 0:15:35", "remaining_time": "18:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10251, "total_steps": 17941, "loss": 1.6915, "learning_rate": 4.0010347976357085e-05, "epoch": 0.5713728331754083, "percentage": 57.14, "elapsed_time": "1 day, 0:15:44", "remaining_time": "18:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10252, "total_steps": 17941, "loss": 1.8803, "learning_rate": 4.000162342464948e-05, "epoch": 0.5714285714285714, "percentage": 57.14, "elapsed_time": "1 day, 0:15:52", "remaining_time": "18:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10253, "total_steps": 17941, "loss": 1.7181, "learning_rate": 3.9992899190032104e-05, "epoch": 0.5714843096817346, "percentage": 57.15, "elapsed_time": "1 day, 0:16:01", "remaining_time": "18:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10254, "total_steps": 17941, "loss": 1.8356, "learning_rate": 3.998417527278162e-05, "epoch": 0.5715400479348978, "percentage": 57.15, "elapsed_time": "1 day, 0:16:09", "remaining_time": "18:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10255, "total_steps": 17941, "loss": 1.6524, "learning_rate": 3.997545167317469e-05, "epoch": 0.5715957861880608, "percentage": 57.16, "elapsed_time": "1 day, 0:16:18", "remaining_time": "18:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10256, "total_steps": 17941, "loss": 1.4982, "learning_rate": 3.9966728391488e-05, "epoch": 0.571651524441224, "percentage": 57.17, "elapsed_time": "1 day, 0:16:27", "remaining_time": "18:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10257, "total_steps": 17941, "loss": 1.6855, "learning_rate": 3.995800542799818e-05, "epoch": 0.5717072626943872, "percentage": 57.17, "elapsed_time": "1 day, 0:16:35", "remaining_time": "18:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10258, "total_steps": 17941, "loss": 1.6136, "learning_rate": 3.9949282782981886e-05, "epoch": 0.5717630009475503, "percentage": 57.18, "elapsed_time": "1 day, 0:16:44", "remaining_time": "18:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10259, "total_steps": 17941, "loss": 1.8276, "learning_rate": 3.994056045671572e-05, "epoch": 0.5718187392007135, "percentage": 57.18, "elapsed_time": "1 day, 0:16:52", "remaining_time": "18:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10260, "total_steps": 17941, "loss": 1.8052, "learning_rate": 3.993183844947635e-05, "epoch": 0.5718744774538767, "percentage": 57.19, "elapsed_time": "1 day, 0:17:01", "remaining_time": "18:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10261, "total_steps": 17941, "loss": 1.7339, "learning_rate": 3.992311676154035e-05, "epoch": 0.5719302157070397, "percentage": 57.19, "elapsed_time": "1 day, 0:17:09", "remaining_time": "18:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10262, "total_steps": 17941, "loss": 1.593, "learning_rate": 3.991439539318434e-05, "epoch": 0.5719859539602029, "percentage": 57.2, "elapsed_time": "1 day, 0:17:18", "remaining_time": "18:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10263, "total_steps": 17941, "loss": 1.5935, "learning_rate": 3.99056743446849e-05, "epoch": 0.572041692213366, "percentage": 57.2, "elapsed_time": "1 day, 0:17:26", "remaining_time": "18:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10264, "total_steps": 17941, "loss": 1.7039, "learning_rate": 3.9896953616318614e-05, "epoch": 0.5720974304665292, "percentage": 57.21, "elapsed_time": "1 day, 0:17:35", "remaining_time": "18:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10265, "total_steps": 17941, "loss": 1.718, "learning_rate": 3.988823320836207e-05, "epoch": 0.5721531687196924, "percentage": 57.22, "elapsed_time": "1 day, 0:17:43", "remaining_time": "18:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10266, "total_steps": 17941, "loss": 1.6327, "learning_rate": 3.9879513121091795e-05, "epoch": 0.5722089069728554, "percentage": 57.22, "elapsed_time": "1 day, 0:17:52", "remaining_time": "18:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10267, "total_steps": 17941, "loss": 1.7032, "learning_rate": 3.987079335478435e-05, "epoch": 0.5722646452260186, "percentage": 57.23, "elapsed_time": "1 day, 0:18:00", "remaining_time": "18:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10268, "total_steps": 17941, "loss": 1.6994, "learning_rate": 3.986207390971631e-05, "epoch": 0.5723203834791818, "percentage": 57.23, "elapsed_time": "1 day, 0:18:09", "remaining_time": "18:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10269, "total_steps": 17941, "loss": 1.6933, "learning_rate": 3.985335478616415e-05, "epoch": 0.5723761217323449, "percentage": 57.24, "elapsed_time": "1 day, 0:18:17", "remaining_time": "18:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10270, "total_steps": 17941, "loss": 1.3312, "learning_rate": 3.984463598440444e-05, "epoch": 0.572431859985508, "percentage": 57.24, "elapsed_time": "1 day, 0:18:26", "remaining_time": "18:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10271, "total_steps": 17941, "loss": 1.5176, "learning_rate": 3.983591750471366e-05, "epoch": 0.5724875982386712, "percentage": 57.25, "elapsed_time": "1 day, 0:18:34", "remaining_time": "18:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10272, "total_steps": 17941, "loss": 1.6718, "learning_rate": 3.982719934736832e-05, "epoch": 0.5725433364918343, "percentage": 57.25, "elapsed_time": "1 day, 0:18:43", "remaining_time": "18:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10273, "total_steps": 17941, "loss": 1.6548, "learning_rate": 3.981848151264489e-05, "epoch": 0.5725990747449975, "percentage": 57.26, "elapsed_time": "1 day, 0:18:52", "remaining_time": "18:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10274, "total_steps": 17941, "loss": 1.6723, "learning_rate": 3.9809764000819875e-05, "epoch": 0.5726548129981607, "percentage": 57.27, "elapsed_time": "1 day, 0:19:00", "remaining_time": "18:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10275, "total_steps": 17941, "loss": 1.673, "learning_rate": 3.980104681216974e-05, "epoch": 0.5727105512513238, "percentage": 57.27, "elapsed_time": "1 day, 0:19:09", "remaining_time": "18:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10276, "total_steps": 17941, "loss": 1.2947, "learning_rate": 3.979232994697091e-05, "epoch": 0.5727662895044869, "percentage": 57.28, "elapsed_time": "1 day, 0:19:17", "remaining_time": "18:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10277, "total_steps": 17941, "loss": 1.6502, "learning_rate": 3.97836134054999e-05, "epoch": 0.5728220277576501, "percentage": 57.28, "elapsed_time": "1 day, 0:19:26", "remaining_time": "18:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10278, "total_steps": 17941, "loss": 1.8275, "learning_rate": 3.9774897188033064e-05, "epoch": 0.5728777660108132, "percentage": 57.29, "elapsed_time": "1 day, 0:19:34", "remaining_time": "18:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10279, "total_steps": 17941, "loss": 1.7393, "learning_rate": 3.97661812948469e-05, "epoch": 0.5729335042639764, "percentage": 57.29, "elapsed_time": "1 day, 0:19:43", "remaining_time": "18:08:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10280, "total_steps": 17941, "loss": 1.6816, "learning_rate": 3.975746572621778e-05, "epoch": 0.5729892425171396, "percentage": 57.3, "elapsed_time": "1 day, 0:19:51", "remaining_time": "18:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10281, "total_steps": 17941, "loss": 1.5666, "learning_rate": 3.9748750482422145e-05, "epoch": 0.5730449807703026, "percentage": 57.3, "elapsed_time": "1 day, 0:19:59", "remaining_time": "18:07:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10282, "total_steps": 17941, "loss": 1.611, "learning_rate": 3.974003556373637e-05, "epoch": 0.5731007190234658, "percentage": 57.31, "elapsed_time": "1 day, 0:20:08", "remaining_time": "18:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10283, "total_steps": 17941, "loss": 1.6061, "learning_rate": 3.973132097043685e-05, "epoch": 0.573156457276629, "percentage": 57.32, "elapsed_time": "1 day, 0:20:16", "remaining_time": "18:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10284, "total_steps": 17941, "loss": 1.7779, "learning_rate": 3.972260670279996e-05, "epoch": 0.5732121955297921, "percentage": 57.32, "elapsed_time": "1 day, 0:20:25", "remaining_time": "18:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10285, "total_steps": 17941, "loss": 1.6468, "learning_rate": 3.971389276110204e-05, "epoch": 0.5732679337829553, "percentage": 57.33, "elapsed_time": "1 day, 0:20:33", "remaining_time": "18:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10286, "total_steps": 17941, "loss": 1.6013, "learning_rate": 3.970517914561951e-05, "epoch": 0.5733236720361183, "percentage": 57.33, "elapsed_time": "1 day, 0:20:42", "remaining_time": "18:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10287, "total_steps": 17941, "loss": 1.7013, "learning_rate": 3.969646585662864e-05, "epoch": 0.5733794102892815, "percentage": 57.34, "elapsed_time": "1 day, 0:20:51", "remaining_time": "18:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10288, "total_steps": 17941, "loss": 1.7675, "learning_rate": 3.9687752894405804e-05, "epoch": 0.5734351485424447, "percentage": 57.34, "elapsed_time": "1 day, 0:20:59", "remaining_time": "18:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10289, "total_steps": 17941, "loss": 1.5965, "learning_rate": 3.9687752894405804e-05, "epoch": 0.5734908867956078, "percentage": 57.35, "elapsed_time": "1 day, 0:21:08", "remaining_time": "18:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10290, "total_steps": 17941, "loss": 1.6883, "learning_rate": 3.967904025922734e-05, "epoch": 0.573546625048771, "percentage": 57.35, "elapsed_time": "1 day, 0:21:16", "remaining_time": "18:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10291, "total_steps": 17941, "loss": 1.6156, "learning_rate": 3.9670327951369537e-05, "epoch": 0.5736023633019341, "percentage": 57.36, "elapsed_time": "1 day, 0:21:25", "remaining_time": "18:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10292, "total_steps": 17941, "loss": 1.6129, "learning_rate": 3.9661615971108706e-05, "epoch": 0.5736581015550972, "percentage": 57.37, "elapsed_time": "1 day, 0:21:33", "remaining_time": "18:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10293, "total_steps": 17941, "loss": 1.7097, "learning_rate": 3.965290431872113e-05, "epoch": 0.5737138398082604, "percentage": 57.37, "elapsed_time": "1 day, 0:21:42", "remaining_time": "18:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10294, "total_steps": 17941, "loss": 1.9848, "learning_rate": 3.9644192994483095e-05, "epoch": 0.5737695780614236, "percentage": 57.38, "elapsed_time": "1 day, 0:21:50", "remaining_time": "18:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10295, "total_steps": 17941, "loss": 1.7762, "learning_rate": 3.96354819986709e-05, "epoch": 0.5738253163145867, "percentage": 57.38, "elapsed_time": "1 day, 0:21:59", "remaining_time": "18:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10296, "total_steps": 17941, "loss": 1.5887, "learning_rate": 3.9626771331560766e-05, "epoch": 0.5738810545677498, "percentage": 57.39, "elapsed_time": "1 day, 0:22:07", "remaining_time": "18:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10297, "total_steps": 17941, "loss": 1.8988, "learning_rate": 3.961806099342899e-05, "epoch": 0.573936792820913, "percentage": 57.39, "elapsed_time": "1 day, 0:22:16", "remaining_time": "18:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10298, "total_steps": 17941, "loss": 1.7073, "learning_rate": 3.960935098455177e-05, "epoch": 0.5739925310740761, "percentage": 57.4, "elapsed_time": "1 day, 0:22:24", "remaining_time": "18:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10299, "total_steps": 17941, "loss": 1.5212, "learning_rate": 3.9600641305205365e-05, "epoch": 0.5740482693272393, "percentage": 57.4, "elapsed_time": "1 day, 0:22:33", "remaining_time": "18:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10300, "total_steps": 17941, "loss": 1.4532, "learning_rate": 3.959193195566598e-05, "epoch": 0.5741040075804025, "percentage": 57.41, "elapsed_time": "1 day, 0:22:41", "remaining_time": "18:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10301, "total_steps": 17941, "loss": 1.7352, "learning_rate": 3.958322293620982e-05, "epoch": 0.5741597458335655, "percentage": 57.42, "elapsed_time": "1 day, 0:22:50", "remaining_time": "18:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10302, "total_steps": 17941, "loss": 1.7068, "learning_rate": 3.957451424711312e-05, "epoch": 0.5742154840867287, "percentage": 57.42, "elapsed_time": "1 day, 0:22:58", "remaining_time": "18:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10303, "total_steps": 17941, "loss": 1.8338, "learning_rate": 3.956580588865202e-05, "epoch": 0.5742712223398919, "percentage": 57.43, "elapsed_time": "1 day, 0:23:07", "remaining_time": "18:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10304, "total_steps": 17941, "loss": 1.3051, "learning_rate": 3.955709786110274e-05, "epoch": 0.574326960593055, "percentage": 57.43, "elapsed_time": "1 day, 0:23:15", "remaining_time": "18:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10305, "total_steps": 17941, "loss": 1.4312, "learning_rate": 3.954839016474141e-05, "epoch": 0.5743826988462182, "percentage": 57.44, "elapsed_time": "1 day, 0:23:24", "remaining_time": "18:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10306, "total_steps": 17941, "loss": 1.6097, "learning_rate": 3.953968279984422e-05, "epoch": 0.5744384370993814, "percentage": 57.44, "elapsed_time": "1 day, 0:23:32", "remaining_time": "18:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10307, "total_steps": 17941, "loss": 1.7451, "learning_rate": 3.95309757666873e-05, "epoch": 0.5744941753525444, "percentage": 57.45, "elapsed_time": "1 day, 0:23:41", "remaining_time": "18:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10308, "total_steps": 17941, "loss": 1.8016, "learning_rate": 3.952226906554679e-05, "epoch": 0.5745499136057076, "percentage": 57.45, "elapsed_time": "1 day, 0:23:49", "remaining_time": "18:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10309, "total_steps": 17941, "loss": 1.6584, "learning_rate": 3.9513562696698826e-05, "epoch": 0.5746056518588707, "percentage": 57.46, "elapsed_time": "1 day, 0:23:58", "remaining_time": "18:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10310, "total_steps": 17941, "loss": 1.5651, "learning_rate": 3.9504856660419495e-05, "epoch": 0.5746613901120339, "percentage": 57.47, "elapsed_time": "1 day, 0:24:06", "remaining_time": "18:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10311, "total_steps": 17941, "loss": 1.7212, "learning_rate": 3.949615095698494e-05, "epoch": 0.5747171283651971, "percentage": 57.47, "elapsed_time": "1 day, 0:24:15", "remaining_time": "18:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10312, "total_steps": 17941, "loss": 1.3938, "learning_rate": 3.948744558667121e-05, "epoch": 0.5747728666183601, "percentage": 57.48, "elapsed_time": "1 day, 0:24:23", "remaining_time": "18:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10313, "total_steps": 17941, "loss": 1.6182, "learning_rate": 3.9478740549754444e-05, "epoch": 0.5748286048715233, "percentage": 57.48, "elapsed_time": "1 day, 0:24:32", "remaining_time": "18:03:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10314, "total_steps": 17941, "loss": 1.5559, "learning_rate": 3.947003584651065e-05, "epoch": 0.5748843431246865, "percentage": 57.49, "elapsed_time": "1 day, 0:24:40", "remaining_time": "18:03:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10315, "total_steps": 17941, "loss": 1.8528, "learning_rate": 3.946133147721594e-05, "epoch": 0.5749400813778496, "percentage": 57.49, "elapsed_time": "1 day, 0:24:49", "remaining_time": "18:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10316, "total_steps": 17941, "loss": 1.3252, "learning_rate": 3.945262744214636e-05, "epoch": 0.5749958196310128, "percentage": 57.5, "elapsed_time": "1 day, 0:24:58", "remaining_time": "18:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10317, "total_steps": 17941, "loss": 1.6752, "learning_rate": 3.9443923741577935e-05, "epoch": 0.575051557884176, "percentage": 57.51, "elapsed_time": "1 day, 0:25:06", "remaining_time": "18:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10318, "total_steps": 17941, "loss": 1.8702, "learning_rate": 3.943522037578671e-05, "epoch": 0.575107296137339, "percentage": 57.51, "elapsed_time": "1 day, 0:25:15", "remaining_time": "18:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10319, "total_steps": 17941, "loss": 1.7431, "learning_rate": 3.942651734504869e-05, "epoch": 0.5751630343905022, "percentage": 57.52, "elapsed_time": "1 day, 0:25:24", "remaining_time": "18:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10320, "total_steps": 17941, "loss": 1.7095, "learning_rate": 3.9417814649639893e-05, "epoch": 0.5752187726436654, "percentage": 57.52, "elapsed_time": "1 day, 0:25:32", "remaining_time": "18:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10321, "total_steps": 17941, "loss": 1.7306, "learning_rate": 3.9409112289836305e-05, "epoch": 0.5752745108968285, "percentage": 57.53, "elapsed_time": "1 day, 0:25:40", "remaining_time": "18:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10322, "total_steps": 17941, "loss": 1.5845, "learning_rate": 3.9400410265913936e-05, "epoch": 0.5753302491499916, "percentage": 57.53, "elapsed_time": "1 day, 0:25:49", "remaining_time": "18:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10323, "total_steps": 17941, "loss": 1.7804, "learning_rate": 3.939170857814876e-05, "epoch": 0.5753859874031548, "percentage": 57.54, "elapsed_time": "1 day, 0:25:57", "remaining_time": "18:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10324, "total_steps": 17941, "loss": 1.6929, "learning_rate": 3.9383007226816726e-05, "epoch": 0.5754417256563179, "percentage": 57.54, "elapsed_time": "1 day, 0:26:06", "remaining_time": "18:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10325, "total_steps": 17941, "loss": 1.7542, "learning_rate": 3.937430621219382e-05, "epoch": 0.5754974639094811, "percentage": 57.55, "elapsed_time": "1 day, 0:26:14", "remaining_time": "18:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10326, "total_steps": 17941, "loss": 1.7471, "learning_rate": 3.936560553455595e-05, "epoch": 0.5755532021626443, "percentage": 57.56, "elapsed_time": "1 day, 0:26:23", "remaining_time": "18:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10327, "total_steps": 17941, "loss": 1.7389, "learning_rate": 3.935690519417906e-05, "epoch": 0.5756089404158073, "percentage": 57.56, "elapsed_time": "1 day, 0:26:32", "remaining_time": "18:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10328, "total_steps": 17941, "loss": 1.6225, "learning_rate": 3.934820519133912e-05, "epoch": 0.5756646786689705, "percentage": 57.57, "elapsed_time": "1 day, 0:26:40", "remaining_time": "18:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10329, "total_steps": 17941, "loss": 1.1692, "learning_rate": 3.933950552631198e-05, "epoch": 0.5757204169221337, "percentage": 57.57, "elapsed_time": "1 day, 0:26:49", "remaining_time": "18:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10330, "total_steps": 17941, "loss": 1.697, "learning_rate": 3.9330806199373595e-05, "epoch": 0.5757761551752968, "percentage": 57.58, "elapsed_time": "1 day, 0:26:58", "remaining_time": "18:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10331, "total_steps": 17941, "loss": 1.6768, "learning_rate": 3.9322107210799795e-05, "epoch": 0.57583189342846, "percentage": 57.58, "elapsed_time": "1 day, 0:27:07", "remaining_time": "18:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10332, "total_steps": 17941, "loss": 1.7127, "learning_rate": 3.931340856086652e-05, "epoch": 0.575887631681623, "percentage": 57.59, "elapsed_time": "1 day, 0:27:15", "remaining_time": "18:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10333, "total_steps": 17941, "loss": 1.7439, "learning_rate": 3.930471024984961e-05, "epoch": 0.5759433699347862, "percentage": 57.59, "elapsed_time": "1 day, 0:27:24", "remaining_time": "18:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10334, "total_steps": 17941, "loss": 1.622, "learning_rate": 3.929601227802494e-05, "epoch": 0.5759991081879494, "percentage": 57.6, "elapsed_time": "1 day, 0:27:32", "remaining_time": "18:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10335, "total_steps": 17941, "loss": 1.5308, "learning_rate": 3.928731464566836e-05, "epoch": 0.5760548464411125, "percentage": 57.61, "elapsed_time": "1 day, 0:27:41", "remaining_time": "18:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10336, "total_steps": 17941, "loss": 1.7297, "learning_rate": 3.927861735305568e-05, "epoch": 0.5761105846942757, "percentage": 57.61, "elapsed_time": "1 day, 0:27:49", "remaining_time": "17:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10337, "total_steps": 17941, "loss": 1.8108, "learning_rate": 3.926992040046277e-05, "epoch": 0.5761663229474389, "percentage": 57.62, "elapsed_time": "1 day, 0:27:58", "remaining_time": "17:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10338, "total_steps": 17941, "loss": 1.4936, "learning_rate": 3.926122378816539e-05, "epoch": 0.5762220612006019, "percentage": 57.62, "elapsed_time": "1 day, 0:28:06", "remaining_time": "17:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10339, "total_steps": 17941, "loss": 1.5076, "learning_rate": 3.925252751643942e-05, "epoch": 0.5762777994537651, "percentage": 57.63, "elapsed_time": "1 day, 0:28:15", "remaining_time": "17:59:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10340, "total_steps": 17941, "loss": 1.7351, "learning_rate": 3.924383158556059e-05, "epoch": 0.5763335377069283, "percentage": 57.63, "elapsed_time": "1 day, 0:28:23", "remaining_time": "17:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10341, "total_steps": 17941, "loss": 1.6554, "learning_rate": 3.9235135995804705e-05, "epoch": 0.5763892759600914, "percentage": 57.64, "elapsed_time": "1 day, 0:28:32", "remaining_time": "17:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10342, "total_steps": 17941, "loss": 1.624, "learning_rate": 3.9226440747447565e-05, "epoch": 0.5764450142132546, "percentage": 57.64, "elapsed_time": "1 day, 0:28:40", "remaining_time": "17:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10343, "total_steps": 17941, "loss": 1.5321, "learning_rate": 3.9217745840764895e-05, "epoch": 0.5765007524664177, "percentage": 57.65, "elapsed_time": "1 day, 0:28:49", "remaining_time": "17:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10344, "total_steps": 17941, "loss": 1.5408, "learning_rate": 3.920905127603247e-05, "epoch": 0.5765564907195808, "percentage": 57.66, "elapsed_time": "1 day, 0:28:57", "remaining_time": "17:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10345, "total_steps": 17941, "loss": 1.587, "learning_rate": 3.920035705352602e-05, "epoch": 0.576612228972744, "percentage": 57.66, "elapsed_time": "1 day, 0:29:06", "remaining_time": "17:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10346, "total_steps": 17941, "loss": 1.7007, "learning_rate": 3.9191663173521284e-05, "epoch": 0.5766679672259072, "percentage": 57.67, "elapsed_time": "1 day, 0:29:14", "remaining_time": "17:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10347, "total_steps": 17941, "loss": 1.7961, "learning_rate": 3.918296963629395e-05, "epoch": 0.5767237054790703, "percentage": 57.67, "elapsed_time": "1 day, 0:29:23", "remaining_time": "17:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10348, "total_steps": 17941, "loss": 1.5591, "learning_rate": 3.9174276442119766e-05, "epoch": 0.5767794437322334, "percentage": 57.68, "elapsed_time": "1 day, 0:29:31", "remaining_time": "17:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10349, "total_steps": 17941, "loss": 1.6161, "learning_rate": 3.916558359127443e-05, "epoch": 0.5768351819853966, "percentage": 57.68, "elapsed_time": "1 day, 0:29:40", "remaining_time": "17:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10350, "total_steps": 17941, "loss": 1.6975, "learning_rate": 3.9156891084033596e-05, "epoch": 0.5768909202385597, "percentage": 57.69, "elapsed_time": "1 day, 0:29:48", "remaining_time": "17:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10351, "total_steps": 17941, "loss": 1.7234, "learning_rate": 3.9148198920672975e-05, "epoch": 0.5769466584917229, "percentage": 57.69, "elapsed_time": "1 day, 0:29:57", "remaining_time": "17:57:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10352, "total_steps": 17941, "loss": 1.5164, "learning_rate": 3.913950710146819e-05, "epoch": 0.5770023967448861, "percentage": 57.7, "elapsed_time": "1 day, 0:30:05", "remaining_time": "17:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10353, "total_steps": 17941, "loss": 1.7445, "learning_rate": 3.913081562669492e-05, "epoch": 0.5770581349980491, "percentage": 57.71, "elapsed_time": "1 day, 0:30:14", "remaining_time": "17:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10354, "total_steps": 17941, "loss": 1.5357, "learning_rate": 3.9122124496628836e-05, "epoch": 0.5771138732512123, "percentage": 57.71, "elapsed_time": "1 day, 0:30:22", "remaining_time": "17:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10355, "total_steps": 17941, "loss": 1.8522, "learning_rate": 3.911343371154551e-05, "epoch": 0.5771696115043754, "percentage": 57.72, "elapsed_time": "1 day, 0:30:31", "remaining_time": "17:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10356, "total_steps": 17941, "loss": 2.0213, "learning_rate": 3.9104743271720624e-05, "epoch": 0.5772253497575386, "percentage": 57.72, "elapsed_time": "1 day, 0:30:39", "remaining_time": "17:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10357, "total_steps": 17941, "loss": 1.8434, "learning_rate": 3.909605317742972e-05, "epoch": 0.5772810880107018, "percentage": 57.73, "elapsed_time": "1 day, 0:30:48", "remaining_time": "17:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10358, "total_steps": 17941, "loss": 1.5575, "learning_rate": 3.908736342894846e-05, "epoch": 0.5773368262638648, "percentage": 57.73, "elapsed_time": "1 day, 0:30:56", "remaining_time": "17:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10359, "total_steps": 17941, "loss": 1.6087, "learning_rate": 3.90786740265524e-05, "epoch": 0.577392564517028, "percentage": 57.74, "elapsed_time": "1 day, 0:31:05", "remaining_time": "17:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10360, "total_steps": 17941, "loss": 1.6299, "learning_rate": 3.9069984970517124e-05, "epoch": 0.5774483027701912, "percentage": 57.74, "elapsed_time": "1 day, 0:31:13", "remaining_time": "17:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10361, "total_steps": 17941, "loss": 1.7779, "learning_rate": 3.90612962611182e-05, "epoch": 0.5775040410233543, "percentage": 57.75, "elapsed_time": "1 day, 0:31:22", "remaining_time": "17:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10362, "total_steps": 17941, "loss": 1.4732, "learning_rate": 3.905260789863118e-05, "epoch": 0.5775597792765175, "percentage": 57.76, "elapsed_time": "1 day, 0:31:30", "remaining_time": "17:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10363, "total_steps": 17941, "loss": 1.7523, "learning_rate": 3.9043919883331615e-05, "epoch": 0.5776155175296807, "percentage": 57.76, "elapsed_time": "1 day, 0:31:39", "remaining_time": "17:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10364, "total_steps": 17941, "loss": 1.617, "learning_rate": 3.903523221549502e-05, "epoch": 0.5776712557828437, "percentage": 57.77, "elapsed_time": "1 day, 0:31:47", "remaining_time": "17:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10365, "total_steps": 17941, "loss": 2.0081, "learning_rate": 3.902654489539695e-05, "epoch": 0.5777269940360069, "percentage": 57.77, "elapsed_time": "1 day, 0:31:56", "remaining_time": "17:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10366, "total_steps": 17941, "loss": 1.6251, "learning_rate": 3.901785792331287e-05, "epoch": 0.5777827322891701, "percentage": 57.78, "elapsed_time": "1 day, 0:32:04", "remaining_time": "17:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10367, "total_steps": 17941, "loss": 1.6483, "learning_rate": 3.9009171299518324e-05, "epoch": 0.5778384705423332, "percentage": 57.78, "elapsed_time": "1 day, 0:32:13", "remaining_time": "17:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10368, "total_steps": 17941, "loss": 1.3879, "learning_rate": 3.9000485024288784e-05, "epoch": 0.5778942087954964, "percentage": 57.79, "elapsed_time": "1 day, 0:32:21", "remaining_time": "17:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10369, "total_steps": 17941, "loss": 1.548, "learning_rate": 3.899179909789972e-05, "epoch": 0.5779499470486595, "percentage": 57.79, "elapsed_time": "1 day, 0:32:30", "remaining_time": "17:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10370, "total_steps": 17941, "loss": 1.9616, "learning_rate": 3.898311352062662e-05, "epoch": 0.5780056853018226, "percentage": 57.8, "elapsed_time": "1 day, 0:32:39", "remaining_time": "17:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10371, "total_steps": 17941, "loss": 1.7795, "learning_rate": 3.8974428292744914e-05, "epoch": 0.5780614235549858, "percentage": 57.81, "elapsed_time": "1 day, 0:32:47", "remaining_time": "17:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10372, "total_steps": 17941, "loss": 1.6974, "learning_rate": 3.896574341453007e-05, "epoch": 0.578117161808149, "percentage": 57.81, "elapsed_time": "1 day, 0:32:56", "remaining_time": "17:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10373, "total_steps": 17941, "loss": 1.4682, "learning_rate": 3.895705888625748e-05, "epoch": 0.5781729000613121, "percentage": 57.82, "elapsed_time": "1 day, 0:33:05", "remaining_time": "17:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10374, "total_steps": 17941, "loss": 1.4336, "learning_rate": 3.894837470820262e-05, "epoch": 0.5782286383144752, "percentage": 57.82, "elapsed_time": "1 day, 0:33:14", "remaining_time": "17:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10375, "total_steps": 17941, "loss": 1.6593, "learning_rate": 3.8939690880640885e-05, "epoch": 0.5782843765676384, "percentage": 57.83, "elapsed_time": "1 day, 0:33:22", "remaining_time": "17:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10376, "total_steps": 17941, "loss": 1.6772, "learning_rate": 3.893100740384766e-05, "epoch": 0.5783401148208015, "percentage": 57.83, "elapsed_time": "1 day, 0:33:30", "remaining_time": "17:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10377, "total_steps": 17941, "loss": 1.7087, "learning_rate": 3.8922324278098356e-05, "epoch": 0.5783958530739647, "percentage": 57.84, "elapsed_time": "1 day, 0:33:39", "remaining_time": "17:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10378, "total_steps": 17941, "loss": 1.4623, "learning_rate": 3.891364150366832e-05, "epoch": 0.5784515913271278, "percentage": 57.85, "elapsed_time": "1 day, 0:33:47", "remaining_time": "17:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10379, "total_steps": 17941, "loss": 1.6518, "learning_rate": 3.890495908083293e-05, "epoch": 0.5785073295802909, "percentage": 57.85, "elapsed_time": "1 day, 0:33:56", "remaining_time": "17:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10380, "total_steps": 17941, "loss": 1.5737, "learning_rate": 3.889627700986759e-05, "epoch": 0.5785630678334541, "percentage": 57.86, "elapsed_time": "1 day, 0:34:04", "remaining_time": "17:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10381, "total_steps": 17941, "loss": 1.5644, "learning_rate": 3.8887595291047564e-05, "epoch": 0.5786188060866172, "percentage": 57.86, "elapsed_time": "1 day, 0:34:13", "remaining_time": "17:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10382, "total_steps": 17941, "loss": 1.8534, "learning_rate": 3.887891392464825e-05, "epoch": 0.5786745443397804, "percentage": 57.87, "elapsed_time": "1 day, 0:34:21", "remaining_time": "17:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10383, "total_steps": 17941, "loss": 1.8821, "learning_rate": 3.8870232910944924e-05, "epoch": 0.5787302825929436, "percentage": 57.87, "elapsed_time": "1 day, 0:34:30", "remaining_time": "17:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10384, "total_steps": 17941, "loss": 1.8454, "learning_rate": 3.886155225021294e-05, "epoch": 0.5787860208461066, "percentage": 57.88, "elapsed_time": "1 day, 0:34:38", "remaining_time": "17:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10385, "total_steps": 17941, "loss": 1.4968, "learning_rate": 3.885287194272757e-05, "epoch": 0.5788417590992698, "percentage": 57.88, "elapsed_time": "1 day, 0:34:47", "remaining_time": "17:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10386, "total_steps": 17941, "loss": 1.7601, "learning_rate": 3.884419198876411e-05, "epoch": 0.578897497352433, "percentage": 57.89, "elapsed_time": "1 day, 0:34:55", "remaining_time": "17:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10387, "total_steps": 17941, "loss": 1.7149, "learning_rate": 3.8835512388597836e-05, "epoch": 0.5789532356055961, "percentage": 57.9, "elapsed_time": "1 day, 0:35:05", "remaining_time": "17:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10388, "total_steps": 17941, "loss": 1.6867, "learning_rate": 3.8826833142504006e-05, "epoch": 0.5790089738587593, "percentage": 57.9, "elapsed_time": "1 day, 0:35:13", "remaining_time": "17:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10389, "total_steps": 17941, "loss": 1.6042, "learning_rate": 3.881815425075791e-05, "epoch": 0.5790647121119225, "percentage": 57.91, "elapsed_time": "1 day, 0:35:22", "remaining_time": "17:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10390, "total_steps": 17941, "loss": 1.7868, "learning_rate": 3.880947571363474e-05, "epoch": 0.5791204503650855, "percentage": 57.91, "elapsed_time": "1 day, 0:35:30", "remaining_time": "17:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10391, "total_steps": 17941, "loss": 1.8606, "learning_rate": 3.880079753140978e-05, "epoch": 0.5791761886182487, "percentage": 57.92, "elapsed_time": "1 day, 0:35:39", "remaining_time": "17:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10392, "total_steps": 17941, "loss": 1.5603, "learning_rate": 3.87921197043582e-05, "epoch": 0.5792319268714119, "percentage": 57.92, "elapsed_time": "1 day, 0:35:47", "remaining_time": "17:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10393, "total_steps": 17941, "loss": 1.9158, "learning_rate": 3.878344223275524e-05, "epoch": 0.579287665124575, "percentage": 57.93, "elapsed_time": "1 day, 0:35:56", "remaining_time": "17:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10394, "total_steps": 17941, "loss": 1.62, "learning_rate": 3.877476511687611e-05, "epoch": 0.5793434033777382, "percentage": 57.93, "elapsed_time": "1 day, 0:36:04", "remaining_time": "17:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10395, "total_steps": 17941, "loss": 1.5055, "learning_rate": 3.8766088356995976e-05, "epoch": 0.5793991416309013, "percentage": 57.94, "elapsed_time": "1 day, 0:36:13", "remaining_time": "17:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10396, "total_steps": 17941, "loss": 1.7256, "learning_rate": 3.875741195339003e-05, "epoch": 0.5794548798840644, "percentage": 57.95, "elapsed_time": "1 day, 0:36:21", "remaining_time": "17:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10397, "total_steps": 17941, "loss": 1.6768, "learning_rate": 3.874873590633341e-05, "epoch": 0.5795106181372276, "percentage": 57.95, "elapsed_time": "1 day, 0:36:30", "remaining_time": "17:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10398, "total_steps": 17941, "loss": 1.676, "learning_rate": 3.874006021610131e-05, "epoch": 0.5795663563903908, "percentage": 57.96, "elapsed_time": "1 day, 0:36:38", "remaining_time": "17:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10399, "total_steps": 17941, "loss": 1.5099, "learning_rate": 3.8731384882968824e-05, "epoch": 0.5796220946435539, "percentage": 57.96, "elapsed_time": "1 day, 0:36:46", "remaining_time": "17:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10400, "total_steps": 17941, "loss": 1.7212, "learning_rate": 3.872270990721112e-05, "epoch": 0.579677832896717, "percentage": 57.97, "elapsed_time": "1 day, 0:36:55", "remaining_time": "17:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10401, "total_steps": 17941, "loss": 1.66, "learning_rate": 3.8714035289103314e-05, "epoch": 0.5797335711498801, "percentage": 57.97, "elapsed_time": "1 day, 0:37:04", "remaining_time": "17:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10402, "total_steps": 17941, "loss": 1.7655, "learning_rate": 3.8705361028920494e-05, "epoch": 0.5797893094030433, "percentage": 57.98, "elapsed_time": "1 day, 0:37:12", "remaining_time": "17:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10403, "total_steps": 17941, "loss": 1.5689, "learning_rate": 3.869668712693778e-05, "epoch": 0.5798450476562065, "percentage": 57.98, "elapsed_time": "1 day, 0:37:20", "remaining_time": "17:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10404, "total_steps": 17941, "loss": 1.6214, "learning_rate": 3.868801358343025e-05, "epoch": 0.5799007859093696, "percentage": 57.99, "elapsed_time": "1 day, 0:37:29", "remaining_time": "17:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10405, "total_steps": 17941, "loss": 1.5918, "learning_rate": 3.8679340398672953e-05, "epoch": 0.5799565241625327, "percentage": 58.0, "elapsed_time": "1 day, 0:37:37", "remaining_time": "17:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10406, "total_steps": 17941, "loss": 1.5958, "learning_rate": 3.867066757294101e-05, "epoch": 0.5800122624156959, "percentage": 58.0, "elapsed_time": "1 day, 0:37:46", "remaining_time": "17:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10407, "total_steps": 17941, "loss": 1.6475, "learning_rate": 3.866199510650941e-05, "epoch": 0.580068000668859, "percentage": 58.01, "elapsed_time": "1 day, 0:37:54", "remaining_time": "17:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10408, "total_steps": 17941, "loss": 1.6921, "learning_rate": 3.865332299965323e-05, "epoch": 0.5801237389220222, "percentage": 58.01, "elapsed_time": "1 day, 0:38:03", "remaining_time": "17:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10409, "total_steps": 17941, "loss": 1.5513, "learning_rate": 3.864465125264749e-05, "epoch": 0.5801794771751854, "percentage": 58.02, "elapsed_time": "1 day, 0:38:11", "remaining_time": "17:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10410, "total_steps": 17941, "loss": 1.6684, "learning_rate": 3.8635979865767205e-05, "epoch": 0.5802352154283484, "percentage": 58.02, "elapsed_time": "1 day, 0:38:20", "remaining_time": "17:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10411, "total_steps": 17941, "loss": 1.6376, "learning_rate": 3.862730883928738e-05, "epoch": 0.5802909536815116, "percentage": 58.03, "elapsed_time": "1 day, 0:38:29", "remaining_time": "17:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10412, "total_steps": 17941, "loss": 1.8236, "learning_rate": 3.8618638173483014e-05, "epoch": 0.5803466919346748, "percentage": 58.03, "elapsed_time": "1 day, 0:38:38", "remaining_time": "17:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10413, "total_steps": 17941, "loss": 1.4877, "learning_rate": 3.860996786862909e-05, "epoch": 0.5804024301878379, "percentage": 58.04, "elapsed_time": "1 day, 0:38:47", "remaining_time": "17:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10414, "total_steps": 17941, "loss": 1.6582, "learning_rate": 3.860129792500056e-05, "epoch": 0.5804581684410011, "percentage": 58.05, "elapsed_time": "1 day, 0:38:55", "remaining_time": "17:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10415, "total_steps": 17941, "loss": 1.6139, "learning_rate": 3.859262834287243e-05, "epoch": 0.5805139066941643, "percentage": 58.05, "elapsed_time": "1 day, 0:39:04", "remaining_time": "17:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10416, "total_steps": 17941, "loss": 1.6614, "learning_rate": 3.8583959122519585e-05, "epoch": 0.5805696449473273, "percentage": 58.06, "elapsed_time": "1 day, 0:39:12", "remaining_time": "17:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10417, "total_steps": 17941, "loss": 1.7069, "learning_rate": 3.8575290264217036e-05, "epoch": 0.5806253832004905, "percentage": 58.06, "elapsed_time": "1 day, 0:39:21", "remaining_time": "17:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10418, "total_steps": 17941, "loss": 1.604, "learning_rate": 3.8566621768239634e-05, "epoch": 0.5806811214536537, "percentage": 58.07, "elapsed_time": "1 day, 0:39:29", "remaining_time": "17:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10419, "total_steps": 17941, "loss": 1.9387, "learning_rate": 3.855795363486233e-05, "epoch": 0.5807368597068168, "percentage": 58.07, "elapsed_time": "1 day, 0:39:38", "remaining_time": "17:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10420, "total_steps": 17941, "loss": 1.8071, "learning_rate": 3.854928586436005e-05, "epoch": 0.58079259795998, "percentage": 58.08, "elapsed_time": "1 day, 0:39:46", "remaining_time": "17:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10421, "total_steps": 17941, "loss": 1.7062, "learning_rate": 3.854061845700764e-05, "epoch": 0.5808483362131431, "percentage": 58.08, "elapsed_time": "1 day, 0:39:55", "remaining_time": "17:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10422, "total_steps": 17941, "loss": 1.6668, "learning_rate": 3.853195141308001e-05, "epoch": 0.5809040744663062, "percentage": 58.09, "elapsed_time": "1 day, 0:40:03", "remaining_time": "17:47:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10423, "total_steps": 17941, "loss": 1.6721, "learning_rate": 3.852328473285201e-05, "epoch": 0.5809598127194694, "percentage": 58.1, "elapsed_time": "1 day, 0:40:12", "remaining_time": "17:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10424, "total_steps": 17941, "loss": 1.503, "learning_rate": 3.851461841659851e-05, "epoch": 0.5810155509726325, "percentage": 58.1, "elapsed_time": "1 day, 0:40:20", "remaining_time": "17:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10425, "total_steps": 17941, "loss": 1.6078, "learning_rate": 3.850595246459434e-05, "epoch": 0.5810712892257957, "percentage": 58.11, "elapsed_time": "1 day, 0:40:29", "remaining_time": "17:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10426, "total_steps": 17941, "loss": 1.4543, "learning_rate": 3.849728687711435e-05, "epoch": 0.5811270274789588, "percentage": 58.11, "elapsed_time": "1 day, 0:40:37", "remaining_time": "17:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10427, "total_steps": 17941, "loss": 1.4153, "learning_rate": 3.8488621654433356e-05, "epoch": 0.5811827657321219, "percentage": 58.12, "elapsed_time": "1 day, 0:40:46", "remaining_time": "17:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10428, "total_steps": 17941, "loss": 1.8426, "learning_rate": 3.8479956796826164e-05, "epoch": 0.5812385039852851, "percentage": 58.12, "elapsed_time": "1 day, 0:40:54", "remaining_time": "17:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10429, "total_steps": 17941, "loss": 1.9991, "learning_rate": 3.8471292304567586e-05, "epoch": 0.5812942422384483, "percentage": 58.13, "elapsed_time": "1 day, 0:41:03", "remaining_time": "17:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10430, "total_steps": 17941, "loss": 1.7196, "learning_rate": 3.8462628177932386e-05, "epoch": 0.5813499804916114, "percentage": 58.13, "elapsed_time": "1 day, 0:41:11", "remaining_time": "17:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10431, "total_steps": 17941, "loss": 1.6985, "learning_rate": 3.845396441719537e-05, "epoch": 0.5814057187447745, "percentage": 58.14, "elapsed_time": "1 day, 0:41:20", "remaining_time": "17:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10432, "total_steps": 17941, "loss": 1.729, "learning_rate": 3.844530102263126e-05, "epoch": 0.5814614569979377, "percentage": 58.15, "elapsed_time": "1 day, 0:41:28", "remaining_time": "17:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10433, "total_steps": 17941, "loss": 1.602, "learning_rate": 3.843663799451483e-05, "epoch": 0.5815171952511008, "percentage": 58.15, "elapsed_time": "1 day, 0:41:37", "remaining_time": "17:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10434, "total_steps": 17941, "loss": 1.6195, "learning_rate": 3.842797533312085e-05, "epoch": 0.581572933504264, "percentage": 58.16, "elapsed_time": "1 day, 0:41:45", "remaining_time": "17:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10435, "total_steps": 17941, "loss": 1.5695, "learning_rate": 3.841931303872401e-05, "epoch": 0.5816286717574272, "percentage": 58.16, "elapsed_time": "1 day, 0:41:54", "remaining_time": "17:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10436, "total_steps": 17941, "loss": 1.5744, "learning_rate": 3.841065111159905e-05, "epoch": 0.5816844100105902, "percentage": 58.17, "elapsed_time": "1 day, 0:42:02", "remaining_time": "17:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10437, "total_steps": 17941, "loss": 1.5559, "learning_rate": 3.8401989552020654e-05, "epoch": 0.5817401482637534, "percentage": 58.17, "elapsed_time": "1 day, 0:42:11", "remaining_time": "17:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10438, "total_steps": 17941, "loss": 1.5991, "learning_rate": 3.839332836026353e-05, "epoch": 0.5817958865169166, "percentage": 58.18, "elapsed_time": "1 day, 0:42:19", "remaining_time": "17:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10439, "total_steps": 17941, "loss": 1.3576, "learning_rate": 3.838466753660237e-05, "epoch": 0.5818516247700797, "percentage": 58.19, "elapsed_time": "1 day, 0:42:28", "remaining_time": "17:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10440, "total_steps": 17941, "loss": 1.7927, "learning_rate": 3.837600708131181e-05, "epoch": 0.5819073630232429, "percentage": 58.19, "elapsed_time": "1 day, 0:42:36", "remaining_time": "17:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10441, "total_steps": 17941, "loss": 1.6014, "learning_rate": 3.836734699466656e-05, "epoch": 0.581963101276406, "percentage": 58.2, "elapsed_time": "1 day, 0:42:45", "remaining_time": "17:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10442, "total_steps": 17941, "loss": 1.7221, "learning_rate": 3.835868727694122e-05, "epoch": 0.5820188395295691, "percentage": 58.2, "elapsed_time": "1 day, 0:42:53", "remaining_time": "17:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10443, "total_steps": 17941, "loss": 1.5634, "learning_rate": 3.835002792841047e-05, "epoch": 0.5820745777827323, "percentage": 58.21, "elapsed_time": "1 day, 0:43:02", "remaining_time": "17:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10444, "total_steps": 17941, "loss": 1.6135, "learning_rate": 3.834136894934888e-05, "epoch": 0.5821303160358955, "percentage": 58.21, "elapsed_time": "1 day, 0:43:10", "remaining_time": "17:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10445, "total_steps": 17941, "loss": 1.3717, "learning_rate": 3.833271034003111e-05, "epoch": 0.5821860542890586, "percentage": 58.22, "elapsed_time": "1 day, 0:43:19", "remaining_time": "17:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10446, "total_steps": 17941, "loss": 1.5761, "learning_rate": 3.832405210073174e-05, "epoch": 0.5822417925422217, "percentage": 58.22, "elapsed_time": "1 day, 0:43:27", "remaining_time": "17:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10447, "total_steps": 17941, "loss": 1.6861, "learning_rate": 3.831539423172536e-05, "epoch": 0.5822975307953848, "percentage": 58.23, "elapsed_time": "1 day, 0:43:35", "remaining_time": "17:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10448, "total_steps": 17941, "loss": 1.6967, "learning_rate": 3.8306736733286555e-05, "epoch": 0.582353269048548, "percentage": 58.24, "elapsed_time": "1 day, 0:43:44", "remaining_time": "17:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10449, "total_steps": 17941, "loss": 1.9025, "learning_rate": 3.829807960568988e-05, "epoch": 0.5824090073017112, "percentage": 58.24, "elapsed_time": "1 day, 0:43:53", "remaining_time": "17:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10450, "total_steps": 17941, "loss": 1.8112, "learning_rate": 3.8289422849209896e-05, "epoch": 0.5824647455548743, "percentage": 58.25, "elapsed_time": "1 day, 0:44:01", "remaining_time": "17:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10451, "total_steps": 17941, "loss": 1.5044, "learning_rate": 3.8280766464121134e-05, "epoch": 0.5825204838080374, "percentage": 58.25, "elapsed_time": "1 day, 0:44:09", "remaining_time": "17:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10452, "total_steps": 17941, "loss": 1.6428, "learning_rate": 3.827211045069813e-05, "epoch": 0.5825762220612006, "percentage": 58.26, "elapsed_time": "1 day, 0:44:18", "remaining_time": "17:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10453, "total_steps": 17941, "loss": 1.7481, "learning_rate": 3.826345480921542e-05, "epoch": 0.5826319603143637, "percentage": 58.26, "elapsed_time": "1 day, 0:44:26", "remaining_time": "17:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10454, "total_steps": 17941, "loss": 1.6192, "learning_rate": 3.825479953994748e-05, "epoch": 0.5826876985675269, "percentage": 58.27, "elapsed_time": "1 day, 0:44:35", "remaining_time": "17:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10455, "total_steps": 17941, "loss": 1.6705, "learning_rate": 3.824614464316883e-05, "epoch": 0.5827434368206901, "percentage": 58.27, "elapsed_time": "1 day, 0:44:44", "remaining_time": "17:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10456, "total_steps": 17941, "loss": 1.7806, "learning_rate": 3.8237490119153934e-05, "epoch": 0.5827991750738531, "percentage": 58.28, "elapsed_time": "1 day, 0:44:53", "remaining_time": "17:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10457, "total_steps": 17941, "loss": 1.5233, "learning_rate": 3.822883596817728e-05, "epoch": 0.5828549133270163, "percentage": 58.29, "elapsed_time": "1 day, 0:45:01", "remaining_time": "17:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10458, "total_steps": 17941, "loss": 1.6379, "learning_rate": 3.822018219051331e-05, "epoch": 0.5829106515801795, "percentage": 58.29, "elapsed_time": "1 day, 0:45:10", "remaining_time": "17:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10459, "total_steps": 17941, "loss": 1.5846, "learning_rate": 3.821152878643647e-05, "epoch": 0.5829663898333426, "percentage": 58.3, "elapsed_time": "1 day, 0:45:18", "remaining_time": "17:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10460, "total_steps": 17941, "loss": 1.5801, "learning_rate": 3.820287575622122e-05, "epoch": 0.5830221280865058, "percentage": 58.3, "elapsed_time": "1 day, 0:45:27", "remaining_time": "17:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10461, "total_steps": 17941, "loss": 1.6576, "learning_rate": 3.8194223100141965e-05, "epoch": 0.583077866339669, "percentage": 58.31, "elapsed_time": "1 day, 0:45:35", "remaining_time": "17:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10462, "total_steps": 17941, "loss": 1.8402, "learning_rate": 3.818557081847313e-05, "epoch": 0.583133604592832, "percentage": 58.31, "elapsed_time": "1 day, 0:45:45", "remaining_time": "17:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10463, "total_steps": 17941, "loss": 1.2378, "learning_rate": 3.81769189114891e-05, "epoch": 0.5831893428459952, "percentage": 58.32, "elapsed_time": "1 day, 0:45:53", "remaining_time": "17:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10464, "total_steps": 17941, "loss": 1.6343, "learning_rate": 3.8168267379464263e-05, "epoch": 0.5832450810991584, "percentage": 58.32, "elapsed_time": "1 day, 0:46:02", "remaining_time": "17:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10465, "total_steps": 17941, "loss": 1.6733, "learning_rate": 3.815961622267301e-05, "epoch": 0.5833008193523215, "percentage": 58.33, "elapsed_time": "1 day, 0:46:10", "remaining_time": "17:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10466, "total_steps": 17941, "loss": 1.6899, "learning_rate": 3.8150965441389674e-05, "epoch": 0.5833565576054847, "percentage": 58.34, "elapsed_time": "1 day, 0:46:19", "remaining_time": "17:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10467, "total_steps": 17941, "loss": 1.6729, "learning_rate": 3.814231503588867e-05, "epoch": 0.5834122958586478, "percentage": 58.34, "elapsed_time": "1 day, 0:46:27", "remaining_time": "17:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10468, "total_steps": 17941, "loss": 1.794, "learning_rate": 3.8133665006444255e-05, "epoch": 0.5834680341118109, "percentage": 58.35, "elapsed_time": "1 day, 0:46:36", "remaining_time": "17:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10469, "total_steps": 17941, "loss": 1.9005, "learning_rate": 3.812501535333083e-05, "epoch": 0.5835237723649741, "percentage": 58.35, "elapsed_time": "1 day, 0:46:44", "remaining_time": "17:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10470, "total_steps": 17941, "loss": 1.75, "learning_rate": 3.811636607682267e-05, "epoch": 0.5835795106181372, "percentage": 58.36, "elapsed_time": "1 day, 0:46:53", "remaining_time": "17:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10471, "total_steps": 17941, "loss": 1.83, "learning_rate": 3.810771717719409e-05, "epoch": 0.5836352488713004, "percentage": 58.36, "elapsed_time": "1 day, 0:47:01", "remaining_time": "17:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10472, "total_steps": 17941, "loss": 1.6382, "learning_rate": 3.80990686547194e-05, "epoch": 0.5836909871244635, "percentage": 58.37, "elapsed_time": "1 day, 0:47:10", "remaining_time": "17:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10473, "total_steps": 17941, "loss": 1.4951, "learning_rate": 3.809042050967285e-05, "epoch": 0.5837467253776266, "percentage": 58.37, "elapsed_time": "1 day, 0:47:18", "remaining_time": "17:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10474, "total_steps": 17941, "loss": 1.5714, "learning_rate": 3.808177274232873e-05, "epoch": 0.5838024636307898, "percentage": 58.38, "elapsed_time": "1 day, 0:47:27", "remaining_time": "17:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10475, "total_steps": 17941, "loss": 1.6896, "learning_rate": 3.807312535296127e-05, "epoch": 0.583858201883953, "percentage": 58.39, "elapsed_time": "1 day, 0:47:35", "remaining_time": "17:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10476, "total_steps": 17941, "loss": 1.6643, "learning_rate": 3.806447834184477e-05, "epoch": 0.5839139401371161, "percentage": 58.39, "elapsed_time": "1 day, 0:47:44", "remaining_time": "17:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10477, "total_steps": 17941, "loss": 1.6747, "learning_rate": 3.8055831709253396e-05, "epoch": 0.5839696783902792, "percentage": 58.4, "elapsed_time": "1 day, 0:47:53", "remaining_time": "17:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10478, "total_steps": 17941, "loss": 1.7009, "learning_rate": 3.804718545546142e-05, "epoch": 0.5840254166434424, "percentage": 58.4, "elapsed_time": "1 day, 0:48:01", "remaining_time": "17:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10479, "total_steps": 17941, "loss": 1.4489, "learning_rate": 3.803853958074303e-05, "epoch": 0.5840811548966055, "percentage": 58.41, "elapsed_time": "1 day, 0:48:10", "remaining_time": "17:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10480, "total_steps": 17941, "loss": 1.5598, "learning_rate": 3.802989408537242e-05, "epoch": 0.5841368931497687, "percentage": 58.41, "elapsed_time": "1 day, 0:48:18", "remaining_time": "17:39:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10481, "total_steps": 17941, "loss": 1.6924, "learning_rate": 3.802124896962379e-05, "epoch": 0.5841926314029319, "percentage": 58.42, "elapsed_time": "1 day, 0:48:27", "remaining_time": "17:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10482, "total_steps": 17941, "loss": 1.479, "learning_rate": 3.801260423377129e-05, "epoch": 0.584248369656095, "percentage": 58.42, "elapsed_time": "1 day, 0:48:35", "remaining_time": "17:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10483, "total_steps": 17941, "loss": 1.5304, "learning_rate": 3.8003959878089104e-05, "epoch": 0.5843041079092581, "percentage": 58.43, "elapsed_time": "1 day, 0:48:44", "remaining_time": "17:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10484, "total_steps": 17941, "loss": 1.4134, "learning_rate": 3.7995315902851354e-05, "epoch": 0.5843598461624213, "percentage": 58.44, "elapsed_time": "1 day, 0:48:52", "remaining_time": "17:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10485, "total_steps": 17941, "loss": 1.8024, "learning_rate": 3.798667230833218e-05, "epoch": 0.5844155844155844, "percentage": 58.44, "elapsed_time": "1 day, 0:49:01", "remaining_time": "17:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10486, "total_steps": 17941, "loss": 1.7916, "learning_rate": 3.797802909480574e-05, "epoch": 0.5844713226687476, "percentage": 58.45, "elapsed_time": "1 day, 0:49:09", "remaining_time": "17:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10487, "total_steps": 17941, "loss": 1.6446, "learning_rate": 3.796938626254612e-05, "epoch": 0.5845270609219108, "percentage": 58.45, "elapsed_time": "1 day, 0:49:18", "remaining_time": "17:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10488, "total_steps": 17941, "loss": 1.5499, "learning_rate": 3.796074381182743e-05, "epoch": 0.5845827991750738, "percentage": 58.46, "elapsed_time": "1 day, 0:49:26", "remaining_time": "17:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10489, "total_steps": 17941, "loss": 1.661, "learning_rate": 3.795210174292374e-05, "epoch": 0.584638537428237, "percentage": 58.46, "elapsed_time": "1 day, 0:49:35", "remaining_time": "17:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10490, "total_steps": 17941, "loss": 1.9696, "learning_rate": 3.794346005610914e-05, "epoch": 0.5846942756814002, "percentage": 58.47, "elapsed_time": "1 day, 0:49:43", "remaining_time": "17:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10491, "total_steps": 17941, "loss": 1.6024, "learning_rate": 3.7934818751657706e-05, "epoch": 0.5847500139345633, "percentage": 58.48, "elapsed_time": "1 day, 0:49:52", "remaining_time": "17:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10492, "total_steps": 17941, "loss": 1.5879, "learning_rate": 3.792617782984346e-05, "epoch": 0.5848057521877265, "percentage": 58.48, "elapsed_time": "1 day, 0:50:01", "remaining_time": "17:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10493, "total_steps": 17941, "loss": 1.5693, "learning_rate": 3.791753729094048e-05, "epoch": 0.5848614904408895, "percentage": 58.49, "elapsed_time": "1 day, 0:50:09", "remaining_time": "17:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10494, "total_steps": 17941, "loss": 1.7629, "learning_rate": 3.790889713522274e-05, "epoch": 0.5849172286940527, "percentage": 58.49, "elapsed_time": "1 day, 0:50:18", "remaining_time": "17:37:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10495, "total_steps": 17941, "loss": 1.8306, "learning_rate": 3.7900257362964314e-05, "epoch": 0.5849729669472159, "percentage": 58.5, "elapsed_time": "1 day, 0:50:26", "remaining_time": "17:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10496, "total_steps": 17941, "loss": 1.6657, "learning_rate": 3.7891617974439165e-05, "epoch": 0.585028705200379, "percentage": 58.5, "elapsed_time": "1 day, 0:50:35", "remaining_time": "17:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10497, "total_steps": 17941, "loss": 1.6045, "learning_rate": 3.7882978969921296e-05, "epoch": 0.5850844434535422, "percentage": 58.51, "elapsed_time": "1 day, 0:50:44", "remaining_time": "17:37:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10498, "total_steps": 17941, "loss": 1.6769, "learning_rate": 3.78743403496847e-05, "epoch": 0.5851401817067053, "percentage": 58.51, "elapsed_time": "1 day, 0:50:52", "remaining_time": "17:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10499, "total_steps": 17941, "loss": 1.5448, "learning_rate": 3.7865702114003314e-05, "epoch": 0.5851959199598684, "percentage": 58.52, "elapsed_time": "1 day, 0:51:01", "remaining_time": "17:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10500, "total_steps": 17941, "loss": 1.8509, "learning_rate": 3.785706426315113e-05, "epoch": 0.5852516582130316, "percentage": 58.53, "elapsed_time": "1 day, 0:51:10", "remaining_time": "17:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10501, "total_steps": 17941, "loss": 1.856, "learning_rate": 3.7848426797402034e-05, "epoch": 0.5853073964661948, "percentage": 58.53, "elapsed_time": "1 day, 0:51:18", "remaining_time": "17:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10502, "total_steps": 17941, "loss": 1.6842, "learning_rate": 3.783978971703003e-05, "epoch": 0.5853631347193579, "percentage": 58.54, "elapsed_time": "1 day, 0:51:27", "remaining_time": "17:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10503, "total_steps": 17941, "loss": 1.8741, "learning_rate": 3.783115302230897e-05, "epoch": 0.585418872972521, "percentage": 58.54, "elapsed_time": "1 day, 0:51:35", "remaining_time": "17:36:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10504, "total_steps": 17941, "loss": 1.669, "learning_rate": 3.7822516713512795e-05, "epoch": 0.5854746112256842, "percentage": 58.55, "elapsed_time": "1 day, 0:51:44", "remaining_time": "17:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10505, "total_steps": 17941, "loss": 1.7707, "learning_rate": 3.78138807909154e-05, "epoch": 0.5855303494788473, "percentage": 58.55, "elapsed_time": "1 day, 0:51:52", "remaining_time": "17:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10506, "total_steps": 17941, "loss": 2.0792, "learning_rate": 3.7805245254790646e-05, "epoch": 0.5855860877320105, "percentage": 58.56, "elapsed_time": "1 day, 0:52:01", "remaining_time": "17:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10507, "total_steps": 17941, "loss": 1.7686, "learning_rate": 3.779661010541242e-05, "epoch": 0.5856418259851737, "percentage": 58.56, "elapsed_time": "1 day, 0:52:10", "remaining_time": "17:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10508, "total_steps": 17941, "loss": 1.751, "learning_rate": 3.778797534305456e-05, "epoch": 0.5856975642383367, "percentage": 58.57, "elapsed_time": "1 day, 0:52:18", "remaining_time": "17:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10509, "total_steps": 17941, "loss": 1.7072, "learning_rate": 3.777934096799094e-05, "epoch": 0.5857533024914999, "percentage": 58.58, "elapsed_time": "1 day, 0:52:27", "remaining_time": "17:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10510, "total_steps": 17941, "loss": 1.4512, "learning_rate": 3.777070698049535e-05, "epoch": 0.5858090407446631, "percentage": 58.58, "elapsed_time": "1 day, 0:52:35", "remaining_time": "17:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10511, "total_steps": 17941, "loss": 1.6386, "learning_rate": 3.7762073380841634e-05, "epoch": 0.5858647789978262, "percentage": 58.59, "elapsed_time": "1 day, 0:52:44", "remaining_time": "17:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10512, "total_steps": 17941, "loss": 1.4614, "learning_rate": 3.775344016930361e-05, "epoch": 0.5859205172509894, "percentage": 58.59, "elapsed_time": "1 day, 0:52:52", "remaining_time": "17:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10513, "total_steps": 17941, "loss": 1.3026, "learning_rate": 3.774480734615506e-05, "epoch": 0.5859762555041526, "percentage": 58.6, "elapsed_time": "1 day, 0:53:01", "remaining_time": "17:34:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10514, "total_steps": 17941, "loss": 1.664, "learning_rate": 3.7736174911669776e-05, "epoch": 0.5860319937573156, "percentage": 58.6, "elapsed_time": "1 day, 0:53:09", "remaining_time": "17:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10515, "total_steps": 17941, "loss": 1.7944, "learning_rate": 3.77275428661215e-05, "epoch": 0.5860877320104788, "percentage": 58.61, "elapsed_time": "1 day, 0:53:18", "remaining_time": "17:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10516, "total_steps": 17941, "loss": 1.6576, "learning_rate": 3.7718911209784026e-05, "epoch": 0.5861434702636419, "percentage": 58.61, "elapsed_time": "1 day, 0:53:27", "remaining_time": "17:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10517, "total_steps": 17941, "loss": 1.968, "learning_rate": 3.771027994293109e-05, "epoch": 0.5861992085168051, "percentage": 58.62, "elapsed_time": "1 day, 0:53:35", "remaining_time": "17:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10518, "total_steps": 17941, "loss": 1.754, "learning_rate": 3.7701649065836394e-05, "epoch": 0.5862549467699683, "percentage": 58.63, "elapsed_time": "1 day, 0:53:44", "remaining_time": "17:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10519, "total_steps": 17941, "loss": 1.4775, "learning_rate": 3.769301857877372e-05, "epoch": 0.5863106850231313, "percentage": 58.63, "elapsed_time": "1 day, 0:53:53", "remaining_time": "17:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10520, "total_steps": 17941, "loss": 1.6659, "learning_rate": 3.768438848201671e-05, "epoch": 0.5863664232762945, "percentage": 58.64, "elapsed_time": "1 day, 0:54:02", "remaining_time": "17:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10521, "total_steps": 17941, "loss": 1.6178, "learning_rate": 3.767575877583912e-05, "epoch": 0.5864221615294577, "percentage": 58.64, "elapsed_time": "1 day, 0:54:10", "remaining_time": "17:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10522, "total_steps": 17941, "loss": 1.5179, "learning_rate": 3.7667129460514585e-05, "epoch": 0.5864778997826208, "percentage": 58.65, "elapsed_time": "1 day, 0:54:18", "remaining_time": "17:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10523, "total_steps": 17941, "loss": 1.6504, "learning_rate": 3.76585005363168e-05, "epoch": 0.586533638035784, "percentage": 58.65, "elapsed_time": "1 day, 0:54:27", "remaining_time": "17:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10524, "total_steps": 17941, "loss": 1.468, "learning_rate": 3.764987200351944e-05, "epoch": 0.5865893762889471, "percentage": 58.66, "elapsed_time": "1 day, 0:54:35", "remaining_time": "17:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10525, "total_steps": 17941, "loss": 1.6458, "learning_rate": 3.764124386239611e-05, "epoch": 0.5866451145421102, "percentage": 58.66, "elapsed_time": "1 day, 0:54:44", "remaining_time": "17:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10526, "total_steps": 17941, "loss": 1.7088, "learning_rate": 3.7632616113220495e-05, "epoch": 0.5867008527952734, "percentage": 58.67, "elapsed_time": "1 day, 0:54:53", "remaining_time": "17:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10527, "total_steps": 17941, "loss": 1.5763, "learning_rate": 3.762398875626616e-05, "epoch": 0.5867565910484366, "percentage": 58.68, "elapsed_time": "1 day, 0:55:01", "remaining_time": "17:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10528, "total_steps": 17941, "loss": 1.639, "learning_rate": 3.761536179180678e-05, "epoch": 0.5868123293015997, "percentage": 58.68, "elapsed_time": "1 day, 0:55:10", "remaining_time": "17:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10529, "total_steps": 17941, "loss": 1.6822, "learning_rate": 3.760673522011588e-05, "epoch": 0.5868680675547628, "percentage": 58.69, "elapsed_time": "1 day, 0:55:18", "remaining_time": "17:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10530, "total_steps": 17941, "loss": 1.7807, "learning_rate": 3.7598109041467094e-05, "epoch": 0.586923805807926, "percentage": 58.69, "elapsed_time": "1 day, 0:55:27", "remaining_time": "17:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10531, "total_steps": 17941, "loss": 1.6093, "learning_rate": 3.758948325613399e-05, "epoch": 0.5869795440610891, "percentage": 58.7, "elapsed_time": "1 day, 0:55:35", "remaining_time": "17:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10532, "total_steps": 17941, "loss": 1.6115, "learning_rate": 3.758085786439011e-05, "epoch": 0.5870352823142523, "percentage": 58.7, "elapsed_time": "1 day, 0:55:44", "remaining_time": "17:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10533, "total_steps": 17941, "loss": 1.6165, "learning_rate": 3.757223286650902e-05, "epoch": 0.5870910205674155, "percentage": 58.71, "elapsed_time": "1 day, 0:55:53", "remaining_time": "17:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10534, "total_steps": 17941, "loss": 1.7445, "learning_rate": 3.756360826276424e-05, "epoch": 0.5871467588205785, "percentage": 58.71, "elapsed_time": "1 day, 0:56:01", "remaining_time": "17:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10535, "total_steps": 17941, "loss": 1.6591, "learning_rate": 3.75549840534293e-05, "epoch": 0.5872024970737417, "percentage": 58.72, "elapsed_time": "1 day, 0:56:09", "remaining_time": "17:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10536, "total_steps": 17941, "loss": 1.6325, "learning_rate": 3.7546360238777694e-05, "epoch": 0.5872582353269049, "percentage": 58.73, "elapsed_time": "1 day, 0:56:19", "remaining_time": "17:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10537, "total_steps": 17941, "loss": 1.6007, "learning_rate": 3.753773681908292e-05, "epoch": 0.587313973580068, "percentage": 58.73, "elapsed_time": "1 day, 0:56:27", "remaining_time": "17:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10538, "total_steps": 17941, "loss": 1.6943, "learning_rate": 3.75291137946185e-05, "epoch": 0.5873697118332312, "percentage": 58.74, "elapsed_time": "1 day, 0:56:36", "remaining_time": "17:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10539, "total_steps": 17941, "loss": 1.538, "learning_rate": 3.7520491165657875e-05, "epoch": 0.5874254500863942, "percentage": 58.74, "elapsed_time": "1 day, 0:56:44", "remaining_time": "17:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10540, "total_steps": 17941, "loss": 1.7185, "learning_rate": 3.751186893247452e-05, "epoch": 0.5874811883395574, "percentage": 58.75, "elapsed_time": "1 day, 0:56:53", "remaining_time": "17:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10541, "total_steps": 17941, "loss": 1.6519, "learning_rate": 3.750324709534185e-05, "epoch": 0.5875369265927206, "percentage": 58.75, "elapsed_time": "1 day, 0:57:01", "remaining_time": "17:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10542, "total_steps": 17941, "loss": 1.783, "learning_rate": 3.749462565453333e-05, "epoch": 0.5875926648458837, "percentage": 58.76, "elapsed_time": "1 day, 0:57:10", "remaining_time": "17:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10543, "total_steps": 17941, "loss": 1.4267, "learning_rate": 3.748600461032238e-05, "epoch": 0.5876484030990469, "percentage": 58.76, "elapsed_time": "1 day, 0:57:18", "remaining_time": "17:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10544, "total_steps": 17941, "loss": 1.6198, "learning_rate": 3.7477383962982374e-05, "epoch": 0.58770414135221, "percentage": 58.77, "elapsed_time": "1 day, 0:57:27", "remaining_time": "17:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10545, "total_steps": 17941, "loss": 1.501, "learning_rate": 3.746876371278678e-05, "epoch": 0.5877598796053731, "percentage": 58.78, "elapsed_time": "1 day, 0:57:35", "remaining_time": "17:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10546, "total_steps": 17941, "loss": 1.7348, "learning_rate": 3.74601438600089e-05, "epoch": 0.5878156178585363, "percentage": 58.78, "elapsed_time": "1 day, 0:57:44", "remaining_time": "17:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10547, "total_steps": 17941, "loss": 1.6013, "learning_rate": 3.745152440492217e-05, "epoch": 0.5878713561116995, "percentage": 58.79, "elapsed_time": "1 day, 0:57:52", "remaining_time": "17:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10548, "total_steps": 17941, "loss": 1.5797, "learning_rate": 3.744290534779991e-05, "epoch": 0.5879270943648626, "percentage": 58.79, "elapsed_time": "1 day, 0:58:01", "remaining_time": "17:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10549, "total_steps": 17941, "loss": 1.6181, "learning_rate": 3.7434286688915474e-05, "epoch": 0.5879828326180258, "percentage": 58.8, "elapsed_time": "1 day, 0:58:09", "remaining_time": "17:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10550, "total_steps": 17941, "loss": 1.7129, "learning_rate": 3.742566842854222e-05, "epoch": 0.5880385708711889, "percentage": 58.8, "elapsed_time": "1 day, 0:58:18", "remaining_time": "17:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10551, "total_steps": 17941, "loss": 1.8679, "learning_rate": 3.741705056695344e-05, "epoch": 0.588094309124352, "percentage": 58.81, "elapsed_time": "1 day, 0:58:26", "remaining_time": "17:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10552, "total_steps": 17941, "loss": 1.2723, "learning_rate": 3.7408433104422455e-05, "epoch": 0.5881500473775152, "percentage": 58.82, "elapsed_time": "1 day, 0:58:35", "remaining_time": "17:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10553, "total_steps": 17941, "loss": 1.8093, "learning_rate": 3.739981604122254e-05, "epoch": 0.5882057856306784, "percentage": 58.82, "elapsed_time": "1 day, 0:58:43", "remaining_time": "17:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10554, "total_steps": 17941, "loss": 1.7748, "learning_rate": 3.739119937762703e-05, "epoch": 0.5882615238838415, "percentage": 58.83, "elapsed_time": "1 day, 0:58:52", "remaining_time": "17:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10555, "total_steps": 17941, "loss": 1.874, "learning_rate": 3.738258311390913e-05, "epoch": 0.5883172621370046, "percentage": 58.83, "elapsed_time": "1 day, 0:59:00", "remaining_time": "17:28:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10556, "total_steps": 17941, "loss": 1.7739, "learning_rate": 3.737396725034214e-05, "epoch": 0.5883730003901678, "percentage": 58.84, "elapsed_time": "1 day, 0:59:09", "remaining_time": "17:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10557, "total_steps": 17941, "loss": 1.3497, "learning_rate": 3.7365351787199305e-05, "epoch": 0.5884287386433309, "percentage": 58.84, "elapsed_time": "1 day, 0:59:17", "remaining_time": "17:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10558, "total_steps": 17941, "loss": 1.5436, "learning_rate": 3.7356736724753834e-05, "epoch": 0.5884844768964941, "percentage": 58.85, "elapsed_time": "1 day, 0:59:26", "remaining_time": "17:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10559, "total_steps": 17941, "loss": 1.5924, "learning_rate": 3.734812206327897e-05, "epoch": 0.5885402151496573, "percentage": 58.85, "elapsed_time": "1 day, 0:59:34", "remaining_time": "17:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10560, "total_steps": 17941, "loss": 1.9695, "learning_rate": 3.73395078030479e-05, "epoch": 0.5885959534028203, "percentage": 58.86, "elapsed_time": "1 day, 0:59:43", "remaining_time": "17:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10561, "total_steps": 17941, "loss": 1.5767, "learning_rate": 3.733089394433383e-05, "epoch": 0.5886516916559835, "percentage": 58.87, "elapsed_time": "1 day, 0:59:51", "remaining_time": "17:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10562, "total_steps": 17941, "loss": 1.6256, "learning_rate": 3.732228048740992e-05, "epoch": 0.5887074299091466, "percentage": 58.87, "elapsed_time": "1 day, 1:00:00", "remaining_time": "17:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10563, "total_steps": 17941, "loss": 1.7033, "learning_rate": 3.731366743254937e-05, "epoch": 0.5887631681623098, "percentage": 58.88, "elapsed_time": "1 day, 1:00:08", "remaining_time": "17:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10564, "total_steps": 17941, "loss": 1.8645, "learning_rate": 3.730505478002533e-05, "epoch": 0.588818906415473, "percentage": 58.88, "elapsed_time": "1 day, 1:00:17", "remaining_time": "17:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10565, "total_steps": 17941, "loss": 1.6798, "learning_rate": 3.7296442530110934e-05, "epoch": 0.588874644668636, "percentage": 58.89, "elapsed_time": "1 day, 1:00:25", "remaining_time": "17:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10566, "total_steps": 17941, "loss": 1.9067, "learning_rate": 3.728783068307931e-05, "epoch": 0.5889303829217992, "percentage": 58.89, "elapsed_time": "1 day, 1:00:34", "remaining_time": "17:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10567, "total_steps": 17941, "loss": 1.7204, "learning_rate": 3.727921923920358e-05, "epoch": 0.5889861211749624, "percentage": 58.9, "elapsed_time": "1 day, 1:00:42", "remaining_time": "17:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10568, "total_steps": 17941, "loss": 1.8126, "learning_rate": 3.7270608198756854e-05, "epoch": 0.5890418594281255, "percentage": 58.9, "elapsed_time": "1 day, 1:00:51", "remaining_time": "17:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10569, "total_steps": 17941, "loss": 1.5697, "learning_rate": 3.726199756201221e-05, "epoch": 0.5890975976812887, "percentage": 58.91, "elapsed_time": "1 day, 1:00:59", "remaining_time": "17:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10570, "total_steps": 17941, "loss": 1.6158, "learning_rate": 3.7253387329242726e-05, "epoch": 0.5891533359344518, "percentage": 58.92, "elapsed_time": "1 day, 1:01:08", "remaining_time": "17:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10571, "total_steps": 17941, "loss": 1.6502, "learning_rate": 3.7244777500721504e-05, "epoch": 0.5892090741876149, "percentage": 58.92, "elapsed_time": "1 day, 1:01:16", "remaining_time": "17:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10572, "total_steps": 17941, "loss": 1.9357, "learning_rate": 3.723616807672155e-05, "epoch": 0.5892648124407781, "percentage": 58.93, "elapsed_time": "1 day, 1:01:25", "remaining_time": "17:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10573, "total_steps": 17941, "loss": 1.7127, "learning_rate": 3.722755905751594e-05, "epoch": 0.5893205506939413, "percentage": 58.93, "elapsed_time": "1 day, 1:01:33", "remaining_time": "17:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10574, "total_steps": 17941, "loss": 1.6027, "learning_rate": 3.7218950443377676e-05, "epoch": 0.5893762889471044, "percentage": 58.94, "elapsed_time": "1 day, 1:01:42", "remaining_time": "17:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10575, "total_steps": 17941, "loss": 1.8543, "learning_rate": 3.7210342234579785e-05, "epoch": 0.5894320272002675, "percentage": 58.94, "elapsed_time": "1 day, 1:01:50", "remaining_time": "17:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10576, "total_steps": 17941, "loss": 1.6043, "learning_rate": 3.720173443139528e-05, "epoch": 0.5894877654534307, "percentage": 58.95, "elapsed_time": "1 day, 1:01:58", "remaining_time": "17:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10577, "total_steps": 17941, "loss": 1.4774, "learning_rate": 3.7193127034097144e-05, "epoch": 0.5895435037065938, "percentage": 58.95, "elapsed_time": "1 day, 1:02:07", "remaining_time": "17:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10578, "total_steps": 17941, "loss": 1.8391, "learning_rate": 3.718452004295835e-05, "epoch": 0.589599241959757, "percentage": 58.96, "elapsed_time": "1 day, 1:02:16", "remaining_time": "17:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10579, "total_steps": 17941, "loss": 1.8092, "learning_rate": 3.717591345825183e-05, "epoch": 0.5896549802129202, "percentage": 58.97, "elapsed_time": "1 day, 1:02:24", "remaining_time": "17:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10580, "total_steps": 17941, "loss": 1.5544, "learning_rate": 3.7167307280250607e-05, "epoch": 0.5897107184660833, "percentage": 58.97, "elapsed_time": "1 day, 1:02:33", "remaining_time": "17:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10581, "total_steps": 17941, "loss": 1.8257, "learning_rate": 3.7158701509227544e-05, "epoch": 0.5897664567192464, "percentage": 58.98, "elapsed_time": "1 day, 1:02:42", "remaining_time": "17:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10582, "total_steps": 17941, "loss": 1.8018, "learning_rate": 3.715009614545561e-05, "epoch": 0.5898221949724096, "percentage": 58.98, "elapsed_time": "1 day, 1:02:50", "remaining_time": "17:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10583, "total_steps": 17941, "loss": 1.6239, "learning_rate": 3.714149118920772e-05, "epoch": 0.5898779332255727, "percentage": 58.99, "elapsed_time": "1 day, 1:02:59", "remaining_time": "17:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10584, "total_steps": 17941, "loss": 1.7372, "learning_rate": 3.713288664075674e-05, "epoch": 0.5899336714787359, "percentage": 58.99, "elapsed_time": "1 day, 1:03:07", "remaining_time": "17:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10585, "total_steps": 17941, "loss": 1.7206, "learning_rate": 3.7124282500375597e-05, "epoch": 0.589989409731899, "percentage": 59.0, "elapsed_time": "1 day, 1:03:16", "remaining_time": "17:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10586, "total_steps": 17941, "loss": 1.8214, "learning_rate": 3.711567876833712e-05, "epoch": 0.5900451479850621, "percentage": 59.0, "elapsed_time": "1 day, 1:03:24", "remaining_time": "17:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10587, "total_steps": 17941, "loss": 1.9289, "learning_rate": 3.710707544491421e-05, "epoch": 0.5901008862382253, "percentage": 59.01, "elapsed_time": "1 day, 1:03:33", "remaining_time": "17:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10588, "total_steps": 17941, "loss": 1.6522, "learning_rate": 3.709847253037967e-05, "epoch": 0.5901566244913884, "percentage": 59.02, "elapsed_time": "1 day, 1:03:41", "remaining_time": "17:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10589, "total_steps": 17941, "loss": 1.7481, "learning_rate": 3.7089870025006374e-05, "epoch": 0.5902123627445516, "percentage": 59.02, "elapsed_time": "1 day, 1:03:50", "remaining_time": "17:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10590, "total_steps": 17941, "loss": 1.4827, "learning_rate": 3.708126792906714e-05, "epoch": 0.5902681009977148, "percentage": 59.03, "elapsed_time": "1 day, 1:03:58", "remaining_time": "17:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10591, "total_steps": 17941, "loss": 1.6345, "learning_rate": 3.707266624283475e-05, "epoch": 0.5903238392508778, "percentage": 59.03, "elapsed_time": "1 day, 1:04:07", "remaining_time": "17:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10592, "total_steps": 17941, "loss": 1.675, "learning_rate": 3.706406496658204e-05, "epoch": 0.590379577504041, "percentage": 59.04, "elapsed_time": "1 day, 1:04:15", "remaining_time": "17:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10593, "total_steps": 17941, "loss": 1.6043, "learning_rate": 3.705546410058175e-05, "epoch": 0.5904353157572042, "percentage": 59.04, "elapsed_time": "1 day, 1:04:24", "remaining_time": "17:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10594, "total_steps": 17941, "loss": 1.799, "learning_rate": 3.704686364510667e-05, "epoch": 0.5904910540103673, "percentage": 59.05, "elapsed_time": "1 day, 1:04:32", "remaining_time": "17:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10595, "total_steps": 17941, "loss": 1.6559, "learning_rate": 3.703826360042954e-05, "epoch": 0.5905467922635305, "percentage": 59.05, "elapsed_time": "1 day, 1:04:41", "remaining_time": "17:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10596, "total_steps": 17941, "loss": 1.7088, "learning_rate": 3.702966396682312e-05, "epoch": 0.5906025305166936, "percentage": 59.06, "elapsed_time": "1 day, 1:04:49", "remaining_time": "17:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10597, "total_steps": 17941, "loss": 1.845, "learning_rate": 3.702106474456016e-05, "epoch": 0.5906582687698567, "percentage": 59.07, "elapsed_time": "1 day, 1:04:58", "remaining_time": "17:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10598, "total_steps": 17941, "loss": 1.6807, "learning_rate": 3.701246593391332e-05, "epoch": 0.5907140070230199, "percentage": 59.07, "elapsed_time": "1 day, 1:05:06", "remaining_time": "17:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10599, "total_steps": 17941, "loss": 1.6427, "learning_rate": 3.7003867535155365e-05, "epoch": 0.5907697452761831, "percentage": 59.08, "elapsed_time": "1 day, 1:05:15", "remaining_time": "17:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10600, "total_steps": 17941, "loss": 1.7423, "learning_rate": 3.699526954855895e-05, "epoch": 0.5908254835293462, "percentage": 59.08, "elapsed_time": "1 day, 1:05:23", "remaining_time": "17:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10601, "total_steps": 17941, "loss": 1.5484, "learning_rate": 3.6986671974396755e-05, "epoch": 0.5908812217825093, "percentage": 59.09, "elapsed_time": "1 day, 1:05:32", "remaining_time": "17:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10602, "total_steps": 17941, "loss": 1.694, "learning_rate": 3.697807481294146e-05, "epoch": 0.5909369600356725, "percentage": 59.09, "elapsed_time": "1 day, 1:05:40", "remaining_time": "17:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10603, "total_steps": 17941, "loss": 1.7923, "learning_rate": 3.696947806446571e-05, "epoch": 0.5909926982888356, "percentage": 59.1, "elapsed_time": "1 day, 1:05:49", "remaining_time": "17:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10604, "total_steps": 17941, "loss": 1.506, "learning_rate": 3.696088172924215e-05, "epoch": 0.5910484365419988, "percentage": 59.1, "elapsed_time": "1 day, 1:05:57", "remaining_time": "17:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10605, "total_steps": 17941, "loss": 1.6042, "learning_rate": 3.695228580754337e-05, "epoch": 0.591104174795162, "percentage": 59.11, "elapsed_time": "1 day, 1:06:06", "remaining_time": "17:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10606, "total_steps": 17941, "loss": 1.5731, "learning_rate": 3.6943690299642055e-05, "epoch": 0.591159913048325, "percentage": 59.12, "elapsed_time": "1 day, 1:06:14", "remaining_time": "17:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10607, "total_steps": 17941, "loss": 1.3331, "learning_rate": 3.693509520581072e-05, "epoch": 0.5912156513014882, "percentage": 59.12, "elapsed_time": "1 day, 1:06:23", "remaining_time": "17:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10608, "total_steps": 17941, "loss": 1.7033, "learning_rate": 3.6926500526322e-05, "epoch": 0.5912713895546513, "percentage": 59.13, "elapsed_time": "1 day, 1:06:31", "remaining_time": "17:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10609, "total_steps": 17941, "loss": 1.8765, "learning_rate": 3.6917906261448473e-05, "epoch": 0.5913271278078145, "percentage": 59.13, "elapsed_time": "1 day, 1:06:40", "remaining_time": "17:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10610, "total_steps": 17941, "loss": 1.6823, "learning_rate": 3.6909312411462675e-05, "epoch": 0.5913828660609777, "percentage": 59.14, "elapsed_time": "1 day, 1:06:49", "remaining_time": "17:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10611, "total_steps": 17941, "loss": 1.6476, "learning_rate": 3.6900718976637174e-05, "epoch": 0.5914386043141407, "percentage": 59.14, "elapsed_time": "1 day, 1:06:57", "remaining_time": "17:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10612, "total_steps": 17941, "loss": 1.7493, "learning_rate": 3.6892125957244484e-05, "epoch": 0.5914943425673039, "percentage": 59.15, "elapsed_time": "1 day, 1:07:05", "remaining_time": "17:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10613, "total_steps": 17941, "loss": 1.5932, "learning_rate": 3.688353335355714e-05, "epoch": 0.5915500808204671, "percentage": 59.16, "elapsed_time": "1 day, 1:07:14", "remaining_time": "17:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10614, "total_steps": 17941, "loss": 1.6508, "learning_rate": 3.687494116584763e-05, "epoch": 0.5916058190736302, "percentage": 59.16, "elapsed_time": "1 day, 1:07:22", "remaining_time": "17:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10615, "total_steps": 17941, "loss": 1.6409, "learning_rate": 3.6866349394388465e-05, "epoch": 0.5916615573267934, "percentage": 59.17, "elapsed_time": "1 day, 1:07:31", "remaining_time": "17:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10616, "total_steps": 17941, "loss": 1.6912, "learning_rate": 3.6857758039452135e-05, "epoch": 0.5917172955799566, "percentage": 59.17, "elapsed_time": "1 day, 1:07:39", "remaining_time": "17:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10617, "total_steps": 17941, "loss": 1.646, "learning_rate": 3.6849167101311086e-05, "epoch": 0.5917730338331196, "percentage": 59.18, "elapsed_time": "1 day, 1:07:48", "remaining_time": "17:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10618, "total_steps": 17941, "loss": 1.5624, "learning_rate": 3.68405765802378e-05, "epoch": 0.5918287720862828, "percentage": 59.18, "elapsed_time": "1 day, 1:07:56", "remaining_time": "17:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10619, "total_steps": 17941, "loss": 1.7411, "learning_rate": 3.683198647650468e-05, "epoch": 0.591884510339446, "percentage": 59.19, "elapsed_time": "1 day, 1:08:05", "remaining_time": "17:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10620, "total_steps": 17941, "loss": 1.6677, "learning_rate": 3.6823396790384176e-05, "epoch": 0.5919402485926091, "percentage": 59.19, "elapsed_time": "1 day, 1:08:13", "remaining_time": "17:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10621, "total_steps": 17941, "loss": 1.6784, "learning_rate": 3.681480752214871e-05, "epoch": 0.5919959868457723, "percentage": 59.2, "elapsed_time": "1 day, 1:08:22", "remaining_time": "17:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10622, "total_steps": 17941, "loss": 2.0557, "learning_rate": 3.6806218672070644e-05, "epoch": 0.5920517250989354, "percentage": 59.21, "elapsed_time": "1 day, 1:08:30", "remaining_time": "17:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10623, "total_steps": 17941, "loss": 1.637, "learning_rate": 3.6797630240422445e-05, "epoch": 0.5921074633520985, "percentage": 59.21, "elapsed_time": "1 day, 1:08:39", "remaining_time": "17:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10624, "total_steps": 17941, "loss": 1.6871, "learning_rate": 3.67890422274764e-05, "epoch": 0.5921632016052617, "percentage": 59.22, "elapsed_time": "1 day, 1:08:47", "remaining_time": "17:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10625, "total_steps": 17941, "loss": 1.5928, "learning_rate": 3.678045463350493e-05, "epoch": 0.5922189398584249, "percentage": 59.22, "elapsed_time": "1 day, 1:08:56", "remaining_time": "17:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10626, "total_steps": 17941, "loss": 1.5871, "learning_rate": 3.677186745878036e-05, "epoch": 0.592274678111588, "percentage": 59.23, "elapsed_time": "1 day, 1:09:05", "remaining_time": "17:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10627, "total_steps": 17941, "loss": 1.5642, "learning_rate": 3.676328070357503e-05, "epoch": 0.5923304163647511, "percentage": 59.23, "elapsed_time": "1 day, 1:09:14", "remaining_time": "17:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10628, "total_steps": 17941, "loss": 1.711, "learning_rate": 3.6754694368161264e-05, "epoch": 0.5923861546179143, "percentage": 59.24, "elapsed_time": "1 day, 1:09:22", "remaining_time": "17:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10629, "total_steps": 17941, "loss": 1.2255, "learning_rate": 3.6746108452811344e-05, "epoch": 0.5924418928710774, "percentage": 59.24, "elapsed_time": "1 day, 1:09:30", "remaining_time": "17:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10630, "total_steps": 17941, "loss": 1.5926, "learning_rate": 3.6737522957797635e-05, "epoch": 0.5924976311242406, "percentage": 59.25, "elapsed_time": "1 day, 1:09:39", "remaining_time": "17:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10631, "total_steps": 17941, "loss": 2.0771, "learning_rate": 3.6728937883392326e-05, "epoch": 0.5925533693774037, "percentage": 59.26, "elapsed_time": "1 day, 1:09:48", "remaining_time": "17:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10632, "total_steps": 17941, "loss": 1.7859, "learning_rate": 3.672035322986777e-05, "epoch": 0.5926091076305668, "percentage": 59.26, "elapsed_time": "1 day, 1:09:56", "remaining_time": "17:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10633, "total_steps": 17941, "loss": 1.6532, "learning_rate": 3.671176899749614e-05, "epoch": 0.59266484588373, "percentage": 59.27, "elapsed_time": "1 day, 1:10:05", "remaining_time": "17:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10634, "total_steps": 17941, "loss": 1.5604, "learning_rate": 3.670318518654975e-05, "epoch": 0.5927205841368931, "percentage": 59.27, "elapsed_time": "1 day, 1:10:13", "remaining_time": "17:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10635, "total_steps": 17941, "loss": 1.6858, "learning_rate": 3.66946017973008e-05, "epoch": 0.5927763223900563, "percentage": 59.28, "elapsed_time": "1 day, 1:10:22", "remaining_time": "17:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10636, "total_steps": 17941, "loss": 1.4864, "learning_rate": 3.668601883002149e-05, "epoch": 0.5928320606432195, "percentage": 59.28, "elapsed_time": "1 day, 1:10:30", "remaining_time": "17:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10637, "total_steps": 17941, "loss": 1.7848, "learning_rate": 3.667743628498406e-05, "epoch": 0.5928877988963825, "percentage": 59.29, "elapsed_time": "1 day, 1:10:38", "remaining_time": "17:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10638, "total_steps": 17941, "loss": 1.7601, "learning_rate": 3.6668854162460667e-05, "epoch": 0.5929435371495457, "percentage": 59.29, "elapsed_time": "1 day, 1:10:47", "remaining_time": "17:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10639, "total_steps": 17941, "loss": 1.8047, "learning_rate": 3.666027246272349e-05, "epoch": 0.5929992754027089, "percentage": 59.3, "elapsed_time": "1 day, 1:10:56", "remaining_time": "17:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10640, "total_steps": 17941, "loss": 1.6072, "learning_rate": 3.665169118604468e-05, "epoch": 0.593055013655872, "percentage": 59.31, "elapsed_time": "1 day, 1:11:04", "remaining_time": "17:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10641, "total_steps": 17941, "loss": 1.768, "learning_rate": 3.6643110332696404e-05, "epoch": 0.5931107519090352, "percentage": 59.31, "elapsed_time": "1 day, 1:11:12", "remaining_time": "17:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10642, "total_steps": 17941, "loss": 1.7465, "learning_rate": 3.663452990295081e-05, "epoch": 0.5931664901621984, "percentage": 59.32, "elapsed_time": "1 day, 1:11:21", "remaining_time": "17:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10643, "total_steps": 17941, "loss": 1.5842, "learning_rate": 3.662594989707999e-05, "epoch": 0.5932222284153614, "percentage": 59.32, "elapsed_time": "1 day, 1:11:29", "remaining_time": "17:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10644, "total_steps": 17941, "loss": 2.1065, "learning_rate": 3.661737031535608e-05, "epoch": 0.5932779666685246, "percentage": 59.33, "elapsed_time": "1 day, 1:11:38", "remaining_time": "17:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10645, "total_steps": 17941, "loss": 1.6108, "learning_rate": 3.660879115805114e-05, "epoch": 0.5933337049216878, "percentage": 59.33, "elapsed_time": "1 day, 1:11:46", "remaining_time": "17:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10646, "total_steps": 17941, "loss": 1.6259, "learning_rate": 3.6600212425437275e-05, "epoch": 0.5933894431748509, "percentage": 59.34, "elapsed_time": "1 day, 1:11:55", "remaining_time": "17:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10647, "total_steps": 17941, "loss": 1.5076, "learning_rate": 3.659163411778654e-05, "epoch": 0.5934451814280141, "percentage": 59.34, "elapsed_time": "1 day, 1:12:03", "remaining_time": "17:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10648, "total_steps": 17941, "loss": 1.8803, "learning_rate": 3.658305623537098e-05, "epoch": 0.5935009196811772, "percentage": 59.35, "elapsed_time": "1 day, 1:12:12", "remaining_time": "17:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10649, "total_steps": 17941, "loss": 1.4336, "learning_rate": 3.6574478778462676e-05, "epoch": 0.5935566579343403, "percentage": 59.36, "elapsed_time": "1 day, 1:12:20", "remaining_time": "17:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10650, "total_steps": 17941, "loss": 1.5946, "learning_rate": 3.6565901747333616e-05, "epoch": 0.5936123961875035, "percentage": 59.36, "elapsed_time": "1 day, 1:12:29", "remaining_time": "17:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10651, "total_steps": 17941, "loss": 1.9025, "learning_rate": 3.655732514225584e-05, "epoch": 0.5936681344406667, "percentage": 59.37, "elapsed_time": "1 day, 1:12:37", "remaining_time": "17:15:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10652, "total_steps": 17941, "loss": 1.5769, "learning_rate": 3.654874896350132e-05, "epoch": 0.5937238726938298, "percentage": 59.37, "elapsed_time": "1 day, 1:12:46", "remaining_time": "17:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10653, "total_steps": 17941, "loss": 1.5514, "learning_rate": 3.654017321134206e-05, "epoch": 0.5937796109469929, "percentage": 59.38, "elapsed_time": "1 day, 1:12:54", "remaining_time": "17:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10654, "total_steps": 17941, "loss": 1.4165, "learning_rate": 3.653159788605004e-05, "epoch": 0.593835349200156, "percentage": 59.38, "elapsed_time": "1 day, 1:13:03", "remaining_time": "17:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10655, "total_steps": 17941, "loss": 1.4697, "learning_rate": 3.652302298789718e-05, "epoch": 0.5938910874533192, "percentage": 59.39, "elapsed_time": "1 day, 1:13:12", "remaining_time": "17:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10656, "total_steps": 17941, "loss": 1.6819, "learning_rate": 3.65144485171555e-05, "epoch": 0.5939468257064824, "percentage": 59.39, "elapsed_time": "1 day, 1:13:21", "remaining_time": "17:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10657, "total_steps": 17941, "loss": 1.8052, "learning_rate": 3.6505874474096844e-05, "epoch": 0.5940025639596455, "percentage": 59.4, "elapsed_time": "1 day, 1:13:29", "remaining_time": "17:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10658, "total_steps": 17941, "loss": 2.0106, "learning_rate": 3.649730085899321e-05, "epoch": 0.5940583022128086, "percentage": 59.41, "elapsed_time": "1 day, 1:13:38", "remaining_time": "17:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10659, "total_steps": 17941, "loss": 1.3272, "learning_rate": 3.648872767211643e-05, "epoch": 0.5941140404659718, "percentage": 59.41, "elapsed_time": "1 day, 1:13:46", "remaining_time": "17:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10660, "total_steps": 17941, "loss": 1.6486, "learning_rate": 3.648015491373845e-05, "epoch": 0.5941697787191349, "percentage": 59.42, "elapsed_time": "1 day, 1:13:55", "remaining_time": "17:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10661, "total_steps": 17941, "loss": 1.6681, "learning_rate": 3.6471582584131135e-05, "epoch": 0.5942255169722981, "percentage": 59.42, "elapsed_time": "1 day, 1:14:03", "remaining_time": "17:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10662, "total_steps": 17941, "loss": 1.7256, "learning_rate": 3.6463010683566336e-05, "epoch": 0.5942812552254613, "percentage": 59.43, "elapsed_time": "1 day, 1:14:12", "remaining_time": "17:13:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10663, "total_steps": 17941, "loss": 1.5431, "learning_rate": 3.645443921231592e-05, "epoch": 0.5943369934786243, "percentage": 59.43, "elapsed_time": "1 day, 1:14:20", "remaining_time": "17:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10664, "total_steps": 17941, "loss": 1.6071, "learning_rate": 3.644586817065171e-05, "epoch": 0.5943927317317875, "percentage": 59.44, "elapsed_time": "1 day, 1:14:29", "remaining_time": "17:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10665, "total_steps": 17941, "loss": 1.6828, "learning_rate": 3.643729755884554e-05, "epoch": 0.5944484699849507, "percentage": 59.44, "elapsed_time": "1 day, 1:14:38", "remaining_time": "17:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10666, "total_steps": 17941, "loss": 1.4355, "learning_rate": 3.6428727377169195e-05, "epoch": 0.5945042082381138, "percentage": 59.45, "elapsed_time": "1 day, 1:14:46", "remaining_time": "17:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10667, "total_steps": 17941, "loss": 1.8823, "learning_rate": 3.642015762589451e-05, "epoch": 0.594559946491277, "percentage": 59.46, "elapsed_time": "1 day, 1:14:55", "remaining_time": "17:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10668, "total_steps": 17941, "loss": 1.6855, "learning_rate": 3.6411588305293255e-05, "epoch": 0.5946156847444402, "percentage": 59.46, "elapsed_time": "1 day, 1:15:04", "remaining_time": "17:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10669, "total_steps": 17941, "loss": 1.6565, "learning_rate": 3.640301941563717e-05, "epoch": 0.5946714229976032, "percentage": 59.47, "elapsed_time": "1 day, 1:15:13", "remaining_time": "17:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10670, "total_steps": 17941, "loss": 1.7644, "learning_rate": 3.639445095719807e-05, "epoch": 0.5947271612507664, "percentage": 59.47, "elapsed_time": "1 day, 1:15:22", "remaining_time": "17:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10671, "total_steps": 17941, "loss": 1.595, "learning_rate": 3.638588293024763e-05, "epoch": 0.5947828995039296, "percentage": 59.48, "elapsed_time": "1 day, 1:15:31", "remaining_time": "17:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10672, "total_steps": 17941, "loss": 1.7064, "learning_rate": 3.637731533505762e-05, "epoch": 0.5948386377570927, "percentage": 59.48, "elapsed_time": "1 day, 1:15:39", "remaining_time": "17:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10673, "total_steps": 17941, "loss": 1.6056, "learning_rate": 3.6368748171899734e-05, "epoch": 0.5948943760102559, "percentage": 59.49, "elapsed_time": "1 day, 1:15:47", "remaining_time": "17:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10674, "total_steps": 17941, "loss": 1.6079, "learning_rate": 3.636018144104567e-05, "epoch": 0.594950114263419, "percentage": 59.5, "elapsed_time": "1 day, 1:15:56", "remaining_time": "17:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10675, "total_steps": 17941, "loss": 1.7554, "learning_rate": 3.6351615142767146e-05, "epoch": 0.5950058525165821, "percentage": 59.5, "elapsed_time": "1 day, 1:16:04", "remaining_time": "17:11:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10676, "total_steps": 17941, "loss": 1.6637, "learning_rate": 3.634304927733581e-05, "epoch": 0.5950615907697453, "percentage": 59.51, "elapsed_time": "1 day, 1:16:13", "remaining_time": "17:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10677, "total_steps": 17941, "loss": 1.4985, "learning_rate": 3.633448384502333e-05, "epoch": 0.5951173290229084, "percentage": 59.51, "elapsed_time": "1 day, 1:16:22", "remaining_time": "17:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10678, "total_steps": 17941, "loss": 1.5359, "learning_rate": 3.632591884610133e-05, "epoch": 0.5951730672760716, "percentage": 59.52, "elapsed_time": "1 day, 1:16:30", "remaining_time": "17:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10679, "total_steps": 17941, "loss": 1.9455, "learning_rate": 3.631735428084148e-05, "epoch": 0.5952288055292347, "percentage": 59.52, "elapsed_time": "1 day, 1:16:39", "remaining_time": "17:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10680, "total_steps": 17941, "loss": 1.5867, "learning_rate": 3.630879014951536e-05, "epoch": 0.5952845437823978, "percentage": 59.53, "elapsed_time": "1 day, 1:16:47", "remaining_time": "17:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10681, "total_steps": 17941, "loss": 1.6271, "learning_rate": 3.6300226452394584e-05, "epoch": 0.595340282035561, "percentage": 59.53, "elapsed_time": "1 day, 1:16:55", "remaining_time": "17:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10682, "total_steps": 17941, "loss": 1.7173, "learning_rate": 3.629166318975078e-05, "epoch": 0.5953960202887242, "percentage": 59.54, "elapsed_time": "1 day, 1:17:04", "remaining_time": "17:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10683, "total_steps": 17941, "loss": 1.7909, "learning_rate": 3.628310036185546e-05, "epoch": 0.5954517585418873, "percentage": 59.55, "elapsed_time": "1 day, 1:17:12", "remaining_time": "17:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10684, "total_steps": 17941, "loss": 1.6348, "learning_rate": 3.6274537968980255e-05, "epoch": 0.5955074967950504, "percentage": 59.55, "elapsed_time": "1 day, 1:17:21", "remaining_time": "17:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10685, "total_steps": 17941, "loss": 1.7643, "learning_rate": 3.6265976011396655e-05, "epoch": 0.5955632350482136, "percentage": 59.56, "elapsed_time": "1 day, 1:17:29", "remaining_time": "17:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10686, "total_steps": 17941, "loss": 1.5047, "learning_rate": 3.625741448937622e-05, "epoch": 0.5956189733013767, "percentage": 59.56, "elapsed_time": "1 day, 1:17:38", "remaining_time": "17:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10687, "total_steps": 17941, "loss": 1.7784, "learning_rate": 3.6248853403190484e-05, "epoch": 0.5956747115545399, "percentage": 59.57, "elapsed_time": "1 day, 1:17:46", "remaining_time": "17:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10688, "total_steps": 17941, "loss": 1.6646, "learning_rate": 3.624029275311094e-05, "epoch": 0.5957304498077031, "percentage": 59.57, "elapsed_time": "1 day, 1:17:55", "remaining_time": "17:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10689, "total_steps": 17941, "loss": 1.8714, "learning_rate": 3.6231732539409095e-05, "epoch": 0.5957861880608661, "percentage": 59.58, "elapsed_time": "1 day, 1:18:03", "remaining_time": "17:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10690, "total_steps": 17941, "loss": 1.7925, "learning_rate": 3.6223172762356404e-05, "epoch": 0.5958419263140293, "percentage": 59.58, "elapsed_time": "1 day, 1:18:12", "remaining_time": "17:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10691, "total_steps": 17941, "loss": 1.5877, "learning_rate": 3.621461342222436e-05, "epoch": 0.5958976645671925, "percentage": 59.59, "elapsed_time": "1 day, 1:18:20", "remaining_time": "17:09:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10692, "total_steps": 17941, "loss": 2.0101, "learning_rate": 3.62060545192844e-05, "epoch": 0.5959534028203556, "percentage": 59.6, "elapsed_time": "1 day, 1:18:29", "remaining_time": "17:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10693, "total_steps": 17941, "loss": 1.8824, "learning_rate": 3.6197496053807954e-05, "epoch": 0.5960091410735188, "percentage": 59.6, "elapsed_time": "1 day, 1:18:37", "remaining_time": "17:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10694, "total_steps": 17941, "loss": 1.8954, "learning_rate": 3.6188938026066476e-05, "epoch": 0.596064879326682, "percentage": 59.61, "elapsed_time": "1 day, 1:18:46", "remaining_time": "17:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10695, "total_steps": 17941, "loss": 1.8127, "learning_rate": 3.618038043633135e-05, "epoch": 0.596120617579845, "percentage": 59.61, "elapsed_time": "1 day, 1:18:55", "remaining_time": "17:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10696, "total_steps": 17941, "loss": 1.7617, "learning_rate": 3.617182328487399e-05, "epoch": 0.5961763558330082, "percentage": 59.62, "elapsed_time": "1 day, 1:19:04", "remaining_time": "17:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10697, "total_steps": 17941, "loss": 1.7745, "learning_rate": 3.616326657196577e-05, "epoch": 0.5962320940861714, "percentage": 59.62, "elapsed_time": "1 day, 1:19:12", "remaining_time": "17:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10698, "total_steps": 17941, "loss": 1.7582, "learning_rate": 3.615471029787807e-05, "epoch": 0.5962878323393345, "percentage": 59.63, "elapsed_time": "1 day, 1:19:21", "remaining_time": "17:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10699, "total_steps": 17941, "loss": 1.7778, "learning_rate": 3.614615446288222e-05, "epoch": 0.5963435705924977, "percentage": 59.63, "elapsed_time": "1 day, 1:19:29", "remaining_time": "17:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10700, "total_steps": 17941, "loss": 1.4981, "learning_rate": 3.6137599067249566e-05, "epoch": 0.5963993088456607, "percentage": 59.64, "elapsed_time": "1 day, 1:19:38", "remaining_time": "17:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10701, "total_steps": 17941, "loss": 1.7714, "learning_rate": 3.612904411125147e-05, "epoch": 0.5964550470988239, "percentage": 59.65, "elapsed_time": "1 day, 1:19:46", "remaining_time": "17:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10702, "total_steps": 17941, "loss": 1.5728, "learning_rate": 3.6120489595159214e-05, "epoch": 0.5965107853519871, "percentage": 59.65, "elapsed_time": "1 day, 1:19:55", "remaining_time": "17:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10703, "total_steps": 17941, "loss": 1.6069, "learning_rate": 3.611193551924411e-05, "epoch": 0.5965665236051502, "percentage": 59.66, "elapsed_time": "1 day, 1:20:03", "remaining_time": "17:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10704, "total_steps": 17941, "loss": 1.4952, "learning_rate": 3.610338188377743e-05, "epoch": 0.5966222618583134, "percentage": 59.66, "elapsed_time": "1 day, 1:20:12", "remaining_time": "17:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10705, "total_steps": 17941, "loss": 1.8509, "learning_rate": 3.609482868903046e-05, "epoch": 0.5966780001114765, "percentage": 59.67, "elapsed_time": "1 day, 1:20:21", "remaining_time": "17:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10706, "total_steps": 17941, "loss": 1.5773, "learning_rate": 3.6086275935274446e-05, "epoch": 0.5967337383646396, "percentage": 59.67, "elapsed_time": "1 day, 1:20:29", "remaining_time": "17:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10707, "total_steps": 17941, "loss": 1.5693, "learning_rate": 3.607772362278063e-05, "epoch": 0.5967894766178028, "percentage": 59.68, "elapsed_time": "1 day, 1:20:37", "remaining_time": "17:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10708, "total_steps": 17941, "loss": 1.5673, "learning_rate": 3.606917175182027e-05, "epoch": 0.596845214870966, "percentage": 59.68, "elapsed_time": "1 day, 1:20:46", "remaining_time": "17:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10709, "total_steps": 17941, "loss": 1.8263, "learning_rate": 3.606062032266453e-05, "epoch": 0.596900953124129, "percentage": 59.69, "elapsed_time": "1 day, 1:20:55", "remaining_time": "17:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10710, "total_steps": 17941, "loss": 1.4876, "learning_rate": 3.605206933558467e-05, "epoch": 0.5969566913772922, "percentage": 59.7, "elapsed_time": "1 day, 1:21:03", "remaining_time": "17:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10711, "total_steps": 17941, "loss": 1.5723, "learning_rate": 3.6043518790851824e-05, "epoch": 0.5970124296304554, "percentage": 59.7, "elapsed_time": "1 day, 1:21:12", "remaining_time": "17:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10712, "total_steps": 17941, "loss": 1.6389, "learning_rate": 3.60349686887372e-05, "epoch": 0.5970681678836185, "percentage": 59.71, "elapsed_time": "1 day, 1:21:21", "remaining_time": "17:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10713, "total_steps": 17941, "loss": 1.7281, "learning_rate": 3.602641902951196e-05, "epoch": 0.5971239061367817, "percentage": 59.71, "elapsed_time": "1 day, 1:21:29", "remaining_time": "17:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10714, "total_steps": 17941, "loss": 1.7753, "learning_rate": 3.601786981344722e-05, "epoch": 0.5971796443899449, "percentage": 59.72, "elapsed_time": "1 day, 1:21:38", "remaining_time": "17:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10715, "total_steps": 17941, "loss": 1.75, "learning_rate": 3.600932104081414e-05, "epoch": 0.5972353826431079, "percentage": 59.72, "elapsed_time": "1 day, 1:21:46", "remaining_time": "17:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10716, "total_steps": 17941, "loss": 1.7143, "learning_rate": 3.6000772711883805e-05, "epoch": 0.5972911208962711, "percentage": 59.73, "elapsed_time": "1 day, 1:21:55", "remaining_time": "17:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10717, "total_steps": 17941, "loss": 1.831, "learning_rate": 3.599222482692737e-05, "epoch": 0.5973468591494343, "percentage": 59.73, "elapsed_time": "1 day, 1:22:03", "remaining_time": "17:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10718, "total_steps": 17941, "loss": 1.6298, "learning_rate": 3.598367738621586e-05, "epoch": 0.5974025974025974, "percentage": 59.74, "elapsed_time": "1 day, 1:22:12", "remaining_time": "17:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10719, "total_steps": 17941, "loss": 1.4701, "learning_rate": 3.5975130390020396e-05, "epoch": 0.5974583356557606, "percentage": 59.75, "elapsed_time": "1 day, 1:22:20", "remaining_time": "17:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10720, "total_steps": 17941, "loss": 1.5741, "learning_rate": 3.596658383861203e-05, "epoch": 0.5975140739089237, "percentage": 59.75, "elapsed_time": "1 day, 1:22:29", "remaining_time": "17:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10721, "total_steps": 17941, "loss": 1.737, "learning_rate": 3.5958037732261804e-05, "epoch": 0.5975698121620868, "percentage": 59.76, "elapsed_time": "1 day, 1:22:37", "remaining_time": "17:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10722, "total_steps": 17941, "loss": 1.5736, "learning_rate": 3.594949207124075e-05, "epoch": 0.59762555041525, "percentage": 59.76, "elapsed_time": "1 day, 1:22:45", "remaining_time": "17:05:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10723, "total_steps": 17941, "loss": 1.5723, "learning_rate": 3.594094685581989e-05, "epoch": 0.5976812886684131, "percentage": 59.77, "elapsed_time": "1 day, 1:22:54", "remaining_time": "17:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10724, "total_steps": 17941, "loss": 1.5994, "learning_rate": 3.5932402086270225e-05, "epoch": 0.5977370269215763, "percentage": 59.77, "elapsed_time": "1 day, 1:23:02", "remaining_time": "17:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10725, "total_steps": 17941, "loss": 1.9002, "learning_rate": 3.592385776286274e-05, "epoch": 0.5977927651747394, "percentage": 59.78, "elapsed_time": "1 day, 1:23:11", "remaining_time": "17:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10726, "total_steps": 17941, "loss": 1.4599, "learning_rate": 3.5915313885868405e-05, "epoch": 0.5978485034279025, "percentage": 59.78, "elapsed_time": "1 day, 1:23:19", "remaining_time": "17:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10727, "total_steps": 17941, "loss": 1.4763, "learning_rate": 3.590677045555822e-05, "epoch": 0.5979042416810657, "percentage": 59.79, "elapsed_time": "1 day, 1:23:28", "remaining_time": "17:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10728, "total_steps": 17941, "loss": 1.6913, "learning_rate": 3.589822747220308e-05, "epoch": 0.5979599799342289, "percentage": 59.8, "elapsed_time": "1 day, 1:23:36", "remaining_time": "17:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10729, "total_steps": 17941, "loss": 1.6534, "learning_rate": 3.588968493607398e-05, "epoch": 0.598015718187392, "percentage": 59.8, "elapsed_time": "1 day, 1:23:45", "remaining_time": "17:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10730, "total_steps": 17941, "loss": 1.6151, "learning_rate": 3.588114284744177e-05, "epoch": 0.5980714564405551, "percentage": 59.81, "elapsed_time": "1 day, 1:23:53", "remaining_time": "17:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10731, "total_steps": 17941, "loss": 1.4861, "learning_rate": 3.587260120657742e-05, "epoch": 0.5981271946937183, "percentage": 59.81, "elapsed_time": "1 day, 1:24:02", "remaining_time": "17:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10732, "total_steps": 17941, "loss": 1.984, "learning_rate": 3.5864060013751775e-05, "epoch": 0.5981829329468814, "percentage": 59.82, "elapsed_time": "1 day, 1:24:10", "remaining_time": "17:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10733, "total_steps": 17941, "loss": 2.0094, "learning_rate": 3.585551926923572e-05, "epoch": 0.5982386712000446, "percentage": 59.82, "elapsed_time": "1 day, 1:24:19", "remaining_time": "17:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10734, "total_steps": 17941, "loss": 1.6148, "learning_rate": 3.5846978973300146e-05, "epoch": 0.5982944094532078, "percentage": 59.83, "elapsed_time": "1 day, 1:24:27", "remaining_time": "17:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10735, "total_steps": 17941, "loss": 1.6965, "learning_rate": 3.5838439126215863e-05, "epoch": 0.5983501477063708, "percentage": 59.84, "elapsed_time": "1 day, 1:24:36", "remaining_time": "17:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10736, "total_steps": 17941, "loss": 1.5948, "learning_rate": 3.582989972825374e-05, "epoch": 0.598405885959534, "percentage": 59.84, "elapsed_time": "1 day, 1:24:44", "remaining_time": "17:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10737, "total_steps": 17941, "loss": 1.8262, "learning_rate": 3.5821360779684564e-05, "epoch": 0.5984616242126972, "percentage": 59.85, "elapsed_time": "1 day, 1:24:53", "remaining_time": "17:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10738, "total_steps": 17941, "loss": 1.9408, "learning_rate": 3.581282228077916e-05, "epoch": 0.5985173624658603, "percentage": 59.85, "elapsed_time": "1 day, 1:25:01", "remaining_time": "17:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10739, "total_steps": 17941, "loss": 1.7485, "learning_rate": 3.580428423180833e-05, "epoch": 0.5985731007190235, "percentage": 59.86, "elapsed_time": "1 day, 1:25:10", "remaining_time": "17:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10740, "total_steps": 17941, "loss": 1.5062, "learning_rate": 3.5795746633042825e-05, "epoch": 0.5986288389721867, "percentage": 59.86, "elapsed_time": "1 day, 1:25:18", "remaining_time": "17:02:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10741, "total_steps": 17941, "loss": 1.6942, "learning_rate": 3.578720948475343e-05, "epoch": 0.5986845772253497, "percentage": 59.87, "elapsed_time": "1 day, 1:25:27", "remaining_time": "17:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10742, "total_steps": 17941, "loss": 1.5236, "learning_rate": 3.5778672787210866e-05, "epoch": 0.5987403154785129, "percentage": 59.87, "elapsed_time": "1 day, 1:25:35", "remaining_time": "17:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10743, "total_steps": 17941, "loss": 1.7426, "learning_rate": 3.5770136540685915e-05, "epoch": 0.5987960537316761, "percentage": 59.88, "elapsed_time": "1 day, 1:25:44", "remaining_time": "17:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10744, "total_steps": 17941, "loss": 1.724, "learning_rate": 3.576160074544923e-05, "epoch": 0.5988517919848392, "percentage": 59.89, "elapsed_time": "1 day, 1:25:53", "remaining_time": "17:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10745, "total_steps": 17941, "loss": 1.6856, "learning_rate": 3.575306540177157e-05, "epoch": 0.5989075302380024, "percentage": 59.89, "elapsed_time": "1 day, 1:26:01", "remaining_time": "17:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10746, "total_steps": 17941, "loss": 1.6754, "learning_rate": 3.5744530509923624e-05, "epoch": 0.5989632684911654, "percentage": 59.9, "elapsed_time": "1 day, 1:26:10", "remaining_time": "17:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10747, "total_steps": 17941, "loss": 1.4265, "learning_rate": 3.5735996070176036e-05, "epoch": 0.5990190067443286, "percentage": 59.9, "elapsed_time": "1 day, 1:26:18", "remaining_time": "17:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10748, "total_steps": 17941, "loss": 1.6428, "learning_rate": 3.57274620827995e-05, "epoch": 0.5990747449974918, "percentage": 59.91, "elapsed_time": "1 day, 1:26:27", "remaining_time": "17:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10749, "total_steps": 17941, "loss": 1.5636, "learning_rate": 3.571892854806464e-05, "epoch": 0.5991304832506549, "percentage": 59.91, "elapsed_time": "1 day, 1:26:35", "remaining_time": "17:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10750, "total_steps": 17941, "loss": 1.6054, "learning_rate": 3.5710395466242126e-05, "epoch": 0.5991862215038181, "percentage": 59.92, "elapsed_time": "1 day, 1:26:44", "remaining_time": "17:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10751, "total_steps": 17941, "loss": 1.753, "learning_rate": 3.570186283760254e-05, "epoch": 0.5992419597569812, "percentage": 59.92, "elapsed_time": "1 day, 1:26:52", "remaining_time": "17:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10752, "total_steps": 17941, "loss": 1.4766, "learning_rate": 3.569333066241648e-05, "epoch": 0.5992976980101443, "percentage": 59.93, "elapsed_time": "1 day, 1:27:00", "remaining_time": "17:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10753, "total_steps": 17941, "loss": 1.5641, "learning_rate": 3.568479894095458e-05, "epoch": 0.5993534362633075, "percentage": 59.94, "elapsed_time": "1 day, 1:27:09", "remaining_time": "17:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10754, "total_steps": 17941, "loss": 1.528, "learning_rate": 3.567626767348739e-05, "epoch": 0.5994091745164707, "percentage": 59.94, "elapsed_time": "1 day, 1:27:18", "remaining_time": "17:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10755, "total_steps": 17941, "loss": 1.8203, "learning_rate": 3.5667736860285485e-05, "epoch": 0.5994649127696338, "percentage": 59.95, "elapsed_time": "1 day, 1:27:26", "remaining_time": "17:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10756, "total_steps": 17941, "loss": 1.6485, "learning_rate": 3.5659206501619385e-05, "epoch": 0.599520651022797, "percentage": 59.95, "elapsed_time": "1 day, 1:27:34", "remaining_time": "17:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10757, "total_steps": 17941, "loss": 1.7586, "learning_rate": 3.565067659775966e-05, "epoch": 0.5995763892759601, "percentage": 59.96, "elapsed_time": "1 day, 1:27:43", "remaining_time": "17:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10758, "total_steps": 17941, "loss": 1.607, "learning_rate": 3.56421471489768e-05, "epoch": 0.5996321275291232, "percentage": 59.96, "elapsed_time": "1 day, 1:27:51", "remaining_time": "17:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10759, "total_steps": 17941, "loss": 1.7169, "learning_rate": 3.563361815554131e-05, "epoch": 0.5996878657822864, "percentage": 59.97, "elapsed_time": "1 day, 1:28:00", "remaining_time": "16:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10760, "total_steps": 17941, "loss": 1.5978, "learning_rate": 3.5625089617723716e-05, "epoch": 0.5997436040354496, "percentage": 59.97, "elapsed_time": "1 day, 1:28:09", "remaining_time": "16:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10761, "total_steps": 17941, "loss": 1.8016, "learning_rate": 3.5616561535794445e-05, "epoch": 0.5997993422886126, "percentage": 59.98, "elapsed_time": "1 day, 1:28:18", "remaining_time": "16:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10762, "total_steps": 17941, "loss": 1.6588, "learning_rate": 3.5608033910023995e-05, "epoch": 0.5998550805417758, "percentage": 59.99, "elapsed_time": "1 day, 1:28:26", "remaining_time": "16:59:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10763, "total_steps": 17941, "loss": 1.8786, "learning_rate": 3.55995067406828e-05, "epoch": 0.599910818794939, "percentage": 59.99, "elapsed_time": "1 day, 1:28:35", "remaining_time": "16:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10764, "total_steps": 17941, "loss": 1.7054, "learning_rate": 3.5590980028041274e-05, "epoch": 0.5999665570481021, "percentage": 60.0, "elapsed_time": "1 day, 1:28:44", "remaining_time": "16:59:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10765, "total_steps": 17941, "loss": 1.4711, "learning_rate": 3.558245377236987e-05, "epoch": 0.6000222953012653, "percentage": 60.0, "elapsed_time": "1 day, 1:28:53", "remaining_time": "16:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10766, "total_steps": 17941, "loss": 1.6006, "learning_rate": 3.557392797393896e-05, "epoch": 0.6000780335544285, "percentage": 60.01, "elapsed_time": "1 day, 1:29:01", "remaining_time": "16:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10767, "total_steps": 17941, "loss": 1.7297, "learning_rate": 3.556540263301896e-05, "epoch": 0.6001337718075915, "percentage": 60.01, "elapsed_time": "1 day, 1:29:10", "remaining_time": "16:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10768, "total_steps": 17941, "loss": 1.684, "learning_rate": 3.55568777498802e-05, "epoch": 0.6001895100607547, "percentage": 60.02, "elapsed_time": "1 day, 1:29:18", "remaining_time": "16:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10769, "total_steps": 17941, "loss": 1.5644, "learning_rate": 3.554835332479311e-05, "epoch": 0.6002452483139178, "percentage": 60.02, "elapsed_time": "1 day, 1:29:27", "remaining_time": "16:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10770, "total_steps": 17941, "loss": 1.7492, "learning_rate": 3.553982935802795e-05, "epoch": 0.600300986567081, "percentage": 60.03, "elapsed_time": "1 day, 1:29:35", "remaining_time": "16:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10771, "total_steps": 17941, "loss": 1.7471, "learning_rate": 3.5531305849855115e-05, "epoch": 0.6003567248202442, "percentage": 60.04, "elapsed_time": "1 day, 1:29:44", "remaining_time": "16:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10772, "total_steps": 17941, "loss": 1.6402, "learning_rate": 3.552278280054491e-05, "epoch": 0.6004124630734072, "percentage": 60.04, "elapsed_time": "1 day, 1:29:53", "remaining_time": "16:58:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10773, "total_steps": 17941, "loss": 1.5077, "learning_rate": 3.551426021036761e-05, "epoch": 0.6004682013265704, "percentage": 60.05, "elapsed_time": "1 day, 1:30:01", "remaining_time": "16:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10774, "total_steps": 17941, "loss": 1.8933, "learning_rate": 3.550573807959353e-05, "epoch": 0.6005239395797336, "percentage": 60.05, "elapsed_time": "1 day, 1:30:10", "remaining_time": "16:57:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10775, "total_steps": 17941, "loss": 1.5747, "learning_rate": 3.549721640849293e-05, "epoch": 0.6005796778328967, "percentage": 60.06, "elapsed_time": "1 day, 1:30:18", "remaining_time": "16:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10776, "total_steps": 17941, "loss": 1.7253, "learning_rate": 3.548869519733606e-05, "epoch": 0.6006354160860599, "percentage": 60.06, "elapsed_time": "1 day, 1:30:27", "remaining_time": "16:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10777, "total_steps": 17941, "loss": 1.6655, "learning_rate": 3.5480174446393175e-05, "epoch": 0.600691154339223, "percentage": 60.07, "elapsed_time": "1 day, 1:30:36", "remaining_time": "16:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10778, "total_steps": 17941, "loss": 1.3522, "learning_rate": 3.5471654155934485e-05, "epoch": 0.6007468925923861, "percentage": 60.07, "elapsed_time": "1 day, 1:30:44", "remaining_time": "16:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10779, "total_steps": 17941, "loss": 1.8613, "learning_rate": 3.546313432623025e-05, "epoch": 0.6008026308455493, "percentage": 60.08, "elapsed_time": "1 day, 1:30:53", "remaining_time": "16:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10780, "total_steps": 17941, "loss": 1.6849, "learning_rate": 3.545461495755061e-05, "epoch": 0.6008583690987125, "percentage": 60.09, "elapsed_time": "1 day, 1:31:01", "remaining_time": "16:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10781, "total_steps": 17941, "loss": 1.7203, "learning_rate": 3.54460960501658e-05, "epoch": 0.6009141073518756, "percentage": 60.09, "elapsed_time": "1 day, 1:31:10", "remaining_time": "16:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10782, "total_steps": 17941, "loss": 1.4293, "learning_rate": 3.5437577604345964e-05, "epoch": 0.6009698456050387, "percentage": 60.1, "elapsed_time": "1 day, 1:31:18", "remaining_time": "16:56:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10783, "total_steps": 17941, "loss": 1.7313, "learning_rate": 3.542905962036126e-05, "epoch": 0.6010255838582019, "percentage": 60.1, "elapsed_time": "1 day, 1:31:27", "remaining_time": "16:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10784, "total_steps": 17941, "loss": 1.7252, "learning_rate": 3.542054209848182e-05, "epoch": 0.601081322111365, "percentage": 60.11, "elapsed_time": "1 day, 1:31:36", "remaining_time": "16:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10785, "total_steps": 17941, "loss": 1.7057, "learning_rate": 3.5412025038977774e-05, "epoch": 0.6011370603645282, "percentage": 60.11, "elapsed_time": "1 day, 1:31:45", "remaining_time": "16:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10786, "total_steps": 17941, "loss": 1.813, "learning_rate": 3.540350844211927e-05, "epoch": 0.6011927986176914, "percentage": 60.12, "elapsed_time": "1 day, 1:31:54", "remaining_time": "16:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10787, "total_steps": 17941, "loss": 1.765, "learning_rate": 3.539499230817634e-05, "epoch": 0.6012485368708544, "percentage": 60.12, "elapsed_time": "1 day, 1:32:02", "remaining_time": "16:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10788, "total_steps": 17941, "loss": 1.6828, "learning_rate": 3.538647663741913e-05, "epoch": 0.6013042751240176, "percentage": 60.13, "elapsed_time": "1 day, 1:32:12", "remaining_time": "16:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10789, "total_steps": 17941, "loss": 1.8815, "learning_rate": 3.5377961430117665e-05, "epoch": 0.6013600133771808, "percentage": 60.14, "elapsed_time": "1 day, 1:32:20", "remaining_time": "16:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10790, "total_steps": 17941, "loss": 1.8932, "learning_rate": 3.5369446686542016e-05, "epoch": 0.6014157516303439, "percentage": 60.14, "elapsed_time": "1 day, 1:32:29", "remaining_time": "16:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10791, "total_steps": 17941, "loss": 1.8328, "learning_rate": 3.5360932406962214e-05, "epoch": 0.6014714898835071, "percentage": 60.15, "elapsed_time": "1 day, 1:32:37", "remaining_time": "16:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10792, "total_steps": 17941, "loss": 1.4607, "learning_rate": 3.5352418591648285e-05, "epoch": 0.6015272281366701, "percentage": 60.15, "elapsed_time": "1 day, 1:32:46", "remaining_time": "16:55:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10793, "total_steps": 17941, "loss": 1.7778, "learning_rate": 3.534390524087024e-05, "epoch": 0.6015829663898333, "percentage": 60.16, "elapsed_time": "1 day, 1:32:54", "remaining_time": "16:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10794, "total_steps": 17941, "loss": 1.6689, "learning_rate": 3.5335392354898055e-05, "epoch": 0.6016387046429965, "percentage": 60.16, "elapsed_time": "1 day, 1:33:03", "remaining_time": "16:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10795, "total_steps": 17941, "loss": 1.6137, "learning_rate": 3.532687993400175e-05, "epoch": 0.6016944428961596, "percentage": 60.17, "elapsed_time": "1 day, 1:33:12", "remaining_time": "16:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10796, "total_steps": 17941, "loss": 1.5538, "learning_rate": 3.5318367978451234e-05, "epoch": 0.6017501811493228, "percentage": 60.18, "elapsed_time": "1 day, 1:33:20", "remaining_time": "16:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10797, "total_steps": 17941, "loss": 1.7932, "learning_rate": 3.530985648851649e-05, "epoch": 0.601805919402486, "percentage": 60.18, "elapsed_time": "1 day, 1:33:29", "remaining_time": "16:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10798, "total_steps": 17941, "loss": 1.7293, "learning_rate": 3.530134546446747e-05, "epoch": 0.601861657655649, "percentage": 60.19, "elapsed_time": "1 day, 1:33:37", "remaining_time": "16:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10799, "total_steps": 17941, "loss": 1.6503, "learning_rate": 3.529283490657406e-05, "epoch": 0.6019173959088122, "percentage": 60.19, "elapsed_time": "1 day, 1:33:46", "remaining_time": "16:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10800, "total_steps": 17941, "loss": 1.7405, "learning_rate": 3.5284324815106184e-05, "epoch": 0.6019731341619754, "percentage": 60.2, "elapsed_time": "1 day, 1:33:54", "remaining_time": "16:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10801, "total_steps": 17941, "loss": 1.9516, "learning_rate": 3.527581519033372e-05, "epoch": 0.6020288724151385, "percentage": 60.2, "elapsed_time": "1 day, 1:34:03", "remaining_time": "16:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10802, "total_steps": 17941, "loss": 1.518, "learning_rate": 3.5267306032526556e-05, "epoch": 0.6020846106683017, "percentage": 60.21, "elapsed_time": "1 day, 1:34:11", "remaining_time": "16:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10803, "total_steps": 17941, "loss": 1.9563, "learning_rate": 3.525879734195453e-05, "epoch": 0.6021403489214648, "percentage": 60.21, "elapsed_time": "1 day, 1:34:20", "remaining_time": "16:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10804, "total_steps": 17941, "loss": 1.4931, "learning_rate": 3.525028911888751e-05, "epoch": 0.6021960871746279, "percentage": 60.22, "elapsed_time": "1 day, 1:34:28", "remaining_time": "16:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10805, "total_steps": 17941, "loss": 1.6004, "learning_rate": 3.5241781363595344e-05, "epoch": 0.6022518254277911, "percentage": 60.23, "elapsed_time": "1 day, 1:34:37", "remaining_time": "16:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10806, "total_steps": 17941, "loss": 1.5503, "learning_rate": 3.523327407634781e-05, "epoch": 0.6023075636809543, "percentage": 60.23, "elapsed_time": "1 day, 1:34:45", "remaining_time": "16:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10807, "total_steps": 17941, "loss": 1.8868, "learning_rate": 3.5224767257414734e-05, "epoch": 0.6023633019341174, "percentage": 60.24, "elapsed_time": "1 day, 1:34:54", "remaining_time": "16:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10808, "total_steps": 17941, "loss": 1.7416, "learning_rate": 3.521626090706589e-05, "epoch": 0.6024190401872805, "percentage": 60.24, "elapsed_time": "1 day, 1:35:02", "remaining_time": "16:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10809, "total_steps": 17941, "loss": 1.6226, "learning_rate": 3.5207755025571066e-05, "epoch": 0.6024747784404437, "percentage": 60.25, "elapsed_time": "1 day, 1:35:11", "remaining_time": "16:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10810, "total_steps": 17941, "loss": 1.5139, "learning_rate": 3.519924961319999e-05, "epoch": 0.6025305166936068, "percentage": 60.25, "elapsed_time": "1 day, 1:35:19", "remaining_time": "16:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10811, "total_steps": 17941, "loss": 1.5466, "learning_rate": 3.519074467022241e-05, "epoch": 0.60258625494677, "percentage": 60.26, "elapsed_time": "1 day, 1:35:28", "remaining_time": "16:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10812, "total_steps": 17941, "loss": 1.5498, "learning_rate": 3.518224019690811e-05, "epoch": 0.6026419931999332, "percentage": 60.26, "elapsed_time": "1 day, 1:35:36", "remaining_time": "16:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10813, "total_steps": 17941, "loss": 1.5064, "learning_rate": 3.517373619352672e-05, "epoch": 0.6026977314530962, "percentage": 60.27, "elapsed_time": "1 day, 1:35:45", "remaining_time": "16:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10814, "total_steps": 17941, "loss": 1.9771, "learning_rate": 3.516523266034799e-05, "epoch": 0.6027534697062594, "percentage": 60.28, "elapsed_time": "1 day, 1:35:53", "remaining_time": "16:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10815, "total_steps": 17941, "loss": 1.5936, "learning_rate": 3.515672959764158e-05, "epoch": 0.6028092079594225, "percentage": 60.28, "elapsed_time": "1 day, 1:36:02", "remaining_time": "16:52:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10816, "total_steps": 17941, "loss": 1.7219, "learning_rate": 3.514822700567718e-05, "epoch": 0.6028649462125857, "percentage": 60.29, "elapsed_time": "1 day, 1:36:10", "remaining_time": "16:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10817, "total_steps": 17941, "loss": 1.6883, "learning_rate": 3.5139724884724406e-05, "epoch": 0.6029206844657489, "percentage": 60.29, "elapsed_time": "1 day, 1:36:19", "remaining_time": "16:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10818, "total_steps": 17941, "loss": 1.8162, "learning_rate": 3.5131223235052927e-05, "epoch": 0.6029764227189119, "percentage": 60.3, "elapsed_time": "1 day, 1:36:27", "remaining_time": "16:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10819, "total_steps": 17941, "loss": 1.7268, "learning_rate": 3.512272205693236e-05, "epoch": 0.6030321609720751, "percentage": 60.3, "elapsed_time": "1 day, 1:36:36", "remaining_time": "16:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10820, "total_steps": 17941, "loss": 1.7887, "learning_rate": 3.511422135063229e-05, "epoch": 0.6030878992252383, "percentage": 60.31, "elapsed_time": "1 day, 1:36:44", "remaining_time": "16:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10821, "total_steps": 17941, "loss": 1.5031, "learning_rate": 3.5105721116422364e-05, "epoch": 0.6031436374784014, "percentage": 60.31, "elapsed_time": "1 day, 1:36:53", "remaining_time": "16:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10822, "total_steps": 17941, "loss": 1.486, "learning_rate": 3.509722135457209e-05, "epoch": 0.6031993757315646, "percentage": 60.32, "elapsed_time": "1 day, 1:37:02", "remaining_time": "16:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10823, "total_steps": 17941, "loss": 1.6346, "learning_rate": 3.5088722065351074e-05, "epoch": 0.6032551139847278, "percentage": 60.33, "elapsed_time": "1 day, 1:37:10", "remaining_time": "16:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10824, "total_steps": 17941, "loss": 1.6415, "learning_rate": 3.508022324902888e-05, "epoch": 0.6033108522378908, "percentage": 60.33, "elapsed_time": "1 day, 1:37:19", "remaining_time": "16:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10825, "total_steps": 17941, "loss": 1.8652, "learning_rate": 3.507172490587499e-05, "epoch": 0.603366590491054, "percentage": 60.34, "elapsed_time": "1 day, 1:37:27", "remaining_time": "16:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10826, "total_steps": 17941, "loss": 1.6726, "learning_rate": 3.5063227036158956e-05, "epoch": 0.6034223287442172, "percentage": 60.34, "elapsed_time": "1 day, 1:37:36", "remaining_time": "16:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10827, "total_steps": 17941, "loss": 1.6772, "learning_rate": 3.5054729640150274e-05, "epoch": 0.6034780669973803, "percentage": 60.35, "elapsed_time": "1 day, 1:37:44", "remaining_time": "16:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10828, "total_steps": 17941, "loss": 1.714, "learning_rate": 3.504623271811843e-05, "epoch": 0.6035338052505435, "percentage": 60.35, "elapsed_time": "1 day, 1:37:53", "remaining_time": "16:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10829, "total_steps": 17941, "loss": 1.6752, "learning_rate": 3.5037736270332886e-05, "epoch": 0.6035895435037066, "percentage": 60.36, "elapsed_time": "1 day, 1:38:02", "remaining_time": "16:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10830, "total_steps": 17941, "loss": 1.3809, "learning_rate": 3.502924029706312e-05, "epoch": 0.6036452817568697, "percentage": 60.36, "elapsed_time": "1 day, 1:38:10", "remaining_time": "16:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10831, "total_steps": 17941, "loss": 1.6847, "learning_rate": 3.502074479857858e-05, "epoch": 0.6037010200100329, "percentage": 60.37, "elapsed_time": "1 day, 1:38:19", "remaining_time": "16:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10832, "total_steps": 17941, "loss": 1.7664, "learning_rate": 3.501224977514867e-05, "epoch": 0.6037567582631961, "percentage": 60.38, "elapsed_time": "1 day, 1:38:27", "remaining_time": "16:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10833, "total_steps": 17941, "loss": 1.631, "learning_rate": 3.500375522704281e-05, "epoch": 0.6038124965163592, "percentage": 60.38, "elapsed_time": "1 day, 1:38:36", "remaining_time": "16:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10834, "total_steps": 17941, "loss": 1.6952, "learning_rate": 3.49952611545304e-05, "epoch": 0.6038682347695223, "percentage": 60.39, "elapsed_time": "1 day, 1:38:44", "remaining_time": "16:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10835, "total_steps": 17941, "loss": 1.5307, "learning_rate": 3.498676755788083e-05, "epoch": 0.6039239730226855, "percentage": 60.39, "elapsed_time": "1 day, 1:38:53", "remaining_time": "16:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10836, "total_steps": 17941, "loss": 1.4216, "learning_rate": 3.497827443736344e-05, "epoch": 0.6039797112758486, "percentage": 60.4, "elapsed_time": "1 day, 1:39:01", "remaining_time": "16:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10837, "total_steps": 17941, "loss": 1.7554, "learning_rate": 3.496978179324761e-05, "epoch": 0.6040354495290118, "percentage": 60.4, "elapsed_time": "1 day, 1:39:09", "remaining_time": "16:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10838, "total_steps": 17941, "loss": 1.677, "learning_rate": 3.49612896258027e-05, "epoch": 0.6040911877821749, "percentage": 60.41, "elapsed_time": "1 day, 1:39:18", "remaining_time": "16:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10839, "total_steps": 17941, "loss": 1.8422, "learning_rate": 3.4952797935297955e-05, "epoch": 0.604146926035338, "percentage": 60.41, "elapsed_time": "1 day, 1:39:27", "remaining_time": "16:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10840, "total_steps": 17941, "loss": 1.6821, "learning_rate": 3.494430672200276e-05, "epoch": 0.6042026642885012, "percentage": 60.42, "elapsed_time": "1 day, 1:39:35", "remaining_time": "16:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10841, "total_steps": 17941, "loss": 1.635, "learning_rate": 3.493581598618636e-05, "epoch": 0.6042584025416643, "percentage": 60.43, "elapsed_time": "1 day, 1:39:44", "remaining_time": "16:48:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10842, "total_steps": 17941, "loss": 1.7191, "learning_rate": 3.4927325728118055e-05, "epoch": 0.6043141407948275, "percentage": 60.43, "elapsed_time": "1 day, 1:39:52", "remaining_time": "16:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10843, "total_steps": 17941, "loss": 1.637, "learning_rate": 3.491883594806709e-05, "epoch": 0.6043698790479907, "percentage": 60.44, "elapsed_time": "1 day, 1:40:01", "remaining_time": "16:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10844, "total_steps": 17941, "loss": 1.6545, "learning_rate": 3.4910346646302716e-05, "epoch": 0.6044256173011537, "percentage": 60.44, "elapsed_time": "1 day, 1:40:09", "remaining_time": "16:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10845, "total_steps": 17941, "loss": 1.7508, "learning_rate": 3.4901857823094184e-05, "epoch": 0.6044813555543169, "percentage": 60.45, "elapsed_time": "1 day, 1:40:18", "remaining_time": "16:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10846, "total_steps": 17941, "loss": 1.5451, "learning_rate": 3.489336947871067e-05, "epoch": 0.6045370938074801, "percentage": 60.45, "elapsed_time": "1 day, 1:40:26", "remaining_time": "16:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10847, "total_steps": 17941, "loss": 1.4548, "learning_rate": 3.488488161342143e-05, "epoch": 0.6045928320606432, "percentage": 60.46, "elapsed_time": "1 day, 1:40:35", "remaining_time": "16:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10848, "total_steps": 17941, "loss": 1.926, "learning_rate": 3.487639422749559e-05, "epoch": 0.6046485703138064, "percentage": 60.46, "elapsed_time": "1 day, 1:40:44", "remaining_time": "16:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10849, "total_steps": 17941, "loss": 1.8622, "learning_rate": 3.486790732120235e-05, "epoch": 0.6047043085669696, "percentage": 60.47, "elapsed_time": "1 day, 1:40:52", "remaining_time": "16:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10850, "total_steps": 17941, "loss": 1.6005, "learning_rate": 3.485942089481089e-05, "epoch": 0.6047600468201326, "percentage": 60.48, "elapsed_time": "1 day, 1:41:00", "remaining_time": "16:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10851, "total_steps": 17941, "loss": 1.6028, "learning_rate": 3.4850934948590295e-05, "epoch": 0.6048157850732958, "percentage": 60.48, "elapsed_time": "1 day, 1:41:10", "remaining_time": "16:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10852, "total_steps": 17941, "loss": 1.8607, "learning_rate": 3.484244948280974e-05, "epoch": 0.604871523326459, "percentage": 60.49, "elapsed_time": "1 day, 1:41:18", "remaining_time": "16:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10853, "total_steps": 17941, "loss": 1.6398, "learning_rate": 3.4833964497738305e-05, "epoch": 0.6049272615796221, "percentage": 60.49, "elapsed_time": "1 day, 1:41:27", "remaining_time": "16:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10854, "total_steps": 17941, "loss": 1.6174, "learning_rate": 3.482547999364509e-05, "epoch": 0.6049829998327853, "percentage": 60.5, "elapsed_time": "1 day, 1:41:35", "remaining_time": "16:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10855, "total_steps": 17941, "loss": 1.742, "learning_rate": 3.481699597079916e-05, "epoch": 0.6050387380859484, "percentage": 60.5, "elapsed_time": "1 day, 1:41:44", "remaining_time": "16:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10856, "total_steps": 17941, "loss": 1.626, "learning_rate": 3.480851242946961e-05, "epoch": 0.6050944763391115, "percentage": 60.51, "elapsed_time": "1 day, 1:41:52", "remaining_time": "16:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10857, "total_steps": 17941, "loss": 1.4834, "learning_rate": 3.4800029369925476e-05, "epoch": 0.6051502145922747, "percentage": 60.52, "elapsed_time": "1 day, 1:42:01", "remaining_time": "16:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10858, "total_steps": 17941, "loss": 1.9472, "learning_rate": 3.4791546792435785e-05, "epoch": 0.6052059528454379, "percentage": 60.52, "elapsed_time": "1 day, 1:42:09", "remaining_time": "16:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10859, "total_steps": 17941, "loss": 1.8025, "learning_rate": 3.478306469726957e-05, "epoch": 0.605261691098601, "percentage": 60.53, "elapsed_time": "1 day, 1:42:18", "remaining_time": "16:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10860, "total_steps": 17941, "loss": 1.7116, "learning_rate": 3.4774583084695804e-05, "epoch": 0.6053174293517641, "percentage": 60.53, "elapsed_time": "1 day, 1:42:26", "remaining_time": "16:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10861, "total_steps": 17941, "loss": 1.5637, "learning_rate": 3.476610195498351e-05, "epoch": 0.6053731676049272, "percentage": 60.54, "elapsed_time": "1 day, 1:42:35", "remaining_time": "16:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10862, "total_steps": 17941, "loss": 1.7162, "learning_rate": 3.4757621308401625e-05, "epoch": 0.6054289058580904, "percentage": 60.54, "elapsed_time": "1 day, 1:42:43", "remaining_time": "16:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10863, "total_steps": 17941, "loss": 1.8017, "learning_rate": 3.474914114521912e-05, "epoch": 0.6054846441112536, "percentage": 60.55, "elapsed_time": "1 day, 1:42:52", "remaining_time": "16:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10864, "total_steps": 17941, "loss": 1.5233, "learning_rate": 3.474066146570496e-05, "epoch": 0.6055403823644167, "percentage": 60.55, "elapsed_time": "1 day, 1:43:01", "remaining_time": "16:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10865, "total_steps": 17941, "loss": 1.7133, "learning_rate": 3.4732182270128026e-05, "epoch": 0.6055961206175798, "percentage": 60.56, "elapsed_time": "1 day, 1:43:09", "remaining_time": "16:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10866, "total_steps": 17941, "loss": 1.6873, "learning_rate": 3.472370355875727e-05, "epoch": 0.605651858870743, "percentage": 60.57, "elapsed_time": "1 day, 1:43:17", "remaining_time": "16:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10867, "total_steps": 17941, "loss": 1.4978, "learning_rate": 3.471522533186157e-05, "epoch": 0.6057075971239061, "percentage": 60.57, "elapsed_time": "1 day, 1:43:26", "remaining_time": "16:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10868, "total_steps": 17941, "loss": 1.7908, "learning_rate": 3.470674758970981e-05, "epoch": 0.6057633353770693, "percentage": 60.58, "elapsed_time": "1 day, 1:43:35", "remaining_time": "16:44:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10869, "total_steps": 17941, "loss": 1.8559, "learning_rate": 3.4698270332570835e-05, "epoch": 0.6058190736302325, "percentage": 60.58, "elapsed_time": "1 day, 1:43:43", "remaining_time": "16:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10870, "total_steps": 17941, "loss": 1.8091, "learning_rate": 3.468979356071351e-05, "epoch": 0.6058748118833955, "percentage": 60.59, "elapsed_time": "1 day, 1:43:52", "remaining_time": "16:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10871, "total_steps": 17941, "loss": 1.6181, "learning_rate": 3.468131727440669e-05, "epoch": 0.6059305501365587, "percentage": 60.59, "elapsed_time": "1 day, 1:44:00", "remaining_time": "16:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10872, "total_steps": 17941, "loss": 1.8721, "learning_rate": 3.467284147391914e-05, "epoch": 0.6059862883897219, "percentage": 60.6, "elapsed_time": "1 day, 1:44:09", "remaining_time": "16:44:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10873, "total_steps": 17941, "loss": 1.3427, "learning_rate": 3.466436615951973e-05, "epoch": 0.606042026642885, "percentage": 60.6, "elapsed_time": "1 day, 1:44:17", "remaining_time": "16:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10874, "total_steps": 17941, "loss": 1.6981, "learning_rate": 3.465589133147718e-05, "epoch": 0.6060977648960482, "percentage": 60.61, "elapsed_time": "1 day, 1:44:26", "remaining_time": "16:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10875, "total_steps": 17941, "loss": 1.3025, "learning_rate": 3.464741699006031e-05, "epoch": 0.6061535031492113, "percentage": 60.62, "elapsed_time": "1 day, 1:44:34", "remaining_time": "16:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10876, "total_steps": 17941, "loss": 1.5597, "learning_rate": 3.4638943135537864e-05, "epoch": 0.6062092414023744, "percentage": 60.62, "elapsed_time": "1 day, 1:44:43", "remaining_time": "16:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10877, "total_steps": 17941, "loss": 1.6599, "learning_rate": 3.463046976817857e-05, "epoch": 0.6062649796555376, "percentage": 60.63, "elapsed_time": "1 day, 1:44:51", "remaining_time": "16:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10878, "total_steps": 17941, "loss": 1.7096, "learning_rate": 3.462199688825119e-05, "epoch": 0.6063207179087008, "percentage": 60.63, "elapsed_time": "1 day, 1:45:00", "remaining_time": "16:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10879, "total_steps": 17941, "loss": 1.6227, "learning_rate": 3.461352449602439e-05, "epoch": 0.6063764561618639, "percentage": 60.64, "elapsed_time": "1 day, 1:45:08", "remaining_time": "16:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10880, "total_steps": 17941, "loss": 1.9214, "learning_rate": 3.4605052591766884e-05, "epoch": 0.606432194415027, "percentage": 60.64, "elapsed_time": "1 day, 1:45:17", "remaining_time": "16:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10881, "total_steps": 17941, "loss": 1.6082, "learning_rate": 3.459658117574733e-05, "epoch": 0.6064879326681902, "percentage": 60.65, "elapsed_time": "1 day, 1:45:25", "remaining_time": "16:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10882, "total_steps": 17941, "loss": 1.5039, "learning_rate": 3.458811024823444e-05, "epoch": 0.6065436709213533, "percentage": 60.65, "elapsed_time": "1 day, 1:45:34", "remaining_time": "16:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10883, "total_steps": 17941, "loss": 1.5629, "learning_rate": 3.4579639809496835e-05, "epoch": 0.6065994091745165, "percentage": 60.66, "elapsed_time": "1 day, 1:45:43", "remaining_time": "16:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10884, "total_steps": 17941, "loss": 1.5471, "learning_rate": 3.4571169859803135e-05, "epoch": 0.6066551474276796, "percentage": 60.67, "elapsed_time": "1 day, 1:45:51", "remaining_time": "16:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10885, "total_steps": 17941, "loss": 1.7089, "learning_rate": 3.4562700399421985e-05, "epoch": 0.6067108856808427, "percentage": 60.67, "elapsed_time": "1 day, 1:46:00", "remaining_time": "16:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10886, "total_steps": 17941, "loss": 1.7032, "learning_rate": 3.455423142862196e-05, "epoch": 0.6067666239340059, "percentage": 60.68, "elapsed_time": "1 day, 1:46:08", "remaining_time": "16:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10887, "total_steps": 17941, "loss": 1.6528, "learning_rate": 3.4545762947671676e-05, "epoch": 0.606822362187169, "percentage": 60.68, "elapsed_time": "1 day, 1:46:17", "remaining_time": "16:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10888, "total_steps": 17941, "loss": 1.641, "learning_rate": 3.453729495683967e-05, "epoch": 0.6068781004403322, "percentage": 60.69, "elapsed_time": "1 day, 1:46:25", "remaining_time": "16:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10889, "total_steps": 17941, "loss": 1.77, "learning_rate": 3.4528827456394506e-05, "epoch": 0.6069338386934954, "percentage": 60.69, "elapsed_time": "1 day, 1:46:34", "remaining_time": "16:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10890, "total_steps": 17941, "loss": 1.7991, "learning_rate": 3.452036044660476e-05, "epoch": 0.6069895769466584, "percentage": 60.7, "elapsed_time": "1 day, 1:46:42", "remaining_time": "16:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10891, "total_steps": 17941, "loss": 1.592, "learning_rate": 3.451189392773891e-05, "epoch": 0.6070453151998216, "percentage": 60.7, "elapsed_time": "1 day, 1:46:51", "remaining_time": "16:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10892, "total_steps": 17941, "loss": 1.4394, "learning_rate": 3.45034279000655e-05, "epoch": 0.6071010534529848, "percentage": 60.71, "elapsed_time": "1 day, 1:46:59", "remaining_time": "16:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10893, "total_steps": 17941, "loss": 1.7956, "learning_rate": 3.449496236385298e-05, "epoch": 0.6071567917061479, "percentage": 60.72, "elapsed_time": "1 day, 1:47:08", "remaining_time": "16:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10894, "total_steps": 17941, "loss": 1.6404, "learning_rate": 3.448649731936988e-05, "epoch": 0.6072125299593111, "percentage": 60.72, "elapsed_time": "1 day, 1:47:16", "remaining_time": "16:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10895, "total_steps": 17941, "loss": 1.6412, "learning_rate": 3.4478032766884615e-05, "epoch": 0.6072682682124743, "percentage": 60.73, "elapsed_time": "1 day, 1:47:25", "remaining_time": "16:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10896, "total_steps": 17941, "loss": 1.699, "learning_rate": 3.446956870666565e-05, "epoch": 0.6073240064656373, "percentage": 60.73, "elapsed_time": "1 day, 1:47:33", "remaining_time": "16:40:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10897, "total_steps": 17941, "loss": 1.6323, "learning_rate": 3.446110513898143e-05, "epoch": 0.6073797447188005, "percentage": 60.74, "elapsed_time": "1 day, 1:47:42", "remaining_time": "16:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10898, "total_steps": 17941, "loss": 1.727, "learning_rate": 3.445264206410034e-05, "epoch": 0.6074354829719637, "percentage": 60.74, "elapsed_time": "1 day, 1:47:50", "remaining_time": "16:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10899, "total_steps": 17941, "loss": 1.4174, "learning_rate": 3.444417948229083e-05, "epoch": 0.6074912212251268, "percentage": 60.75, "elapsed_time": "1 day, 1:47:59", "remaining_time": "16:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10900, "total_steps": 17941, "loss": 1.7969, "learning_rate": 3.443571739382121e-05, "epoch": 0.60754695947829, "percentage": 60.75, "elapsed_time": "1 day, 1:48:07", "remaining_time": "16:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10901, "total_steps": 17941, "loss": 1.7629, "learning_rate": 3.44272557989599e-05, "epoch": 0.6076026977314531, "percentage": 60.76, "elapsed_time": "1 day, 1:48:16", "remaining_time": "16:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10902, "total_steps": 17941, "loss": 1.6894, "learning_rate": 3.4418794697975254e-05, "epoch": 0.6076584359846162, "percentage": 60.77, "elapsed_time": "1 day, 1:48:24", "remaining_time": "16:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10903, "total_steps": 17941, "loss": 1.6697, "learning_rate": 3.4410334091135586e-05, "epoch": 0.6077141742377794, "percentage": 60.77, "elapsed_time": "1 day, 1:48:33", "remaining_time": "16:39:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10904, "total_steps": 17941, "loss": 1.7436, "learning_rate": 3.440187397870923e-05, "epoch": 0.6077699124909426, "percentage": 60.78, "elapsed_time": "1 day, 1:48:41", "remaining_time": "16:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10905, "total_steps": 17941, "loss": 1.921, "learning_rate": 3.4393414360964486e-05, "epoch": 0.6078256507441057, "percentage": 60.78, "elapsed_time": "1 day, 1:48:50", "remaining_time": "16:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10906, "total_steps": 17941, "loss": 1.5432, "learning_rate": 3.438495523816966e-05, "epoch": 0.6078813889972688, "percentage": 60.79, "elapsed_time": "1 day, 1:48:58", "remaining_time": "16:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10907, "total_steps": 17941, "loss": 1.4088, "learning_rate": 3.437649661059298e-05, "epoch": 0.6079371272504319, "percentage": 60.79, "elapsed_time": "1 day, 1:49:07", "remaining_time": "16:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10908, "total_steps": 17941, "loss": 1.964, "learning_rate": 3.436803847850275e-05, "epoch": 0.6079928655035951, "percentage": 60.8, "elapsed_time": "1 day, 1:49:15", "remaining_time": "16:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10909, "total_steps": 17941, "loss": 1.8181, "learning_rate": 3.4359580842167205e-05, "epoch": 0.6080486037567583, "percentage": 60.8, "elapsed_time": "1 day, 1:49:24", "remaining_time": "16:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10910, "total_steps": 17941, "loss": 1.5749, "learning_rate": 3.435112370185456e-05, "epoch": 0.6081043420099214, "percentage": 60.81, "elapsed_time": "1 day, 1:49:32", "remaining_time": "16:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10911, "total_steps": 17941, "loss": 1.5584, "learning_rate": 3.434266705783305e-05, "epoch": 0.6081600802630845, "percentage": 60.82, "elapsed_time": "1 day, 1:49:41", "remaining_time": "16:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10912, "total_steps": 17941, "loss": 1.4784, "learning_rate": 3.4334210910370833e-05, "epoch": 0.6082158185162477, "percentage": 60.82, "elapsed_time": "1 day, 1:49:49", "remaining_time": "16:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10913, "total_steps": 17941, "loss": 1.748, "learning_rate": 3.4325755259736114e-05, "epoch": 0.6082715567694108, "percentage": 60.83, "elapsed_time": "1 day, 1:49:58", "remaining_time": "16:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10914, "total_steps": 17941, "loss": 1.4765, "learning_rate": 3.4317300106197045e-05, "epoch": 0.608327295022574, "percentage": 60.83, "elapsed_time": "1 day, 1:50:06", "remaining_time": "16:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10915, "total_steps": 17941, "loss": 1.5289, "learning_rate": 3.430884545002178e-05, "epoch": 0.6083830332757372, "percentage": 60.84, "elapsed_time": "1 day, 1:50:15", "remaining_time": "16:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10916, "total_steps": 17941, "loss": 1.7349, "learning_rate": 3.430039129147846e-05, "epoch": 0.6084387715289002, "percentage": 60.84, "elapsed_time": "1 day, 1:50:23", "remaining_time": "16:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10917, "total_steps": 17941, "loss": 1.8119, "learning_rate": 3.4291937630835184e-05, "epoch": 0.6084945097820634, "percentage": 60.85, "elapsed_time": "1 day, 1:50:32", "remaining_time": "16:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10918, "total_steps": 17941, "loss": 1.4698, "learning_rate": 3.428348446836008e-05, "epoch": 0.6085502480352266, "percentage": 60.86, "elapsed_time": "1 day, 1:50:40", "remaining_time": "16:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10919, "total_steps": 17941, "loss": 1.7174, "learning_rate": 3.42750318043212e-05, "epoch": 0.6086059862883897, "percentage": 60.86, "elapsed_time": "1 day, 1:50:49", "remaining_time": "16:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10920, "total_steps": 17941, "loss": 1.7808, "learning_rate": 3.4266579638986637e-05, "epoch": 0.6086617245415529, "percentage": 60.87, "elapsed_time": "1 day, 1:50:57", "remaining_time": "16:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10921, "total_steps": 17941, "loss": 1.5736, "learning_rate": 3.4258127972624423e-05, "epoch": 0.6087174627947161, "percentage": 60.87, "elapsed_time": "1 day, 1:51:06", "remaining_time": "16:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10922, "total_steps": 17941, "loss": 1.3187, "learning_rate": 3.424967680550261e-05, "epoch": 0.6087732010478791, "percentage": 60.88, "elapsed_time": "1 day, 1:51:15", "remaining_time": "16:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10923, "total_steps": 17941, "loss": 1.6827, "learning_rate": 3.424122613788923e-05, "epoch": 0.6088289393010423, "percentage": 60.88, "elapsed_time": "1 day, 1:51:23", "remaining_time": "16:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10924, "total_steps": 17941, "loss": 1.548, "learning_rate": 3.423277597005226e-05, "epoch": 0.6088846775542055, "percentage": 60.89, "elapsed_time": "1 day, 1:51:32", "remaining_time": "16:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10925, "total_steps": 17941, "loss": 1.7789, "learning_rate": 3.422432630225974e-05, "epoch": 0.6089404158073686, "percentage": 60.89, "elapsed_time": "1 day, 1:51:40", "remaining_time": "16:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10926, "total_steps": 17941, "loss": 1.6069, "learning_rate": 3.421587713477957e-05, "epoch": 0.6089961540605318, "percentage": 60.9, "elapsed_time": "1 day, 1:51:49", "remaining_time": "16:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10927, "total_steps": 17941, "loss": 1.4861, "learning_rate": 3.4207428467879774e-05, "epoch": 0.6090518923136949, "percentage": 60.91, "elapsed_time": "1 day, 1:51:57", "remaining_time": "16:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10928, "total_steps": 17941, "loss": 1.5054, "learning_rate": 3.419898030182825e-05, "epoch": 0.609107630566858, "percentage": 60.91, "elapsed_time": "1 day, 1:52:06", "remaining_time": "16:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10929, "total_steps": 17941, "loss": 1.9566, "learning_rate": 3.4190532636892955e-05, "epoch": 0.6091633688200212, "percentage": 60.92, "elapsed_time": "1 day, 1:52:14", "remaining_time": "16:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10930, "total_steps": 17941, "loss": 1.4754, "learning_rate": 3.418208547334181e-05, "epoch": 0.6092191070731843, "percentage": 60.92, "elapsed_time": "1 day, 1:52:23", "remaining_time": "16:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10931, "total_steps": 17941, "loss": 1.4885, "learning_rate": 3.417363881144267e-05, "epoch": 0.6092748453263475, "percentage": 60.93, "elapsed_time": "1 day, 1:52:31", "remaining_time": "16:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10932, "total_steps": 17941, "loss": 1.5243, "learning_rate": 3.416519265146343e-05, "epoch": 0.6093305835795106, "percentage": 60.93, "elapsed_time": "1 day, 1:52:40", "remaining_time": "16:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10933, "total_steps": 17941, "loss": 1.5245, "learning_rate": 3.415674699367195e-05, "epoch": 0.6093863218326737, "percentage": 60.94, "elapsed_time": "1 day, 1:52:48", "remaining_time": "16:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10934, "total_steps": 17941, "loss": 1.6732, "learning_rate": 3.414830183833608e-05, "epoch": 0.6094420600858369, "percentage": 60.94, "elapsed_time": "1 day, 1:52:57", "remaining_time": "16:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10935, "total_steps": 17941, "loss": 1.6273, "learning_rate": 3.413985718572368e-05, "epoch": 0.6094977983390001, "percentage": 60.95, "elapsed_time": "1 day, 1:53:05", "remaining_time": "16:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10936, "total_steps": 17941, "loss": 1.7216, "learning_rate": 3.413141303610252e-05, "epoch": 0.6095535365921632, "percentage": 60.96, "elapsed_time": "1 day, 1:53:14", "remaining_time": "16:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10937, "total_steps": 17941, "loss": 1.6605, "learning_rate": 3.412296938974043e-05, "epoch": 0.6096092748453263, "percentage": 60.96, "elapsed_time": "1 day, 1:53:22", "remaining_time": "16:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10938, "total_steps": 17941, "loss": 1.6557, "learning_rate": 3.4114526246905176e-05, "epoch": 0.6096650130984895, "percentage": 60.97, "elapsed_time": "1 day, 1:53:31", "remaining_time": "16:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10939, "total_steps": 17941, "loss": 1.6936, "learning_rate": 3.410608360786454e-05, "epoch": 0.6097207513516526, "percentage": 60.97, "elapsed_time": "1 day, 1:53:40", "remaining_time": "16:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10940, "total_steps": 17941, "loss": 1.5873, "learning_rate": 3.4097641472886245e-05, "epoch": 0.6097764896048158, "percentage": 60.98, "elapsed_time": "1 day, 1:53:48", "remaining_time": "16:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10941, "total_steps": 17941, "loss": 1.636, "learning_rate": 3.408919984223804e-05, "epoch": 0.609832227857979, "percentage": 60.98, "elapsed_time": "1 day, 1:53:56", "remaining_time": "16:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10942, "total_steps": 17941, "loss": 1.5813, "learning_rate": 3.408075871618767e-05, "epoch": 0.609887966111142, "percentage": 60.99, "elapsed_time": "1 day, 1:54:05", "remaining_time": "16:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10943, "total_steps": 17941, "loss": 1.8607, "learning_rate": 3.407231809500281e-05, "epoch": 0.6099437043643052, "percentage": 60.99, "elapsed_time": "1 day, 1:54:13", "remaining_time": "16:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10944, "total_steps": 17941, "loss": 1.6621, "learning_rate": 3.406387797895116e-05, "epoch": 0.6099994426174684, "percentage": 61.0, "elapsed_time": "1 day, 1:54:22", "remaining_time": "16:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10945, "total_steps": 17941, "loss": 1.8064, "learning_rate": 3.405543836830038e-05, "epoch": 0.6100551808706315, "percentage": 61.01, "elapsed_time": "1 day, 1:54:30", "remaining_time": "16:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10946, "total_steps": 17941, "loss": 1.6508, "learning_rate": 3.404699926331814e-05, "epoch": 0.6101109191237947, "percentage": 61.01, "elapsed_time": "1 day, 1:54:39", "remaining_time": "16:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10947, "total_steps": 17941, "loss": 1.8309, "learning_rate": 3.403856066427207e-05, "epoch": 0.6101666573769579, "percentage": 61.02, "elapsed_time": "1 day, 1:54:47", "remaining_time": "16:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10948, "total_steps": 17941, "loss": 1.6079, "learning_rate": 3.403012257142977e-05, "epoch": 0.6102223956301209, "percentage": 61.02, "elapsed_time": "1 day, 1:54:56", "remaining_time": "16:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10949, "total_steps": 17941, "loss": 1.5691, "learning_rate": 3.4021684985058914e-05, "epoch": 0.6102781338832841, "percentage": 61.03, "elapsed_time": "1 day, 1:55:04", "remaining_time": "16:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10950, "total_steps": 17941, "loss": 1.7893, "learning_rate": 3.4013247905427e-05, "epoch": 0.6103338721364473, "percentage": 61.03, "elapsed_time": "1 day, 1:55:13", "remaining_time": "16:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10951, "total_steps": 17941, "loss": 1.708, "learning_rate": 3.4004811332801705e-05, "epoch": 0.6103896103896104, "percentage": 61.04, "elapsed_time": "1 day, 1:55:22", "remaining_time": "16:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10952, "total_steps": 17941, "loss": 1.9378, "learning_rate": 3.39963752674505e-05, "epoch": 0.6104453486427736, "percentage": 61.04, "elapsed_time": "1 day, 1:55:31", "remaining_time": "16:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10953, "total_steps": 17941, "loss": 1.7007, "learning_rate": 3.398793970964098e-05, "epoch": 0.6105010868959366, "percentage": 61.05, "elapsed_time": "1 day, 1:55:39", "remaining_time": "16:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10954, "total_steps": 17941, "loss": 1.6816, "learning_rate": 3.397950465964065e-05, "epoch": 0.6105568251490998, "percentage": 61.06, "elapsed_time": "1 day, 1:55:48", "remaining_time": "16:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10955, "total_steps": 17941, "loss": 1.8814, "learning_rate": 3.3971070117717016e-05, "epoch": 0.610612563402263, "percentage": 61.06, "elapsed_time": "1 day, 1:55:56", "remaining_time": "16:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10956, "total_steps": 17941, "loss": 1.7222, "learning_rate": 3.39626360841376e-05, "epoch": 0.6106683016554261, "percentage": 61.07, "elapsed_time": "1 day, 1:56:05", "remaining_time": "16:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10957, "total_steps": 17941, "loss": 1.6526, "learning_rate": 3.395420255916986e-05, "epoch": 0.6107240399085893, "percentage": 61.07, "elapsed_time": "1 day, 1:56:13", "remaining_time": "16:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10958, "total_steps": 17941, "loss": 1.5243, "learning_rate": 3.3945769543081264e-05, "epoch": 0.6107797781617524, "percentage": 61.08, "elapsed_time": "1 day, 1:56:23", "remaining_time": "16:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10959, "total_steps": 17941, "loss": 1.6196, "learning_rate": 3.3937337036139236e-05, "epoch": 0.6108355164149155, "percentage": 61.08, "elapsed_time": "1 day, 1:56:31", "remaining_time": "16:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10960, "total_steps": 17941, "loss": 1.5272, "learning_rate": 3.392890503861124e-05, "epoch": 0.6108912546680787, "percentage": 61.09, "elapsed_time": "1 day, 1:56:39", "remaining_time": "16:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10961, "total_steps": 17941, "loss": 1.6407, "learning_rate": 3.3920473550764676e-05, "epoch": 0.6109469929212419, "percentage": 61.09, "elapsed_time": "1 day, 1:56:48", "remaining_time": "16:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10962, "total_steps": 17941, "loss": 1.618, "learning_rate": 3.3912042572866934e-05, "epoch": 0.611002731174405, "percentage": 61.1, "elapsed_time": "1 day, 1:56:57", "remaining_time": "16:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10963, "total_steps": 17941, "loss": 1.7345, "learning_rate": 3.390361210518542e-05, "epoch": 0.6110584694275681, "percentage": 61.11, "elapsed_time": "1 day, 1:57:05", "remaining_time": "16:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10964, "total_steps": 17941, "loss": 1.5911, "learning_rate": 3.389518214798746e-05, "epoch": 0.6111142076807313, "percentage": 61.11, "elapsed_time": "1 day, 1:57:13", "remaining_time": "16:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10965, "total_steps": 17941, "loss": 1.4994, "learning_rate": 3.388675270154045e-05, "epoch": 0.6111699459338944, "percentage": 61.12, "elapsed_time": "1 day, 1:57:22", "remaining_time": "16:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10966, "total_steps": 17941, "loss": 1.5398, "learning_rate": 3.3878323766111675e-05, "epoch": 0.6112256841870576, "percentage": 61.12, "elapsed_time": "1 day, 1:57:31", "remaining_time": "16:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10967, "total_steps": 17941, "loss": 1.501, "learning_rate": 3.3869895341968463e-05, "epoch": 0.6112814224402208, "percentage": 61.13, "elapsed_time": "1 day, 1:57:39", "remaining_time": "16:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10968, "total_steps": 17941, "loss": 1.5948, "learning_rate": 3.386146742937815e-05, "epoch": 0.6113371606933838, "percentage": 61.13, "elapsed_time": "1 day, 1:57:47", "remaining_time": "16:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10969, "total_steps": 17941, "loss": 1.5442, "learning_rate": 3.385304002860799e-05, "epoch": 0.611392898946547, "percentage": 61.14, "elapsed_time": "1 day, 1:57:56", "remaining_time": "16:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10970, "total_steps": 17941, "loss": 1.743, "learning_rate": 3.384461313992526e-05, "epoch": 0.6114486371997102, "percentage": 61.14, "elapsed_time": "1 day, 1:58:04", "remaining_time": "16:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10971, "total_steps": 17941, "loss": 1.8001, "learning_rate": 3.38361867635972e-05, "epoch": 0.6115043754528733, "percentage": 61.15, "elapsed_time": "1 day, 1:58:13", "remaining_time": "16:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10972, "total_steps": 17941, "loss": 1.8217, "learning_rate": 3.382776089989107e-05, "epoch": 0.6115601137060365, "percentage": 61.16, "elapsed_time": "1 day, 1:58:22", "remaining_time": "16:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10973, "total_steps": 17941, "loss": 1.5457, "learning_rate": 3.3819335549074064e-05, "epoch": 0.6116158519591997, "percentage": 61.16, "elapsed_time": "1 day, 1:58:31", "remaining_time": "16:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10974, "total_steps": 17941, "loss": 1.571, "learning_rate": 3.3810910711413376e-05, "epoch": 0.6116715902123627, "percentage": 61.17, "elapsed_time": "1 day, 1:58:39", "remaining_time": "16:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10975, "total_steps": 17941, "loss": 1.579, "learning_rate": 3.380248638717625e-05, "epoch": 0.6117273284655259, "percentage": 61.17, "elapsed_time": "1 day, 1:58:48", "remaining_time": "16:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10976, "total_steps": 17941, "loss": 1.5398, "learning_rate": 3.379406257662977e-05, "epoch": 0.611783066718689, "percentage": 61.18, "elapsed_time": "1 day, 1:58:57", "remaining_time": "16:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10977, "total_steps": 17941, "loss": 1.7963, "learning_rate": 3.378563928004118e-05, "epoch": 0.6118388049718522, "percentage": 61.18, "elapsed_time": "1 day, 1:59:05", "remaining_time": "16:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10978, "total_steps": 17941, "loss": 1.7298, "learning_rate": 3.377721649767755e-05, "epoch": 0.6118945432250154, "percentage": 61.19, "elapsed_time": "1 day, 1:59:14", "remaining_time": "16:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10979, "total_steps": 17941, "loss": 1.6033, "learning_rate": 3.376879422980605e-05, "epoch": 0.6119502814781784, "percentage": 61.2, "elapsed_time": "1 day, 1:59:23", "remaining_time": "16:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10980, "total_steps": 17941, "loss": 1.5339, "learning_rate": 3.3760372476693744e-05, "epoch": 0.6120060197313416, "percentage": 61.2, "elapsed_time": "1 day, 1:59:32", "remaining_time": "16:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10981, "total_steps": 17941, "loss": 1.4833, "learning_rate": 3.375195123860774e-05, "epoch": 0.6120617579845048, "percentage": 61.21, "elapsed_time": "1 day, 1:59:40", "remaining_time": "16:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10982, "total_steps": 17941, "loss": 1.7522, "learning_rate": 3.374353051581513e-05, "epoch": 0.6121174962376679, "percentage": 61.21, "elapsed_time": "1 day, 1:59:48", "remaining_time": "16:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10983, "total_steps": 17941, "loss": 1.7102, "learning_rate": 3.373511030858292e-05, "epoch": 0.612173234490831, "percentage": 61.22, "elapsed_time": "1 day, 1:59:57", "remaining_time": "16:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10984, "total_steps": 17941, "loss": 1.6045, "learning_rate": 3.372669061717821e-05, "epoch": 0.6122289727439942, "percentage": 61.22, "elapsed_time": "1 day, 2:00:06", "remaining_time": "16:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10985, "total_steps": 17941, "loss": 1.7434, "learning_rate": 3.3718271441867964e-05, "epoch": 0.6122847109971573, "percentage": 61.23, "elapsed_time": "1 day, 2:00:14", "remaining_time": "16:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10986, "total_steps": 17941, "loss": 1.5278, "learning_rate": 3.370985278291923e-05, "epoch": 0.6123404492503205, "percentage": 61.23, "elapsed_time": "1 day, 2:00:23", "remaining_time": "16:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10987, "total_steps": 17941, "loss": 1.4593, "learning_rate": 3.3701434640599e-05, "epoch": 0.6123961875034837, "percentage": 61.24, "elapsed_time": "1 day, 2:00:31", "remaining_time": "16:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10988, "total_steps": 17941, "loss": 1.616, "learning_rate": 3.369301701517422e-05, "epoch": 0.6124519257566468, "percentage": 61.25, "elapsed_time": "1 day, 2:00:39", "remaining_time": "16:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10989, "total_steps": 17941, "loss": 1.7739, "learning_rate": 3.3684599906911885e-05, "epoch": 0.6125076640098099, "percentage": 61.25, "elapsed_time": "1 day, 2:00:48", "remaining_time": "16:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10990, "total_steps": 17941, "loss": 1.7103, "learning_rate": 3.36761833160789e-05, "epoch": 0.6125634022629731, "percentage": 61.26, "elapsed_time": "1 day, 2:00:56", "remaining_time": "16:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10991, "total_steps": 17941, "loss": 1.6394, "learning_rate": 3.3667767242942215e-05, "epoch": 0.6126191405161362, "percentage": 61.26, "elapsed_time": "1 day, 2:01:05", "remaining_time": "16:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10992, "total_steps": 17941, "loss": 1.6211, "learning_rate": 3.3659351687768714e-05, "epoch": 0.6126748787692994, "percentage": 61.27, "elapsed_time": "1 day, 2:01:13", "remaining_time": "16:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10993, "total_steps": 17941, "loss": 1.9074, "learning_rate": 3.3650936650825305e-05, "epoch": 0.6127306170224626, "percentage": 61.27, "elapsed_time": "1 day, 2:01:22", "remaining_time": "16:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10994, "total_steps": 17941, "loss": 1.7556, "learning_rate": 3.364252213237887e-05, "epoch": 0.6127863552756256, "percentage": 61.28, "elapsed_time": "1 day, 2:01:30", "remaining_time": "16:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10995, "total_steps": 17941, "loss": 1.6704, "learning_rate": 3.363410813269627e-05, "epoch": 0.6128420935287888, "percentage": 61.28, "elapsed_time": "1 day, 2:01:39", "remaining_time": "16:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10996, "total_steps": 17941, "loss": 1.629, "learning_rate": 3.362569465204434e-05, "epoch": 0.612897831781952, "percentage": 61.29, "elapsed_time": "1 day, 2:01:48", "remaining_time": "16:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10997, "total_steps": 17941, "loss": 1.5543, "learning_rate": 3.361728169068989e-05, "epoch": 0.6129535700351151, "percentage": 61.3, "elapsed_time": "1 day, 2:01:56", "remaining_time": "16:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10998, "total_steps": 17941, "loss": 1.484, "learning_rate": 3.360886924889977e-05, "epoch": 0.6130093082882783, "percentage": 61.3, "elapsed_time": "1 day, 2:02:05", "remaining_time": "16:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10999, "total_steps": 17941, "loss": 1.5407, "learning_rate": 3.360045732694074e-05, "epoch": 0.6130650465414413, "percentage": 61.31, "elapsed_time": "1 day, 2:02:13", "remaining_time": "16:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11000, "total_steps": 17941, "loss": 1.801, "learning_rate": 3.3592045925079575e-05, "epoch": 0.6131207847946045, "percentage": 61.31, "elapsed_time": "1 day, 2:02:23", "remaining_time": "16:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11001, "total_steps": 17941, "loss": 1.7198, "learning_rate": 3.3583635043583075e-05, "epoch": 0.6131765230477677, "percentage": 61.32, "elapsed_time": "1 day, 2:02:31", "remaining_time": "16:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11002, "total_steps": 17941, "loss": 1.8192, "learning_rate": 3.357522468271793e-05, "epoch": 0.6132322613009308, "percentage": 61.32, "elapsed_time": "1 day, 2:02:40", "remaining_time": "16:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11003, "total_steps": 17941, "loss": 1.5158, "learning_rate": 3.356681484275091e-05, "epoch": 0.613287999554094, "percentage": 61.33, "elapsed_time": "1 day, 2:02:48", "remaining_time": "16:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11004, "total_steps": 17941, "loss": 1.5025, "learning_rate": 3.3558405523948703e-05, "epoch": 0.6133437378072571, "percentage": 61.33, "elapsed_time": "1 day, 2:02:56", "remaining_time": "16:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11005, "total_steps": 17941, "loss": 1.4258, "learning_rate": 3.354999672657802e-05, "epoch": 0.6133994760604202, "percentage": 61.34, "elapsed_time": "1 day, 2:03:05", "remaining_time": "16:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11006, "total_steps": 17941, "loss": 1.5761, "learning_rate": 3.354158845090553e-05, "epoch": 0.6134552143135834, "percentage": 61.35, "elapsed_time": "1 day, 2:03:13", "remaining_time": "16:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11007, "total_steps": 17941, "loss": 1.8187, "learning_rate": 3.3533180697197886e-05, "epoch": 0.6135109525667466, "percentage": 61.35, "elapsed_time": "1 day, 2:03:22", "remaining_time": "16:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11008, "total_steps": 17941, "loss": 1.655, "learning_rate": 3.352477346572176e-05, "epoch": 0.6135666908199097, "percentage": 61.36, "elapsed_time": "1 day, 2:03:31", "remaining_time": "16:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11009, "total_steps": 17941, "loss": 1.7595, "learning_rate": 3.351636675674373e-05, "epoch": 0.6136224290730729, "percentage": 61.36, "elapsed_time": "1 day, 2:03:39", "remaining_time": "16:24:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11010, "total_steps": 17941, "loss": 1.7159, "learning_rate": 3.350796057053048e-05, "epoch": 0.613678167326236, "percentage": 61.37, "elapsed_time": "1 day, 2:03:47", "remaining_time": "16:24:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11011, "total_steps": 17941, "loss": 1.6548, "learning_rate": 3.349955490734854e-05, "epoch": 0.6137339055793991, "percentage": 61.37, "elapsed_time": "1 day, 2:03:56", "remaining_time": "16:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11012, "total_steps": 17941, "loss": 1.6303, "learning_rate": 3.349114976746451e-05, "epoch": 0.6137896438325623, "percentage": 61.38, "elapsed_time": "1 day, 2:04:05", "remaining_time": "16:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11013, "total_steps": 17941, "loss": 1.6347, "learning_rate": 3.348274515114498e-05, "epoch": 0.6138453820857255, "percentage": 61.38, "elapsed_time": "1 day, 2:04:13", "remaining_time": "16:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11014, "total_steps": 17941, "loss": 1.3515, "learning_rate": 3.3474341058656453e-05, "epoch": 0.6139011203388886, "percentage": 61.39, "elapsed_time": "1 day, 2:04:22", "remaining_time": "16:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11015, "total_steps": 17941, "loss": 1.8692, "learning_rate": 3.346593749026549e-05, "epoch": 0.6139568585920517, "percentage": 61.4, "elapsed_time": "1 day, 2:04:30", "remaining_time": "16:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11016, "total_steps": 17941, "loss": 1.6248, "learning_rate": 3.345753444623858e-05, "epoch": 0.6140125968452149, "percentage": 61.4, "elapsed_time": "1 day, 2:04:39", "remaining_time": "16:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11017, "total_steps": 17941, "loss": 1.6746, "learning_rate": 3.344913192684224e-05, "epoch": 0.614068335098378, "percentage": 61.41, "elapsed_time": "1 day, 2:04:47", "remaining_time": "16:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11018, "total_steps": 17941, "loss": 1.6177, "learning_rate": 3.344072993234292e-05, "epoch": 0.6141240733515412, "percentage": 61.41, "elapsed_time": "1 day, 2:04:56", "remaining_time": "16:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11019, "total_steps": 17941, "loss": 1.6588, "learning_rate": 3.343232846300709e-05, "epoch": 0.6141798116047044, "percentage": 61.42, "elapsed_time": "1 day, 2:05:05", "remaining_time": "16:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11020, "total_steps": 17941, "loss": 1.257, "learning_rate": 3.3423927519101225e-05, "epoch": 0.6142355498578674, "percentage": 61.42, "elapsed_time": "1 day, 2:05:13", "remaining_time": "16:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11021, "total_steps": 17941, "loss": 1.5108, "learning_rate": 3.3415527100891734e-05, "epoch": 0.6142912881110306, "percentage": 61.43, "elapsed_time": "1 day, 2:05:22", "remaining_time": "16:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11022, "total_steps": 17941, "loss": 1.8459, "learning_rate": 3.3407127208645026e-05, "epoch": 0.6143470263641937, "percentage": 61.43, "elapsed_time": "1 day, 2:05:30", "remaining_time": "16:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11023, "total_steps": 17941, "loss": 1.9795, "learning_rate": 3.33987278426275e-05, "epoch": 0.6144027646173569, "percentage": 61.44, "elapsed_time": "1 day, 2:05:39", "remaining_time": "16:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11024, "total_steps": 17941, "loss": 1.5239, "learning_rate": 3.339032900310554e-05, "epoch": 0.6144585028705201, "percentage": 61.45, "elapsed_time": "1 day, 2:05:47", "remaining_time": "16:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11025, "total_steps": 17941, "loss": 2.0899, "learning_rate": 3.338193069034549e-05, "epoch": 0.6145142411236831, "percentage": 61.45, "elapsed_time": "1 day, 2:05:56", "remaining_time": "16:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11026, "total_steps": 17941, "loss": 1.7312, "learning_rate": 3.33735329046137e-05, "epoch": 0.6145699793768463, "percentage": 61.46, "elapsed_time": "1 day, 2:06:04", "remaining_time": "16:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11027, "total_steps": 17941, "loss": 1.5185, "learning_rate": 3.336513564617654e-05, "epoch": 0.6146257176300095, "percentage": 61.46, "elapsed_time": "1 day, 2:06:13", "remaining_time": "16:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11028, "total_steps": 17941, "loss": 1.8831, "learning_rate": 3.3356738915300255e-05, "epoch": 0.6146814558831726, "percentage": 61.47, "elapsed_time": "1 day, 2:06:21", "remaining_time": "16:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11029, "total_steps": 17941, "loss": 1.7854, "learning_rate": 3.33483427122512e-05, "epoch": 0.6147371941363358, "percentage": 61.47, "elapsed_time": "1 day, 2:06:30", "remaining_time": "16:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11030, "total_steps": 17941, "loss": 1.5749, "learning_rate": 3.333994703729562e-05, "epoch": 0.614792932389499, "percentage": 61.48, "elapsed_time": "1 day, 2:06:38", "remaining_time": "16:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11031, "total_steps": 17941, "loss": 1.7339, "learning_rate": 3.333155189069978e-05, "epoch": 0.614848670642662, "percentage": 61.48, "elapsed_time": "1 day, 2:06:47", "remaining_time": "16:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11032, "total_steps": 17941, "loss": 1.6177, "learning_rate": 3.332315727272994e-05, "epoch": 0.6149044088958252, "percentage": 61.49, "elapsed_time": "1 day, 2:06:55", "remaining_time": "16:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11033, "total_steps": 17941, "loss": 1.8444, "learning_rate": 3.331476318365231e-05, "epoch": 0.6149601471489884, "percentage": 61.5, "elapsed_time": "1 day, 2:07:04", "remaining_time": "16:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11034, "total_steps": 17941, "loss": 1.5832, "learning_rate": 3.330636962373312e-05, "epoch": 0.6150158854021515, "percentage": 61.5, "elapsed_time": "1 day, 2:07:12", "remaining_time": "16:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11035, "total_steps": 17941, "loss": 1.7523, "learning_rate": 3.329797659323853e-05, "epoch": 0.6150716236553146, "percentage": 61.51, "elapsed_time": "1 day, 2:07:21", "remaining_time": "16:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11036, "total_steps": 17941, "loss": 1.5468, "learning_rate": 3.3289584092434785e-05, "epoch": 0.6151273619084778, "percentage": 61.51, "elapsed_time": "1 day, 2:07:29", "remaining_time": "16:20:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11037, "total_steps": 17941, "loss": 1.6177, "learning_rate": 3.328119212158797e-05, "epoch": 0.6151831001616409, "percentage": 61.52, "elapsed_time": "1 day, 2:07:38", "remaining_time": "16:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11038, "total_steps": 17941, "loss": 1.585, "learning_rate": 3.327280068096429e-05, "epoch": 0.6152388384148041, "percentage": 61.52, "elapsed_time": "1 day, 2:07:46", "remaining_time": "16:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11039, "total_steps": 17941, "loss": 1.5652, "learning_rate": 3.326440977082981e-05, "epoch": 0.6152945766679673, "percentage": 61.53, "elapsed_time": "1 day, 2:07:55", "remaining_time": "16:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11040, "total_steps": 17941, "loss": 1.6, "learning_rate": 3.325601939145069e-05, "epoch": 0.6153503149211303, "percentage": 61.54, "elapsed_time": "1 day, 2:08:03", "remaining_time": "16:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11041, "total_steps": 17941, "loss": 1.7046, "learning_rate": 3.3247629543093025e-05, "epoch": 0.6154060531742935, "percentage": 61.54, "elapsed_time": "1 day, 2:08:12", "remaining_time": "16:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11042, "total_steps": 17941, "loss": 1.7124, "learning_rate": 3.323924022602287e-05, "epoch": 0.6154617914274567, "percentage": 61.55, "elapsed_time": "1 day, 2:08:20", "remaining_time": "16:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11043, "total_steps": 17941, "loss": 1.4437, "learning_rate": 3.32308514405063e-05, "epoch": 0.6155175296806198, "percentage": 61.55, "elapsed_time": "1 day, 2:08:29", "remaining_time": "16:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11044, "total_steps": 17941, "loss": 1.809, "learning_rate": 3.322246318680934e-05, "epoch": 0.615573267933783, "percentage": 61.56, "elapsed_time": "1 day, 2:08:37", "remaining_time": "16:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11045, "total_steps": 17941, "loss": 1.6689, "learning_rate": 3.321407546519802e-05, "epoch": 0.615629006186946, "percentage": 61.56, "elapsed_time": "1 day, 2:08:46", "remaining_time": "16:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11046, "total_steps": 17941, "loss": 1.7449, "learning_rate": 3.320568827593837e-05, "epoch": 0.6156847444401092, "percentage": 61.57, "elapsed_time": "1 day, 2:08:54", "remaining_time": "16:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11047, "total_steps": 17941, "loss": 1.6372, "learning_rate": 3.319730161929637e-05, "epoch": 0.6157404826932724, "percentage": 61.57, "elapsed_time": "1 day, 2:09:03", "remaining_time": "16:19:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11048, "total_steps": 17941, "loss": 1.6837, "learning_rate": 3.318891549553801e-05, "epoch": 0.6157962209464355, "percentage": 61.58, "elapsed_time": "1 day, 2:09:11", "remaining_time": "16:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11049, "total_steps": 17941, "loss": 1.7888, "learning_rate": 3.318052990492921e-05, "epoch": 0.6158519591995987, "percentage": 61.59, "elapsed_time": "1 day, 2:09:20", "remaining_time": "16:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11050, "total_steps": 17941, "loss": 1.6178, "learning_rate": 3.317214484773596e-05, "epoch": 0.6159076974527619, "percentage": 61.59, "elapsed_time": "1 day, 2:09:28", "remaining_time": "16:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11051, "total_steps": 17941, "loss": 1.9799, "learning_rate": 3.316376032422415e-05, "epoch": 0.6159634357059249, "percentage": 61.6, "elapsed_time": "1 day, 2:09:37", "remaining_time": "16:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11052, "total_steps": 17941, "loss": 1.7318, "learning_rate": 3.315537633465968e-05, "epoch": 0.6160191739590881, "percentage": 61.6, "elapsed_time": "1 day, 2:09:45", "remaining_time": "16:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11053, "total_steps": 17941, "loss": 1.2948, "learning_rate": 3.3146992879308505e-05, "epoch": 0.6160749122122513, "percentage": 61.61, "elapsed_time": "1 day, 2:09:54", "remaining_time": "16:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11054, "total_steps": 17941, "loss": 1.7205, "learning_rate": 3.3138609958436414e-05, "epoch": 0.6161306504654144, "percentage": 61.61, "elapsed_time": "1 day, 2:10:02", "remaining_time": "16:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11055, "total_steps": 17941, "loss": 1.4926, "learning_rate": 3.3130227572309334e-05, "epoch": 0.6161863887185776, "percentage": 61.62, "elapsed_time": "1 day, 2:10:11", "remaining_time": "16:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11056, "total_steps": 17941, "loss": 1.5604, "learning_rate": 3.3121845721193065e-05, "epoch": 0.6162421269717407, "percentage": 61.62, "elapsed_time": "1 day, 2:10:19", "remaining_time": "16:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11057, "total_steps": 17941, "loss": 1.737, "learning_rate": 3.311346440535346e-05, "epoch": 0.6162978652249038, "percentage": 61.63, "elapsed_time": "1 day, 2:10:28", "remaining_time": "16:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11058, "total_steps": 17941, "loss": 1.2615, "learning_rate": 3.31050836250563e-05, "epoch": 0.616353603478067, "percentage": 61.64, "elapsed_time": "1 day, 2:10:36", "remaining_time": "16:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11059, "total_steps": 17941, "loss": 1.6531, "learning_rate": 3.3096703380567376e-05, "epoch": 0.6164093417312302, "percentage": 61.64, "elapsed_time": "1 day, 2:10:45", "remaining_time": "16:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11060, "total_steps": 17941, "loss": 1.7572, "learning_rate": 3.3088323672152474e-05, "epoch": 0.6164650799843933, "percentage": 61.65, "elapsed_time": "1 day, 2:10:53", "remaining_time": "16:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11061, "total_steps": 17941, "loss": 1.7705, "learning_rate": 3.307994450007733e-05, "epoch": 0.6165208182375564, "percentage": 61.65, "elapsed_time": "1 day, 2:11:02", "remaining_time": "16:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11062, "total_steps": 17941, "loss": 1.7726, "learning_rate": 3.3071565864607723e-05, "epoch": 0.6165765564907196, "percentage": 61.66, "elapsed_time": "1 day, 2:11:10", "remaining_time": "16:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11063, "total_steps": 17941, "loss": 1.4762, "learning_rate": 3.3063187766009316e-05, "epoch": 0.6166322947438827, "percentage": 61.66, "elapsed_time": "1 day, 2:11:19", "remaining_time": "16:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11064, "total_steps": 17941, "loss": 1.7204, "learning_rate": 3.305481020454787e-05, "epoch": 0.6166880329970459, "percentage": 61.67, "elapsed_time": "1 day, 2:11:27", "remaining_time": "16:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11065, "total_steps": 17941, "loss": 1.5623, "learning_rate": 3.304643318048903e-05, "epoch": 0.6167437712502091, "percentage": 61.67, "elapsed_time": "1 day, 2:11:36", "remaining_time": "16:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11066, "total_steps": 17941, "loss": 1.7162, "learning_rate": 3.303805669409848e-05, "epoch": 0.6167995095033721, "percentage": 61.68, "elapsed_time": "1 day, 2:11:45", "remaining_time": "16:16:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11067, "total_steps": 17941, "loss": 1.666, "learning_rate": 3.30296807456419e-05, "epoch": 0.6168552477565353, "percentage": 61.69, "elapsed_time": "1 day, 2:11:53", "remaining_time": "16:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11068, "total_steps": 17941, "loss": 1.3855, "learning_rate": 3.3021305335384886e-05, "epoch": 0.6169109860096984, "percentage": 61.69, "elapsed_time": "1 day, 2:12:01", "remaining_time": "16:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11069, "total_steps": 17941, "loss": 1.8732, "learning_rate": 3.3012930463593084e-05, "epoch": 0.6169667242628616, "percentage": 61.7, "elapsed_time": "1 day, 2:12:10", "remaining_time": "16:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11070, "total_steps": 17941, "loss": 1.5905, "learning_rate": 3.300455613053207e-05, "epoch": 0.6170224625160248, "percentage": 61.7, "elapsed_time": "1 day, 2:12:19", "remaining_time": "16:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11071, "total_steps": 17941, "loss": 1.5319, "learning_rate": 3.299618233646745e-05, "epoch": 0.6170782007691878, "percentage": 61.71, "elapsed_time": "1 day, 2:12:27", "remaining_time": "16:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11072, "total_steps": 17941, "loss": 1.7873, "learning_rate": 3.29878090816648e-05, "epoch": 0.617133939022351, "percentage": 61.71, "elapsed_time": "1 day, 2:12:36", "remaining_time": "16:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11073, "total_steps": 17941, "loss": 1.8069, "learning_rate": 3.297943636638965e-05, "epoch": 0.6171896772755142, "percentage": 61.72, "elapsed_time": "1 day, 2:12:44", "remaining_time": "16:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11074, "total_steps": 17941, "loss": 1.3797, "learning_rate": 3.297106419090754e-05, "epoch": 0.6172454155286773, "percentage": 61.72, "elapsed_time": "1 day, 2:12:53", "remaining_time": "16:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11075, "total_steps": 17941, "loss": 1.8426, "learning_rate": 3.296269255548399e-05, "epoch": 0.6173011537818405, "percentage": 61.73, "elapsed_time": "1 day, 2:13:01", "remaining_time": "16:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11076, "total_steps": 17941, "loss": 1.5177, "learning_rate": 3.2954321460384506e-05, "epoch": 0.6173568920350037, "percentage": 61.74, "elapsed_time": "1 day, 2:13:09", "remaining_time": "16:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11077, "total_steps": 17941, "loss": 1.641, "learning_rate": 3.294595090587455e-05, "epoch": 0.6174126302881667, "percentage": 61.74, "elapsed_time": "1 day, 2:13:18", "remaining_time": "16:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11078, "total_steps": 17941, "loss": 1.6019, "learning_rate": 3.293758089221959e-05, "epoch": 0.6174683685413299, "percentage": 61.75, "elapsed_time": "1 day, 2:13:26", "remaining_time": "16:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11079, "total_steps": 17941, "loss": 1.5064, "learning_rate": 3.292921141968511e-05, "epoch": 0.6175241067944931, "percentage": 61.75, "elapsed_time": "1 day, 2:13:35", "remaining_time": "16:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11080, "total_steps": 17941, "loss": 1.7632, "learning_rate": 3.292084248853649e-05, "epoch": 0.6175798450476562, "percentage": 61.76, "elapsed_time": "1 day, 2:13:44", "remaining_time": "16:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11081, "total_steps": 17941, "loss": 1.5724, "learning_rate": 3.291247409903919e-05, "epoch": 0.6176355833008194, "percentage": 61.76, "elapsed_time": "1 day, 2:13:52", "remaining_time": "16:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11082, "total_steps": 17941, "loss": 1.8628, "learning_rate": 3.290410625145857e-05, "epoch": 0.6176913215539825, "percentage": 61.77, "elapsed_time": "1 day, 2:14:00", "remaining_time": "16:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11083, "total_steps": 17941, "loss": 1.5649, "learning_rate": 3.289573894606003e-05, "epoch": 0.6177470598071456, "percentage": 61.77, "elapsed_time": "1 day, 2:14:09", "remaining_time": "16:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11084, "total_steps": 17941, "loss": 1.5843, "learning_rate": 3.288737218310892e-05, "epoch": 0.6178027980603088, "percentage": 61.78, "elapsed_time": "1 day, 2:14:17", "remaining_time": "16:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11085, "total_steps": 17941, "loss": 1.6214, "learning_rate": 3.287900596287059e-05, "epoch": 0.617858536313472, "percentage": 61.79, "elapsed_time": "1 day, 2:14:26", "remaining_time": "16:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11086, "total_steps": 17941, "loss": 1.9879, "learning_rate": 3.2870640285610375e-05, "epoch": 0.6179142745666351, "percentage": 61.79, "elapsed_time": "1 day, 2:14:34", "remaining_time": "16:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11087, "total_steps": 17941, "loss": 1.6907, "learning_rate": 3.286227515159357e-05, "epoch": 0.6179700128197982, "percentage": 61.8, "elapsed_time": "1 day, 2:14:43", "remaining_time": "16:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11088, "total_steps": 17941, "loss": 1.7293, "learning_rate": 3.28539105610855e-05, "epoch": 0.6180257510729614, "percentage": 61.8, "elapsed_time": "1 day, 2:14:51", "remaining_time": "16:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11089, "total_steps": 17941, "loss": 1.7966, "learning_rate": 3.284554651435138e-05, "epoch": 0.6180814893261245, "percentage": 61.81, "elapsed_time": "1 day, 2:15:00", "remaining_time": "16:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11090, "total_steps": 17941, "loss": 1.7938, "learning_rate": 3.2837183011656533e-05, "epoch": 0.6181372275792877, "percentage": 61.81, "elapsed_time": "1 day, 2:15:08", "remaining_time": "16:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11091, "total_steps": 17941, "loss": 1.6818, "learning_rate": 3.2828820053266176e-05, "epoch": 0.6181929658324508, "percentage": 61.82, "elapsed_time": "1 day, 2:15:17", "remaining_time": "16:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11092, "total_steps": 17941, "loss": 1.7102, "learning_rate": 3.2820457639445525e-05, "epoch": 0.6182487040856139, "percentage": 61.82, "elapsed_time": "1 day, 2:15:26", "remaining_time": "16:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11093, "total_steps": 17941, "loss": 1.7051, "learning_rate": 3.28120957704598e-05, "epoch": 0.6183044423387771, "percentage": 61.83, "elapsed_time": "1 day, 2:15:35", "remaining_time": "16:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11094, "total_steps": 17941, "loss": 1.6841, "learning_rate": 3.280373444657417e-05, "epoch": 0.6183601805919402, "percentage": 61.84, "elapsed_time": "1 day, 2:15:43", "remaining_time": "16:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11095, "total_steps": 17941, "loss": 2.0282, "learning_rate": 3.279537366805384e-05, "epoch": 0.6184159188451034, "percentage": 61.84, "elapsed_time": "1 day, 2:15:52", "remaining_time": "16:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11096, "total_steps": 17941, "loss": 1.6552, "learning_rate": 3.278701343516393e-05, "epoch": 0.6184716570982666, "percentage": 61.85, "elapsed_time": "1 day, 2:16:01", "remaining_time": "16:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11097, "total_steps": 17941, "loss": 1.7273, "learning_rate": 3.27786537481696e-05, "epoch": 0.6185273953514296, "percentage": 61.85, "elapsed_time": "1 day, 2:16:10", "remaining_time": "16:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11098, "total_steps": 17941, "loss": 1.6164, "learning_rate": 3.277029460733598e-05, "epoch": 0.6185831336045928, "percentage": 61.86, "elapsed_time": "1 day, 2:16:18", "remaining_time": "16:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11099, "total_steps": 17941, "loss": 1.9246, "learning_rate": 3.276193601292815e-05, "epoch": 0.618638871857756, "percentage": 61.86, "elapsed_time": "1 day, 2:16:26", "remaining_time": "16:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11100, "total_steps": 17941, "loss": 1.5328, "learning_rate": 3.275357796521121e-05, "epoch": 0.6186946101109191, "percentage": 61.87, "elapsed_time": "1 day, 2:16:35", "remaining_time": "16:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11101, "total_steps": 17941, "loss": 1.7782, "learning_rate": 3.274522046445021e-05, "epoch": 0.6187503483640823, "percentage": 61.88, "elapsed_time": "1 day, 2:16:43", "remaining_time": "16:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11102, "total_steps": 17941, "loss": 1.5018, "learning_rate": 3.273686351091023e-05, "epoch": 0.6188060866172455, "percentage": 61.88, "elapsed_time": "1 day, 2:16:52", "remaining_time": "16:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11103, "total_steps": 17941, "loss": 1.6596, "learning_rate": 3.272850710485628e-05, "epoch": 0.6188618248704085, "percentage": 61.89, "elapsed_time": "1 day, 2:17:01", "remaining_time": "16:11:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11104, "total_steps": 17941, "loss": 1.4884, "learning_rate": 3.2720151246553366e-05, "epoch": 0.6189175631235717, "percentage": 61.89, "elapsed_time": "1 day, 2:17:09", "remaining_time": "16:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11105, "total_steps": 17941, "loss": 1.5642, "learning_rate": 3.271179593626654e-05, "epoch": 0.6189733013767349, "percentage": 61.9, "elapsed_time": "1 day, 2:17:18", "remaining_time": "16:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11106, "total_steps": 17941, "loss": 1.7674, "learning_rate": 3.270344117426073e-05, "epoch": 0.619029039629898, "percentage": 61.9, "elapsed_time": "1 day, 2:17:27", "remaining_time": "16:10:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11107, "total_steps": 17941, "loss": 1.5923, "learning_rate": 3.269508696080093e-05, "epoch": 0.6190847778830612, "percentage": 61.91, "elapsed_time": "1 day, 2:17:35", "remaining_time": "16:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11108, "total_steps": 17941, "loss": 1.5301, "learning_rate": 3.268673329615207e-05, "epoch": 0.6191405161362243, "percentage": 61.91, "elapsed_time": "1 day, 2:17:44", "remaining_time": "16:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11109, "total_steps": 17941, "loss": 1.5344, "learning_rate": 3.267838018057909e-05, "epoch": 0.6191962543893874, "percentage": 61.92, "elapsed_time": "1 day, 2:17:53", "remaining_time": "16:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11110, "total_steps": 17941, "loss": 1.8432, "learning_rate": 3.2670027614346896e-05, "epoch": 0.6192519926425506, "percentage": 61.93, "elapsed_time": "1 day, 2:18:02", "remaining_time": "16:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11111, "total_steps": 17941, "loss": 1.6279, "learning_rate": 3.2661675597720384e-05, "epoch": 0.6193077308957138, "percentage": 61.93, "elapsed_time": "1 day, 2:18:11", "remaining_time": "16:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11112, "total_steps": 17941, "loss": 1.5426, "learning_rate": 3.265332413096444e-05, "epoch": 0.6193634691488769, "percentage": 61.94, "elapsed_time": "1 day, 2:18:19", "remaining_time": "16:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11113, "total_steps": 17941, "loss": 1.709, "learning_rate": 3.26449732143439e-05, "epoch": 0.61941920740204, "percentage": 61.94, "elapsed_time": "1 day, 2:18:28", "remaining_time": "16:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11114, "total_steps": 17941, "loss": 1.6154, "learning_rate": 3.263662284812365e-05, "epoch": 0.6194749456552031, "percentage": 61.95, "elapsed_time": "1 day, 2:18:37", "remaining_time": "16:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11115, "total_steps": 17941, "loss": 1.4069, "learning_rate": 3.262827303256846e-05, "epoch": 0.6195306839083663, "percentage": 61.95, "elapsed_time": "1 day, 2:18:45", "remaining_time": "16:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11116, "total_steps": 17941, "loss": 1.6916, "learning_rate": 3.261992376794318e-05, "epoch": 0.6195864221615295, "percentage": 61.96, "elapsed_time": "1 day, 2:18:54", "remaining_time": "16:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11117, "total_steps": 17941, "loss": 1.829, "learning_rate": 3.2611575054512584e-05, "epoch": 0.6196421604146926, "percentage": 61.96, "elapsed_time": "1 day, 2:19:02", "remaining_time": "16:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11118, "total_steps": 17941, "loss": 1.4311, "learning_rate": 3.2603226892541437e-05, "epoch": 0.6196978986678557, "percentage": 61.97, "elapsed_time": "1 day, 2:19:11", "remaining_time": "16:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11119, "total_steps": 17941, "loss": 1.7092, "learning_rate": 3.2594879282294524e-05, "epoch": 0.6197536369210189, "percentage": 61.98, "elapsed_time": "1 day, 2:19:19", "remaining_time": "16:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11120, "total_steps": 17941, "loss": 1.5921, "learning_rate": 3.258653222403654e-05, "epoch": 0.619809375174182, "percentage": 61.98, "elapsed_time": "1 day, 2:19:28", "remaining_time": "16:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11121, "total_steps": 17941, "loss": 1.6191, "learning_rate": 3.257818571803224e-05, "epoch": 0.6198651134273452, "percentage": 61.99, "elapsed_time": "1 day, 2:19:36", "remaining_time": "16:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11122, "total_steps": 17941, "loss": 1.3492, "learning_rate": 3.25698397645463e-05, "epoch": 0.6199208516805084, "percentage": 61.99, "elapsed_time": "1 day, 2:19:45", "remaining_time": "16:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11123, "total_steps": 17941, "loss": 1.7222, "learning_rate": 3.2561494363843416e-05, "epoch": 0.6199765899336714, "percentage": 62.0, "elapsed_time": "1 day, 2:19:53", "remaining_time": "16:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11124, "total_steps": 17941, "loss": 1.5677, "learning_rate": 3.255314951618827e-05, "epoch": 0.6200323281868346, "percentage": 62.0, "elapsed_time": "1 day, 2:20:02", "remaining_time": "16:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11125, "total_steps": 17941, "loss": 1.4315, "learning_rate": 3.2544805221845485e-05, "epoch": 0.6200880664399978, "percentage": 62.01, "elapsed_time": "1 day, 2:20:11", "remaining_time": "16:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11126, "total_steps": 17941, "loss": 1.4994, "learning_rate": 3.253646148107973e-05, "epoch": 0.6201438046931609, "percentage": 62.01, "elapsed_time": "1 day, 2:20:20", "remaining_time": "16:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11127, "total_steps": 17941, "loss": 1.4227, "learning_rate": 3.2528118294155576e-05, "epoch": 0.6201995429463241, "percentage": 62.02, "elapsed_time": "1 day, 2:20:29", "remaining_time": "16:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11128, "total_steps": 17941, "loss": 1.8407, "learning_rate": 3.251977566133766e-05, "epoch": 0.6202552811994873, "percentage": 62.03, "elapsed_time": "1 day, 2:20:37", "remaining_time": "16:07:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11129, "total_steps": 17941, "loss": 1.8582, "learning_rate": 3.251143358289053e-05, "epoch": 0.6203110194526503, "percentage": 62.03, "elapsed_time": "1 day, 2:20:46", "remaining_time": "16:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11130, "total_steps": 17941, "loss": 1.6491, "learning_rate": 3.2503092059078754e-05, "epoch": 0.6203667577058135, "percentage": 62.04, "elapsed_time": "1 day, 2:20:54", "remaining_time": "16:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11131, "total_steps": 17941, "loss": 1.6451, "learning_rate": 3.2494751090166907e-05, "epoch": 0.6204224959589767, "percentage": 62.04, "elapsed_time": "1 day, 2:21:03", "remaining_time": "16:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11132, "total_steps": 17941, "loss": 1.563, "learning_rate": 3.2486410676419467e-05, "epoch": 0.6204782342121398, "percentage": 62.05, "elapsed_time": "1 day, 2:21:12", "remaining_time": "16:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11133, "total_steps": 17941, "loss": 1.7636, "learning_rate": 3.247807081810099e-05, "epoch": 0.620533972465303, "percentage": 62.05, "elapsed_time": "1 day, 2:21:20", "remaining_time": "16:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11134, "total_steps": 17941, "loss": 1.6853, "learning_rate": 3.246973151547594e-05, "epoch": 0.6205897107184661, "percentage": 62.06, "elapsed_time": "1 day, 2:21:28", "remaining_time": "16:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11135, "total_steps": 17941, "loss": 1.7606, "learning_rate": 3.2461392768808796e-05, "epoch": 0.6206454489716292, "percentage": 62.06, "elapsed_time": "1 day, 2:21:37", "remaining_time": "16:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11136, "total_steps": 17941, "loss": 1.6584, "learning_rate": 3.245305457836402e-05, "epoch": 0.6207011872247924, "percentage": 62.07, "elapsed_time": "1 day, 2:21:45", "remaining_time": "16:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11137, "total_steps": 17941, "loss": 1.6822, "learning_rate": 3.244471694440604e-05, "epoch": 0.6207569254779555, "percentage": 62.08, "elapsed_time": "1 day, 2:21:54", "remaining_time": "16:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11138, "total_steps": 17941, "loss": 1.7112, "learning_rate": 3.243637986719929e-05, "epoch": 0.6208126637311187, "percentage": 62.08, "elapsed_time": "1 day, 2:22:03", "remaining_time": "16:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11139, "total_steps": 17941, "loss": 1.731, "learning_rate": 3.2428043347008154e-05, "epoch": 0.6208684019842818, "percentage": 62.09, "elapsed_time": "1 day, 2:22:12", "remaining_time": "16:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11140, "total_steps": 17941, "loss": 1.6321, "learning_rate": 3.241970738409707e-05, "epoch": 0.6209241402374449, "percentage": 62.09, "elapsed_time": "1 day, 2:22:20", "remaining_time": "16:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11141, "total_steps": 17941, "loss": 1.5864, "learning_rate": 3.241137197873032e-05, "epoch": 0.6209798784906081, "percentage": 62.1, "elapsed_time": "1 day, 2:22:29", "remaining_time": "16:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11142, "total_steps": 17941, "loss": 1.8697, "learning_rate": 3.2403037131172324e-05, "epoch": 0.6210356167437713, "percentage": 62.1, "elapsed_time": "1 day, 2:22:38", "remaining_time": "16:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11143, "total_steps": 17941, "loss": 1.7243, "learning_rate": 3.239470284168739e-05, "epoch": 0.6210913549969344, "percentage": 62.11, "elapsed_time": "1 day, 2:22:46", "remaining_time": "16:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11144, "total_steps": 17941, "loss": 1.953, "learning_rate": 3.238636911053984e-05, "epoch": 0.6211470932500975, "percentage": 62.11, "elapsed_time": "1 day, 2:22:55", "remaining_time": "16:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11145, "total_steps": 17941, "loss": 1.7371, "learning_rate": 3.237803593799397e-05, "epoch": 0.6212028315032607, "percentage": 62.12, "elapsed_time": "1 day, 2:23:03", "remaining_time": "16:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11146, "total_steps": 17941, "loss": 1.6465, "learning_rate": 3.2369703324314046e-05, "epoch": 0.6212585697564238, "percentage": 62.13, "elapsed_time": "1 day, 2:23:12", "remaining_time": "16:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11147, "total_steps": 17941, "loss": 1.7146, "learning_rate": 3.236137126976435e-05, "epoch": 0.621314308009587, "percentage": 62.13, "elapsed_time": "1 day, 2:23:20", "remaining_time": "16:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11148, "total_steps": 17941, "loss": 1.8071, "learning_rate": 3.23530397746091e-05, "epoch": 0.6213700462627502, "percentage": 62.14, "elapsed_time": "1 day, 2:23:29", "remaining_time": "16:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11149, "total_steps": 17941, "loss": 1.6476, "learning_rate": 3.234470883911255e-05, "epoch": 0.6214257845159132, "percentage": 62.14, "elapsed_time": "1 day, 2:23:37", "remaining_time": "16:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11150, "total_steps": 17941, "loss": 1.7425, "learning_rate": 3.2336378463538907e-05, "epoch": 0.6214815227690764, "percentage": 62.15, "elapsed_time": "1 day, 2:23:46", "remaining_time": "16:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11151, "total_steps": 17941, "loss": 1.5382, "learning_rate": 3.232804864815234e-05, "epoch": 0.6215372610222396, "percentage": 62.15, "elapsed_time": "1 day, 2:23:54", "remaining_time": "16:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11152, "total_steps": 17941, "loss": 1.5486, "learning_rate": 3.2319719393217055e-05, "epoch": 0.6215929992754027, "percentage": 62.16, "elapsed_time": "1 day, 2:24:03", "remaining_time": "16:04:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11153, "total_steps": 17941, "loss": 1.8761, "learning_rate": 3.231139069899717e-05, "epoch": 0.6216487375285659, "percentage": 62.16, "elapsed_time": "1 day, 2:24:11", "remaining_time": "16:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11154, "total_steps": 17941, "loss": 1.8006, "learning_rate": 3.230306256575685e-05, "epoch": 0.621704475781729, "percentage": 62.17, "elapsed_time": "1 day, 2:24:20", "remaining_time": "16:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11155, "total_steps": 17941, "loss": 1.681, "learning_rate": 3.2294734993760196e-05, "epoch": 0.6217602140348921, "percentage": 62.18, "elapsed_time": "1 day, 2:24:28", "remaining_time": "16:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11156, "total_steps": 17941, "loss": 1.6012, "learning_rate": 3.228640798327131e-05, "epoch": 0.6218159522880553, "percentage": 62.18, "elapsed_time": "1 day, 2:24:37", "remaining_time": "16:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11157, "total_steps": 17941, "loss": 1.8304, "learning_rate": 3.227808153455431e-05, "epoch": 0.6218716905412185, "percentage": 62.19, "elapsed_time": "1 day, 2:24:45", "remaining_time": "16:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11158, "total_steps": 17941, "loss": 1.699, "learning_rate": 3.226975564787322e-05, "epoch": 0.6219274287943816, "percentage": 62.19, "elapsed_time": "1 day, 2:24:54", "remaining_time": "16:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11159, "total_steps": 17941, "loss": 1.5854, "learning_rate": 3.226143032349211e-05, "epoch": 0.6219831670475447, "percentage": 62.2, "elapsed_time": "1 day, 2:25:02", "remaining_time": "16:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11160, "total_steps": 17941, "loss": 1.8011, "learning_rate": 3.225310556167501e-05, "epoch": 0.6220389053007078, "percentage": 62.2, "elapsed_time": "1 day, 2:25:11", "remaining_time": "16:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11161, "total_steps": 17941, "loss": 1.8349, "learning_rate": 3.2244781362685937e-05, "epoch": 0.622094643553871, "percentage": 62.21, "elapsed_time": "1 day, 2:25:20", "remaining_time": "16:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11162, "total_steps": 17941, "loss": 1.6352, "learning_rate": 3.223645772678887e-05, "epoch": 0.6221503818070342, "percentage": 62.22, "elapsed_time": "1 day, 2:25:28", "remaining_time": "16:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11163, "total_steps": 17941, "loss": 1.7301, "learning_rate": 3.2228134654247785e-05, "epoch": 0.6222061200601973, "percentage": 62.22, "elapsed_time": "1 day, 2:25:36", "remaining_time": "16:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11164, "total_steps": 17941, "loss": 1.939, "learning_rate": 3.2219812145326675e-05, "epoch": 0.6222618583133604, "percentage": 62.23, "elapsed_time": "1 day, 2:25:45", "remaining_time": "16:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11165, "total_steps": 17941, "loss": 1.5153, "learning_rate": 3.221149020028944e-05, "epoch": 0.6223175965665236, "percentage": 62.23, "elapsed_time": "1 day, 2:25:54", "remaining_time": "16:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11166, "total_steps": 17941, "loss": 1.7389, "learning_rate": 3.2203168819400045e-05, "epoch": 0.6223733348196867, "percentage": 62.24, "elapsed_time": "1 day, 2:26:03", "remaining_time": "16:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11167, "total_steps": 17941, "loss": 1.6778, "learning_rate": 3.219484800292234e-05, "epoch": 0.6224290730728499, "percentage": 62.24, "elapsed_time": "1 day, 2:26:11", "remaining_time": "16:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11168, "total_steps": 17941, "loss": 1.5979, "learning_rate": 3.2186527751120264e-05, "epoch": 0.6224848113260131, "percentage": 62.25, "elapsed_time": "1 day, 2:26:20", "remaining_time": "16:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11169, "total_steps": 17941, "loss": 1.6583, "learning_rate": 3.2178208064257666e-05, "epoch": 0.6225405495791762, "percentage": 62.25, "elapsed_time": "1 day, 2:26:28", "remaining_time": "16:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11170, "total_steps": 17941, "loss": 1.8095, "learning_rate": 3.2169888942598395e-05, "epoch": 0.6225962878323393, "percentage": 62.26, "elapsed_time": "1 day, 2:26:37", "remaining_time": "16:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11171, "total_steps": 17941, "loss": 1.7863, "learning_rate": 3.2161570386406305e-05, "epoch": 0.6226520260855025, "percentage": 62.27, "elapsed_time": "1 day, 2:26:46", "remaining_time": "16:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11172, "total_steps": 17941, "loss": 1.5287, "learning_rate": 3.2153252395945176e-05, "epoch": 0.6227077643386656, "percentage": 62.27, "elapsed_time": "1 day, 2:26:54", "remaining_time": "16:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11173, "total_steps": 17941, "loss": 1.5626, "learning_rate": 3.214493497147885e-05, "epoch": 0.6227635025918288, "percentage": 62.28, "elapsed_time": "1 day, 2:27:03", "remaining_time": "16:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11174, "total_steps": 17941, "loss": 1.3227, "learning_rate": 3.2136618113271055e-05, "epoch": 0.622819240844992, "percentage": 62.28, "elapsed_time": "1 day, 2:27:11", "remaining_time": "16:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11175, "total_steps": 17941, "loss": 1.4615, "learning_rate": 3.2128301821585616e-05, "epoch": 0.622874979098155, "percentage": 62.29, "elapsed_time": "1 day, 2:27:20", "remaining_time": "16:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11176, "total_steps": 17941, "loss": 1.5484, "learning_rate": 3.2119986096686215e-05, "epoch": 0.6229307173513182, "percentage": 62.29, "elapsed_time": "1 day, 2:27:28", "remaining_time": "16:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11177, "total_steps": 17941, "loss": 1.3652, "learning_rate": 3.211167093883661e-05, "epoch": 0.6229864556044814, "percentage": 62.3, "elapsed_time": "1 day, 2:27:37", "remaining_time": "16:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11178, "total_steps": 17941, "loss": 1.7177, "learning_rate": 3.2103356348300525e-05, "epoch": 0.6230421938576445, "percentage": 62.3, "elapsed_time": "1 day, 2:27:45", "remaining_time": "16:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11179, "total_steps": 17941, "loss": 1.6482, "learning_rate": 3.2095042325341626e-05, "epoch": 0.6230979321108077, "percentage": 62.31, "elapsed_time": "1 day, 2:27:54", "remaining_time": "16:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11180, "total_steps": 17941, "loss": 1.6545, "learning_rate": 3.2086728870223594e-05, "epoch": 0.6231536703639708, "percentage": 62.32, "elapsed_time": "1 day, 2:28:03", "remaining_time": "16:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11181, "total_steps": 17941, "loss": 1.9482, "learning_rate": 3.207841598321007e-05, "epoch": 0.6232094086171339, "percentage": 62.32, "elapsed_time": "1 day, 2:28:12", "remaining_time": "16:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11182, "total_steps": 17941, "loss": 1.4994, "learning_rate": 3.207010366456469e-05, "epoch": 0.6232651468702971, "percentage": 62.33, "elapsed_time": "1 day, 2:28:21", "remaining_time": "16:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11183, "total_steps": 17941, "loss": 1.6828, "learning_rate": 3.206179191455111e-05, "epoch": 0.6233208851234602, "percentage": 62.33, "elapsed_time": "1 day, 2:28:29", "remaining_time": "15:59:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11184, "total_steps": 17941, "loss": 1.66, "learning_rate": 3.2053480733432886e-05, "epoch": 0.6233766233766234, "percentage": 62.34, "elapsed_time": "1 day, 2:28:38", "remaining_time": "15:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11185, "total_steps": 17941, "loss": 1.7498, "learning_rate": 3.204517012147363e-05, "epoch": 0.6234323616297865, "percentage": 62.34, "elapsed_time": "1 day, 2:28:46", "remaining_time": "15:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11186, "total_steps": 17941, "loss": 1.7147, "learning_rate": 3.2036860078936886e-05, "epoch": 0.6234880998829496, "percentage": 62.35, "elapsed_time": "1 day, 2:28:55", "remaining_time": "15:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11187, "total_steps": 17941, "loss": 1.5002, "learning_rate": 3.2028550606086216e-05, "epoch": 0.6235438381361128, "percentage": 62.35, "elapsed_time": "1 day, 2:29:03", "remaining_time": "15:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11188, "total_steps": 17941, "loss": 1.6626, "learning_rate": 3.202024170318513e-05, "epoch": 0.623599576389276, "percentage": 62.36, "elapsed_time": "1 day, 2:29:12", "remaining_time": "15:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11189, "total_steps": 17941, "loss": 1.6432, "learning_rate": 3.201193337049714e-05, "epoch": 0.6236553146424391, "percentage": 62.37, "elapsed_time": "1 day, 2:29:20", "remaining_time": "15:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11190, "total_steps": 17941, "loss": 1.6593, "learning_rate": 3.2003625608285776e-05, "epoch": 0.6237110528956022, "percentage": 62.37, "elapsed_time": "1 day, 2:29:29", "remaining_time": "15:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11191, "total_steps": 17941, "loss": 1.7227, "learning_rate": 3.199531841681445e-05, "epoch": 0.6237667911487654, "percentage": 62.38, "elapsed_time": "1 day, 2:29:37", "remaining_time": "15:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11192, "total_steps": 17941, "loss": 1.663, "learning_rate": 3.198701179634668e-05, "epoch": 0.6238225294019285, "percentage": 62.38, "elapsed_time": "1 day, 2:29:46", "remaining_time": "15:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11193, "total_steps": 17941, "loss": 1.3727, "learning_rate": 3.197870574714584e-05, "epoch": 0.6238782676550917, "percentage": 62.39, "elapsed_time": "1 day, 2:29:54", "remaining_time": "15:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11194, "total_steps": 17941, "loss": 1.7794, "learning_rate": 3.197040026947541e-05, "epoch": 0.6239340059082549, "percentage": 62.39, "elapsed_time": "1 day, 2:30:03", "remaining_time": "15:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11195, "total_steps": 17941, "loss": 1.7328, "learning_rate": 3.196209536359874e-05, "epoch": 0.623989744161418, "percentage": 62.4, "elapsed_time": "1 day, 2:30:11", "remaining_time": "15:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11196, "total_steps": 17941, "loss": 1.621, "learning_rate": 3.195379102977925e-05, "epoch": 0.6240454824145811, "percentage": 62.4, "elapsed_time": "1 day, 2:30:20", "remaining_time": "15:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11197, "total_steps": 17941, "loss": 1.6368, "learning_rate": 3.19454872682803e-05, "epoch": 0.6241012206677443, "percentage": 62.41, "elapsed_time": "1 day, 2:30:28", "remaining_time": "15:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11198, "total_steps": 17941, "loss": 1.4724, "learning_rate": 3.193718407936521e-05, "epoch": 0.6241569589209074, "percentage": 62.42, "elapsed_time": "1 day, 2:30:37", "remaining_time": "15:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11199, "total_steps": 17941, "loss": 1.5669, "learning_rate": 3.192888146329734e-05, "epoch": 0.6242126971740706, "percentage": 62.42, "elapsed_time": "1 day, 2:30:45", "remaining_time": "15:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11200, "total_steps": 17941, "loss": 1.904, "learning_rate": 3.192057942033997e-05, "epoch": 0.6242684354272338, "percentage": 62.43, "elapsed_time": "1 day, 2:30:54", "remaining_time": "15:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11201, "total_steps": 17941, "loss": 1.4223, "learning_rate": 3.191227795075644e-05, "epoch": 0.6243241736803968, "percentage": 62.43, "elapsed_time": "1 day, 2:31:02", "remaining_time": "15:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11202, "total_steps": 17941, "loss": 1.6111, "learning_rate": 3.190397705480997e-05, "epoch": 0.62437991193356, "percentage": 62.44, "elapsed_time": "1 day, 2:31:12", "remaining_time": "15:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11203, "total_steps": 17941, "loss": 2.0359, "learning_rate": 3.189567673276385e-05, "epoch": 0.6244356501867232, "percentage": 62.44, "elapsed_time": "1 day, 2:31:20", "remaining_time": "15:57:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11204, "total_steps": 17941, "loss": 1.6094, "learning_rate": 3.1887376984881315e-05, "epoch": 0.6244913884398863, "percentage": 62.45, "elapsed_time": "1 day, 2:31:29", "remaining_time": "15:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11205, "total_steps": 17941, "loss": 1.581, "learning_rate": 3.187907781142556e-05, "epoch": 0.6245471266930495, "percentage": 62.45, "elapsed_time": "1 day, 2:31:38", "remaining_time": "15:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11206, "total_steps": 17941, "loss": 1.4707, "learning_rate": 3.187077921265983e-05, "epoch": 0.6246028649462125, "percentage": 62.46, "elapsed_time": "1 day, 2:31:46", "remaining_time": "15:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11207, "total_steps": 17941, "loss": 1.6216, "learning_rate": 3.186248118884726e-05, "epoch": 0.6246586031993757, "percentage": 62.47, "elapsed_time": "1 day, 2:31:55", "remaining_time": "15:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11208, "total_steps": 17941, "loss": 1.5112, "learning_rate": 3.185418374025104e-05, "epoch": 0.6247143414525389, "percentage": 62.47, "elapsed_time": "1 day, 2:32:03", "remaining_time": "15:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11209, "total_steps": 17941, "loss": 1.8131, "learning_rate": 3.184588686713432e-05, "epoch": 0.624770079705702, "percentage": 62.48, "elapsed_time": "1 day, 2:32:12", "remaining_time": "15:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11210, "total_steps": 17941, "loss": 1.6177, "learning_rate": 3.183759056976022e-05, "epoch": 0.6248258179588652, "percentage": 62.48, "elapsed_time": "1 day, 2:32:20", "remaining_time": "15:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11211, "total_steps": 17941, "loss": 1.8943, "learning_rate": 3.1829294848391867e-05, "epoch": 0.6248815562120283, "percentage": 62.49, "elapsed_time": "1 day, 2:32:29", "remaining_time": "15:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11212, "total_steps": 17941, "loss": 1.4587, "learning_rate": 3.182099970329232e-05, "epoch": 0.6249372944651914, "percentage": 62.49, "elapsed_time": "1 day, 2:32:38", "remaining_time": "15:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11213, "total_steps": 17941, "loss": 1.7161, "learning_rate": 3.181270513472469e-05, "epoch": 0.6249930327183546, "percentage": 62.5, "elapsed_time": "1 day, 2:32:46", "remaining_time": "15:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11214, "total_steps": 17941, "loss": 1.6094, "learning_rate": 3.1804411142952e-05, "epoch": 0.6250487709715178, "percentage": 62.5, "elapsed_time": "1 day, 2:32:56", "remaining_time": "15:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11215, "total_steps": 17941, "loss": 1.8517, "learning_rate": 3.179611772823729e-05, "epoch": 0.6251045092246809, "percentage": 62.51, "elapsed_time": "1 day, 2:33:05", "remaining_time": "15:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11216, "total_steps": 17941, "loss": 1.4891, "learning_rate": 3.178782489084362e-05, "epoch": 0.625160247477844, "percentage": 62.52, "elapsed_time": "1 day, 2:33:13", "remaining_time": "15:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11217, "total_steps": 17941, "loss": 1.5387, "learning_rate": 3.177953263103394e-05, "epoch": 0.6252159857310072, "percentage": 62.52, "elapsed_time": "1 day, 2:33:22", "remaining_time": "15:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11218, "total_steps": 17941, "loss": 1.8772, "learning_rate": 3.177124094907127e-05, "epoch": 0.6252717239841703, "percentage": 62.53, "elapsed_time": "1 day, 2:33:30", "remaining_time": "15:55:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11219, "total_steps": 17941, "loss": 1.6118, "learning_rate": 3.176294984521852e-05, "epoch": 0.6253274622373335, "percentage": 62.53, "elapsed_time": "1 day, 2:33:39", "remaining_time": "15:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11220, "total_steps": 17941, "loss": 1.5575, "learning_rate": 3.175465931973871e-05, "epoch": 0.6253832004904967, "percentage": 62.54, "elapsed_time": "1 day, 2:33:47", "remaining_time": "15:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11221, "total_steps": 17941, "loss": 1.8273, "learning_rate": 3.174636937289471e-05, "epoch": 0.6254389387436597, "percentage": 62.54, "elapsed_time": "1 day, 2:33:56", "remaining_time": "15:54:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11222, "total_steps": 17941, "loss": 1.7487, "learning_rate": 3.173808000494944e-05, "epoch": 0.6254946769968229, "percentage": 62.55, "elapsed_time": "1 day, 2:34:04", "remaining_time": "15:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11223, "total_steps": 17941, "loss": 1.7391, "learning_rate": 3.1729791216165814e-05, "epoch": 0.6255504152499861, "percentage": 62.56, "elapsed_time": "1 day, 2:34:13", "remaining_time": "15:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11224, "total_steps": 17941, "loss": 1.9217, "learning_rate": 3.172150300680669e-05, "epoch": 0.6256061535031492, "percentage": 62.56, "elapsed_time": "1 day, 2:34:21", "remaining_time": "15:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11225, "total_steps": 17941, "loss": 1.9327, "learning_rate": 3.171321537713491e-05, "epoch": 0.6256618917563124, "percentage": 62.57, "elapsed_time": "1 day, 2:34:29", "remaining_time": "15:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11226, "total_steps": 17941, "loss": 1.6966, "learning_rate": 3.1704928327413307e-05, "epoch": 0.6257176300094756, "percentage": 62.57, "elapsed_time": "1 day, 2:34:38", "remaining_time": "15:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11227, "total_steps": 17941, "loss": 1.664, "learning_rate": 3.169664185790474e-05, "epoch": 0.6257733682626386, "percentage": 62.58, "elapsed_time": "1 day, 2:34:46", "remaining_time": "15:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11228, "total_steps": 17941, "loss": 1.5542, "learning_rate": 3.1688355968871945e-05, "epoch": 0.6258291065158018, "percentage": 62.58, "elapsed_time": "1 day, 2:34:55", "remaining_time": "15:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11229, "total_steps": 17941, "loss": 1.6896, "learning_rate": 3.1680070660577746e-05, "epoch": 0.6258848447689649, "percentage": 62.59, "elapsed_time": "1 day, 2:35:03", "remaining_time": "15:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11230, "total_steps": 17941, "loss": 1.6811, "learning_rate": 3.1671785933284906e-05, "epoch": 0.6259405830221281, "percentage": 62.59, "elapsed_time": "1 day, 2:35:12", "remaining_time": "15:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11231, "total_steps": 17941, "loss": 1.7108, "learning_rate": 3.166350178725615e-05, "epoch": 0.6259963212752913, "percentage": 62.6, "elapsed_time": "1 day, 2:35:20", "remaining_time": "15:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11232, "total_steps": 17941, "loss": 1.6537, "learning_rate": 3.16552182227542e-05, "epoch": 0.6260520595284543, "percentage": 62.61, "elapsed_time": "1 day, 2:35:29", "remaining_time": "15:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11233, "total_steps": 17941, "loss": 1.5966, "learning_rate": 3.164693524004178e-05, "epoch": 0.6261077977816175, "percentage": 62.61, "elapsed_time": "1 day, 2:35:37", "remaining_time": "15:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11234, "total_steps": 17941, "loss": 1.8528, "learning_rate": 3.1638652839381544e-05, "epoch": 0.6261635360347807, "percentage": 62.62, "elapsed_time": "1 day, 2:35:46", "remaining_time": "15:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11235, "total_steps": 17941, "loss": 1.7224, "learning_rate": 3.1630371021036214e-05, "epoch": 0.6262192742879438, "percentage": 62.62, "elapsed_time": "1 day, 2:35:54", "remaining_time": "15:52:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11236, "total_steps": 17941, "loss": 1.5045, "learning_rate": 3.16220897852684e-05, "epoch": 0.626275012541107, "percentage": 62.63, "elapsed_time": "1 day, 2:36:03", "remaining_time": "15:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11237, "total_steps": 17941, "loss": 1.6119, "learning_rate": 3.1613809132340756e-05, "epoch": 0.6263307507942701, "percentage": 62.63, "elapsed_time": "1 day, 2:36:11", "remaining_time": "15:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11238, "total_steps": 17941, "loss": 1.7967, "learning_rate": 3.1605529062515884e-05, "epoch": 0.6263864890474332, "percentage": 62.64, "elapsed_time": "1 day, 2:36:20", "remaining_time": "15:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11239, "total_steps": 17941, "loss": 1.4543, "learning_rate": 3.1597249576056384e-05, "epoch": 0.6264422273005964, "percentage": 62.64, "elapsed_time": "1 day, 2:36:28", "remaining_time": "15:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11240, "total_steps": 17941, "loss": 1.6086, "learning_rate": 3.1588970673224826e-05, "epoch": 0.6264979655537596, "percentage": 62.65, "elapsed_time": "1 day, 2:36:36", "remaining_time": "15:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11241, "total_steps": 17941, "loss": 1.8036, "learning_rate": 3.158069235428377e-05, "epoch": 0.6265537038069227, "percentage": 62.66, "elapsed_time": "1 day, 2:36:45", "remaining_time": "15:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11242, "total_steps": 17941, "loss": 1.5898, "learning_rate": 3.157241461949578e-05, "epoch": 0.6266094420600858, "percentage": 62.66, "elapsed_time": "1 day, 2:36:53", "remaining_time": "15:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11243, "total_steps": 17941, "loss": 1.5166, "learning_rate": 3.1564137469123336e-05, "epoch": 0.626665180313249, "percentage": 62.67, "elapsed_time": "1 day, 2:37:02", "remaining_time": "15:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11244, "total_steps": 17941, "loss": 1.9267, "learning_rate": 3.155586090342898e-05, "epoch": 0.6267209185664121, "percentage": 62.67, "elapsed_time": "1 day, 2:37:10", "remaining_time": "15:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11245, "total_steps": 17941, "loss": 1.7181, "learning_rate": 3.1547584922675163e-05, "epoch": 0.6267766568195753, "percentage": 62.68, "elapsed_time": "1 day, 2:37:19", "remaining_time": "15:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11246, "total_steps": 17941, "loss": 1.7861, "learning_rate": 3.1539309527124394e-05, "epoch": 0.6268323950727385, "percentage": 62.68, "elapsed_time": "1 day, 2:37:27", "remaining_time": "15:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11247, "total_steps": 17941, "loss": 1.7002, "learning_rate": 3.153103471703907e-05, "epoch": 0.6268881333259015, "percentage": 62.69, "elapsed_time": "1 day, 2:37:36", "remaining_time": "15:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11248, "total_steps": 17941, "loss": 1.6348, "learning_rate": 3.1522760492681647e-05, "epoch": 0.6269438715790647, "percentage": 62.69, "elapsed_time": "1 day, 2:37:44", "remaining_time": "15:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11249, "total_steps": 17941, "loss": 1.6681, "learning_rate": 3.151448685431454e-05, "epoch": 0.6269996098322279, "percentage": 62.7, "elapsed_time": "1 day, 2:37:53", "remaining_time": "15:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11250, "total_steps": 17941, "loss": 1.6242, "learning_rate": 3.150621380220011e-05, "epoch": 0.627055348085391, "percentage": 62.71, "elapsed_time": "1 day, 2:38:01", "remaining_time": "15:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11251, "total_steps": 17941, "loss": 1.5461, "learning_rate": 3.149794133660079e-05, "epoch": 0.6271110863385542, "percentage": 62.71, "elapsed_time": "1 day, 2:38:09", "remaining_time": "15:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11252, "total_steps": 17941, "loss": 1.6535, "learning_rate": 3.148966945777886e-05, "epoch": 0.6271668245917172, "percentage": 62.72, "elapsed_time": "1 day, 2:38:18", "remaining_time": "15:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11253, "total_steps": 17941, "loss": 1.5138, "learning_rate": 3.148139816599672e-05, "epoch": 0.6272225628448804, "percentage": 62.72, "elapsed_time": "1 day, 2:38:26", "remaining_time": "15:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11254, "total_steps": 17941, "loss": 1.546, "learning_rate": 3.147312746151664e-05, "epoch": 0.6272783010980436, "percentage": 62.73, "elapsed_time": "1 day, 2:38:35", "remaining_time": "15:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11255, "total_steps": 17941, "loss": 1.6739, "learning_rate": 3.1464857344600935e-05, "epoch": 0.6273340393512067, "percentage": 62.73, "elapsed_time": "1 day, 2:38:43", "remaining_time": "15:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11256, "total_steps": 17941, "loss": 1.5668, "learning_rate": 3.145658781551191e-05, "epoch": 0.6273897776043699, "percentage": 62.74, "elapsed_time": "1 day, 2:38:52", "remaining_time": "15:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11257, "total_steps": 17941, "loss": 1.545, "learning_rate": 3.144831887451178e-05, "epoch": 0.627445515857533, "percentage": 62.74, "elapsed_time": "1 day, 2:39:00", "remaining_time": "15:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11258, "total_steps": 17941, "loss": 1.6925, "learning_rate": 3.144005052186283e-05, "epoch": 0.6275012541106961, "percentage": 62.75, "elapsed_time": "1 day, 2:39:09", "remaining_time": "15:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11259, "total_steps": 17941, "loss": 1.5535, "learning_rate": 3.1431782757827256e-05, "epoch": 0.6275569923638593, "percentage": 62.76, "elapsed_time": "1 day, 2:39:17", "remaining_time": "15:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11260, "total_steps": 17941, "loss": 1.5023, "learning_rate": 3.142351558266726e-05, "epoch": 0.6276127306170225, "percentage": 62.76, "elapsed_time": "1 day, 2:39:26", "remaining_time": "15:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11261, "total_steps": 17941, "loss": 1.4871, "learning_rate": 3.1415248996645056e-05, "epoch": 0.6276684688701856, "percentage": 62.77, "elapsed_time": "1 day, 2:39:34", "remaining_time": "15:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11262, "total_steps": 17941, "loss": 1.79, "learning_rate": 3.1406983000022795e-05, "epoch": 0.6277242071233488, "percentage": 62.77, "elapsed_time": "1 day, 2:39:42", "remaining_time": "15:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11263, "total_steps": 17941, "loss": 1.7054, "learning_rate": 3.1398717593062635e-05, "epoch": 0.6277799453765119, "percentage": 62.78, "elapsed_time": "1 day, 2:39:51", "remaining_time": "15:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11264, "total_steps": 17941, "loss": 1.7227, "learning_rate": 3.139045277602669e-05, "epoch": 0.627835683629675, "percentage": 62.78, "elapsed_time": "1 day, 2:39:59", "remaining_time": "15:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11265, "total_steps": 17941, "loss": 1.7799, "learning_rate": 3.138218854917709e-05, "epoch": 0.6278914218828382, "percentage": 62.79, "elapsed_time": "1 day, 2:40:08", "remaining_time": "15:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11266, "total_steps": 17941, "loss": 1.8094, "learning_rate": 3.137392491277592e-05, "epoch": 0.6279471601360014, "percentage": 62.79, "elapsed_time": "1 day, 2:40:16", "remaining_time": "15:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11267, "total_steps": 17941, "loss": 1.2856, "learning_rate": 3.1365661867085236e-05, "epoch": 0.6280028983891645, "percentage": 62.8, "elapsed_time": "1 day, 2:40:25", "remaining_time": "15:48:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11268, "total_steps": 17941, "loss": 1.8226, "learning_rate": 3.135739941236714e-05, "epoch": 0.6280586366423276, "percentage": 62.81, "elapsed_time": "1 day, 2:40:33", "remaining_time": "15:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11269, "total_steps": 17941, "loss": 1.4785, "learning_rate": 3.134913754888362e-05, "epoch": 0.6281143748954908, "percentage": 62.81, "elapsed_time": "1 day, 2:40:42", "remaining_time": "15:47:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11270, "total_steps": 17941, "loss": 1.7147, "learning_rate": 3.134087627689672e-05, "epoch": 0.6281701131486539, "percentage": 62.82, "elapsed_time": "1 day, 2:40:50", "remaining_time": "15:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11271, "total_steps": 17941, "loss": 1.6772, "learning_rate": 3.133261559666843e-05, "epoch": 0.6282258514018171, "percentage": 62.82, "elapsed_time": "1 day, 2:40:58", "remaining_time": "15:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11272, "total_steps": 17941, "loss": 1.5868, "learning_rate": 3.132435550846076e-05, "epoch": 0.6282815896549803, "percentage": 62.83, "elapsed_time": "1 day, 2:41:07", "remaining_time": "15:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11273, "total_steps": 17941, "loss": 1.8946, "learning_rate": 3.1316096012535626e-05, "epoch": 0.6283373279081433, "percentage": 62.83, "elapsed_time": "1 day, 2:41:15", "remaining_time": "15:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11274, "total_steps": 17941, "loss": 1.6757, "learning_rate": 3.130783710915498e-05, "epoch": 0.6283930661613065, "percentage": 62.84, "elapsed_time": "1 day, 2:41:24", "remaining_time": "15:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11275, "total_steps": 17941, "loss": 1.4474, "learning_rate": 3.129957879858078e-05, "epoch": 0.6284488044144696, "percentage": 62.84, "elapsed_time": "1 day, 2:41:33", "remaining_time": "15:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11276, "total_steps": 17941, "loss": 1.5844, "learning_rate": 3.1291321081074884e-05, "epoch": 0.6285045426676328, "percentage": 62.85, "elapsed_time": "1 day, 2:41:41", "remaining_time": "15:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11277, "total_steps": 17941, "loss": 1.4043, "learning_rate": 3.1283063956899244e-05, "epoch": 0.628560280920796, "percentage": 62.86, "elapsed_time": "1 day, 2:41:50", "remaining_time": "15:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11278, "total_steps": 17941, "loss": 1.7536, "learning_rate": 3.127480742631565e-05, "epoch": 0.628616019173959, "percentage": 62.86, "elapsed_time": "1 day, 2:41:58", "remaining_time": "15:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11279, "total_steps": 17941, "loss": 2.0976, "learning_rate": 3.126655148958602e-05, "epoch": 0.6286717574271222, "percentage": 62.87, "elapsed_time": "1 day, 2:42:07", "remaining_time": "15:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11280, "total_steps": 17941, "loss": 1.6716, "learning_rate": 3.125829614697213e-05, "epoch": 0.6287274956802854, "percentage": 62.87, "elapsed_time": "1 day, 2:42:16", "remaining_time": "15:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11281, "total_steps": 17941, "loss": 1.7497, "learning_rate": 3.125004139873582e-05, "epoch": 0.6287832339334485, "percentage": 62.88, "elapsed_time": "1 day, 2:42:24", "remaining_time": "15:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11282, "total_steps": 17941, "loss": 1.7312, "learning_rate": 3.1241787245138884e-05, "epoch": 0.6288389721866117, "percentage": 62.88, "elapsed_time": "1 day, 2:42:32", "remaining_time": "15:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11283, "total_steps": 17941, "loss": 1.5331, "learning_rate": 3.123353368644307e-05, "epoch": 0.6288947104397749, "percentage": 62.89, "elapsed_time": "1 day, 2:42:42", "remaining_time": "15:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11284, "total_steps": 17941, "loss": 1.6681, "learning_rate": 3.1225280722910175e-05, "epoch": 0.6289504486929379, "percentage": 62.9, "elapsed_time": "1 day, 2:42:50", "remaining_time": "15:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11285, "total_steps": 17941, "loss": 1.7812, "learning_rate": 3.12170283548019e-05, "epoch": 0.6290061869461011, "percentage": 62.9, "elapsed_time": "1 day, 2:42:59", "remaining_time": "15:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11286, "total_steps": 17941, "loss": 1.7624, "learning_rate": 3.120877658237998e-05, "epoch": 0.6290619251992643, "percentage": 62.91, "elapsed_time": "1 day, 2:43:08", "remaining_time": "15:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11287, "total_steps": 17941, "loss": 1.5895, "learning_rate": 3.120052540590609e-05, "epoch": 0.6291176634524274, "percentage": 62.91, "elapsed_time": "1 day, 2:43:16", "remaining_time": "15:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11288, "total_steps": 17941, "loss": 1.5756, "learning_rate": 3.1192274825641935e-05, "epoch": 0.6291734017055906, "percentage": 62.92, "elapsed_time": "1 day, 2:43:25", "remaining_time": "15:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11289, "total_steps": 17941, "loss": 1.9689, "learning_rate": 3.118402484184917e-05, "epoch": 0.6292291399587537, "percentage": 62.92, "elapsed_time": "1 day, 2:43:33", "remaining_time": "15:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11290, "total_steps": 17941, "loss": 1.422, "learning_rate": 3.1175775454789424e-05, "epoch": 0.6292848782119168, "percentage": 62.93, "elapsed_time": "1 day, 2:43:42", "remaining_time": "15:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11291, "total_steps": 17941, "loss": 1.5129, "learning_rate": 3.1167526664724346e-05, "epoch": 0.62934061646508, "percentage": 62.93, "elapsed_time": "1 day, 2:43:50", "remaining_time": "15:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11292, "total_steps": 17941, "loss": 1.5274, "learning_rate": 3.11592784719155e-05, "epoch": 0.6293963547182432, "percentage": 62.94, "elapsed_time": "1 day, 2:43:58", "remaining_time": "15:44:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11293, "total_steps": 17941, "loss": 1.7378, "learning_rate": 3.1151030876624486e-05, "epoch": 0.6294520929714063, "percentage": 62.95, "elapsed_time": "1 day, 2:44:07", "remaining_time": "15:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11294, "total_steps": 17941, "loss": 1.6353, "learning_rate": 3.1142783879112914e-05, "epoch": 0.6295078312245694, "percentage": 62.95, "elapsed_time": "1 day, 2:44:16", "remaining_time": "15:44:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11295, "total_steps": 17941, "loss": 1.6101, "learning_rate": 3.113453747964225e-05, "epoch": 0.6295635694777326, "percentage": 62.96, "elapsed_time": "1 day, 2:44:24", "remaining_time": "15:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11296, "total_steps": 17941, "loss": 1.6695, "learning_rate": 3.112629167847409e-05, "epoch": 0.6296193077308957, "percentage": 62.96, "elapsed_time": "1 day, 2:44:33", "remaining_time": "15:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11297, "total_steps": 17941, "loss": 1.4184, "learning_rate": 3.11180464758699e-05, "epoch": 0.6296750459840589, "percentage": 62.97, "elapsed_time": "1 day, 2:44:41", "remaining_time": "15:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11298, "total_steps": 17941, "loss": 1.7076, "learning_rate": 3.1109801872091205e-05, "epoch": 0.629730784237222, "percentage": 62.97, "elapsed_time": "1 day, 2:44:49", "remaining_time": "15:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11299, "total_steps": 17941, "loss": 1.8046, "learning_rate": 3.1101557867399444e-05, "epoch": 0.6297865224903851, "percentage": 62.98, "elapsed_time": "1 day, 2:44:58", "remaining_time": "15:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11300, "total_steps": 17941, "loss": 1.6712, "learning_rate": 3.109331446205608e-05, "epoch": 0.6298422607435483, "percentage": 62.98, "elapsed_time": "1 day, 2:45:06", "remaining_time": "15:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11301, "total_steps": 17941, "loss": 1.7935, "learning_rate": 3.108507165632256e-05, "epoch": 0.6298979989967114, "percentage": 62.99, "elapsed_time": "1 day, 2:45:15", "remaining_time": "15:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11302, "total_steps": 17941, "loss": 1.4931, "learning_rate": 3.1076829450460266e-05, "epoch": 0.6299537372498746, "percentage": 63.0, "elapsed_time": "1 day, 2:45:23", "remaining_time": "15:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11303, "total_steps": 17941, "loss": 1.5466, "learning_rate": 3.106858784473064e-05, "epoch": 0.6300094755030378, "percentage": 63.0, "elapsed_time": "1 day, 2:45:32", "remaining_time": "15:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11304, "total_steps": 17941, "loss": 1.5863, "learning_rate": 3.1060346839395e-05, "epoch": 0.6300652137562008, "percentage": 63.01, "elapsed_time": "1 day, 2:45:40", "remaining_time": "15:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11305, "total_steps": 17941, "loss": 1.5272, "learning_rate": 3.105210643471476e-05, "epoch": 0.630120952009364, "percentage": 63.01, "elapsed_time": "1 day, 2:45:49", "remaining_time": "15:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11306, "total_steps": 17941, "loss": 1.6595, "learning_rate": 3.10438666309512e-05, "epoch": 0.6301766902625272, "percentage": 63.02, "elapsed_time": "1 day, 2:45:57", "remaining_time": "15:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11307, "total_steps": 17941, "loss": 1.7253, "learning_rate": 3.103562742836569e-05, "epoch": 0.6302324285156903, "percentage": 63.02, "elapsed_time": "1 day, 2:46:06", "remaining_time": "15:42:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11308, "total_steps": 17941, "loss": 1.7749, "learning_rate": 3.1027388827219506e-05, "epoch": 0.6302881667688535, "percentage": 63.03, "elapsed_time": "1 day, 2:46:14", "remaining_time": "15:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11309, "total_steps": 17941, "loss": 1.6484, "learning_rate": 3.1019150827773925e-05, "epoch": 0.6303439050220166, "percentage": 63.03, "elapsed_time": "1 day, 2:46:23", "remaining_time": "15:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11310, "total_steps": 17941, "loss": 1.6021, "learning_rate": 3.1010913430290224e-05, "epoch": 0.6303996432751797, "percentage": 63.04, "elapsed_time": "1 day, 2:46:32", "remaining_time": "15:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11311, "total_steps": 17941, "loss": 1.3745, "learning_rate": 3.100267663502962e-05, "epoch": 0.6304553815283429, "percentage": 63.05, "elapsed_time": "1 day, 2:46:40", "remaining_time": "15:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11312, "total_steps": 17941, "loss": 1.6346, "learning_rate": 3.099444044225336e-05, "epoch": 0.6305111197815061, "percentage": 63.05, "elapsed_time": "1 day, 2:46:49", "remaining_time": "15:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11313, "total_steps": 17941, "loss": 1.7061, "learning_rate": 3.0986204852222626e-05, "epoch": 0.6305668580346692, "percentage": 63.06, "elapsed_time": "1 day, 2:46:57", "remaining_time": "15:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11314, "total_steps": 17941, "loss": 1.7118, "learning_rate": 3.097796986519863e-05, "epoch": 0.6306225962878323, "percentage": 63.06, "elapsed_time": "1 day, 2:47:06", "remaining_time": "15:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11315, "total_steps": 17941, "loss": 1.5219, "learning_rate": 3.096973548144252e-05, "epoch": 0.6306783345409955, "percentage": 63.07, "elapsed_time": "1 day, 2:47:14", "remaining_time": "15:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11316, "total_steps": 17941, "loss": 1.8662, "learning_rate": 3.096150170121545e-05, "epoch": 0.6307340727941586, "percentage": 63.07, "elapsed_time": "1 day, 2:47:23", "remaining_time": "15:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11317, "total_steps": 17941, "loss": 1.6059, "learning_rate": 3.0953268524778544e-05, "epoch": 0.6307898110473218, "percentage": 63.08, "elapsed_time": "1 day, 2:47:31", "remaining_time": "15:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11318, "total_steps": 17941, "loss": 1.7426, "learning_rate": 3.09450359523929e-05, "epoch": 0.630845549300485, "percentage": 63.08, "elapsed_time": "1 day, 2:47:39", "remaining_time": "15:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11319, "total_steps": 17941, "loss": 1.6988, "learning_rate": 3.093680398431962e-05, "epoch": 0.630901287553648, "percentage": 63.09, "elapsed_time": "1 day, 2:47:49", "remaining_time": "15:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11320, "total_steps": 17941, "loss": 1.6672, "learning_rate": 3.0928572620819786e-05, "epoch": 0.6309570258068112, "percentage": 63.1, "elapsed_time": "1 day, 2:47:57", "remaining_time": "15:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11321, "total_steps": 17941, "loss": 1.3523, "learning_rate": 3.092034186215441e-05, "epoch": 0.6310127640599743, "percentage": 63.1, "elapsed_time": "1 day, 2:48:05", "remaining_time": "15:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11322, "total_steps": 17941, "loss": 1.6872, "learning_rate": 3.091211170858457e-05, "epoch": 0.6310685023131375, "percentage": 63.11, "elapsed_time": "1 day, 2:48:14", "remaining_time": "15:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11323, "total_steps": 17941, "loss": 1.7043, "learning_rate": 3.0903882160371246e-05, "epoch": 0.6311242405663007, "percentage": 63.11, "elapsed_time": "1 day, 2:48:22", "remaining_time": "15:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11324, "total_steps": 17941, "loss": 1.7498, "learning_rate": 3.089565321777546e-05, "epoch": 0.6311799788194637, "percentage": 63.12, "elapsed_time": "1 day, 2:48:31", "remaining_time": "15:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11325, "total_steps": 17941, "loss": 1.6361, "learning_rate": 3.088742488105814e-05, "epoch": 0.6312357170726269, "percentage": 63.12, "elapsed_time": "1 day, 2:48:40", "remaining_time": "15:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11326, "total_steps": 17941, "loss": 1.707, "learning_rate": 3.0879197150480274e-05, "epoch": 0.6312914553257901, "percentage": 63.13, "elapsed_time": "1 day, 2:48:48", "remaining_time": "15:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11327, "total_steps": 17941, "loss": 1.8144, "learning_rate": 3.0870970026302813e-05, "epoch": 0.6313471935789532, "percentage": 63.13, "elapsed_time": "1 day, 2:48:57", "remaining_time": "15:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11328, "total_steps": 17941, "loss": 1.8036, "learning_rate": 3.0862743508786626e-05, "epoch": 0.6314029318321164, "percentage": 63.14, "elapsed_time": "1 day, 2:49:05", "remaining_time": "15:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11329, "total_steps": 17941, "loss": 1.666, "learning_rate": 3.0854517598192666e-05, "epoch": 0.6314586700852796, "percentage": 63.15, "elapsed_time": "1 day, 2:49:14", "remaining_time": "15:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11330, "total_steps": 17941, "loss": 1.6637, "learning_rate": 3.084629229478175e-05, "epoch": 0.6315144083384426, "percentage": 63.15, "elapsed_time": "1 day, 2:49:22", "remaining_time": "15:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11331, "total_steps": 17941, "loss": 1.597, "learning_rate": 3.083806759881479e-05, "epoch": 0.6315701465916058, "percentage": 63.16, "elapsed_time": "1 day, 2:49:31", "remaining_time": "15:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11332, "total_steps": 17941, "loss": 1.6464, "learning_rate": 3.0829843510552604e-05, "epoch": 0.631625884844769, "percentage": 63.16, "elapsed_time": "1 day, 2:49:39", "remaining_time": "15:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11333, "total_steps": 17941, "loss": 1.5438, "learning_rate": 3.0821620030256e-05, "epoch": 0.6316816230979321, "percentage": 63.17, "elapsed_time": "1 day, 2:49:47", "remaining_time": "15:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11334, "total_steps": 17941, "loss": 1.7269, "learning_rate": 3.0813397158185806e-05, "epoch": 0.6317373613510953, "percentage": 63.17, "elapsed_time": "1 day, 2:49:56", "remaining_time": "15:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11335, "total_steps": 17941, "loss": 1.6349, "learning_rate": 3.0805174894602775e-05, "epoch": 0.6317930996042584, "percentage": 63.18, "elapsed_time": "1 day, 2:50:04", "remaining_time": "15:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11336, "total_steps": 17941, "loss": 1.6013, "learning_rate": 3.0796953239767693e-05, "epoch": 0.6318488378574215, "percentage": 63.18, "elapsed_time": "1 day, 2:50:13", "remaining_time": "15:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11337, "total_steps": 17941, "loss": 1.7542, "learning_rate": 3.078873219394127e-05, "epoch": 0.6319045761105847, "percentage": 63.19, "elapsed_time": "1 day, 2:50:21", "remaining_time": "15:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11338, "total_steps": 17941, "loss": 1.8181, "learning_rate": 3.078051175738429e-05, "epoch": 0.6319603143637479, "percentage": 63.2, "elapsed_time": "1 day, 2:50:30", "remaining_time": "15:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11339, "total_steps": 17941, "loss": 1.6423, "learning_rate": 3.0772291930357386e-05, "epoch": 0.632016052616911, "percentage": 63.2, "elapsed_time": "1 day, 2:50:38", "remaining_time": "15:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11340, "total_steps": 17941, "loss": 1.5643, "learning_rate": 3.076407271312129e-05, "epoch": 0.6320717908700741, "percentage": 63.21, "elapsed_time": "1 day, 2:50:47", "remaining_time": "15:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11341, "total_steps": 17941, "loss": 1.609, "learning_rate": 3.075585410593666e-05, "epoch": 0.6321275291232373, "percentage": 63.21, "elapsed_time": "1 day, 2:50:55", "remaining_time": "15:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11342, "total_steps": 17941, "loss": 1.9504, "learning_rate": 3.074763610906413e-05, "epoch": 0.6321832673764004, "percentage": 63.22, "elapsed_time": "1 day, 2:51:03", "remaining_time": "15:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11343, "total_steps": 17941, "loss": 1.704, "learning_rate": 3.073941872276434e-05, "epoch": 0.6322390056295636, "percentage": 63.22, "elapsed_time": "1 day, 2:51:12", "remaining_time": "15:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11344, "total_steps": 17941, "loss": 1.8544, "learning_rate": 3.073120194729788e-05, "epoch": 0.6322947438827267, "percentage": 63.23, "elapsed_time": "1 day, 2:51:20", "remaining_time": "15:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11345, "total_steps": 17941, "loss": 1.6185, "learning_rate": 3.072298578292534e-05, "epoch": 0.6323504821358898, "percentage": 63.24, "elapsed_time": "1 day, 2:51:29", "remaining_time": "15:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11346, "total_steps": 17941, "loss": 1.764, "learning_rate": 3.071477022990734e-05, "epoch": 0.632406220389053, "percentage": 63.24, "elapsed_time": "1 day, 2:51:37", "remaining_time": "15:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11347, "total_steps": 17941, "loss": 1.6142, "learning_rate": 3.070655528850435e-05, "epoch": 0.6324619586422161, "percentage": 63.25, "elapsed_time": "1 day, 2:51:46", "remaining_time": "15:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11348, "total_steps": 17941, "loss": 1.6187, "learning_rate": 3.0698340958976943e-05, "epoch": 0.6325176968953793, "percentage": 63.25, "elapsed_time": "1 day, 2:51:54", "remaining_time": "15:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11349, "total_steps": 17941, "loss": 1.5745, "learning_rate": 3.069012724158563e-05, "epoch": 0.6325734351485425, "percentage": 63.26, "elapsed_time": "1 day, 2:52:03", "remaining_time": "15:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11350, "total_steps": 17941, "loss": 1.9964, "learning_rate": 3.068191413659091e-05, "epoch": 0.6326291734017055, "percentage": 63.26, "elapsed_time": "1 day, 2:52:11", "remaining_time": "15:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11351, "total_steps": 17941, "loss": 1.5707, "learning_rate": 3.067370164425322e-05, "epoch": 0.6326849116548687, "percentage": 63.27, "elapsed_time": "1 day, 2:52:20", "remaining_time": "15:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11352, "total_steps": 17941, "loss": 1.8577, "learning_rate": 3.066548976483304e-05, "epoch": 0.6327406499080319, "percentage": 63.27, "elapsed_time": "1 day, 2:52:28", "remaining_time": "15:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11353, "total_steps": 17941, "loss": 1.6431, "learning_rate": 3.06572784985908e-05, "epoch": 0.632796388161195, "percentage": 63.28, "elapsed_time": "1 day, 2:52:37", "remaining_time": "15:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11354, "total_steps": 17941, "loss": 1.5172, "learning_rate": 3.0649067845786895e-05, "epoch": 0.6328521264143582, "percentage": 63.29, "elapsed_time": "1 day, 2:52:45", "remaining_time": "15:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11355, "total_steps": 17941, "loss": 1.8141, "learning_rate": 3.0640857806681764e-05, "epoch": 0.6329078646675214, "percentage": 63.29, "elapsed_time": "1 day, 2:52:54", "remaining_time": "15:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11356, "total_steps": 17941, "loss": 1.679, "learning_rate": 3.0632648381535725e-05, "epoch": 0.6329636029206844, "percentage": 63.3, "elapsed_time": "1 day, 2:53:02", "remaining_time": "15:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11357, "total_steps": 17941, "loss": 1.5311, "learning_rate": 3.062443957060918e-05, "epoch": 0.6330193411738476, "percentage": 63.3, "elapsed_time": "1 day, 2:53:11", "remaining_time": "15:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11358, "total_steps": 17941, "loss": 1.6186, "learning_rate": 3.061623137416243e-05, "epoch": 0.6330750794270108, "percentage": 63.31, "elapsed_time": "1 day, 2:53:19", "remaining_time": "15:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11359, "total_steps": 17941, "loss": 1.7088, "learning_rate": 3.060802379245581e-05, "epoch": 0.6331308176801739, "percentage": 63.31, "elapsed_time": "1 day, 2:53:28", "remaining_time": "15:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11360, "total_steps": 17941, "loss": 1.5318, "learning_rate": 3.059981682574961e-05, "epoch": 0.6331865559333371, "percentage": 63.32, "elapsed_time": "1 day, 2:53:36", "remaining_time": "15:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11361, "total_steps": 17941, "loss": 1.5, "learning_rate": 3.059161047430411e-05, "epoch": 0.6332422941865002, "percentage": 63.32, "elapsed_time": "1 day, 2:53:45", "remaining_time": "15:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11362, "total_steps": 17941, "loss": 1.6703, "learning_rate": 3.058340473837958e-05, "epoch": 0.6332980324396633, "percentage": 63.33, "elapsed_time": "1 day, 2:53:53", "remaining_time": "15:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11363, "total_steps": 17941, "loss": 1.42, "learning_rate": 3.057519961823622e-05, "epoch": 0.6333537706928265, "percentage": 63.34, "elapsed_time": "1 day, 2:54:02", "remaining_time": "15:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11364, "total_steps": 17941, "loss": 1.8826, "learning_rate": 3.05669951141343e-05, "epoch": 0.6334095089459897, "percentage": 63.34, "elapsed_time": "1 day, 2:54:10", "remaining_time": "15:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11365, "total_steps": 17941, "loss": 1.7671, "learning_rate": 3.055879122633397e-05, "epoch": 0.6334652471991528, "percentage": 63.35, "elapsed_time": "1 day, 2:54:18", "remaining_time": "15:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11366, "total_steps": 17941, "loss": 1.7308, "learning_rate": 3.055058795509544e-05, "epoch": 0.6335209854523159, "percentage": 63.35, "elapsed_time": "1 day, 2:54:27", "remaining_time": "15:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11367, "total_steps": 17941, "loss": 1.8272, "learning_rate": 3.0542385300678875e-05, "epoch": 0.633576723705479, "percentage": 63.36, "elapsed_time": "1 day, 2:54:36", "remaining_time": "15:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11368, "total_steps": 17941, "loss": 1.3861, "learning_rate": 3.053418326334438e-05, "epoch": 0.6336324619586422, "percentage": 63.36, "elapsed_time": "1 day, 2:54:45", "remaining_time": "15:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11369, "total_steps": 17941, "loss": 2.0965, "learning_rate": 3.052598184335212e-05, "epoch": 0.6336882002118054, "percentage": 63.37, "elapsed_time": "1 day, 2:54:53", "remaining_time": "15:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11370, "total_steps": 17941, "loss": 1.5337, "learning_rate": 3.0517781040962163e-05, "epoch": 0.6337439384649685, "percentage": 63.37, "elapsed_time": "1 day, 2:55:02", "remaining_time": "15:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11371, "total_steps": 17941, "loss": 1.6827, "learning_rate": 3.0509580856434595e-05, "epoch": 0.6337996767181316, "percentage": 63.38, "elapsed_time": "1 day, 2:55:10", "remaining_time": "15:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11372, "total_steps": 17941, "loss": 1.6712, "learning_rate": 3.0501381290029506e-05, "epoch": 0.6338554149712948, "percentage": 63.39, "elapsed_time": "1 day, 2:55:18", "remaining_time": "15:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11373, "total_steps": 17941, "loss": 1.7436, "learning_rate": 3.049318234200689e-05, "epoch": 0.6339111532244579, "percentage": 63.39, "elapsed_time": "1 day, 2:55:27", "remaining_time": "15:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11374, "total_steps": 17941, "loss": 1.5253, "learning_rate": 3.048498401262683e-05, "epoch": 0.6339668914776211, "percentage": 63.4, "elapsed_time": "1 day, 2:55:35", "remaining_time": "15:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11375, "total_steps": 17941, "loss": 1.6458, "learning_rate": 3.0476786302149274e-05, "epoch": 0.6340226297307843, "percentage": 63.4, "elapsed_time": "1 day, 2:55:44", "remaining_time": "15:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11376, "total_steps": 17941, "loss": 1.8774, "learning_rate": 3.0468589210834237e-05, "epoch": 0.6340783679839473, "percentage": 63.41, "elapsed_time": "1 day, 2:55:52", "remaining_time": "15:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11377, "total_steps": 17941, "loss": 1.7102, "learning_rate": 3.046039273894167e-05, "epoch": 0.6341341062371105, "percentage": 63.41, "elapsed_time": "1 day, 2:56:01", "remaining_time": "15:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11378, "total_steps": 17941, "loss": 1.8709, "learning_rate": 3.045219688673152e-05, "epoch": 0.6341898444902737, "percentage": 63.42, "elapsed_time": "1 day, 2:56:09", "remaining_time": "15:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11379, "total_steps": 17941, "loss": 1.6028, "learning_rate": 3.044400165446372e-05, "epoch": 0.6342455827434368, "percentage": 63.42, "elapsed_time": "1 day, 2:56:18", "remaining_time": "15:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11380, "total_steps": 17941, "loss": 1.6706, "learning_rate": 3.043580704239815e-05, "epoch": 0.6343013209966, "percentage": 63.43, "elapsed_time": "1 day, 2:56:26", "remaining_time": "15:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11381, "total_steps": 17941, "loss": 1.3136, "learning_rate": 3.0427613050794745e-05, "epoch": 0.6343570592497632, "percentage": 63.44, "elapsed_time": "1 day, 2:56:35", "remaining_time": "15:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11382, "total_steps": 17941, "loss": 1.7069, "learning_rate": 3.0419419679913307e-05, "epoch": 0.6344127975029262, "percentage": 63.44, "elapsed_time": "1 day, 2:56:43", "remaining_time": "15:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11383, "total_steps": 17941, "loss": 1.9564, "learning_rate": 3.0411226930013735e-05, "epoch": 0.6344685357560894, "percentage": 63.45, "elapsed_time": "1 day, 2:56:52", "remaining_time": "15:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11384, "total_steps": 17941, "loss": 1.655, "learning_rate": 3.0403034801355828e-05, "epoch": 0.6345242740092526, "percentage": 63.45, "elapsed_time": "1 day, 2:57:00", "remaining_time": "15:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11385, "total_steps": 17941, "loss": 1.4787, "learning_rate": 3.0394843294199395e-05, "epoch": 0.6345800122624157, "percentage": 63.46, "elapsed_time": "1 day, 2:57:09", "remaining_time": "15:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11386, "total_steps": 17941, "loss": 1.6266, "learning_rate": 3.038665240880424e-05, "epoch": 0.6346357505155789, "percentage": 63.46, "elapsed_time": "1 day, 2:57:17", "remaining_time": "15:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11387, "total_steps": 17941, "loss": 1.8088, "learning_rate": 3.0378462145430102e-05, "epoch": 0.634691488768742, "percentage": 63.47, "elapsed_time": "1 day, 2:57:26", "remaining_time": "15:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11388, "total_steps": 17941, "loss": 1.5096, "learning_rate": 3.0370272504336762e-05, "epoch": 0.6347472270219051, "percentage": 63.47, "elapsed_time": "1 day, 2:57:34", "remaining_time": "15:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11389, "total_steps": 17941, "loss": 1.9104, "learning_rate": 3.0362083485783897e-05, "epoch": 0.6348029652750683, "percentage": 63.48, "elapsed_time": "1 day, 2:57:42", "remaining_time": "15:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11390, "total_steps": 17941, "loss": 1.8119, "learning_rate": 3.035389509003128e-05, "epoch": 0.6348587035282314, "percentage": 63.49, "elapsed_time": "1 day, 2:57:51", "remaining_time": "15:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11391, "total_steps": 17941, "loss": 1.7255, "learning_rate": 3.0345707317338545e-05, "epoch": 0.6349144417813946, "percentage": 63.49, "elapsed_time": "1 day, 2:57:59", "remaining_time": "15:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11392, "total_steps": 17941, "loss": 1.6893, "learning_rate": 3.0337520167965383e-05, "epoch": 0.6349701800345577, "percentage": 63.5, "elapsed_time": "1 day, 2:58:08", "remaining_time": "15:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11393, "total_steps": 17941, "loss": 1.6162, "learning_rate": 3.0329333642171454e-05, "epoch": 0.6350259182877208, "percentage": 63.5, "elapsed_time": "1 day, 2:58:16", "remaining_time": "15:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11394, "total_steps": 17941, "loss": 1.6565, "learning_rate": 3.032114774021636e-05, "epoch": 0.635081656540884, "percentage": 63.51, "elapsed_time": "1 day, 2:58:25", "remaining_time": "15:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11395, "total_steps": 17941, "loss": 1.6259, "learning_rate": 3.031296246235974e-05, "epoch": 0.6351373947940472, "percentage": 63.51, "elapsed_time": "1 day, 2:58:33", "remaining_time": "15:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11396, "total_steps": 17941, "loss": 1.8429, "learning_rate": 3.0304777808861152e-05, "epoch": 0.6351931330472103, "percentage": 63.52, "elapsed_time": "1 day, 2:58:42", "remaining_time": "15:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11397, "total_steps": 17941, "loss": 1.5404, "learning_rate": 3.0296593779980177e-05, "epoch": 0.6352488713003734, "percentage": 63.52, "elapsed_time": "1 day, 2:58:50", "remaining_time": "15:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11398, "total_steps": 17941, "loss": 1.6664, "learning_rate": 3.028841037597639e-05, "epoch": 0.6353046095535366, "percentage": 63.53, "elapsed_time": "1 day, 2:58:59", "remaining_time": "15:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11399, "total_steps": 17941, "loss": 1.4491, "learning_rate": 3.0280227597109272e-05, "epoch": 0.6353603478066997, "percentage": 63.54, "elapsed_time": "1 day, 2:59:07", "remaining_time": "15:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11400, "total_steps": 17941, "loss": 1.7172, "learning_rate": 3.0272045443638386e-05, "epoch": 0.6354160860598629, "percentage": 63.54, "elapsed_time": "1 day, 2:59:16", "remaining_time": "15:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11401, "total_steps": 17941, "loss": 1.6882, "learning_rate": 3.0263863915823182e-05, "epoch": 0.6354718243130261, "percentage": 63.55, "elapsed_time": "1 day, 2:59:24", "remaining_time": "15:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11402, "total_steps": 17941, "loss": 1.5914, "learning_rate": 3.0255683013923154e-05, "epoch": 0.6355275625661891, "percentage": 63.55, "elapsed_time": "1 day, 2:59:33", "remaining_time": "15:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11403, "total_steps": 17941, "loss": 1.5801, "learning_rate": 3.0247502738197735e-05, "epoch": 0.6355833008193523, "percentage": 63.56, "elapsed_time": "1 day, 2:59:42", "remaining_time": "15:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11404, "total_steps": 17941, "loss": 1.6125, "learning_rate": 3.0239323088906357e-05, "epoch": 0.6356390390725155, "percentage": 63.56, "elapsed_time": "1 day, 2:59:51", "remaining_time": "15:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11405, "total_steps": 17941, "loss": 1.8681, "learning_rate": 3.0231144066308463e-05, "epoch": 0.6356947773256786, "percentage": 63.57, "elapsed_time": "1 day, 2:59:59", "remaining_time": "15:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11406, "total_steps": 17941, "loss": 1.6304, "learning_rate": 3.0222965670663394e-05, "epoch": 0.6357505155788418, "percentage": 63.58, "elapsed_time": "1 day, 3:00:08", "remaining_time": "15:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11407, "total_steps": 17941, "loss": 1.6737, "learning_rate": 3.021478790223057e-05, "epoch": 0.635806253832005, "percentage": 63.58, "elapsed_time": "1 day, 3:00:17", "remaining_time": "15:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11408, "total_steps": 17941, "loss": 1.3904, "learning_rate": 3.0206610761269293e-05, "epoch": 0.635861992085168, "percentage": 63.59, "elapsed_time": "1 day, 3:00:25", "remaining_time": "15:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11409, "total_steps": 17941, "loss": 1.5715, "learning_rate": 3.0198434248038933e-05, "epoch": 0.6359177303383312, "percentage": 63.59, "elapsed_time": "1 day, 3:00:34", "remaining_time": "15:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11410, "total_steps": 17941, "loss": 1.5383, "learning_rate": 3.0190258362798783e-05, "epoch": 0.6359734685914944, "percentage": 63.6, "elapsed_time": "1 day, 3:00:42", "remaining_time": "15:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11411, "total_steps": 17941, "loss": 1.4719, "learning_rate": 3.0182083105808134e-05, "epoch": 0.6360292068446575, "percentage": 63.6, "elapsed_time": "1 day, 3:00:50", "remaining_time": "15:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11412, "total_steps": 17941, "loss": 1.7294, "learning_rate": 3.017390847732628e-05, "epoch": 0.6360849450978207, "percentage": 63.61, "elapsed_time": "1 day, 3:00:59", "remaining_time": "15:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11413, "total_steps": 17941, "loss": 1.6529, "learning_rate": 3.016573447761244e-05, "epoch": 0.6361406833509837, "percentage": 63.61, "elapsed_time": "1 day, 3:01:07", "remaining_time": "15:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11414, "total_steps": 17941, "loss": 1.3404, "learning_rate": 3.015756110692587e-05, "epoch": 0.6361964216041469, "percentage": 63.62, "elapsed_time": "1 day, 3:01:16", "remaining_time": "15:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11415, "total_steps": 17941, "loss": 1.726, "learning_rate": 3.0149388365525756e-05, "epoch": 0.6362521598573101, "percentage": 63.63, "elapsed_time": "1 day, 3:01:24", "remaining_time": "15:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11416, "total_steps": 17941, "loss": 1.7075, "learning_rate": 3.0141216253671334e-05, "epoch": 0.6363078981104732, "percentage": 63.63, "elapsed_time": "1 day, 3:01:33", "remaining_time": "15:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11417, "total_steps": 17941, "loss": 1.4312, "learning_rate": 3.013304477162171e-05, "epoch": 0.6363636363636364, "percentage": 63.64, "elapsed_time": "1 day, 3:01:41", "remaining_time": "15:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11418, "total_steps": 17941, "loss": 1.6381, "learning_rate": 3.0124873919636098e-05, "epoch": 0.6364193746167995, "percentage": 63.64, "elapsed_time": "1 day, 3:01:50", "remaining_time": "15:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11419, "total_steps": 17941, "loss": 1.669, "learning_rate": 3.0116703697973604e-05, "epoch": 0.6364751128699626, "percentage": 63.65, "elapsed_time": "1 day, 3:01:58", "remaining_time": "15:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11420, "total_steps": 17941, "loss": 1.7477, "learning_rate": 3.0108534106893336e-05, "epoch": 0.6365308511231258, "percentage": 63.65, "elapsed_time": "1 day, 3:02:07", "remaining_time": "15:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11421, "total_steps": 17941, "loss": 1.6329, "learning_rate": 3.01003651466544e-05, "epoch": 0.636586589376289, "percentage": 63.66, "elapsed_time": "1 day, 3:02:16", "remaining_time": "15:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11422, "total_steps": 17941, "loss": 1.65, "learning_rate": 3.009219681751585e-05, "epoch": 0.636642327629452, "percentage": 63.66, "elapsed_time": "1 day, 3:02:24", "remaining_time": "15:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11423, "total_steps": 17941, "loss": 1.6053, "learning_rate": 3.008402911973675e-05, "epoch": 0.6366980658826152, "percentage": 63.67, "elapsed_time": "1 day, 3:02:33", "remaining_time": "15:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11424, "total_steps": 17941, "loss": 1.4455, "learning_rate": 3.0075862053576115e-05, "epoch": 0.6367538041357784, "percentage": 63.68, "elapsed_time": "1 day, 3:02:41", "remaining_time": "15:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11425, "total_steps": 17941, "loss": 1.6209, "learning_rate": 3.006769561929298e-05, "epoch": 0.6368095423889415, "percentage": 63.68, "elapsed_time": "1 day, 3:02:50", "remaining_time": "15:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11426, "total_steps": 17941, "loss": 1.5629, "learning_rate": 3.005952981714633e-05, "epoch": 0.6368652806421047, "percentage": 63.69, "elapsed_time": "1 day, 3:02:58", "remaining_time": "15:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11427, "total_steps": 17941, "loss": 1.6286, "learning_rate": 3.0051364647395132e-05, "epoch": 0.6369210188952679, "percentage": 63.69, "elapsed_time": "1 day, 3:03:07", "remaining_time": "15:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11428, "total_steps": 17941, "loss": 1.3619, "learning_rate": 3.004320011029834e-05, "epoch": 0.6369767571484309, "percentage": 63.7, "elapsed_time": "1 day, 3:03:15", "remaining_time": "15:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11429, "total_steps": 17941, "loss": 1.8033, "learning_rate": 3.003503620611488e-05, "epoch": 0.6370324954015941, "percentage": 63.7, "elapsed_time": "1 day, 3:03:23", "remaining_time": "15:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11430, "total_steps": 17941, "loss": 1.7917, "learning_rate": 3.0026872935103658e-05, "epoch": 0.6370882336547573, "percentage": 63.71, "elapsed_time": "1 day, 3:03:32", "remaining_time": "15:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11431, "total_steps": 17941, "loss": 1.5718, "learning_rate": 3.00187102975236e-05, "epoch": 0.6371439719079204, "percentage": 63.71, "elapsed_time": "1 day, 3:03:40", "remaining_time": "15:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11432, "total_steps": 17941, "loss": 1.6192, "learning_rate": 3.0010548293633527e-05, "epoch": 0.6371997101610836, "percentage": 63.72, "elapsed_time": "1 day, 3:03:49", "remaining_time": "15:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11433, "total_steps": 17941, "loss": 1.7251, "learning_rate": 3.0002386923692344e-05, "epoch": 0.6372554484142468, "percentage": 63.73, "elapsed_time": "1 day, 3:03:57", "remaining_time": "15:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11434, "total_steps": 17941, "loss": 1.6958, "learning_rate": 2.9994226187958823e-05, "epoch": 0.6373111866674098, "percentage": 63.73, "elapsed_time": "1 day, 3:04:06", "remaining_time": "15:24:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11435, "total_steps": 17941, "loss": 1.688, "learning_rate": 2.9986066086691828e-05, "epoch": 0.637366924920573, "percentage": 63.74, "elapsed_time": "1 day, 3:04:14", "remaining_time": "15:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11436, "total_steps": 17941, "loss": 1.4879, "learning_rate": 2.997790662015012e-05, "epoch": 0.6374226631737361, "percentage": 63.74, "elapsed_time": "1 day, 3:04:23", "remaining_time": "15:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11437, "total_steps": 17941, "loss": 1.7174, "learning_rate": 2.9969747788592472e-05, "epoch": 0.6374784014268993, "percentage": 63.75, "elapsed_time": "1 day, 3:04:31", "remaining_time": "15:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11438, "total_steps": 17941, "loss": 1.6473, "learning_rate": 2.996158959227765e-05, "epoch": 0.6375341396800625, "percentage": 63.75, "elapsed_time": "1 day, 3:04:40", "remaining_time": "15:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11439, "total_steps": 17941, "loss": 1.8093, "learning_rate": 2.995343203146436e-05, "epoch": 0.6375898779332255, "percentage": 63.76, "elapsed_time": "1 day, 3:04:48", "remaining_time": "15:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11440, "total_steps": 17941, "loss": 1.5227, "learning_rate": 2.994527510641134e-05, "epoch": 0.6376456161863887, "percentage": 63.76, "elapsed_time": "1 day, 3:04:56", "remaining_time": "15:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11441, "total_steps": 17941, "loss": 1.5738, "learning_rate": 2.993711881737725e-05, "epoch": 0.6377013544395519, "percentage": 63.77, "elapsed_time": "1 day, 3:05:05", "remaining_time": "15:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11442, "total_steps": 17941, "loss": 1.6712, "learning_rate": 2.9928963164620806e-05, "epoch": 0.637757092692715, "percentage": 63.78, "elapsed_time": "1 day, 3:05:13", "remaining_time": "15:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11443, "total_steps": 17941, "loss": 1.3923, "learning_rate": 2.992080814840059e-05, "epoch": 0.6378128309458782, "percentage": 63.78, "elapsed_time": "1 day, 3:05:22", "remaining_time": "15:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11444, "total_steps": 17941, "loss": 1.7614, "learning_rate": 2.991265376897529e-05, "epoch": 0.6378685691990413, "percentage": 63.79, "elapsed_time": "1 day, 3:05:30", "remaining_time": "15:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11445, "total_steps": 17941, "loss": 1.6199, "learning_rate": 2.99045000266035e-05, "epoch": 0.6379243074522044, "percentage": 63.79, "elapsed_time": "1 day, 3:05:39", "remaining_time": "15:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11446, "total_steps": 17941, "loss": 1.9717, "learning_rate": 2.9896346921543796e-05, "epoch": 0.6379800457053676, "percentage": 63.8, "elapsed_time": "1 day, 3:05:48", "remaining_time": "15:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11447, "total_steps": 17941, "loss": 1.7399, "learning_rate": 2.9888194454054762e-05, "epoch": 0.6380357839585308, "percentage": 63.8, "elapsed_time": "1 day, 3:05:57", "remaining_time": "15:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11448, "total_steps": 17941, "loss": 1.7467, "learning_rate": 2.988004262439493e-05, "epoch": 0.6380915222116939, "percentage": 63.81, "elapsed_time": "1 day, 3:06:05", "remaining_time": "15:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11449, "total_steps": 17941, "loss": 1.8546, "learning_rate": 2.9871891432822858e-05, "epoch": 0.638147260464857, "percentage": 63.81, "elapsed_time": "1 day, 3:06:13", "remaining_time": "15:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11450, "total_steps": 17941, "loss": 1.5476, "learning_rate": 2.9863740879597006e-05, "epoch": 0.6382029987180202, "percentage": 63.82, "elapsed_time": "1 day, 3:06:22", "remaining_time": "15:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11451, "total_steps": 17941, "loss": 1.5871, "learning_rate": 2.98555909649759e-05, "epoch": 0.6382587369711833, "percentage": 63.83, "elapsed_time": "1 day, 3:06:30", "remaining_time": "15:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11452, "total_steps": 17941, "loss": 1.592, "learning_rate": 2.9847441689218014e-05, "epoch": 0.6383144752243465, "percentage": 63.83, "elapsed_time": "1 day, 3:06:39", "remaining_time": "15:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11453, "total_steps": 17941, "loss": 1.4722, "learning_rate": 2.9839293052581767e-05, "epoch": 0.6383702134775097, "percentage": 63.84, "elapsed_time": "1 day, 3:06:47", "remaining_time": "15:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11454, "total_steps": 17941, "loss": 1.5706, "learning_rate": 2.983114505532561e-05, "epoch": 0.6384259517306727, "percentage": 63.84, "elapsed_time": "1 day, 3:06:56", "remaining_time": "15:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11455, "total_steps": 17941, "loss": 1.6502, "learning_rate": 2.9822997697707927e-05, "epoch": 0.6384816899838359, "percentage": 63.85, "elapsed_time": "1 day, 3:07:04", "remaining_time": "15:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11456, "total_steps": 17941, "loss": 1.7896, "learning_rate": 2.981485097998711e-05, "epoch": 0.6385374282369991, "percentage": 63.85, "elapsed_time": "1 day, 3:07:13", "remaining_time": "15:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11457, "total_steps": 17941, "loss": 1.5343, "learning_rate": 2.9806704902421555e-05, "epoch": 0.6385931664901622, "percentage": 63.86, "elapsed_time": "1 day, 3:07:21", "remaining_time": "15:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11458, "total_steps": 17941, "loss": 1.6853, "learning_rate": 2.9798559465269564e-05, "epoch": 0.6386489047433254, "percentage": 63.86, "elapsed_time": "1 day, 3:07:30", "remaining_time": "15:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11459, "total_steps": 17941, "loss": 1.3626, "learning_rate": 2.9790414668789514e-05, "epoch": 0.6387046429964884, "percentage": 63.87, "elapsed_time": "1 day, 3:07:39", "remaining_time": "15:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11460, "total_steps": 17941, "loss": 1.7424, "learning_rate": 2.978227051323965e-05, "epoch": 0.6387603812496516, "percentage": 63.88, "elapsed_time": "1 day, 3:07:47", "remaining_time": "15:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11461, "total_steps": 17941, "loss": 1.586, "learning_rate": 2.9774126998878305e-05, "epoch": 0.6388161195028148, "percentage": 63.88, "elapsed_time": "1 day, 3:07:56", "remaining_time": "15:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11462, "total_steps": 17941, "loss": 1.7159, "learning_rate": 2.976598412596372e-05, "epoch": 0.6388718577559779, "percentage": 63.89, "elapsed_time": "1 day, 3:08:04", "remaining_time": "15:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11463, "total_steps": 17941, "loss": 1.1537, "learning_rate": 2.975784189475414e-05, "epoch": 0.6389275960091411, "percentage": 63.89, "elapsed_time": "1 day, 3:08:13", "remaining_time": "15:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11464, "total_steps": 17941, "loss": 1.8564, "learning_rate": 2.974970030550781e-05, "epoch": 0.6389833342623042, "percentage": 63.9, "elapsed_time": "1 day, 3:08:22", "remaining_time": "15:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11465, "total_steps": 17941, "loss": 1.474, "learning_rate": 2.9741559358482908e-05, "epoch": 0.6390390725154673, "percentage": 63.9, "elapsed_time": "1 day, 3:08:30", "remaining_time": "15:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11466, "total_steps": 17941, "loss": 1.6722, "learning_rate": 2.973341905393764e-05, "epoch": 0.6390948107686305, "percentage": 63.91, "elapsed_time": "1 day, 3:08:39", "remaining_time": "15:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11467, "total_steps": 17941, "loss": 1.499, "learning_rate": 2.972527939213013e-05, "epoch": 0.6391505490217937, "percentage": 63.92, "elapsed_time": "1 day, 3:08:47", "remaining_time": "15:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11468, "total_steps": 17941, "loss": 1.7276, "learning_rate": 2.9717140373318587e-05, "epoch": 0.6392062872749568, "percentage": 63.92, "elapsed_time": "1 day, 3:08:56", "remaining_time": "15:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11469, "total_steps": 17941, "loss": 1.7654, "learning_rate": 2.9709001997761053e-05, "epoch": 0.63926202552812, "percentage": 63.93, "elapsed_time": "1 day, 3:09:04", "remaining_time": "15:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11470, "total_steps": 17941, "loss": 1.634, "learning_rate": 2.970086426571569e-05, "epoch": 0.6393177637812831, "percentage": 63.93, "elapsed_time": "1 day, 3:09:12", "remaining_time": "15:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11471, "total_steps": 17941, "loss": 1.6631, "learning_rate": 2.969272717744057e-05, "epoch": 0.6393735020344462, "percentage": 63.94, "elapsed_time": "1 day, 3:09:21", "remaining_time": "15:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11472, "total_steps": 17941, "loss": 1.9441, "learning_rate": 2.9684590733193728e-05, "epoch": 0.6394292402876094, "percentage": 63.94, "elapsed_time": "1 day, 3:09:29", "remaining_time": "15:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11473, "total_steps": 17941, "loss": 1.5584, "learning_rate": 2.9676454933233238e-05, "epoch": 0.6394849785407726, "percentage": 63.95, "elapsed_time": "1 day, 3:09:38", "remaining_time": "15:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11474, "total_steps": 17941, "loss": 1.6103, "learning_rate": 2.9668319777817088e-05, "epoch": 0.6395407167939356, "percentage": 63.95, "elapsed_time": "1 day, 3:09:46", "remaining_time": "15:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11475, "total_steps": 17941, "loss": 1.7739, "learning_rate": 2.966018526720331e-05, "epoch": 0.6395964550470988, "percentage": 63.96, "elapsed_time": "1 day, 3:09:55", "remaining_time": "15:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11476, "total_steps": 17941, "loss": 1.8033, "learning_rate": 2.965205140164984e-05, "epoch": 0.639652193300262, "percentage": 63.97, "elapsed_time": "1 day, 3:10:04", "remaining_time": "15:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11477, "total_steps": 17941, "loss": 1.5886, "learning_rate": 2.9643918181414676e-05, "epoch": 0.6397079315534251, "percentage": 63.97, "elapsed_time": "1 day, 3:10:13", "remaining_time": "15:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11478, "total_steps": 17941, "loss": 1.3883, "learning_rate": 2.963578560675575e-05, "epoch": 0.6397636698065883, "percentage": 63.98, "elapsed_time": "1 day, 3:10:21", "remaining_time": "15:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11479, "total_steps": 17941, "loss": 1.764, "learning_rate": 2.962765367793096e-05, "epoch": 0.6398194080597515, "percentage": 63.98, "elapsed_time": "1 day, 3:10:30", "remaining_time": "15:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11480, "total_steps": 17941, "loss": 1.2644, "learning_rate": 2.9619522395198228e-05, "epoch": 0.6398751463129145, "percentage": 63.99, "elapsed_time": "1 day, 3:10:38", "remaining_time": "15:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11481, "total_steps": 17941, "loss": 1.6284, "learning_rate": 2.9611391758815416e-05, "epoch": 0.6399308845660777, "percentage": 63.99, "elapsed_time": "1 day, 3:10:47", "remaining_time": "15:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11482, "total_steps": 17941, "loss": 1.5244, "learning_rate": 2.9603261769040368e-05, "epoch": 0.6399866228192408, "percentage": 64.0, "elapsed_time": "1 day, 3:10:55", "remaining_time": "15:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11483, "total_steps": 17941, "loss": 1.662, "learning_rate": 2.9595132426130968e-05, "epoch": 0.640042361072404, "percentage": 64.0, "elapsed_time": "1 day, 3:11:03", "remaining_time": "15:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11484, "total_steps": 17941, "loss": 1.7329, "learning_rate": 2.9587003730344965e-05, "epoch": 0.6400980993255672, "percentage": 64.01, "elapsed_time": "1 day, 3:11:12", "remaining_time": "15:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11485, "total_steps": 17941, "loss": 1.5648, "learning_rate": 2.9578875681940223e-05, "epoch": 0.6401538375787302, "percentage": 64.02, "elapsed_time": "1 day, 3:11:20", "remaining_time": "15:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11486, "total_steps": 17941, "loss": 1.639, "learning_rate": 2.9570748281174443e-05, "epoch": 0.6402095758318934, "percentage": 64.02, "elapsed_time": "1 day, 3:11:29", "remaining_time": "15:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11487, "total_steps": 17941, "loss": 1.5573, "learning_rate": 2.9562621528305445e-05, "epoch": 0.6402653140850566, "percentage": 64.03, "elapsed_time": "1 day, 3:11:37", "remaining_time": "15:16:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11488, "total_steps": 17941, "loss": 1.6015, "learning_rate": 2.9554495423590924e-05, "epoch": 0.6403210523382197, "percentage": 64.03, "elapsed_time": "1 day, 3:11:46", "remaining_time": "15:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11489, "total_steps": 17941, "loss": 1.6447, "learning_rate": 2.9546369967288594e-05, "epoch": 0.6403767905913829, "percentage": 64.04, "elapsed_time": "1 day, 3:11:54", "remaining_time": "15:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11490, "total_steps": 17941, "loss": 1.5088, "learning_rate": 2.9538245159656174e-05, "epoch": 0.640432528844546, "percentage": 64.04, "elapsed_time": "1 day, 3:12:03", "remaining_time": "15:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11491, "total_steps": 17941, "loss": 1.6811, "learning_rate": 2.9530121000951294e-05, "epoch": 0.6404882670977091, "percentage": 64.05, "elapsed_time": "1 day, 3:12:11", "remaining_time": "15:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11492, "total_steps": 17941, "loss": 1.5924, "learning_rate": 2.952199749143165e-05, "epoch": 0.6405440053508723, "percentage": 64.05, "elapsed_time": "1 day, 3:12:19", "remaining_time": "15:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11493, "total_steps": 17941, "loss": 1.5902, "learning_rate": 2.9513874631354833e-05, "epoch": 0.6405997436040355, "percentage": 64.06, "elapsed_time": "1 day, 3:12:28", "remaining_time": "15:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11494, "total_steps": 17941, "loss": 1.4045, "learning_rate": 2.9505752420978495e-05, "epoch": 0.6406554818571986, "percentage": 64.07, "elapsed_time": "1 day, 3:12:36", "remaining_time": "15:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11495, "total_steps": 17941, "loss": 1.4327, "learning_rate": 2.9497630860560178e-05, "epoch": 0.6407112201103617, "percentage": 64.07, "elapsed_time": "1 day, 3:12:45", "remaining_time": "15:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11496, "total_steps": 17941, "loss": 1.5244, "learning_rate": 2.9489509950357476e-05, "epoch": 0.6407669583635249, "percentage": 64.08, "elapsed_time": "1 day, 3:12:53", "remaining_time": "15:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11497, "total_steps": 17941, "loss": 1.7219, "learning_rate": 2.9481389690627943e-05, "epoch": 0.640822696616688, "percentage": 64.08, "elapsed_time": "1 day, 3:13:02", "remaining_time": "15:15:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11498, "total_steps": 17941, "loss": 1.5458, "learning_rate": 2.947327008162909e-05, "epoch": 0.6408784348698512, "percentage": 64.09, "elapsed_time": "1 day, 3:13:10", "remaining_time": "15:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11499, "total_steps": 17941, "loss": 1.8704, "learning_rate": 2.946515112361844e-05, "epoch": 0.6409341731230144, "percentage": 64.09, "elapsed_time": "1 day, 3:13:19", "remaining_time": "15:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11500, "total_steps": 17941, "loss": 1.6822, "learning_rate": 2.945703281685346e-05, "epoch": 0.6409899113761774, "percentage": 64.1, "elapsed_time": "1 day, 3:13:27", "remaining_time": "15:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11501, "total_steps": 17941, "loss": 1.7695, "learning_rate": 2.944891516159163e-05, "epoch": 0.6410456496293406, "percentage": 64.1, "elapsed_time": "1 day, 3:13:36", "remaining_time": "15:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11502, "total_steps": 17941, "loss": 1.4151, "learning_rate": 2.9440798158090377e-05, "epoch": 0.6411013878825038, "percentage": 64.11, "elapsed_time": "1 day, 3:13:44", "remaining_time": "15:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11503, "total_steps": 17941, "loss": 1.7826, "learning_rate": 2.9432681806607143e-05, "epoch": 0.6411571261356669, "percentage": 64.12, "elapsed_time": "1 day, 3:13:53", "remaining_time": "15:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11504, "total_steps": 17941, "loss": 1.6817, "learning_rate": 2.9424566107399342e-05, "epoch": 0.6412128643888301, "percentage": 64.12, "elapsed_time": "1 day, 3:14:02", "remaining_time": "15:14:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11505, "total_steps": 17941, "loss": 1.7257, "learning_rate": 2.9416451060724325e-05, "epoch": 0.6412686026419931, "percentage": 64.13, "elapsed_time": "1 day, 3:14:10", "remaining_time": "15:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11506, "total_steps": 17941, "loss": 1.5757, "learning_rate": 2.9408336666839488e-05, "epoch": 0.6413243408951563, "percentage": 64.13, "elapsed_time": "1 day, 3:14:18", "remaining_time": "15:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11507, "total_steps": 17941, "loss": 1.8345, "learning_rate": 2.940022292600213e-05, "epoch": 0.6413800791483195, "percentage": 64.14, "elapsed_time": "1 day, 3:14:27", "remaining_time": "15:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11508, "total_steps": 17941, "loss": 1.7728, "learning_rate": 2.9392109838469594e-05, "epoch": 0.6414358174014826, "percentage": 64.14, "elapsed_time": "1 day, 3:14:35", "remaining_time": "15:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11509, "total_steps": 17941, "loss": 1.4375, "learning_rate": 2.938399740449922e-05, "epoch": 0.6414915556546458, "percentage": 64.15, "elapsed_time": "1 day, 3:14:44", "remaining_time": "15:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11510, "total_steps": 17941, "loss": 1.6464, "learning_rate": 2.937588562434821e-05, "epoch": 0.641547293907809, "percentage": 64.15, "elapsed_time": "1 day, 3:14:52", "remaining_time": "15:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11511, "total_steps": 17941, "loss": 1.8679, "learning_rate": 2.936777449827388e-05, "epoch": 0.641603032160972, "percentage": 64.16, "elapsed_time": "1 day, 3:15:01", "remaining_time": "15:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11512, "total_steps": 17941, "loss": 1.8918, "learning_rate": 2.935966402653344e-05, "epoch": 0.6416587704141352, "percentage": 64.17, "elapsed_time": "1 day, 3:15:10", "remaining_time": "15:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11513, "total_steps": 17941, "loss": 1.6716, "learning_rate": 2.9351554209384125e-05, "epoch": 0.6417145086672984, "percentage": 64.17, "elapsed_time": "1 day, 3:15:19", "remaining_time": "15:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11514, "total_steps": 17941, "loss": 1.7824, "learning_rate": 2.9343445047083117e-05, "epoch": 0.6417702469204615, "percentage": 64.18, "elapsed_time": "1 day, 3:15:27", "remaining_time": "15:12:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11515, "total_steps": 17941, "loss": 1.557, "learning_rate": 2.933533653988759e-05, "epoch": 0.6418259851736247, "percentage": 64.18, "elapsed_time": "1 day, 3:15:36", "remaining_time": "15:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11516, "total_steps": 17941, "loss": 1.498, "learning_rate": 2.932722868805472e-05, "epoch": 0.6418817234267878, "percentage": 64.19, "elapsed_time": "1 day, 3:15:44", "remaining_time": "15:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11517, "total_steps": 17941, "loss": 1.628, "learning_rate": 2.93191214918416e-05, "epoch": 0.6419374616799509, "percentage": 64.19, "elapsed_time": "1 day, 3:15:52", "remaining_time": "15:12:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11518, "total_steps": 17941, "loss": 1.5985, "learning_rate": 2.93110149515054e-05, "epoch": 0.6419931999331141, "percentage": 64.2, "elapsed_time": "1 day, 3:16:01", "remaining_time": "15:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11519, "total_steps": 17941, "loss": 1.5679, "learning_rate": 2.9302909067303152e-05, "epoch": 0.6420489381862773, "percentage": 64.2, "elapsed_time": "1 day, 3:16:09", "remaining_time": "15:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11520, "total_steps": 17941, "loss": 1.8117, "learning_rate": 2.929480383949198e-05, "epoch": 0.6421046764394404, "percentage": 64.21, "elapsed_time": "1 day, 3:16:18", "remaining_time": "15:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11521, "total_steps": 17941, "loss": 1.6363, "learning_rate": 2.9286699268328887e-05, "epoch": 0.6421604146926035, "percentage": 64.22, "elapsed_time": "1 day, 3:16:26", "remaining_time": "15:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11522, "total_steps": 17941, "loss": 1.7658, "learning_rate": 2.9278595354070937e-05, "epoch": 0.6422161529457667, "percentage": 64.22, "elapsed_time": "1 day, 3:16:35", "remaining_time": "15:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11523, "total_steps": 17941, "loss": 1.4656, "learning_rate": 2.9270492096975134e-05, "epoch": 0.6422718911989298, "percentage": 64.23, "elapsed_time": "1 day, 3:16:43", "remaining_time": "15:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11524, "total_steps": 17941, "loss": 1.5639, "learning_rate": 2.9262389497298454e-05, "epoch": 0.642327629452093, "percentage": 64.23, "elapsed_time": "1 day, 3:16:52", "remaining_time": "15:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11525, "total_steps": 17941, "loss": 1.9102, "learning_rate": 2.9254287555297876e-05, "epoch": 0.6423833677052562, "percentage": 64.24, "elapsed_time": "1 day, 3:17:00", "remaining_time": "15:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11526, "total_steps": 17941, "loss": 1.72, "learning_rate": 2.9246186271230337e-05, "epoch": 0.6424391059584192, "percentage": 64.24, "elapsed_time": "1 day, 3:17:09", "remaining_time": "15:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11527, "total_steps": 17941, "loss": 1.729, "learning_rate": 2.9238085645352776e-05, "epoch": 0.6424948442115824, "percentage": 64.25, "elapsed_time": "1 day, 3:17:17", "remaining_time": "15:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11528, "total_steps": 17941, "loss": 1.6568, "learning_rate": 2.9229985677922062e-05, "epoch": 0.6425505824647455, "percentage": 64.26, "elapsed_time": "1 day, 3:17:26", "remaining_time": "15:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11529, "total_steps": 17941, "loss": 1.4062, "learning_rate": 2.9221886369195116e-05, "epoch": 0.6426063207179087, "percentage": 64.26, "elapsed_time": "1 day, 3:17:34", "remaining_time": "15:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11530, "total_steps": 17941, "loss": 1.5071, "learning_rate": 2.9213787719428805e-05, "epoch": 0.6426620589710719, "percentage": 64.27, "elapsed_time": "1 day, 3:17:42", "remaining_time": "15:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11531, "total_steps": 17941, "loss": 1.572, "learning_rate": 2.9205689728879936e-05, "epoch": 0.6427177972242349, "percentage": 64.27, "elapsed_time": "1 day, 3:17:51", "remaining_time": "15:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11532, "total_steps": 17941, "loss": 1.3922, "learning_rate": 2.919759239780537e-05, "epoch": 0.6427735354773981, "percentage": 64.28, "elapsed_time": "1 day, 3:17:59", "remaining_time": "15:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11533, "total_steps": 17941, "loss": 1.6264, "learning_rate": 2.9189495726461868e-05, "epoch": 0.6428292737305613, "percentage": 64.28, "elapsed_time": "1 day, 3:18:08", "remaining_time": "15:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11534, "total_steps": 17941, "loss": 1.4878, "learning_rate": 2.918139971510624e-05, "epoch": 0.6428850119837244, "percentage": 64.29, "elapsed_time": "1 day, 3:18:16", "remaining_time": "15:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11535, "total_steps": 17941, "loss": 1.6821, "learning_rate": 2.917330436399522e-05, "epoch": 0.6429407502368876, "percentage": 64.29, "elapsed_time": "1 day, 3:18:25", "remaining_time": "15:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11536, "total_steps": 17941, "loss": 1.8271, "learning_rate": 2.9165209673385563e-05, "epoch": 0.6429964884900508, "percentage": 64.3, "elapsed_time": "1 day, 3:18:33", "remaining_time": "15:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11537, "total_steps": 17941, "loss": 1.4832, "learning_rate": 2.9157115643533993e-05, "epoch": 0.6430522267432138, "percentage": 64.31, "elapsed_time": "1 day, 3:18:42", "remaining_time": "15:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11538, "total_steps": 17941, "loss": 1.5079, "learning_rate": 2.914902227469718e-05, "epoch": 0.643107964996377, "percentage": 64.31, "elapsed_time": "1 day, 3:18:50", "remaining_time": "15:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11539, "total_steps": 17941, "loss": 1.5945, "learning_rate": 2.9140929567131815e-05, "epoch": 0.6431637032495402, "percentage": 64.32, "elapsed_time": "1 day, 3:18:58", "remaining_time": "15:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11540, "total_steps": 17941, "loss": 1.598, "learning_rate": 2.9132837521094535e-05, "epoch": 0.6432194415027033, "percentage": 64.32, "elapsed_time": "1 day, 3:19:07", "remaining_time": "15:09:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11541, "total_steps": 17941, "loss": 1.6551, "learning_rate": 2.9124746136841996e-05, "epoch": 0.6432751797558665, "percentage": 64.33, "elapsed_time": "1 day, 3:19:15", "remaining_time": "15:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11542, "total_steps": 17941, "loss": 1.5584, "learning_rate": 2.911665541463079e-05, "epoch": 0.6433309180090296, "percentage": 64.33, "elapsed_time": "1 day, 3:19:24", "remaining_time": "15:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11543, "total_steps": 17941, "loss": 1.7545, "learning_rate": 2.9108565354717522e-05, "epoch": 0.6433866562621927, "percentage": 64.34, "elapsed_time": "1 day, 3:19:32", "remaining_time": "15:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11544, "total_steps": 17941, "loss": 1.5668, "learning_rate": 2.910047595735877e-05, "epoch": 0.6434423945153559, "percentage": 64.34, "elapsed_time": "1 day, 3:19:41", "remaining_time": "15:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11545, "total_steps": 17941, "loss": 1.7969, "learning_rate": 2.9092387222811045e-05, "epoch": 0.6434981327685191, "percentage": 64.35, "elapsed_time": "1 day, 3:19:49", "remaining_time": "15:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11546, "total_steps": 17941, "loss": 1.7327, "learning_rate": 2.9084299151330906e-05, "epoch": 0.6435538710216822, "percentage": 64.36, "elapsed_time": "1 day, 3:19:58", "remaining_time": "15:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11547, "total_steps": 17941, "loss": 1.7837, "learning_rate": 2.9076211743174854e-05, "epoch": 0.6436096092748453, "percentage": 64.36, "elapsed_time": "1 day, 3:20:06", "remaining_time": "15:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11548, "total_steps": 17941, "loss": 1.6744, "learning_rate": 2.9068124998599362e-05, "epoch": 0.6436653475280085, "percentage": 64.37, "elapsed_time": "1 day, 3:20:15", "remaining_time": "15:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11549, "total_steps": 17941, "loss": 1.6584, "learning_rate": 2.9060038917860928e-05, "epoch": 0.6437210857811716, "percentage": 64.37, "elapsed_time": "1 day, 3:20:23", "remaining_time": "15:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11550, "total_steps": 17941, "loss": 1.6557, "learning_rate": 2.9051953501215928e-05, "epoch": 0.6437768240343348, "percentage": 64.38, "elapsed_time": "1 day, 3:20:32", "remaining_time": "15:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11551, "total_steps": 17941, "loss": 1.7061, "learning_rate": 2.9043868748920868e-05, "epoch": 0.6438325622874979, "percentage": 64.38, "elapsed_time": "1 day, 3:20:40", "remaining_time": "15:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11552, "total_steps": 17941, "loss": 1.7217, "learning_rate": 2.903578466123209e-05, "epoch": 0.643888300540661, "percentage": 64.39, "elapsed_time": "1 day, 3:20:48", "remaining_time": "15:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11553, "total_steps": 17941, "loss": 1.6482, "learning_rate": 2.902770123840599e-05, "epoch": 0.6439440387938242, "percentage": 64.39, "elapsed_time": "1 day, 3:20:57", "remaining_time": "15:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11554, "total_steps": 17941, "loss": 1.5762, "learning_rate": 2.901961848069894e-05, "epoch": 0.6439997770469873, "percentage": 64.4, "elapsed_time": "1 day, 3:21:05", "remaining_time": "15:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11555, "total_steps": 17941, "loss": 1.5193, "learning_rate": 2.9011536388367256e-05, "epoch": 0.6440555153001505, "percentage": 64.41, "elapsed_time": "1 day, 3:21:14", "remaining_time": "15:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11556, "total_steps": 17941, "loss": 1.6022, "learning_rate": 2.900345496166729e-05, "epoch": 0.6441112535533137, "percentage": 64.41, "elapsed_time": "1 day, 3:21:22", "remaining_time": "15:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11557, "total_steps": 17941, "loss": 1.748, "learning_rate": 2.8995374200855275e-05, "epoch": 0.6441669918064767, "percentage": 64.42, "elapsed_time": "1 day, 3:21:31", "remaining_time": "15:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11558, "total_steps": 17941, "loss": 1.4763, "learning_rate": 2.8987294106187567e-05, "epoch": 0.6442227300596399, "percentage": 64.42, "elapsed_time": "1 day, 3:21:39", "remaining_time": "15:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11559, "total_steps": 17941, "loss": 1.6101, "learning_rate": 2.8979214677920353e-05, "epoch": 0.6442784683128031, "percentage": 64.43, "elapsed_time": "1 day, 3:21:48", "remaining_time": "15:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11560, "total_steps": 17941, "loss": 1.7446, "learning_rate": 2.8971135916309895e-05, "epoch": 0.6443342065659662, "percentage": 64.43, "elapsed_time": "1 day, 3:21:56", "remaining_time": "15:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11561, "total_steps": 17941, "loss": 1.8012, "learning_rate": 2.8963057821612394e-05, "epoch": 0.6443899448191294, "percentage": 64.44, "elapsed_time": "1 day, 3:22:04", "remaining_time": "15:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11562, "total_steps": 17941, "loss": 1.4746, "learning_rate": 2.8954980394084046e-05, "epoch": 0.6444456830722926, "percentage": 64.44, "elapsed_time": "1 day, 3:22:13", "remaining_time": "15:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11563, "total_steps": 17941, "loss": 1.5389, "learning_rate": 2.8946903633981038e-05, "epoch": 0.6445014213254556, "percentage": 64.45, "elapsed_time": "1 day, 3:22:22", "remaining_time": "15:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11564, "total_steps": 17941, "loss": 1.9017, "learning_rate": 2.8938827541559482e-05, "epoch": 0.6445571595786188, "percentage": 64.46, "elapsed_time": "1 day, 3:22:30", "remaining_time": "15:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11565, "total_steps": 17941, "loss": 1.668, "learning_rate": 2.893075211707552e-05, "epoch": 0.644612897831782, "percentage": 64.46, "elapsed_time": "1 day, 3:22:39", "remaining_time": "15:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11566, "total_steps": 17941, "loss": 1.9912, "learning_rate": 2.8922677360785255e-05, "epoch": 0.6446686360849451, "percentage": 64.47, "elapsed_time": "1 day, 3:22:47", "remaining_time": "15:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11567, "total_steps": 17941, "loss": 1.4963, "learning_rate": 2.8914603272944784e-05, "epoch": 0.6447243743381083, "percentage": 64.47, "elapsed_time": "1 day, 3:22:55", "remaining_time": "15:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11568, "total_steps": 17941, "loss": 1.6432, "learning_rate": 2.890652985381015e-05, "epoch": 0.6447801125912714, "percentage": 64.48, "elapsed_time": "1 day, 3:23:05", "remaining_time": "15:05:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11569, "total_steps": 17941, "loss": 1.65, "learning_rate": 2.8898457103637412e-05, "epoch": 0.6448358508444345, "percentage": 64.48, "elapsed_time": "1 day, 3:23:13", "remaining_time": "15:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11570, "total_steps": 17941, "loss": 1.6351, "learning_rate": 2.8890385022682603e-05, "epoch": 0.6448915890975977, "percentage": 64.49, "elapsed_time": "1 day, 3:23:22", "remaining_time": "15:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11571, "total_steps": 17941, "loss": 2.0205, "learning_rate": 2.8882313611201684e-05, "epoch": 0.6449473273507609, "percentage": 64.49, "elapsed_time": "1 day, 3:23:30", "remaining_time": "15:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11572, "total_steps": 17941, "loss": 1.8547, "learning_rate": 2.887424286945065e-05, "epoch": 0.645003065603924, "percentage": 64.5, "elapsed_time": "1 day, 3:23:39", "remaining_time": "15:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11573, "total_steps": 17941, "loss": 1.733, "learning_rate": 2.8866172797685463e-05, "epoch": 0.6450588038570871, "percentage": 64.51, "elapsed_time": "1 day, 3:23:47", "remaining_time": "15:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11574, "total_steps": 17941, "loss": 1.7774, "learning_rate": 2.8858103396162055e-05, "epoch": 0.6451145421102502, "percentage": 64.51, "elapsed_time": "1 day, 3:23:56", "remaining_time": "15:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11575, "total_steps": 17941, "loss": 1.4179, "learning_rate": 2.8850034665136345e-05, "epoch": 0.6451702803634134, "percentage": 64.52, "elapsed_time": "1 day, 3:24:04", "remaining_time": "15:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11576, "total_steps": 17941, "loss": 1.7132, "learning_rate": 2.8841966604864218e-05, "epoch": 0.6452260186165766, "percentage": 64.52, "elapsed_time": "1 day, 3:24:13", "remaining_time": "15:04:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11577, "total_steps": 17941, "loss": 1.6576, "learning_rate": 2.8833899215601567e-05, "epoch": 0.6452817568697397, "percentage": 64.53, "elapsed_time": "1 day, 3:24:21", "remaining_time": "15:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11578, "total_steps": 17941, "loss": 1.5273, "learning_rate": 2.8825832497604215e-05, "epoch": 0.6453374951229028, "percentage": 64.53, "elapsed_time": "1 day, 3:24:29", "remaining_time": "15:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11579, "total_steps": 17941, "loss": 1.3098, "learning_rate": 2.8817766451127997e-05, "epoch": 0.645393233376066, "percentage": 64.54, "elapsed_time": "1 day, 3:24:38", "remaining_time": "15:03:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11580, "total_steps": 17941, "loss": 1.7311, "learning_rate": 2.880970107642873e-05, "epoch": 0.6454489716292291, "percentage": 64.54, "elapsed_time": "1 day, 3:24:46", "remaining_time": "15:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11581, "total_steps": 17941, "loss": 1.5223, "learning_rate": 2.8801636373762193e-05, "epoch": 0.6455047098823923, "percentage": 64.55, "elapsed_time": "1 day, 3:24:55", "remaining_time": "15:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11582, "total_steps": 17941, "loss": 1.7109, "learning_rate": 2.879357234338418e-05, "epoch": 0.6455604481355555, "percentage": 64.56, "elapsed_time": "1 day, 3:25:03", "remaining_time": "15:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11583, "total_steps": 17941, "loss": 1.811, "learning_rate": 2.878550898555036e-05, "epoch": 0.6456161863887185, "percentage": 64.56, "elapsed_time": "1 day, 3:25:12", "remaining_time": "15:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11584, "total_steps": 17941, "loss": 1.6823, "learning_rate": 2.8777446300516552e-05, "epoch": 0.6456719246418817, "percentage": 64.57, "elapsed_time": "1 day, 3:25:20", "remaining_time": "15:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11585, "total_steps": 17941, "loss": 1.576, "learning_rate": 2.876938428853839e-05, "epoch": 0.6457276628950449, "percentage": 64.57, "elapsed_time": "1 day, 3:25:29", "remaining_time": "15:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11586, "total_steps": 17941, "loss": 1.6211, "learning_rate": 2.8761322949871582e-05, "epoch": 0.645783401148208, "percentage": 64.58, "elapsed_time": "1 day, 3:25:37", "remaining_time": "15:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11587, "total_steps": 17941, "loss": 1.8955, "learning_rate": 2.8753262284771776e-05, "epoch": 0.6458391394013712, "percentage": 64.58, "elapsed_time": "1 day, 3:25:46", "remaining_time": "15:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11588, "total_steps": 17941, "loss": 1.6045, "learning_rate": 2.874520229349461e-05, "epoch": 0.6458948776545343, "percentage": 64.59, "elapsed_time": "1 day, 3:25:55", "remaining_time": "15:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11589, "total_steps": 17941, "loss": 1.3921, "learning_rate": 2.8737142976295723e-05, "epoch": 0.6459506159076974, "percentage": 64.6, "elapsed_time": "1 day, 3:26:03", "remaining_time": "15:02:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11590, "total_steps": 17941, "loss": 1.6893, "learning_rate": 2.8729084333430673e-05, "epoch": 0.6460063541608606, "percentage": 64.6, "elapsed_time": "1 day, 3:26:12", "remaining_time": "15:02:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11591, "total_steps": 17941, "loss": 1.6962, "learning_rate": 2.8721026365155046e-05, "epoch": 0.6460620924140238, "percentage": 64.61, "elapsed_time": "1 day, 3:26:20", "remaining_time": "15:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11592, "total_steps": 17941, "loss": 1.5756, "learning_rate": 2.8712969071724405e-05, "epoch": 0.6461178306671869, "percentage": 64.61, "elapsed_time": "1 day, 3:26:29", "remaining_time": "15:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11593, "total_steps": 17941, "loss": 1.5104, "learning_rate": 2.8704912453394266e-05, "epoch": 0.64617356892035, "percentage": 64.62, "elapsed_time": "1 day, 3:26:37", "remaining_time": "15:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11594, "total_steps": 17941, "loss": 1.6283, "learning_rate": 2.8696856510420146e-05, "epoch": 0.6462293071735132, "percentage": 64.62, "elapsed_time": "1 day, 3:26:46", "remaining_time": "15:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11595, "total_steps": 17941, "loss": 1.7311, "learning_rate": 2.8688801243057532e-05, "epoch": 0.6462850454266763, "percentage": 64.63, "elapsed_time": "1 day, 3:26:54", "remaining_time": "15:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11596, "total_steps": 17941, "loss": 1.695, "learning_rate": 2.868074665156191e-05, "epoch": 0.6463407836798395, "percentage": 64.63, "elapsed_time": "1 day, 3:27:03", "remaining_time": "15:01:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11597, "total_steps": 17941, "loss": 1.6918, "learning_rate": 2.867269273618869e-05, "epoch": 0.6463965219330026, "percentage": 64.64, "elapsed_time": "1 day, 3:27:12", "remaining_time": "15:01:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11598, "total_steps": 17941, "loss": 1.865, "learning_rate": 2.8664639497193303e-05, "epoch": 0.6464522601861658, "percentage": 64.65, "elapsed_time": "1 day, 3:27:20", "remaining_time": "15:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11599, "total_steps": 17941, "loss": 1.5144, "learning_rate": 2.865658693483116e-05, "epoch": 0.6465079984393289, "percentage": 64.65, "elapsed_time": "1 day, 3:27:29", "remaining_time": "15:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11600, "total_steps": 17941, "loss": 1.5973, "learning_rate": 2.8648535049357637e-05, "epoch": 0.646563736692492, "percentage": 64.66, "elapsed_time": "1 day, 3:27:37", "remaining_time": "15:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11601, "total_steps": 17941, "loss": 1.763, "learning_rate": 2.86404838410281e-05, "epoch": 0.6466194749456552, "percentage": 64.66, "elapsed_time": "1 day, 3:27:46", "remaining_time": "15:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11602, "total_steps": 17941, "loss": 1.5489, "learning_rate": 2.863243331009787e-05, "epoch": 0.6466752131988184, "percentage": 64.67, "elapsed_time": "1 day, 3:27:54", "remaining_time": "15:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11603, "total_steps": 17941, "loss": 1.8196, "learning_rate": 2.86243834568223e-05, "epoch": 0.6467309514519815, "percentage": 64.67, "elapsed_time": "1 day, 3:28:03", "remaining_time": "15:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11604, "total_steps": 17941, "loss": 1.7187, "learning_rate": 2.8616334281456643e-05, "epoch": 0.6467866897051446, "percentage": 64.68, "elapsed_time": "1 day, 3:28:11", "remaining_time": "15:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11605, "total_steps": 17941, "loss": 1.6422, "learning_rate": 2.8608285784256182e-05, "epoch": 0.6468424279583078, "percentage": 64.68, "elapsed_time": "1 day, 3:28:20", "remaining_time": "14:59:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11606, "total_steps": 17941, "loss": 1.6867, "learning_rate": 2.8600237965476172e-05, "epoch": 0.6468981662114709, "percentage": 64.69, "elapsed_time": "1 day, 3:28:28", "remaining_time": "14:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11607, "total_steps": 17941, "loss": 1.561, "learning_rate": 2.8592190825371845e-05, "epoch": 0.6469539044646341, "percentage": 64.7, "elapsed_time": "1 day, 3:28:36", "remaining_time": "14:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11608, "total_steps": 17941, "loss": 1.7218, "learning_rate": 2.8584144364198428e-05, "epoch": 0.6470096427177973, "percentage": 64.7, "elapsed_time": "1 day, 3:28:45", "remaining_time": "14:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11609, "total_steps": 17941, "loss": 1.5977, "learning_rate": 2.8576098582211054e-05, "epoch": 0.6470653809709603, "percentage": 64.71, "elapsed_time": "1 day, 3:28:53", "remaining_time": "14:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11610, "total_steps": 17941, "loss": 1.6856, "learning_rate": 2.856805347966496e-05, "epoch": 0.6471211192241235, "percentage": 64.71, "elapsed_time": "1 day, 3:29:02", "remaining_time": "14:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11611, "total_steps": 17941, "loss": 1.6719, "learning_rate": 2.8560009056815235e-05, "epoch": 0.6471768574772867, "percentage": 64.72, "elapsed_time": "1 day, 3:29:10", "remaining_time": "14:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11612, "total_steps": 17941, "loss": 1.5255, "learning_rate": 2.855196531391702e-05, "epoch": 0.6472325957304498, "percentage": 64.72, "elapsed_time": "1 day, 3:29:19", "remaining_time": "14:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11613, "total_steps": 17941, "loss": 1.543, "learning_rate": 2.8543922251225408e-05, "epoch": 0.647288333983613, "percentage": 64.73, "elapsed_time": "1 day, 3:29:27", "remaining_time": "14:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11614, "total_steps": 17941, "loss": 1.9824, "learning_rate": 2.8535879868995487e-05, "epoch": 0.6473440722367761, "percentage": 64.73, "elapsed_time": "1 day, 3:29:36", "remaining_time": "14:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11615, "total_steps": 17941, "loss": 1.9843, "learning_rate": 2.8527838167482336e-05, "epoch": 0.6473998104899392, "percentage": 64.74, "elapsed_time": "1 day, 3:29:44", "remaining_time": "14:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11616, "total_steps": 17941, "loss": 1.6633, "learning_rate": 2.851979714694094e-05, "epoch": 0.6474555487431024, "percentage": 64.75, "elapsed_time": "1 day, 3:29:53", "remaining_time": "14:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11617, "total_steps": 17941, "loss": 1.7438, "learning_rate": 2.8511756807626345e-05, "epoch": 0.6475112869962656, "percentage": 64.75, "elapsed_time": "1 day, 3:30:01", "remaining_time": "14:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11618, "total_steps": 17941, "loss": 1.4934, "learning_rate": 2.850371714979354e-05, "epoch": 0.6475670252494287, "percentage": 64.76, "elapsed_time": "1 day, 3:30:10", "remaining_time": "14:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11619, "total_steps": 17941, "loss": 1.7621, "learning_rate": 2.8495678173697494e-05, "epoch": 0.6476227635025918, "percentage": 64.76, "elapsed_time": "1 day, 3:30:18", "remaining_time": "14:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11620, "total_steps": 17941, "loss": 1.6058, "learning_rate": 2.8487639879593153e-05, "epoch": 0.6476785017557549, "percentage": 64.77, "elapsed_time": "1 day, 3:30:26", "remaining_time": "14:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11621, "total_steps": 17941, "loss": 1.8631, "learning_rate": 2.847960226773545e-05, "epoch": 0.6477342400089181, "percentage": 64.77, "elapsed_time": "1 day, 3:30:35", "remaining_time": "14:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11622, "total_steps": 17941, "loss": 1.5498, "learning_rate": 2.8471565338379313e-05, "epoch": 0.6477899782620813, "percentage": 64.78, "elapsed_time": "1 day, 3:30:43", "remaining_time": "14:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11623, "total_steps": 17941, "loss": 1.5045, "learning_rate": 2.8463529091779583e-05, "epoch": 0.6478457165152444, "percentage": 64.78, "elapsed_time": "1 day, 3:30:52", "remaining_time": "14:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11624, "total_steps": 17941, "loss": 1.606, "learning_rate": 2.8455493528191145e-05, "epoch": 0.6479014547684075, "percentage": 64.79, "elapsed_time": "1 day, 3:31:00", "remaining_time": "14:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11625, "total_steps": 17941, "loss": 1.7629, "learning_rate": 2.844745864786884e-05, "epoch": 0.6479571930215707, "percentage": 64.8, "elapsed_time": "1 day, 3:31:09", "remaining_time": "14:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11626, "total_steps": 17941, "loss": 1.644, "learning_rate": 2.8439424451067487e-05, "epoch": 0.6480129312747338, "percentage": 64.8, "elapsed_time": "1 day, 3:31:17", "remaining_time": "14:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11627, "total_steps": 17941, "loss": 1.6939, "learning_rate": 2.843139093804188e-05, "epoch": 0.648068669527897, "percentage": 64.81, "elapsed_time": "1 day, 3:31:26", "remaining_time": "14:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11628, "total_steps": 17941, "loss": 1.7068, "learning_rate": 2.8423358109046806e-05, "epoch": 0.6481244077810602, "percentage": 64.81, "elapsed_time": "1 day, 3:31:34", "remaining_time": "14:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11629, "total_steps": 17941, "loss": 1.6281, "learning_rate": 2.8415325964337026e-05, "epoch": 0.6481801460342232, "percentage": 64.82, "elapsed_time": "1 day, 3:31:42", "remaining_time": "14:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11630, "total_steps": 17941, "loss": 1.4476, "learning_rate": 2.8407294504167236e-05, "epoch": 0.6482358842873864, "percentage": 64.82, "elapsed_time": "1 day, 3:31:51", "remaining_time": "14:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11631, "total_steps": 17941, "loss": 1.7469, "learning_rate": 2.839926372879218e-05, "epoch": 0.6482916225405496, "percentage": 64.83, "elapsed_time": "1 day, 3:32:00", "remaining_time": "14:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11632, "total_steps": 17941, "loss": 1.635, "learning_rate": 2.839123363846653e-05, "epoch": 0.6483473607937127, "percentage": 64.83, "elapsed_time": "1 day, 3:32:08", "remaining_time": "14:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11633, "total_steps": 17941, "loss": 1.6089, "learning_rate": 2.838320423344496e-05, "epoch": 0.6484030990468759, "percentage": 64.84, "elapsed_time": "1 day, 3:32:17", "remaining_time": "14:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11634, "total_steps": 17941, "loss": 1.6684, "learning_rate": 2.8375175513982144e-05, "epoch": 0.6484588373000391, "percentage": 64.85, "elapsed_time": "1 day, 3:32:25", "remaining_time": "14:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11635, "total_steps": 17941, "loss": 1.6369, "learning_rate": 2.8367147480332635e-05, "epoch": 0.6485145755532021, "percentage": 64.85, "elapsed_time": "1 day, 3:32:34", "remaining_time": "14:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11636, "total_steps": 17941, "loss": 1.7348, "learning_rate": 2.8359120132751116e-05, "epoch": 0.6485703138063653, "percentage": 64.86, "elapsed_time": "1 day, 3:32:42", "remaining_time": "14:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11637, "total_steps": 17941, "loss": 1.5308, "learning_rate": 2.835109347149212e-05, "epoch": 0.6486260520595285, "percentage": 64.86, "elapsed_time": "1 day, 3:32:51", "remaining_time": "14:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11638, "total_steps": 17941, "loss": 1.6735, "learning_rate": 2.834306749681021e-05, "epoch": 0.6486817903126916, "percentage": 64.87, "elapsed_time": "1 day, 3:33:00", "remaining_time": "14:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11639, "total_steps": 17941, "loss": 1.3315, "learning_rate": 2.8335042208959932e-05, "epoch": 0.6487375285658548, "percentage": 64.87, "elapsed_time": "1 day, 3:33:08", "remaining_time": "14:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11640, "total_steps": 17941, "loss": 1.4162, "learning_rate": 2.8327017608195804e-05, "epoch": 0.6487932668190179, "percentage": 64.88, "elapsed_time": "1 day, 3:33:17", "remaining_time": "14:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11641, "total_steps": 17941, "loss": 1.407, "learning_rate": 2.831899369477233e-05, "epoch": 0.648849005072181, "percentage": 64.88, "elapsed_time": "1 day, 3:33:25", "remaining_time": "14:54:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11642, "total_steps": 17941, "loss": 1.4329, "learning_rate": 2.8310970468943947e-05, "epoch": 0.6489047433253442, "percentage": 64.89, "elapsed_time": "1 day, 3:33:34", "remaining_time": "14:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11643, "total_steps": 17941, "loss": 1.7362, "learning_rate": 2.830294793096513e-05, "epoch": 0.6489604815785073, "percentage": 64.9, "elapsed_time": "1 day, 3:33:42", "remaining_time": "14:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11644, "total_steps": 17941, "loss": 1.8945, "learning_rate": 2.8294926081090296e-05, "epoch": 0.6490162198316705, "percentage": 64.9, "elapsed_time": "1 day, 3:33:51", "remaining_time": "14:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11645, "total_steps": 17941, "loss": 1.6381, "learning_rate": 2.8286904919573858e-05, "epoch": 0.6490719580848336, "percentage": 64.91, "elapsed_time": "1 day, 3:33:59", "remaining_time": "14:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11646, "total_steps": 17941, "loss": 1.5749, "learning_rate": 2.8278884446670205e-05, "epoch": 0.6491276963379967, "percentage": 64.91, "elapsed_time": "1 day, 3:34:08", "remaining_time": "14:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11647, "total_steps": 17941, "loss": 1.6901, "learning_rate": 2.827086466263369e-05, "epoch": 0.6491834345911599, "percentage": 64.92, "elapsed_time": "1 day, 3:34:16", "remaining_time": "14:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11648, "total_steps": 17941, "loss": 1.588, "learning_rate": 2.8262845567718676e-05, "epoch": 0.6492391728443231, "percentage": 64.92, "elapsed_time": "1 day, 3:34:25", "remaining_time": "14:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11649, "total_steps": 17941, "loss": 1.5874, "learning_rate": 2.8254827162179453e-05, "epoch": 0.6492949110974862, "percentage": 64.93, "elapsed_time": "1 day, 3:34:34", "remaining_time": "14:53:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11650, "total_steps": 17941, "loss": 1.5423, "learning_rate": 2.8246809446270323e-05, "epoch": 0.6493506493506493, "percentage": 64.94, "elapsed_time": "1 day, 3:34:42", "remaining_time": "14:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11651, "total_steps": 17941, "loss": 1.4861, "learning_rate": 2.8238792420245564e-05, "epoch": 0.6494063876038125, "percentage": 64.94, "elapsed_time": "1 day, 3:34:51", "remaining_time": "14:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11652, "total_steps": 17941, "loss": 1.4421, "learning_rate": 2.823077608435944e-05, "epoch": 0.6494621258569756, "percentage": 64.95, "elapsed_time": "1 day, 3:34:59", "remaining_time": "14:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11653, "total_steps": 17941, "loss": 1.5598, "learning_rate": 2.822276043886617e-05, "epoch": 0.6495178641101388, "percentage": 64.95, "elapsed_time": "1 day, 3:35:07", "remaining_time": "14:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11654, "total_steps": 17941, "loss": 1.485, "learning_rate": 2.8214745484019972e-05, "epoch": 0.649573602363302, "percentage": 64.96, "elapsed_time": "1 day, 3:35:16", "remaining_time": "14:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11655, "total_steps": 17941, "loss": 1.4355, "learning_rate": 2.820673122007505e-05, "epoch": 0.649629340616465, "percentage": 64.96, "elapsed_time": "1 day, 3:35:24", "remaining_time": "14:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11656, "total_steps": 17941, "loss": 1.6034, "learning_rate": 2.8198717647285534e-05, "epoch": 0.6496850788696282, "percentage": 64.97, "elapsed_time": "1 day, 3:35:33", "remaining_time": "14:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11657, "total_steps": 17941, "loss": 1.7005, "learning_rate": 2.8190704765905573e-05, "epoch": 0.6497408171227914, "percentage": 64.97, "elapsed_time": "1 day, 3:35:41", "remaining_time": "14:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11658, "total_steps": 17941, "loss": 1.6823, "learning_rate": 2.8182692576189306e-05, "epoch": 0.6497965553759545, "percentage": 64.98, "elapsed_time": "1 day, 3:35:50", "remaining_time": "14:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11659, "total_steps": 17941, "loss": 1.6961, "learning_rate": 2.817468107839083e-05, "epoch": 0.6498522936291177, "percentage": 64.99, "elapsed_time": "1 day, 3:35:58", "remaining_time": "14:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11660, "total_steps": 17941, "loss": 1.6161, "learning_rate": 2.816667027276424e-05, "epoch": 0.6499080318822809, "percentage": 64.99, "elapsed_time": "1 day, 3:36:07", "remaining_time": "14:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11661, "total_steps": 17941, "loss": 1.6064, "learning_rate": 2.8158660159563527e-05, "epoch": 0.6499637701354439, "percentage": 65.0, "elapsed_time": "1 day, 3:36:15", "remaining_time": "14:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11662, "total_steps": 17941, "loss": 1.6869, "learning_rate": 2.815065073904281e-05, "epoch": 0.6500195083886071, "percentage": 65.0, "elapsed_time": "1 day, 3:36:24", "remaining_time": "14:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11663, "total_steps": 17941, "loss": 1.6542, "learning_rate": 2.8142642011456045e-05, "epoch": 0.6500752466417703, "percentage": 65.01, "elapsed_time": "1 day, 3:36:32", "remaining_time": "14:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11664, "total_steps": 17941, "loss": 1.6167, "learning_rate": 2.8134633977057235e-05, "epoch": 0.6501309848949334, "percentage": 65.01, "elapsed_time": "1 day, 3:36:40", "remaining_time": "14:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11665, "total_steps": 17941, "loss": 1.6651, "learning_rate": 2.812662663610035e-05, "epoch": 0.6501867231480966, "percentage": 65.02, "elapsed_time": "1 day, 3:36:49", "remaining_time": "14:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11666, "total_steps": 17941, "loss": 1.3785, "learning_rate": 2.8118619988839338e-05, "epoch": 0.6502424614012596, "percentage": 65.02, "elapsed_time": "1 day, 3:36:57", "remaining_time": "14:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11667, "total_steps": 17941, "loss": 1.5593, "learning_rate": 2.811061403552815e-05, "epoch": 0.6502981996544228, "percentage": 65.03, "elapsed_time": "1 day, 3:37:06", "remaining_time": "14:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11668, "total_steps": 17941, "loss": 1.7187, "learning_rate": 2.8102608776420614e-05, "epoch": 0.650353937907586, "percentage": 65.04, "elapsed_time": "1 day, 3:37:14", "remaining_time": "14:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11669, "total_steps": 17941, "loss": 1.5669, "learning_rate": 2.8094604211770693e-05, "epoch": 0.6504096761607491, "percentage": 65.04, "elapsed_time": "1 day, 3:37:23", "remaining_time": "14:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11670, "total_steps": 17941, "loss": 1.7421, "learning_rate": 2.8086600341832197e-05, "epoch": 0.6504654144139123, "percentage": 65.05, "elapsed_time": "1 day, 3:37:31", "remaining_time": "14:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11671, "total_steps": 17941, "loss": 1.4496, "learning_rate": 2.807859716685899e-05, "epoch": 0.6505211526670754, "percentage": 65.05, "elapsed_time": "1 day, 3:37:40", "remaining_time": "14:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11672, "total_steps": 17941, "loss": 1.5671, "learning_rate": 2.8070594687104835e-05, "epoch": 0.6505768909202385, "percentage": 65.06, "elapsed_time": "1 day, 3:37:48", "remaining_time": "14:50:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11673, "total_steps": 17941, "loss": 1.6659, "learning_rate": 2.806259290282357e-05, "epoch": 0.6506326291734017, "percentage": 65.06, "elapsed_time": "1 day, 3:37:56", "remaining_time": "14:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11674, "total_steps": 17941, "loss": 1.5014, "learning_rate": 2.8054591814268984e-05, "epoch": 0.6506883674265649, "percentage": 65.07, "elapsed_time": "1 day, 3:38:05", "remaining_time": "14:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11675, "total_steps": 17941, "loss": 1.7134, "learning_rate": 2.804659142169477e-05, "epoch": 0.650744105679728, "percentage": 65.07, "elapsed_time": "1 day, 3:38:14", "remaining_time": "14:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11676, "total_steps": 17941, "loss": 1.8295, "learning_rate": 2.803859172535468e-05, "epoch": 0.6507998439328911, "percentage": 65.08, "elapsed_time": "1 day, 3:38:23", "remaining_time": "14:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11677, "total_steps": 17941, "loss": 1.553, "learning_rate": 2.8030592725502412e-05, "epoch": 0.6508555821860543, "percentage": 65.09, "elapsed_time": "1 day, 3:38:31", "remaining_time": "14:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11678, "total_steps": 17941, "loss": 1.5796, "learning_rate": 2.8022594422391663e-05, "epoch": 0.6509113204392174, "percentage": 65.09, "elapsed_time": "1 day, 3:38:39", "remaining_time": "14:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11679, "total_steps": 17941, "loss": 1.6964, "learning_rate": 2.8014596816276073e-05, "epoch": 0.6509670586923806, "percentage": 65.1, "elapsed_time": "1 day, 3:38:48", "remaining_time": "14:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11680, "total_steps": 17941, "loss": 1.523, "learning_rate": 2.800659990740929e-05, "epoch": 0.6510227969455438, "percentage": 65.1, "elapsed_time": "1 day, 3:38:56", "remaining_time": "14:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11681, "total_steps": 17941, "loss": 1.385, "learning_rate": 2.7998603696044952e-05, "epoch": 0.6510785351987068, "percentage": 65.11, "elapsed_time": "1 day, 3:39:05", "remaining_time": "14:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11682, "total_steps": 17941, "loss": 1.4586, "learning_rate": 2.79906081824366e-05, "epoch": 0.65113427345187, "percentage": 65.11, "elapsed_time": "1 day, 3:39:13", "remaining_time": "14:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11683, "total_steps": 17941, "loss": 1.5598, "learning_rate": 2.798261336683784e-05, "epoch": 0.6511900117050332, "percentage": 65.12, "elapsed_time": "1 day, 3:39:22", "remaining_time": "14:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11684, "total_steps": 17941, "loss": 1.6281, "learning_rate": 2.7974619249502208e-05, "epoch": 0.6512457499581963, "percentage": 65.12, "elapsed_time": "1 day, 3:39:30", "remaining_time": "14:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11685, "total_steps": 17941, "loss": 1.6654, "learning_rate": 2.7966625830683235e-05, "epoch": 0.6513014882113595, "percentage": 65.13, "elapsed_time": "1 day, 3:39:39", "remaining_time": "14:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11686, "total_steps": 17941, "loss": 1.6944, "learning_rate": 2.7958633110634457e-05, "epoch": 0.6513572264645227, "percentage": 65.14, "elapsed_time": "1 day, 3:39:47", "remaining_time": "14:48:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11687, "total_steps": 17941, "loss": 1.3509, "learning_rate": 2.7950641089609274e-05, "epoch": 0.6514129647176857, "percentage": 65.14, "elapsed_time": "1 day, 3:39:56", "remaining_time": "14:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11688, "total_steps": 17941, "loss": 1.8239, "learning_rate": 2.7942649767861252e-05, "epoch": 0.6514687029708489, "percentage": 65.15, "elapsed_time": "1 day, 3:40:04", "remaining_time": "14:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11689, "total_steps": 17941, "loss": 1.7763, "learning_rate": 2.7934659145643747e-05, "epoch": 0.651524441224012, "percentage": 65.15, "elapsed_time": "1 day, 3:40:13", "remaining_time": "14:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11690, "total_steps": 17941, "loss": 1.5611, "learning_rate": 2.792666922321021e-05, "epoch": 0.6515801794771752, "percentage": 65.16, "elapsed_time": "1 day, 3:40:22", "remaining_time": "14:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11691, "total_steps": 17941, "loss": 1.6913, "learning_rate": 2.7918680000814025e-05, "epoch": 0.6516359177303384, "percentage": 65.16, "elapsed_time": "1 day, 3:40:30", "remaining_time": "14:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11692, "total_steps": 17941, "loss": 1.7309, "learning_rate": 2.7910691478708567e-05, "epoch": 0.6516916559835014, "percentage": 65.17, "elapsed_time": "1 day, 3:40:38", "remaining_time": "14:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11693, "total_steps": 17941, "loss": 1.9031, "learning_rate": 2.7902703657147206e-05, "epoch": 0.6517473942366646, "percentage": 65.17, "elapsed_time": "1 day, 3:40:47", "remaining_time": "14:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11694, "total_steps": 17941, "loss": 1.6664, "learning_rate": 2.789471653638321e-05, "epoch": 0.6518031324898278, "percentage": 65.18, "elapsed_time": "1 day, 3:40:55", "remaining_time": "14:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11695, "total_steps": 17941, "loss": 1.7134, "learning_rate": 2.7886730116669963e-05, "epoch": 0.6518588707429909, "percentage": 65.19, "elapsed_time": "1 day, 3:41:04", "remaining_time": "14:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11696, "total_steps": 17941, "loss": 1.6886, "learning_rate": 2.787874439826068e-05, "epoch": 0.651914608996154, "percentage": 65.19, "elapsed_time": "1 day, 3:41:13", "remaining_time": "14:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11697, "total_steps": 17941, "loss": 1.5477, "learning_rate": 2.7870759381408686e-05, "epoch": 0.6519703472493172, "percentage": 65.2, "elapsed_time": "1 day, 3:41:21", "remaining_time": "14:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11698, "total_steps": 17941, "loss": 1.5624, "learning_rate": 2.7862775066367124e-05, "epoch": 0.6520260855024803, "percentage": 65.2, "elapsed_time": "1 day, 3:41:30", "remaining_time": "14:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11699, "total_steps": 17941, "loss": 1.8036, "learning_rate": 2.7854791453389295e-05, "epoch": 0.6520818237556435, "percentage": 65.21, "elapsed_time": "1 day, 3:41:38", "remaining_time": "14:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11700, "total_steps": 17941, "loss": 1.639, "learning_rate": 2.7846808542728386e-05, "epoch": 0.6521375620088067, "percentage": 65.21, "elapsed_time": "1 day, 3:41:46", "remaining_time": "14:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11701, "total_steps": 17941, "loss": 1.553, "learning_rate": 2.783882633463753e-05, "epoch": 0.6521933002619698, "percentage": 65.22, "elapsed_time": "1 day, 3:41:55", "remaining_time": "14:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11702, "total_steps": 17941, "loss": 1.2438, "learning_rate": 2.7830844829369896e-05, "epoch": 0.6522490385151329, "percentage": 65.22, "elapsed_time": "1 day, 3:42:03", "remaining_time": "14:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11703, "total_steps": 17941, "loss": 1.5023, "learning_rate": 2.7822864027178596e-05, "epoch": 0.6523047767682961, "percentage": 65.23, "elapsed_time": "1 day, 3:42:12", "remaining_time": "14:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11704, "total_steps": 17941, "loss": 1.5908, "learning_rate": 2.781488392831676e-05, "epoch": 0.6523605150214592, "percentage": 65.24, "elapsed_time": "1 day, 3:42:20", "remaining_time": "14:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11705, "total_steps": 17941, "loss": 1.6314, "learning_rate": 2.7806904533037455e-05, "epoch": 0.6524162532746224, "percentage": 65.24, "elapsed_time": "1 day, 3:42:29", "remaining_time": "14:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11706, "total_steps": 17941, "loss": 1.4394, "learning_rate": 2.7798925841593743e-05, "epoch": 0.6524719915277856, "percentage": 65.25, "elapsed_time": "1 day, 3:42:38", "remaining_time": "14:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11707, "total_steps": 17941, "loss": 1.8412, "learning_rate": 2.779094785423868e-05, "epoch": 0.6525277297809486, "percentage": 65.25, "elapsed_time": "1 day, 3:42:46", "remaining_time": "14:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11708, "total_steps": 17941, "loss": 1.592, "learning_rate": 2.7782970571225243e-05, "epoch": 0.6525834680341118, "percentage": 65.26, "elapsed_time": "1 day, 3:42:55", "remaining_time": "14:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11709, "total_steps": 17941, "loss": 1.8748, "learning_rate": 2.777499399280645e-05, "epoch": 0.652639206287275, "percentage": 65.26, "elapsed_time": "1 day, 3:43:03", "remaining_time": "14:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11710, "total_steps": 17941, "loss": 1.5548, "learning_rate": 2.7767018119235262e-05, "epoch": 0.6526949445404381, "percentage": 65.27, "elapsed_time": "1 day, 3:43:12", "remaining_time": "14:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11711, "total_steps": 17941, "loss": 1.6619, "learning_rate": 2.7759042950764635e-05, "epoch": 0.6527506827936013, "percentage": 65.28, "elapsed_time": "1 day, 3:43:20", "remaining_time": "14:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11712, "total_steps": 17941, "loss": 1.5367, "learning_rate": 2.7751068487647508e-05, "epoch": 0.6528064210467643, "percentage": 65.28, "elapsed_time": "1 day, 3:43:29", "remaining_time": "14:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11713, "total_steps": 17941, "loss": 1.7765, "learning_rate": 2.774309473013673e-05, "epoch": 0.6528621592999275, "percentage": 65.29, "elapsed_time": "1 day, 3:43:37", "remaining_time": "14:44:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11714, "total_steps": 17941, "loss": 1.445, "learning_rate": 2.7735121678485265e-05, "epoch": 0.6529178975530907, "percentage": 65.29, "elapsed_time": "1 day, 3:43:46", "remaining_time": "14:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11715, "total_steps": 17941, "loss": 1.4578, "learning_rate": 2.7727149332945902e-05, "epoch": 0.6529736358062538, "percentage": 65.3, "elapsed_time": "1 day, 3:43:54", "remaining_time": "14:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11716, "total_steps": 17941, "loss": 1.2704, "learning_rate": 2.7719177693771505e-05, "epoch": 0.653029374059417, "percentage": 65.3, "elapsed_time": "1 day, 3:44:02", "remaining_time": "14:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11717, "total_steps": 17941, "loss": 1.5699, "learning_rate": 2.7711206761214882e-05, "epoch": 0.6530851123125802, "percentage": 65.31, "elapsed_time": "1 day, 3:44:11", "remaining_time": "14:44:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11718, "total_steps": 17941, "loss": 1.8262, "learning_rate": 2.770323653552883e-05, "epoch": 0.6531408505657432, "percentage": 65.31, "elapsed_time": "1 day, 3:44:19", "remaining_time": "14:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11719, "total_steps": 17941, "loss": 1.6857, "learning_rate": 2.769526701696613e-05, "epoch": 0.6531965888189064, "percentage": 65.32, "elapsed_time": "1 day, 3:44:28", "remaining_time": "14:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11720, "total_steps": 17941, "loss": 1.6479, "learning_rate": 2.7687298205779488e-05, "epoch": 0.6532523270720696, "percentage": 65.33, "elapsed_time": "1 day, 3:44:36", "remaining_time": "14:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11721, "total_steps": 17941, "loss": 1.5931, "learning_rate": 2.7679330102221684e-05, "epoch": 0.6533080653252327, "percentage": 65.33, "elapsed_time": "1 day, 3:44:44", "remaining_time": "14:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11722, "total_steps": 17941, "loss": 1.6227, "learning_rate": 2.7671362706545377e-05, "epoch": 0.6533638035783959, "percentage": 65.34, "elapsed_time": "1 day, 3:44:53", "remaining_time": "14:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11723, "total_steps": 17941, "loss": 1.6291, "learning_rate": 2.7663396019003275e-05, "epoch": 0.653419541831559, "percentage": 65.34, "elapsed_time": "1 day, 3:45:01", "remaining_time": "14:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11724, "total_steps": 17941, "loss": 1.3945, "learning_rate": 2.7655430039847986e-05, "epoch": 0.6534752800847221, "percentage": 65.35, "elapsed_time": "1 day, 3:45:10", "remaining_time": "14:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11725, "total_steps": 17941, "loss": 1.6416, "learning_rate": 2.7647464769332186e-05, "epoch": 0.6535310183378853, "percentage": 65.35, "elapsed_time": "1 day, 3:45:19", "remaining_time": "14:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11726, "total_steps": 17941, "loss": 1.5359, "learning_rate": 2.7639500207708513e-05, "epoch": 0.6535867565910485, "percentage": 65.36, "elapsed_time": "1 day, 3:45:27", "remaining_time": "14:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11727, "total_steps": 17941, "loss": 1.8041, "learning_rate": 2.7631536355229494e-05, "epoch": 0.6536424948442116, "percentage": 65.36, "elapsed_time": "1 day, 3:45:36", "remaining_time": "14:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11728, "total_steps": 17941, "loss": 1.3771, "learning_rate": 2.7623573212147723e-05, "epoch": 0.6536982330973747, "percentage": 65.37, "elapsed_time": "1 day, 3:45:44", "remaining_time": "14:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11729, "total_steps": 17941, "loss": 1.5428, "learning_rate": 2.7615610778715757e-05, "epoch": 0.6537539713505379, "percentage": 65.38, "elapsed_time": "1 day, 3:45:52", "remaining_time": "14:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11730, "total_steps": 17941, "loss": 1.7209, "learning_rate": 2.76076490551861e-05, "epoch": 0.653809709603701, "percentage": 65.38, "elapsed_time": "1 day, 3:46:01", "remaining_time": "14:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11731, "total_steps": 17941, "loss": 1.7189, "learning_rate": 2.7599688041811257e-05, "epoch": 0.6538654478568642, "percentage": 65.39, "elapsed_time": "1 day, 3:46:09", "remaining_time": "14:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11732, "total_steps": 17941, "loss": 1.6597, "learning_rate": 2.759172773884371e-05, "epoch": 0.6539211861100274, "percentage": 65.39, "elapsed_time": "1 day, 3:46:18", "remaining_time": "14:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11733, "total_steps": 17941, "loss": 1.5292, "learning_rate": 2.7583768146535925e-05, "epoch": 0.6539769243631904, "percentage": 65.4, "elapsed_time": "1 day, 3:46:26", "remaining_time": "14:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11734, "total_steps": 17941, "loss": 1.6176, "learning_rate": 2.7575809265140305e-05, "epoch": 0.6540326626163536, "percentage": 65.4, "elapsed_time": "1 day, 3:46:35", "remaining_time": "14:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11735, "total_steps": 17941, "loss": 1.7055, "learning_rate": 2.756785109490927e-05, "epoch": 0.6540884008695167, "percentage": 65.41, "elapsed_time": "1 day, 3:46:43", "remaining_time": "14:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11736, "total_steps": 17941, "loss": 1.5861, "learning_rate": 2.7559893636095212e-05, "epoch": 0.6541441391226799, "percentage": 65.41, "elapsed_time": "1 day, 3:46:52", "remaining_time": "14:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11737, "total_steps": 17941, "loss": 1.8638, "learning_rate": 2.755193688895049e-05, "epoch": 0.6541998773758431, "percentage": 65.42, "elapsed_time": "1 day, 3:47:00", "remaining_time": "14:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11738, "total_steps": 17941, "loss": 1.4608, "learning_rate": 2.754398085372747e-05, "epoch": 0.6542556156290061, "percentage": 65.43, "elapsed_time": "1 day, 3:47:09", "remaining_time": "14:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11739, "total_steps": 17941, "loss": 1.7498, "learning_rate": 2.7536025530678407e-05, "epoch": 0.6543113538821693, "percentage": 65.43, "elapsed_time": "1 day, 3:47:17", "remaining_time": "14:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11740, "total_steps": 17941, "loss": 1.4097, "learning_rate": 2.752807092005568e-05, "epoch": 0.6543670921353325, "percentage": 65.44, "elapsed_time": "1 day, 3:47:25", "remaining_time": "14:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11741, "total_steps": 17941, "loss": 1.6588, "learning_rate": 2.75201170221115e-05, "epoch": 0.6544228303884956, "percentage": 65.44, "elapsed_time": "1 day, 3:47:34", "remaining_time": "14:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11742, "total_steps": 17941, "loss": 1.8219, "learning_rate": 2.7512163837098155e-05, "epoch": 0.6544785686416588, "percentage": 65.45, "elapsed_time": "1 day, 3:47:42", "remaining_time": "14:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11743, "total_steps": 17941, "loss": 1.4547, "learning_rate": 2.750421136526785e-05, "epoch": 0.654534306894822, "percentage": 65.45, "elapsed_time": "1 day, 3:47:51", "remaining_time": "14:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11744, "total_steps": 17941, "loss": 1.6586, "learning_rate": 2.74962596068728e-05, "epoch": 0.654590045147985, "percentage": 65.46, "elapsed_time": "1 day, 3:48:00", "remaining_time": "14:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11745, "total_steps": 17941, "loss": 1.8293, "learning_rate": 2.748830856216521e-05, "epoch": 0.6546457834011482, "percentage": 65.46, "elapsed_time": "1 day, 3:48:08", "remaining_time": "14:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11746, "total_steps": 17941, "loss": 1.651, "learning_rate": 2.7480358231397184e-05, "epoch": 0.6547015216543114, "percentage": 65.47, "elapsed_time": "1 day, 3:48:17", "remaining_time": "14:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11747, "total_steps": 17941, "loss": 1.4241, "learning_rate": 2.747240861482093e-05, "epoch": 0.6547572599074745, "percentage": 65.48, "elapsed_time": "1 day, 3:48:25", "remaining_time": "14:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11748, "total_steps": 17941, "loss": 1.8573, "learning_rate": 2.7464459712688516e-05, "epoch": 0.6548129981606376, "percentage": 65.48, "elapsed_time": "1 day, 3:48:33", "remaining_time": "14:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11749, "total_steps": 17941, "loss": 1.7483, "learning_rate": 2.745651152525205e-05, "epoch": 0.6548687364138008, "percentage": 65.49, "elapsed_time": "1 day, 3:48:42", "remaining_time": "14:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11750, "total_steps": 17941, "loss": 1.5745, "learning_rate": 2.744856405276359e-05, "epoch": 0.6549244746669639, "percentage": 65.49, "elapsed_time": "1 day, 3:48:51", "remaining_time": "14:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11751, "total_steps": 17941, "loss": 1.6733, "learning_rate": 2.744061729547521e-05, "epoch": 0.6549802129201271, "percentage": 65.5, "elapsed_time": "1 day, 3:48:59", "remaining_time": "14:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11752, "total_steps": 17941, "loss": 1.6021, "learning_rate": 2.743267125363893e-05, "epoch": 0.6550359511732903, "percentage": 65.5, "elapsed_time": "1 day, 3:49:08", "remaining_time": "14:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11753, "total_steps": 17941, "loss": 1.5939, "learning_rate": 2.7424725927506722e-05, "epoch": 0.6550916894264533, "percentage": 65.51, "elapsed_time": "1 day, 3:49:16", "remaining_time": "14:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11754, "total_steps": 17941, "loss": 1.5034, "learning_rate": 2.741678131733058e-05, "epoch": 0.6551474276796165, "percentage": 65.51, "elapsed_time": "1 day, 3:49:24", "remaining_time": "14:38:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11755, "total_steps": 17941, "loss": 1.6453, "learning_rate": 2.740883742336247e-05, "epoch": 0.6552031659327797, "percentage": 65.52, "elapsed_time": "1 day, 3:49:33", "remaining_time": "14:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11756, "total_steps": 17941, "loss": 1.7042, "learning_rate": 2.7400894245854326e-05, "epoch": 0.6552589041859428, "percentage": 65.53, "elapsed_time": "1 day, 3:49:41", "remaining_time": "14:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11757, "total_steps": 17941, "loss": 1.5452, "learning_rate": 2.7392951785058046e-05, "epoch": 0.655314642439106, "percentage": 65.53, "elapsed_time": "1 day, 3:49:50", "remaining_time": "14:38:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11758, "total_steps": 17941, "loss": 1.7493, "learning_rate": 2.7385010041225534e-05, "epoch": 0.655370380692269, "percentage": 65.54, "elapsed_time": "1 day, 3:49:58", "remaining_time": "14:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11759, "total_steps": 17941, "loss": 1.3269, "learning_rate": 2.737706901460866e-05, "epoch": 0.6554261189454322, "percentage": 65.54, "elapsed_time": "1 day, 3:50:07", "remaining_time": "14:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11760, "total_steps": 17941, "loss": 1.7478, "learning_rate": 2.7369128705459246e-05, "epoch": 0.6554818571985954, "percentage": 65.55, "elapsed_time": "1 day, 3:50:15", "remaining_time": "14:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11761, "total_steps": 17941, "loss": 1.6844, "learning_rate": 2.736118911402912e-05, "epoch": 0.6555375954517585, "percentage": 65.55, "elapsed_time": "1 day, 3:50:24", "remaining_time": "14:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11762, "total_steps": 17941, "loss": 1.8216, "learning_rate": 2.735325024057007e-05, "epoch": 0.6555933337049217, "percentage": 65.56, "elapsed_time": "1 day, 3:50:32", "remaining_time": "14:37:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11763, "total_steps": 17941, "loss": 1.7156, "learning_rate": 2.7345312085333897e-05, "epoch": 0.6556490719580849, "percentage": 65.56, "elapsed_time": "1 day, 3:50:41", "remaining_time": "14:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11764, "total_steps": 17941, "loss": 1.7078, "learning_rate": 2.7337374648572354e-05, "epoch": 0.6557048102112479, "percentage": 65.57, "elapsed_time": "1 day, 3:50:50", "remaining_time": "14:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11765, "total_steps": 17941, "loss": 1.798, "learning_rate": 2.7329437930537115e-05, "epoch": 0.6557605484644111, "percentage": 65.58, "elapsed_time": "1 day, 3:50:59", "remaining_time": "14:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11766, "total_steps": 17941, "loss": 1.3555, "learning_rate": 2.7321501931479966e-05, "epoch": 0.6558162867175743, "percentage": 65.58, "elapsed_time": "1 day, 3:51:07", "remaining_time": "14:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11767, "total_steps": 17941, "loss": 1.4993, "learning_rate": 2.7313566651652532e-05, "epoch": 0.6558720249707374, "percentage": 65.59, "elapsed_time": "1 day, 3:51:16", "remaining_time": "14:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11768, "total_steps": 17941, "loss": 1.6846, "learning_rate": 2.7305632091306488e-05, "epoch": 0.6559277632239006, "percentage": 65.59, "elapsed_time": "1 day, 3:51:24", "remaining_time": "14:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11769, "total_steps": 17941, "loss": 1.7928, "learning_rate": 2.729769825069348e-05, "epoch": 0.6559835014770637, "percentage": 65.6, "elapsed_time": "1 day, 3:51:33", "remaining_time": "14:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11770, "total_steps": 17941, "loss": 1.6052, "learning_rate": 2.7289765130065126e-05, "epoch": 0.6560392397302268, "percentage": 65.6, "elapsed_time": "1 day, 3:51:41", "remaining_time": "14:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11771, "total_steps": 17941, "loss": 1.6509, "learning_rate": 2.728183272967303e-05, "epoch": 0.65609497798339, "percentage": 65.61, "elapsed_time": "1 day, 3:51:50", "remaining_time": "14:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11772, "total_steps": 17941, "loss": 1.7614, "learning_rate": 2.7273901049768697e-05, "epoch": 0.6561507162365532, "percentage": 65.62, "elapsed_time": "1 day, 3:51:58", "remaining_time": "14:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11773, "total_steps": 17941, "loss": 1.441, "learning_rate": 2.7265970090603764e-05, "epoch": 0.6562064544897163, "percentage": 65.62, "elapsed_time": "1 day, 3:52:07", "remaining_time": "14:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11774, "total_steps": 17941, "loss": 1.7769, "learning_rate": 2.725803985242969e-05, "epoch": 0.6562621927428794, "percentage": 65.63, "elapsed_time": "1 day, 3:52:15", "remaining_time": "14:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11775, "total_steps": 17941, "loss": 1.7925, "learning_rate": 2.7250110335497996e-05, "epoch": 0.6563179309960426, "percentage": 65.63, "elapsed_time": "1 day, 3:52:24", "remaining_time": "14:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11776, "total_steps": 17941, "loss": 1.8628, "learning_rate": 2.7242181540060163e-05, "epoch": 0.6563736692492057, "percentage": 65.64, "elapsed_time": "1 day, 3:52:32", "remaining_time": "14:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11777, "total_steps": 17941, "loss": 1.5689, "learning_rate": 2.7234253466367643e-05, "epoch": 0.6564294075023689, "percentage": 65.64, "elapsed_time": "1 day, 3:52:41", "remaining_time": "14:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11778, "total_steps": 17941, "loss": 1.5135, "learning_rate": 2.7226326114671895e-05, "epoch": 0.6564851457555321, "percentage": 65.65, "elapsed_time": "1 day, 3:52:49", "remaining_time": "14:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11779, "total_steps": 17941, "loss": 1.5069, "learning_rate": 2.7218399485224278e-05, "epoch": 0.6565408840086951, "percentage": 65.65, "elapsed_time": "1 day, 3:52:58", "remaining_time": "14:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11780, "total_steps": 17941, "loss": 1.6105, "learning_rate": 2.721047357827621e-05, "epoch": 0.6565966222618583, "percentage": 65.66, "elapsed_time": "1 day, 3:53:06", "remaining_time": "14:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11781, "total_steps": 17941, "loss": 1.7517, "learning_rate": 2.7202548394079037e-05, "epoch": 0.6566523605150214, "percentage": 65.67, "elapsed_time": "1 day, 3:53:15", "remaining_time": "14:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11782, "total_steps": 17941, "loss": 1.5322, "learning_rate": 2.7194623932884133e-05, "epoch": 0.6567080987681846, "percentage": 65.67, "elapsed_time": "1 day, 3:53:23", "remaining_time": "14:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11783, "total_steps": 17941, "loss": 1.6235, "learning_rate": 2.718670019494276e-05, "epoch": 0.6567638370213478, "percentage": 65.68, "elapsed_time": "1 day, 3:53:31", "remaining_time": "14:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11784, "total_steps": 17941, "loss": 1.6345, "learning_rate": 2.717877718050626e-05, "epoch": 0.6568195752745108, "percentage": 65.68, "elapsed_time": "1 day, 3:53:40", "remaining_time": "14:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11785, "total_steps": 17941, "loss": 1.7114, "learning_rate": 2.7170854889825914e-05, "epoch": 0.656875313527674, "percentage": 65.69, "elapsed_time": "1 day, 3:53:48", "remaining_time": "14:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11786, "total_steps": 17941, "loss": 1.7212, "learning_rate": 2.716293332315293e-05, "epoch": 0.6569310517808372, "percentage": 65.69, "elapsed_time": "1 day, 3:53:57", "remaining_time": "14:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11787, "total_steps": 17941, "loss": 1.6627, "learning_rate": 2.7155012480738546e-05, "epoch": 0.6569867900340003, "percentage": 65.7, "elapsed_time": "1 day, 3:54:06", "remaining_time": "14:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11788, "total_steps": 17941, "loss": 1.7468, "learning_rate": 2.714709236283397e-05, "epoch": 0.6570425282871635, "percentage": 65.7, "elapsed_time": "1 day, 3:54:14", "remaining_time": "14:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11789, "total_steps": 17941, "loss": 1.5715, "learning_rate": 2.7139172969690385e-05, "epoch": 0.6570982665403267, "percentage": 65.71, "elapsed_time": "1 day, 3:54:23", "remaining_time": "14:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11790, "total_steps": 17941, "loss": 1.6476, "learning_rate": 2.7131254301558965e-05, "epoch": 0.6571540047934897, "percentage": 65.72, "elapsed_time": "1 day, 3:54:32", "remaining_time": "14:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11791, "total_steps": 17941, "loss": 1.5052, "learning_rate": 2.7123336358690786e-05, "epoch": 0.6572097430466529, "percentage": 65.72, "elapsed_time": "1 day, 3:54:40", "remaining_time": "14:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11792, "total_steps": 17941, "loss": 1.673, "learning_rate": 2.711541914133704e-05, "epoch": 0.6572654812998161, "percentage": 65.73, "elapsed_time": "1 day, 3:54:49", "remaining_time": "14:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11793, "total_steps": 17941, "loss": 1.7664, "learning_rate": 2.710750264974875e-05, "epoch": 0.6573212195529792, "percentage": 65.73, "elapsed_time": "1 day, 3:54:57", "remaining_time": "14:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11794, "total_steps": 17941, "loss": 1.6937, "learning_rate": 2.7099586884177004e-05, "epoch": 0.6573769578061424, "percentage": 65.74, "elapsed_time": "1 day, 3:55:06", "remaining_time": "14:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11795, "total_steps": 17941, "loss": 1.6415, "learning_rate": 2.709167184487284e-05, "epoch": 0.6574326960593055, "percentage": 65.74, "elapsed_time": "1 day, 3:55:14", "remaining_time": "14:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11796, "total_steps": 17941, "loss": 2.0278, "learning_rate": 2.7083757532087285e-05, "epoch": 0.6574884343124686, "percentage": 65.75, "elapsed_time": "1 day, 3:55:24", "remaining_time": "14:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11797, "total_steps": 17941, "loss": 1.7187, "learning_rate": 2.7075843946071343e-05, "epoch": 0.6575441725656318, "percentage": 65.75, "elapsed_time": "1 day, 3:55:32", "remaining_time": "14:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11798, "total_steps": 17941, "loss": 1.5879, "learning_rate": 2.7067931087075936e-05, "epoch": 0.657599910818795, "percentage": 65.76, "elapsed_time": "1 day, 3:55:40", "remaining_time": "14:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11799, "total_steps": 17941, "loss": 1.6877, "learning_rate": 2.7060018955352094e-05, "epoch": 0.6576556490719581, "percentage": 65.77, "elapsed_time": "1 day, 3:55:49", "remaining_time": "14:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11800, "total_steps": 17941, "loss": 1.5547, "learning_rate": 2.7052107551150685e-05, "epoch": 0.6577113873251212, "percentage": 65.77, "elapsed_time": "1 day, 3:55:57", "remaining_time": "14:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11801, "total_steps": 17941, "loss": 1.5204, "learning_rate": 2.7044196874722627e-05, "epoch": 0.6577671255782844, "percentage": 65.78, "elapsed_time": "1 day, 3:56:06", "remaining_time": "14:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11802, "total_steps": 17941, "loss": 1.7442, "learning_rate": 2.7036286926318798e-05, "epoch": 0.6578228638314475, "percentage": 65.78, "elapsed_time": "1 day, 3:56:14", "remaining_time": "14:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11803, "total_steps": 17941, "loss": 1.4083, "learning_rate": 2.7028377706190068e-05, "epoch": 0.6578786020846107, "percentage": 65.79, "elapsed_time": "1 day, 3:56:23", "remaining_time": "14:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11804, "total_steps": 17941, "loss": 1.8607, "learning_rate": 2.7020469214587274e-05, "epoch": 0.6579343403377738, "percentage": 65.79, "elapsed_time": "1 day, 3:56:31", "remaining_time": "14:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11805, "total_steps": 17941, "loss": 1.6151, "learning_rate": 2.7012561451761203e-05, "epoch": 0.6579900785909369, "percentage": 65.8, "elapsed_time": "1 day, 3:56:40", "remaining_time": "14:31:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11806, "total_steps": 17941, "loss": 1.6476, "learning_rate": 2.700465441796266e-05, "epoch": 0.6580458168441001, "percentage": 65.8, "elapsed_time": "1 day, 3:56:48", "remaining_time": "14:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11807, "total_steps": 17941, "loss": 1.3972, "learning_rate": 2.6996748113442394e-05, "epoch": 0.6581015550972632, "percentage": 65.81, "elapsed_time": "1 day, 3:56:56", "remaining_time": "14:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11808, "total_steps": 17941, "loss": 1.597, "learning_rate": 2.6988842538451187e-05, "epoch": 0.6581572933504264, "percentage": 65.82, "elapsed_time": "1 day, 3:57:05", "remaining_time": "14:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11809, "total_steps": 17941, "loss": 1.5462, "learning_rate": 2.6980937693239695e-05, "epoch": 0.6582130316035896, "percentage": 65.82, "elapsed_time": "1 day, 3:57:13", "remaining_time": "14:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11810, "total_steps": 17941, "loss": 1.6007, "learning_rate": 2.697303357805866e-05, "epoch": 0.6582687698567526, "percentage": 65.83, "elapsed_time": "1 day, 3:57:22", "remaining_time": "14:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11811, "total_steps": 17941, "loss": 1.6685, "learning_rate": 2.696513019315877e-05, "epoch": 0.6583245081099158, "percentage": 65.83, "elapsed_time": "1 day, 3:57:30", "remaining_time": "14:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11812, "total_steps": 17941, "loss": 1.4725, "learning_rate": 2.6957227538790625e-05, "epoch": 0.658380246363079, "percentage": 65.84, "elapsed_time": "1 day, 3:57:39", "remaining_time": "14:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11813, "total_steps": 17941, "loss": 1.4386, "learning_rate": 2.694932561520488e-05, "epoch": 0.6584359846162421, "percentage": 65.84, "elapsed_time": "1 day, 3:57:49", "remaining_time": "14:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11814, "total_steps": 17941, "loss": 1.8516, "learning_rate": 2.694142442265212e-05, "epoch": 0.6584917228694053, "percentage": 65.85, "elapsed_time": "1 day, 3:57:57", "remaining_time": "14:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11815, "total_steps": 17941, "loss": 1.7817, "learning_rate": 2.6933523961382946e-05, "epoch": 0.6585474611225685, "percentage": 65.85, "elapsed_time": "1 day, 3:58:05", "remaining_time": "14:30:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11816, "total_steps": 17941, "loss": 1.6708, "learning_rate": 2.6925624231647916e-05, "epoch": 0.6586031993757315, "percentage": 65.86, "elapsed_time": "1 day, 3:58:14", "remaining_time": "14:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11817, "total_steps": 17941, "loss": 1.6924, "learning_rate": 2.691772523369752e-05, "epoch": 0.6586589376288947, "percentage": 65.87, "elapsed_time": "1 day, 3:58:23", "remaining_time": "14:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11818, "total_steps": 17941, "loss": 1.5783, "learning_rate": 2.6909826967782338e-05, "epoch": 0.6587146758820579, "percentage": 65.87, "elapsed_time": "1 day, 3:58:32", "remaining_time": "14:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11819, "total_steps": 17941, "loss": 1.5426, "learning_rate": 2.6901929434152802e-05, "epoch": 0.658770414135221, "percentage": 65.88, "elapsed_time": "1 day, 3:58:40", "remaining_time": "14:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11820, "total_steps": 17941, "loss": 1.67, "learning_rate": 2.6894032633059392e-05, "epoch": 0.6588261523883842, "percentage": 65.88, "elapsed_time": "1 day, 3:58:49", "remaining_time": "14:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11821, "total_steps": 17941, "loss": 1.4324, "learning_rate": 2.688613656475255e-05, "epoch": 0.6588818906415473, "percentage": 65.89, "elapsed_time": "1 day, 3:58:57", "remaining_time": "14:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11822, "total_steps": 17941, "loss": 1.5658, "learning_rate": 2.687824122948269e-05, "epoch": 0.6589376288947104, "percentage": 65.89, "elapsed_time": "1 day, 3:59:06", "remaining_time": "14:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11823, "total_steps": 17941, "loss": 1.7141, "learning_rate": 2.687034662750023e-05, "epoch": 0.6589933671478736, "percentage": 65.9, "elapsed_time": "1 day, 3:59:14", "remaining_time": "14:28:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11824, "total_steps": 17941, "loss": 1.51, "learning_rate": 2.6862452759055478e-05, "epoch": 0.6590491054010368, "percentage": 65.9, "elapsed_time": "1 day, 3:59:23", "remaining_time": "14:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11825, "total_steps": 17941, "loss": 1.7183, "learning_rate": 2.6854559624398868e-05, "epoch": 0.6591048436541999, "percentage": 65.91, "elapsed_time": "1 day, 3:59:32", "remaining_time": "14:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11826, "total_steps": 17941, "loss": 1.6043, "learning_rate": 2.6846667223780658e-05, "epoch": 0.659160581907363, "percentage": 65.92, "elapsed_time": "1 day, 3:59:40", "remaining_time": "14:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11827, "total_steps": 17941, "loss": 1.6279, "learning_rate": 2.683877555745117e-05, "epoch": 0.6592163201605261, "percentage": 65.92, "elapsed_time": "1 day, 3:59:49", "remaining_time": "14:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11828, "total_steps": 17941, "loss": 1.5773, "learning_rate": 2.683088462566068e-05, "epoch": 0.6592720584136893, "percentage": 65.93, "elapsed_time": "1 day, 3:59:57", "remaining_time": "14:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11829, "total_steps": 17941, "loss": 1.5818, "learning_rate": 2.682299442865945e-05, "epoch": 0.6593277966668525, "percentage": 65.93, "elapsed_time": "1 day, 4:00:06", "remaining_time": "14:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11830, "total_steps": 17941, "loss": 1.7962, "learning_rate": 2.6815104966697718e-05, "epoch": 0.6593835349200156, "percentage": 65.94, "elapsed_time": "1 day, 4:00:14", "remaining_time": "14:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11831, "total_steps": 17941, "loss": 1.6222, "learning_rate": 2.680721624002566e-05, "epoch": 0.6594392731731787, "percentage": 65.94, "elapsed_time": "1 day, 4:00:23", "remaining_time": "14:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11832, "total_steps": 17941, "loss": 1.781, "learning_rate": 2.6799328248893485e-05, "epoch": 0.6594950114263419, "percentage": 65.95, "elapsed_time": "1 day, 4:00:31", "remaining_time": "14:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11833, "total_steps": 17941, "loss": 1.5622, "learning_rate": 2.6791440993551343e-05, "epoch": 0.659550749679505, "percentage": 65.96, "elapsed_time": "1 day, 4:00:40", "remaining_time": "14:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11834, "total_steps": 17941, "loss": 1.6885, "learning_rate": 2.6783554474249407e-05, "epoch": 0.6596064879326682, "percentage": 65.96, "elapsed_time": "1 day, 4:00:48", "remaining_time": "14:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11835, "total_steps": 17941, "loss": 1.7058, "learning_rate": 2.677566869123771e-05, "epoch": 0.6596622261858314, "percentage": 65.97, "elapsed_time": "1 day, 4:00:57", "remaining_time": "14:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11836, "total_steps": 17941, "loss": 1.6399, "learning_rate": 2.676778364476642e-05, "epoch": 0.6597179644389944, "percentage": 65.97, "elapsed_time": "1 day, 4:01:05", "remaining_time": "14:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11837, "total_steps": 17941, "loss": 1.6838, "learning_rate": 2.6759899335085602e-05, "epoch": 0.6597737026921576, "percentage": 65.98, "elapsed_time": "1 day, 4:01:13", "remaining_time": "14:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11838, "total_steps": 17941, "loss": 1.7896, "learning_rate": 2.6752015762445254e-05, "epoch": 0.6598294409453208, "percentage": 65.98, "elapsed_time": "1 day, 4:01:22", "remaining_time": "14:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11839, "total_steps": 17941, "loss": 1.2567, "learning_rate": 2.674413292709542e-05, "epoch": 0.6598851791984839, "percentage": 65.99, "elapsed_time": "1 day, 4:01:30", "remaining_time": "14:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11840, "total_steps": 17941, "loss": 1.5649, "learning_rate": 2.6736250829286103e-05, "epoch": 0.6599409174516471, "percentage": 65.99, "elapsed_time": "1 day, 4:01:39", "remaining_time": "14:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11841, "total_steps": 17941, "loss": 1.5569, "learning_rate": 2.6728369469267266e-05, "epoch": 0.6599966557048103, "percentage": 66.0, "elapsed_time": "1 day, 4:01:47", "remaining_time": "14:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11842, "total_steps": 17941, "loss": 1.534, "learning_rate": 2.6720488847288873e-05, "epoch": 0.6600523939579733, "percentage": 66.01, "elapsed_time": "1 day, 4:01:56", "remaining_time": "14:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11843, "total_steps": 17941, "loss": 1.722, "learning_rate": 2.6712608963600843e-05, "epoch": 0.6601081322111365, "percentage": 66.01, "elapsed_time": "1 day, 4:02:04", "remaining_time": "14:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11844, "total_steps": 17941, "loss": 1.5489, "learning_rate": 2.67047298184531e-05, "epoch": 0.6601638704642997, "percentage": 66.02, "elapsed_time": "1 day, 4:02:13", "remaining_time": "14:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11845, "total_steps": 17941, "loss": 1.8072, "learning_rate": 2.6696851412095492e-05, "epoch": 0.6602196087174628, "percentage": 66.02, "elapsed_time": "1 day, 4:02:21", "remaining_time": "14:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11846, "total_steps": 17941, "loss": 1.454, "learning_rate": 2.6688973744777884e-05, "epoch": 0.660275346970626, "percentage": 66.03, "elapsed_time": "1 day, 4:02:30", "remaining_time": "14:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11847, "total_steps": 17941, "loss": 1.663, "learning_rate": 2.6681096816750117e-05, "epoch": 0.6603310852237891, "percentage": 66.03, "elapsed_time": "1 day, 4:02:38", "remaining_time": "14:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11848, "total_steps": 17941, "loss": 1.4612, "learning_rate": 2.6673220628262e-05, "epoch": 0.6603868234769522, "percentage": 66.04, "elapsed_time": "1 day, 4:02:47", "remaining_time": "14:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11849, "total_steps": 17941, "loss": 1.5046, "learning_rate": 2.6665345179563345e-05, "epoch": 0.6604425617301154, "percentage": 66.04, "elapsed_time": "1 day, 4:02:55", "remaining_time": "14:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11850, "total_steps": 17941, "loss": 1.7277, "learning_rate": 2.6657470470903845e-05, "epoch": 0.6604982999832785, "percentage": 66.05, "elapsed_time": "1 day, 4:03:04", "remaining_time": "14:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11851, "total_steps": 17941, "loss": 1.6117, "learning_rate": 2.6649596502533323e-05, "epoch": 0.6605540382364417, "percentage": 66.06, "elapsed_time": "1 day, 4:03:13", "remaining_time": "14:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11852, "total_steps": 17941, "loss": 1.7025, "learning_rate": 2.6641723274701447e-05, "epoch": 0.6606097764896048, "percentage": 66.06, "elapsed_time": "1 day, 4:03:21", "remaining_time": "14:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11853, "total_steps": 17941, "loss": 1.3906, "learning_rate": 2.6633850787657915e-05, "epoch": 0.6606655147427679, "percentage": 66.07, "elapsed_time": "1 day, 4:03:30", "remaining_time": "14:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11854, "total_steps": 17941, "loss": 1.721, "learning_rate": 2.6625979041652406e-05, "epoch": 0.6607212529959311, "percentage": 66.07, "elapsed_time": "1 day, 4:03:38", "remaining_time": "14:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11855, "total_steps": 17941, "loss": 1.4738, "learning_rate": 2.6618108036934554e-05, "epoch": 0.6607769912490943, "percentage": 66.08, "elapsed_time": "1 day, 4:03:47", "remaining_time": "14:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11856, "total_steps": 17941, "loss": 1.6252, "learning_rate": 2.6610237773754015e-05, "epoch": 0.6608327295022574, "percentage": 66.08, "elapsed_time": "1 day, 4:03:55", "remaining_time": "14:24:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11857, "total_steps": 17941, "loss": 1.6125, "learning_rate": 2.6602368252360345e-05, "epoch": 0.6608884677554205, "percentage": 66.09, "elapsed_time": "1 day, 4:04:03", "remaining_time": "14:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11858, "total_steps": 17941, "loss": 1.6452, "learning_rate": 2.6594499473003125e-05, "epoch": 0.6609442060085837, "percentage": 66.09, "elapsed_time": "1 day, 4:04:12", "remaining_time": "14:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11859, "total_steps": 17941, "loss": 1.5554, "learning_rate": 2.658663143593193e-05, "epoch": 0.6609999442617468, "percentage": 66.1, "elapsed_time": "1 day, 4:04:20", "remaining_time": "14:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11860, "total_steps": 17941, "loss": 1.6729, "learning_rate": 2.6578764141396282e-05, "epoch": 0.66105568251491, "percentage": 66.11, "elapsed_time": "1 day, 4:04:29", "remaining_time": "14:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11861, "total_steps": 17941, "loss": 1.6435, "learning_rate": 2.6570897589645654e-05, "epoch": 0.6611114207680732, "percentage": 66.11, "elapsed_time": "1 day, 4:04:37", "remaining_time": "14:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11862, "total_steps": 17941, "loss": 1.6829, "learning_rate": 2.656303178092957e-05, "epoch": 0.6611671590212362, "percentage": 66.12, "elapsed_time": "1 day, 4:04:46", "remaining_time": "14:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11863, "total_steps": 17941, "loss": 1.6514, "learning_rate": 2.6555166715497492e-05, "epoch": 0.6612228972743994, "percentage": 66.12, "elapsed_time": "1 day, 4:04:55", "remaining_time": "14:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11864, "total_steps": 17941, "loss": 1.6465, "learning_rate": 2.6547302393598804e-05, "epoch": 0.6612786355275626, "percentage": 66.13, "elapsed_time": "1 day, 4:05:03", "remaining_time": "14:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11865, "total_steps": 17941, "loss": 1.6402, "learning_rate": 2.6539438815482955e-05, "epoch": 0.6613343737807257, "percentage": 66.13, "elapsed_time": "1 day, 4:05:12", "remaining_time": "14:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11866, "total_steps": 17941, "loss": 1.6084, "learning_rate": 2.653157598139932e-05, "epoch": 0.6613901120338889, "percentage": 66.14, "elapsed_time": "1 day, 4:05:20", "remaining_time": "14:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11867, "total_steps": 17941, "loss": 1.846, "learning_rate": 2.652371389159727e-05, "epoch": 0.661445850287052, "percentage": 66.14, "elapsed_time": "1 day, 4:05:29", "remaining_time": "14:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11868, "total_steps": 17941, "loss": 1.8253, "learning_rate": 2.6515852546326124e-05, "epoch": 0.6615015885402151, "percentage": 66.15, "elapsed_time": "1 day, 4:05:37", "remaining_time": "14:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11869, "total_steps": 17941, "loss": 1.7235, "learning_rate": 2.6507991945835227e-05, "epoch": 0.6615573267933783, "percentage": 66.16, "elapsed_time": "1 day, 4:05:46", "remaining_time": "14:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11870, "total_steps": 17941, "loss": 1.6533, "learning_rate": 2.6500132090373873e-05, "epoch": 0.6616130650465415, "percentage": 66.16, "elapsed_time": "1 day, 4:05:54", "remaining_time": "14:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11871, "total_steps": 17941, "loss": 1.711, "learning_rate": 2.649227298019129e-05, "epoch": 0.6616688032997046, "percentage": 66.17, "elapsed_time": "1 day, 4:06:03", "remaining_time": "14:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11872, "total_steps": 17941, "loss": 1.6361, "learning_rate": 2.6484414615536757e-05, "epoch": 0.6617245415528678, "percentage": 66.17, "elapsed_time": "1 day, 4:06:11", "remaining_time": "14:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11873, "total_steps": 17941, "loss": 1.6981, "learning_rate": 2.6476556996659484e-05, "epoch": 0.6617802798060308, "percentage": 66.18, "elapsed_time": "1 day, 4:06:19", "remaining_time": "14:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11874, "total_steps": 17941, "loss": 1.5684, "learning_rate": 2.646870012380867e-05, "epoch": 0.661836018059194, "percentage": 66.18, "elapsed_time": "1 day, 4:06:28", "remaining_time": "14:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11875, "total_steps": 17941, "loss": 1.5542, "learning_rate": 2.646084399723351e-05, "epoch": 0.6618917563123572, "percentage": 66.19, "elapsed_time": "1 day, 4:06:36", "remaining_time": "14:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11876, "total_steps": 17941, "loss": 1.7904, "learning_rate": 2.6452988617183106e-05, "epoch": 0.6619474945655203, "percentage": 66.19, "elapsed_time": "1 day, 4:06:45", "remaining_time": "14:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11877, "total_steps": 17941, "loss": 1.607, "learning_rate": 2.6445133983906643e-05, "epoch": 0.6620032328186835, "percentage": 66.2, "elapsed_time": "1 day, 4:06:53", "remaining_time": "14:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11878, "total_steps": 17941, "loss": 1.6927, "learning_rate": 2.643728009765318e-05, "epoch": 0.6620589710718466, "percentage": 66.21, "elapsed_time": "1 day, 4:07:02", "remaining_time": "14:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11879, "total_steps": 17941, "loss": 1.7663, "learning_rate": 2.642942695867181e-05, "epoch": 0.6621147093250097, "percentage": 66.21, "elapsed_time": "1 day, 4:07:10", "remaining_time": "14:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11880, "total_steps": 17941, "loss": 1.7458, "learning_rate": 2.6421574567211595e-05, "epoch": 0.6621704475781729, "percentage": 66.22, "elapsed_time": "1 day, 4:07:19", "remaining_time": "14:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11881, "total_steps": 17941, "loss": 1.6295, "learning_rate": 2.6413722923521555e-05, "epoch": 0.6622261858313361, "percentage": 66.22, "elapsed_time": "1 day, 4:07:27", "remaining_time": "14:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11882, "total_steps": 17941, "loss": 1.5865, "learning_rate": 2.6405872027850732e-05, "epoch": 0.6622819240844992, "percentage": 66.23, "elapsed_time": "1 day, 4:07:36", "remaining_time": "14:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11883, "total_steps": 17941, "loss": 1.6666, "learning_rate": 2.6398021880448066e-05, "epoch": 0.6623376623376623, "percentage": 66.23, "elapsed_time": "1 day, 4:07:45", "remaining_time": "14:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11884, "total_steps": 17941, "loss": 1.7405, "learning_rate": 2.6390172481562537e-05, "epoch": 0.6623934005908255, "percentage": 66.24, "elapsed_time": "1 day, 4:07:53", "remaining_time": "14:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11885, "total_steps": 17941, "loss": 1.6778, "learning_rate": 2.6382323831443078e-05, "epoch": 0.6624491388439886, "percentage": 66.24, "elapsed_time": "1 day, 4:08:02", "remaining_time": "14:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11886, "total_steps": 17941, "loss": 1.6827, "learning_rate": 2.6374475930338625e-05, "epoch": 0.6625048770971518, "percentage": 66.25, "elapsed_time": "1 day, 4:08:10", "remaining_time": "14:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11887, "total_steps": 17941, "loss": 1.8122, "learning_rate": 2.6366628778498017e-05, "epoch": 0.662560615350315, "percentage": 66.26, "elapsed_time": "1 day, 4:08:19", "remaining_time": "14:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11888, "total_steps": 17941, "loss": 1.724, "learning_rate": 2.6358782376170164e-05, "epoch": 0.662616353603478, "percentage": 66.26, "elapsed_time": "1 day, 4:08:27", "remaining_time": "14:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11889, "total_steps": 17941, "loss": 1.5148, "learning_rate": 2.6350936723603923e-05, "epoch": 0.6626720918566412, "percentage": 66.27, "elapsed_time": "1 day, 4:08:36", "remaining_time": "14:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11890, "total_steps": 17941, "loss": 1.7194, "learning_rate": 2.634309182104806e-05, "epoch": 0.6627278301098044, "percentage": 66.27, "elapsed_time": "1 day, 4:08:44", "remaining_time": "14:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11891, "total_steps": 17941, "loss": 1.667, "learning_rate": 2.63352476687514e-05, "epoch": 0.6627835683629675, "percentage": 66.28, "elapsed_time": "1 day, 4:08:52", "remaining_time": "14:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11892, "total_steps": 17941, "loss": 1.6988, "learning_rate": 2.6327404266962707e-05, "epoch": 0.6628393066161307, "percentage": 66.28, "elapsed_time": "1 day, 4:09:01", "remaining_time": "14:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11893, "total_steps": 17941, "loss": 1.4099, "learning_rate": 2.6319561615930732e-05, "epoch": 0.6628950448692938, "percentage": 66.29, "elapsed_time": "1 day, 4:09:09", "remaining_time": "14:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11894, "total_steps": 17941, "loss": 1.7522, "learning_rate": 2.6311719715904193e-05, "epoch": 0.6629507831224569, "percentage": 66.3, "elapsed_time": "1 day, 4:09:18", "remaining_time": "14:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11895, "total_steps": 17941, "loss": 1.5786, "learning_rate": 2.630387856713179e-05, "epoch": 0.6630065213756201, "percentage": 66.3, "elapsed_time": "1 day, 4:09:27", "remaining_time": "14:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11896, "total_steps": 17941, "loss": 1.5653, "learning_rate": 2.6296038169862226e-05, "epoch": 0.6630622596287832, "percentage": 66.31, "elapsed_time": "1 day, 4:09:35", "remaining_time": "14:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11897, "total_steps": 17941, "loss": 1.6283, "learning_rate": 2.6288198524344106e-05, "epoch": 0.6631179978819464, "percentage": 66.31, "elapsed_time": "1 day, 4:09:44", "remaining_time": "14:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11898, "total_steps": 17941, "loss": 1.6296, "learning_rate": 2.6280359630826078e-05, "epoch": 0.6631737361351095, "percentage": 66.32, "elapsed_time": "1 day, 4:09:53", "remaining_time": "14:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11899, "total_steps": 17941, "loss": 1.5074, "learning_rate": 2.6272521489556746e-05, "epoch": 0.6632294743882726, "percentage": 66.32, "elapsed_time": "1 day, 4:10:01", "remaining_time": "14:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11900, "total_steps": 17941, "loss": 1.4944, "learning_rate": 2.62646841007847e-05, "epoch": 0.6632852126414358, "percentage": 66.33, "elapsed_time": "1 day, 4:10:10", "remaining_time": "14:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11901, "total_steps": 17941, "loss": 1.7095, "learning_rate": 2.6256847464758495e-05, "epoch": 0.663340950894599, "percentage": 66.33, "elapsed_time": "1 day, 4:10:18", "remaining_time": "14:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11902, "total_steps": 17941, "loss": 1.6111, "learning_rate": 2.6249011581726625e-05, "epoch": 0.6633966891477621, "percentage": 66.34, "elapsed_time": "1 day, 4:10:27", "remaining_time": "14:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11903, "total_steps": 17941, "loss": 1.7611, "learning_rate": 2.6241176451937664e-05, "epoch": 0.6634524274009252, "percentage": 66.35, "elapsed_time": "1 day, 4:10:35", "remaining_time": "14:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11904, "total_steps": 17941, "loss": 1.6979, "learning_rate": 2.623334207564005e-05, "epoch": 0.6635081656540884, "percentage": 66.35, "elapsed_time": "1 day, 4:10:44", "remaining_time": "14:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11905, "total_steps": 17941, "loss": 1.8504, "learning_rate": 2.6225508453082247e-05, "epoch": 0.6635639039072515, "percentage": 66.36, "elapsed_time": "1 day, 4:10:52", "remaining_time": "14:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11906, "total_steps": 17941, "loss": 1.4962, "learning_rate": 2.6217675584512713e-05, "epoch": 0.6636196421604147, "percentage": 66.36, "elapsed_time": "1 day, 4:11:00", "remaining_time": "14:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11907, "total_steps": 17941, "loss": 1.5897, "learning_rate": 2.620984347017984e-05, "epoch": 0.6636753804135779, "percentage": 66.37, "elapsed_time": "1 day, 4:11:09", "remaining_time": "14:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11908, "total_steps": 17941, "loss": 1.565, "learning_rate": 2.6202012110332046e-05, "epoch": 0.663731118666741, "percentage": 66.37, "elapsed_time": "1 day, 4:11:17", "remaining_time": "14:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11909, "total_steps": 17941, "loss": 1.8616, "learning_rate": 2.619418150521766e-05, "epoch": 0.6637868569199041, "percentage": 66.38, "elapsed_time": "1 day, 4:11:26", "remaining_time": "14:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11910, "total_steps": 17941, "loss": 1.7539, "learning_rate": 2.6186351655085036e-05, "epoch": 0.6638425951730673, "percentage": 66.38, "elapsed_time": "1 day, 4:11:34", "remaining_time": "14:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11911, "total_steps": 17941, "loss": 1.5453, "learning_rate": 2.6178522560182496e-05, "epoch": 0.6638983334262304, "percentage": 66.39, "elapsed_time": "1 day, 4:11:43", "remaining_time": "14:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11912, "total_steps": 17941, "loss": 1.6533, "learning_rate": 2.6170694220758352e-05, "epoch": 0.6639540716793936, "percentage": 66.4, "elapsed_time": "1 day, 4:11:51", "remaining_time": "14:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11913, "total_steps": 17941, "loss": 1.5123, "learning_rate": 2.6162866637060812e-05, "epoch": 0.6640098099325568, "percentage": 66.4, "elapsed_time": "1 day, 4:12:00", "remaining_time": "14:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11914, "total_steps": 17941, "loss": 1.7104, "learning_rate": 2.6155039809338178e-05, "epoch": 0.6640655481857198, "percentage": 66.41, "elapsed_time": "1 day, 4:12:09", "remaining_time": "14:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11915, "total_steps": 17941, "loss": 1.6117, "learning_rate": 2.6147213737838682e-05, "epoch": 0.664121286438883, "percentage": 66.41, "elapsed_time": "1 day, 4:12:18", "remaining_time": "14:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11916, "total_steps": 17941, "loss": 1.9683, "learning_rate": 2.6139388422810468e-05, "epoch": 0.6641770246920462, "percentage": 66.42, "elapsed_time": "1 day, 4:12:26", "remaining_time": "14:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11917, "total_steps": 17941, "loss": 1.5635, "learning_rate": 2.613156386450174e-05, "epoch": 0.6642327629452093, "percentage": 66.42, "elapsed_time": "1 day, 4:12:34", "remaining_time": "14:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11918, "total_steps": 17941, "loss": 1.6013, "learning_rate": 2.6123740063160646e-05, "epoch": 0.6642885011983725, "percentage": 66.43, "elapsed_time": "1 day, 4:12:43", "remaining_time": "14:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11919, "total_steps": 17941, "loss": 1.6931, "learning_rate": 2.6115917019035326e-05, "epoch": 0.6643442394515355, "percentage": 66.43, "elapsed_time": "1 day, 4:12:51", "remaining_time": "14:15:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11920, "total_steps": 17941, "loss": 1.397, "learning_rate": 2.6108094732373823e-05, "epoch": 0.6643999777046987, "percentage": 66.44, "elapsed_time": "1 day, 4:13:00", "remaining_time": "14:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11921, "total_steps": 17941, "loss": 1.5599, "learning_rate": 2.610027320342428e-05, "epoch": 0.6644557159578619, "percentage": 66.45, "elapsed_time": "1 day, 4:13:08", "remaining_time": "14:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11922, "total_steps": 17941, "loss": 1.5155, "learning_rate": 2.6092452432434745e-05, "epoch": 0.664511454211025, "percentage": 66.45, "elapsed_time": "1 day, 4:13:17", "remaining_time": "14:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11923, "total_steps": 17941, "loss": 1.6088, "learning_rate": 2.6084632419653206e-05, "epoch": 0.6645671924641882, "percentage": 66.46, "elapsed_time": "1 day, 4:13:25", "remaining_time": "14:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11924, "total_steps": 17941, "loss": 1.6295, "learning_rate": 2.6076813165327692e-05, "epoch": 0.6646229307173513, "percentage": 66.46, "elapsed_time": "1 day, 4:13:34", "remaining_time": "14:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11925, "total_steps": 17941, "loss": 1.7028, "learning_rate": 2.606899466970618e-05, "epoch": 0.6646786689705144, "percentage": 66.47, "elapsed_time": "1 day, 4:13:42", "remaining_time": "14:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11926, "total_steps": 17941, "loss": 1.7271, "learning_rate": 2.6061176933036636e-05, "epoch": 0.6647344072236776, "percentage": 66.47, "elapsed_time": "1 day, 4:13:50", "remaining_time": "14:14:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11927, "total_steps": 17941, "loss": 1.6711, "learning_rate": 2.6053359955566997e-05, "epoch": 0.6647901454768408, "percentage": 66.48, "elapsed_time": "1 day, 4:13:59", "remaining_time": "14:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11928, "total_steps": 17941, "loss": 1.6863, "learning_rate": 2.604554373754513e-05, "epoch": 0.6648458837300039, "percentage": 66.48, "elapsed_time": "1 day, 4:14:07", "remaining_time": "14:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11929, "total_steps": 17941, "loss": 1.6041, "learning_rate": 2.6037728279218986e-05, "epoch": 0.664901621983167, "percentage": 66.49, "elapsed_time": "1 day, 4:14:16", "remaining_time": "14:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11930, "total_steps": 17941, "loss": 1.5647, "learning_rate": 2.6029913580836372e-05, "epoch": 0.6649573602363302, "percentage": 66.5, "elapsed_time": "1 day, 4:14:25", "remaining_time": "14:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11931, "total_steps": 17941, "loss": 1.489, "learning_rate": 2.6022099642645147e-05, "epoch": 0.6650130984894933, "percentage": 66.5, "elapsed_time": "1 day, 4:14:33", "remaining_time": "14:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11932, "total_steps": 17941, "loss": 1.7557, "learning_rate": 2.6014286464893116e-05, "epoch": 0.6650688367426565, "percentage": 66.51, "elapsed_time": "1 day, 4:14:42", "remaining_time": "14:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11933, "total_steps": 17941, "loss": 1.5685, "learning_rate": 2.600647404782808e-05, "epoch": 0.6651245749958197, "percentage": 66.51, "elapsed_time": "1 day, 4:14:50", "remaining_time": "14:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11934, "total_steps": 17941, "loss": 1.8277, "learning_rate": 2.5998662391697805e-05, "epoch": 0.6651803132489827, "percentage": 66.52, "elapsed_time": "1 day, 4:14:59", "remaining_time": "14:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11935, "total_steps": 17941, "loss": 1.7789, "learning_rate": 2.599085149674999e-05, "epoch": 0.6652360515021459, "percentage": 66.52, "elapsed_time": "1 day, 4:15:07", "remaining_time": "14:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11936, "total_steps": 17941, "loss": 1.8216, "learning_rate": 2.5983041363232418e-05, "epoch": 0.6652917897553091, "percentage": 66.53, "elapsed_time": "1 day, 4:15:16", "remaining_time": "14:12:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11937, "total_steps": 17941, "loss": 1.7176, "learning_rate": 2.5975231991392725e-05, "epoch": 0.6653475280084722, "percentage": 66.53, "elapsed_time": "1 day, 4:15:24", "remaining_time": "14:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11938, "total_steps": 17941, "loss": 1.656, "learning_rate": 2.5967423381478616e-05, "epoch": 0.6654032662616354, "percentage": 66.54, "elapsed_time": "1 day, 4:15:32", "remaining_time": "14:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11939, "total_steps": 17941, "loss": 1.4709, "learning_rate": 2.5959615533737685e-05, "epoch": 0.6654590045147986, "percentage": 66.55, "elapsed_time": "1 day, 4:15:41", "remaining_time": "14:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11940, "total_steps": 17941, "loss": 1.6504, "learning_rate": 2.5951808448417602e-05, "epoch": 0.6655147427679616, "percentage": 66.55, "elapsed_time": "1 day, 4:15:49", "remaining_time": "14:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11941, "total_steps": 17941, "loss": 1.5995, "learning_rate": 2.5944002125765964e-05, "epoch": 0.6655704810211248, "percentage": 66.56, "elapsed_time": "1 day, 4:15:58", "remaining_time": "14:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11942, "total_steps": 17941, "loss": 1.8318, "learning_rate": 2.5936196566030302e-05, "epoch": 0.6656262192742879, "percentage": 66.56, "elapsed_time": "1 day, 4:16:06", "remaining_time": "14:12:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11943, "total_steps": 17941, "loss": 1.5158, "learning_rate": 2.5928391769458183e-05, "epoch": 0.6656819575274511, "percentage": 66.57, "elapsed_time": "1 day, 4:16:15", "remaining_time": "14:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11944, "total_steps": 17941, "loss": 1.5724, "learning_rate": 2.592058773629713e-05, "epoch": 0.6657376957806143, "percentage": 66.57, "elapsed_time": "1 day, 4:16:23", "remaining_time": "14:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11945, "total_steps": 17941, "loss": 1.6876, "learning_rate": 2.591278446679466e-05, "epoch": 0.6657934340337773, "percentage": 66.58, "elapsed_time": "1 day, 4:16:32", "remaining_time": "14:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11946, "total_steps": 17941, "loss": 1.6439, "learning_rate": 2.5904981961198187e-05, "epoch": 0.6658491722869405, "percentage": 66.58, "elapsed_time": "1 day, 4:16:40", "remaining_time": "14:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11947, "total_steps": 17941, "loss": 1.4966, "learning_rate": 2.5897180219755223e-05, "epoch": 0.6659049105401037, "percentage": 66.59, "elapsed_time": "1 day, 4:16:49", "remaining_time": "14:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11948, "total_steps": 17941, "loss": 1.6051, "learning_rate": 2.5889379242713197e-05, "epoch": 0.6659606487932668, "percentage": 66.6, "elapsed_time": "1 day, 4:16:57", "remaining_time": "14:11:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11949, "total_steps": 17941, "loss": 1.768, "learning_rate": 2.588157903031947e-05, "epoch": 0.66601638704643, "percentage": 66.6, "elapsed_time": "1 day, 4:17:05", "remaining_time": "14:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11950, "total_steps": 17941, "loss": 1.6705, "learning_rate": 2.5873779582821428e-05, "epoch": 0.6660721252995931, "percentage": 66.61, "elapsed_time": "1 day, 4:17:14", "remaining_time": "14:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11951, "total_steps": 17941, "loss": 1.7035, "learning_rate": 2.5865980900466436e-05, "epoch": 0.6661278635527562, "percentage": 66.61, "elapsed_time": "1 day, 4:17:22", "remaining_time": "14:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11952, "total_steps": 17941, "loss": 1.6159, "learning_rate": 2.5858182983501817e-05, "epoch": 0.6661836018059194, "percentage": 66.62, "elapsed_time": "1 day, 4:17:31", "remaining_time": "14:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11953, "total_steps": 17941, "loss": 1.5236, "learning_rate": 2.5850385832174896e-05, "epoch": 0.6662393400590826, "percentage": 66.62, "elapsed_time": "1 day, 4:17:39", "remaining_time": "14:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11954, "total_steps": 17941, "loss": 1.5456, "learning_rate": 2.58425894467329e-05, "epoch": 0.6662950783122457, "percentage": 66.63, "elapsed_time": "1 day, 4:17:48", "remaining_time": "14:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11955, "total_steps": 17941, "loss": 1.8465, "learning_rate": 2.5834793827423155e-05, "epoch": 0.6663508165654088, "percentage": 66.64, "elapsed_time": "1 day, 4:17:56", "remaining_time": "14:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11956, "total_steps": 17941, "loss": 1.7157, "learning_rate": 2.582699897449284e-05, "epoch": 0.666406554818572, "percentage": 66.64, "elapsed_time": "1 day, 4:18:05", "remaining_time": "14:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11957, "total_steps": 17941, "loss": 1.5398, "learning_rate": 2.5819204888189173e-05, "epoch": 0.6664622930717351, "percentage": 66.65, "elapsed_time": "1 day, 4:18:14", "remaining_time": "14:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11958, "total_steps": 17941, "loss": 1.4759, "learning_rate": 2.5811411568759346e-05, "epoch": 0.6665180313248983, "percentage": 66.65, "elapsed_time": "1 day, 4:18:22", "remaining_time": "14:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11959, "total_steps": 17941, "loss": 1.6772, "learning_rate": 2.5803619016450518e-05, "epoch": 0.6665737695780615, "percentage": 66.66, "elapsed_time": "1 day, 4:18:31", "remaining_time": "14:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11960, "total_steps": 17941, "loss": 1.6816, "learning_rate": 2.579582723150984e-05, "epoch": 0.6666295078312245, "percentage": 66.66, "elapsed_time": "1 day, 4:18:39", "remaining_time": "14:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11961, "total_steps": 17941, "loss": 1.7645, "learning_rate": 2.578803621418436e-05, "epoch": 0.6666852460843877, "percentage": 66.67, "elapsed_time": "1 day, 4:18:48", "remaining_time": "14:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11962, "total_steps": 17941, "loss": 1.6954, "learning_rate": 2.5780245964721244e-05, "epoch": 0.6667409843375509, "percentage": 66.67, "elapsed_time": "1 day, 4:18:56", "remaining_time": "14:09:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11963, "total_steps": 17941, "loss": 1.4321, "learning_rate": 2.5772456483367497e-05, "epoch": 0.666796722590714, "percentage": 66.68, "elapsed_time": "1 day, 4:19:04", "remaining_time": "14:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11964, "total_steps": 17941, "loss": 1.5843, "learning_rate": 2.5764667770370195e-05, "epoch": 0.6668524608438772, "percentage": 66.69, "elapsed_time": "1 day, 4:19:13", "remaining_time": "14:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11965, "total_steps": 17941, "loss": 1.6635, "learning_rate": 2.5756879825976287e-05, "epoch": 0.6669081990970402, "percentage": 66.69, "elapsed_time": "1 day, 4:19:21", "remaining_time": "14:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11966, "total_steps": 17941, "loss": 1.5231, "learning_rate": 2.5749092650432828e-05, "epoch": 0.6669639373502034, "percentage": 66.7, "elapsed_time": "1 day, 4:19:30", "remaining_time": "14:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11967, "total_steps": 17941, "loss": 1.5618, "learning_rate": 2.5741306243986773e-05, "epoch": 0.6670196756033666, "percentage": 66.7, "elapsed_time": "1 day, 4:19:38", "remaining_time": "14:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11968, "total_steps": 17941, "loss": 1.6768, "learning_rate": 2.5733520606885024e-05, "epoch": 0.6670754138565297, "percentage": 66.71, "elapsed_time": "1 day, 4:19:47", "remaining_time": "14:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11969, "total_steps": 17941, "loss": 1.9559, "learning_rate": 2.5725735739374523e-05, "epoch": 0.6671311521096929, "percentage": 66.71, "elapsed_time": "1 day, 4:19:55", "remaining_time": "14:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11970, "total_steps": 17941, "loss": 1.1981, "learning_rate": 2.5717951641702155e-05, "epoch": 0.667186890362856, "percentage": 66.72, "elapsed_time": "1 day, 4:20:04", "remaining_time": "14:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11971, "total_steps": 17941, "loss": 1.5034, "learning_rate": 2.5710168314114802e-05, "epoch": 0.6672426286160191, "percentage": 66.72, "elapsed_time": "1 day, 4:20:12", "remaining_time": "14:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11972, "total_steps": 17941, "loss": 1.5647, "learning_rate": 2.570238575685926e-05, "epoch": 0.6672983668691823, "percentage": 66.73, "elapsed_time": "1 day, 4:20:21", "remaining_time": "14:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11973, "total_steps": 17941, "loss": 1.9909, "learning_rate": 2.5694603970182384e-05, "epoch": 0.6673541051223455, "percentage": 66.74, "elapsed_time": "1 day, 4:20:29", "remaining_time": "14:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11974, "total_steps": 17941, "loss": 1.7471, "learning_rate": 2.568682295433099e-05, "epoch": 0.6674098433755086, "percentage": 66.74, "elapsed_time": "1 day, 4:20:38", "remaining_time": "14:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11975, "total_steps": 17941, "loss": 1.376, "learning_rate": 2.5679042709551793e-05, "epoch": 0.6674655816286718, "percentage": 66.75, "elapsed_time": "1 day, 4:20:46", "remaining_time": "14:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11976, "total_steps": 17941, "loss": 1.6064, "learning_rate": 2.5671263236091557e-05, "epoch": 0.6675213198818349, "percentage": 66.75, "elapsed_time": "1 day, 4:20:55", "remaining_time": "14:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11977, "total_steps": 17941, "loss": 1.6715, "learning_rate": 2.5663484534197014e-05, "epoch": 0.667577058134998, "percentage": 66.76, "elapsed_time": "1 day, 4:21:03", "remaining_time": "14:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11978, "total_steps": 17941, "loss": 1.5901, "learning_rate": 2.5655706604114844e-05, "epoch": 0.6676327963881612, "percentage": 66.76, "elapsed_time": "1 day, 4:21:12", "remaining_time": "14:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11979, "total_steps": 17941, "loss": 1.5659, "learning_rate": 2.5647929446091746e-05, "epoch": 0.6676885346413244, "percentage": 66.77, "elapsed_time": "1 day, 4:21:20", "remaining_time": "14:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11980, "total_steps": 17941, "loss": 1.7662, "learning_rate": 2.5640153060374293e-05, "epoch": 0.6677442728944875, "percentage": 66.77, "elapsed_time": "1 day, 4:21:29", "remaining_time": "14:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11981, "total_steps": 17941, "loss": 1.5056, "learning_rate": 2.563237744720921e-05, "epoch": 0.6678000111476506, "percentage": 66.78, "elapsed_time": "1 day, 4:21:38", "remaining_time": "14:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11982, "total_steps": 17941, "loss": 1.5221, "learning_rate": 2.5624602606843017e-05, "epoch": 0.6678557494008138, "percentage": 66.79, "elapsed_time": "1 day, 4:21:46", "remaining_time": "14:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11983, "total_steps": 17941, "loss": 1.6958, "learning_rate": 2.561682853952231e-05, "epoch": 0.6679114876539769, "percentage": 66.79, "elapsed_time": "1 day, 4:21:55", "remaining_time": "14:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11984, "total_steps": 17941, "loss": 1.7868, "learning_rate": 2.560905524549364e-05, "epoch": 0.6679672259071401, "percentage": 66.8, "elapsed_time": "1 day, 4:22:03", "remaining_time": "14:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11985, "total_steps": 17941, "loss": 1.3076, "learning_rate": 2.5601282725003522e-05, "epoch": 0.6680229641603033, "percentage": 66.8, "elapsed_time": "1 day, 4:22:12", "remaining_time": "14:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11986, "total_steps": 17941, "loss": 1.9535, "learning_rate": 2.5593510978298486e-05, "epoch": 0.6680787024134663, "percentage": 66.81, "elapsed_time": "1 day, 4:22:20", "remaining_time": "14:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11987, "total_steps": 17941, "loss": 1.5529, "learning_rate": 2.5585740005624947e-05, "epoch": 0.6681344406666295, "percentage": 66.81, "elapsed_time": "1 day, 4:22:28", "remaining_time": "14:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11988, "total_steps": 17941, "loss": 1.5102, "learning_rate": 2.5577969807229422e-05, "epoch": 0.6681901789197926, "percentage": 66.82, "elapsed_time": "1 day, 4:22:38", "remaining_time": "14:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11989, "total_steps": 17941, "loss": 1.5665, "learning_rate": 2.557020038335829e-05, "epoch": 0.6682459171729558, "percentage": 66.82, "elapsed_time": "1 day, 4:22:46", "remaining_time": "14:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11990, "total_steps": 17941, "loss": 1.5837, "learning_rate": 2.5562431734257987e-05, "epoch": 0.668301655426119, "percentage": 66.83, "elapsed_time": "1 day, 4:22:55", "remaining_time": "14:05:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11991, "total_steps": 17941, "loss": 1.673, "learning_rate": 2.5554663860174823e-05, "epoch": 0.668357393679282, "percentage": 66.84, "elapsed_time": "1 day, 4:23:03", "remaining_time": "14:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11992, "total_steps": 17941, "loss": 1.6438, "learning_rate": 2.5546896761355216e-05, "epoch": 0.6684131319324452, "percentage": 66.84, "elapsed_time": "1 day, 4:23:12", "remaining_time": "14:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11993, "total_steps": 17941, "loss": 1.6323, "learning_rate": 2.5539130438045494e-05, "epoch": 0.6684688701856084, "percentage": 66.85, "elapsed_time": "1 day, 4:23:21", "remaining_time": "14:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11994, "total_steps": 17941, "loss": 1.6362, "learning_rate": 2.5531364890491916e-05, "epoch": 0.6685246084387715, "percentage": 66.85, "elapsed_time": "1 day, 4:23:29", "remaining_time": "14:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11995, "total_steps": 17941, "loss": 1.7689, "learning_rate": 2.5523600118940784e-05, "epoch": 0.6685803466919347, "percentage": 66.86, "elapsed_time": "1 day, 4:23:38", "remaining_time": "14:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11996, "total_steps": 17941, "loss": 1.7699, "learning_rate": 2.551583612363835e-05, "epoch": 0.6686360849450979, "percentage": 66.86, "elapsed_time": "1 day, 4:23:46", "remaining_time": "14:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11997, "total_steps": 17941, "loss": 1.6291, "learning_rate": 2.550807290483086e-05, "epoch": 0.6686918231982609, "percentage": 66.87, "elapsed_time": "1 day, 4:23:55", "remaining_time": "14:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11998, "total_steps": 17941, "loss": 1.4974, "learning_rate": 2.5500310462764458e-05, "epoch": 0.6687475614514241, "percentage": 66.87, "elapsed_time": "1 day, 4:24:04", "remaining_time": "14:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11999, "total_steps": 17941, "loss": 1.742, "learning_rate": 2.549254879768539e-05, "epoch": 0.6688032997045873, "percentage": 66.88, "elapsed_time": "1 day, 4:24:12", "remaining_time": "14:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12000, "total_steps": 17941, "loss": 1.6044, "learning_rate": 2.54847879098398e-05, "epoch": 0.6688590379577504, "percentage": 66.89, "elapsed_time": "1 day, 4:24:21", "remaining_time": "14:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12001, "total_steps": 17941, "loss": 1.6588, "learning_rate": 2.5477027799473786e-05, "epoch": 0.6689147762109136, "percentage": 66.89, "elapsed_time": "1 day, 4:24:30", "remaining_time": "14:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12002, "total_steps": 17941, "loss": 1.5768, "learning_rate": 2.5469268466833474e-05, "epoch": 0.6689705144640767, "percentage": 66.9, "elapsed_time": "1 day, 4:24:39", "remaining_time": "14:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12003, "total_steps": 17941, "loss": 1.7623, "learning_rate": 2.5461509912164937e-05, "epoch": 0.6690262527172398, "percentage": 66.9, "elapsed_time": "1 day, 4:24:47", "remaining_time": "14:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12004, "total_steps": 17941, "loss": 1.6399, "learning_rate": 2.5453752135714237e-05, "epoch": 0.669081990970403, "percentage": 66.91, "elapsed_time": "1 day, 4:24:56", "remaining_time": "14:03:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12005, "total_steps": 17941, "loss": 1.6047, "learning_rate": 2.5445995137727428e-05, "epoch": 0.6691377292235662, "percentage": 66.91, "elapsed_time": "1 day, 4:25:05", "remaining_time": "14:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12006, "total_steps": 17941, "loss": 1.6891, "learning_rate": 2.5438238918450453e-05, "epoch": 0.6691934674767293, "percentage": 66.92, "elapsed_time": "1 day, 4:25:13", "remaining_time": "14:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12007, "total_steps": 17941, "loss": 1.6847, "learning_rate": 2.5430483478129374e-05, "epoch": 0.6692492057298924, "percentage": 66.92, "elapsed_time": "1 day, 4:25:22", "remaining_time": "14:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12008, "total_steps": 17941, "loss": 1.7936, "learning_rate": 2.5422728817010088e-05, "epoch": 0.6693049439830556, "percentage": 66.93, "elapsed_time": "1 day, 4:25:30", "remaining_time": "14:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12009, "total_steps": 17941, "loss": 1.5723, "learning_rate": 2.5414974935338553e-05, "epoch": 0.6693606822362187, "percentage": 66.94, "elapsed_time": "1 day, 4:25:39", "remaining_time": "14:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12010, "total_steps": 17941, "loss": 1.9559, "learning_rate": 2.540722183336066e-05, "epoch": 0.6694164204893819, "percentage": 66.94, "elapsed_time": "1 day, 4:25:47", "remaining_time": "14:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12011, "total_steps": 17941, "loss": 1.5012, "learning_rate": 2.5399469511322316e-05, "epoch": 0.669472158742545, "percentage": 66.95, "elapsed_time": "1 day, 4:25:55", "remaining_time": "14:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12012, "total_steps": 17941, "loss": 1.7371, "learning_rate": 2.5391717969469387e-05, "epoch": 0.6695278969957081, "percentage": 66.95, "elapsed_time": "1 day, 4:26:04", "remaining_time": "14:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12013, "total_steps": 17941, "loss": 1.5257, "learning_rate": 2.5383967208047642e-05, "epoch": 0.6695836352488713, "percentage": 66.96, "elapsed_time": "1 day, 4:26:12", "remaining_time": "14:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12014, "total_steps": 17941, "loss": 1.5169, "learning_rate": 2.5376217227302985e-05, "epoch": 0.6696393735020344, "percentage": 66.96, "elapsed_time": "1 day, 4:26:21", "remaining_time": "14:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12015, "total_steps": 17941, "loss": 1.763, "learning_rate": 2.5368468027481125e-05, "epoch": 0.6696951117551976, "percentage": 66.97, "elapsed_time": "1 day, 4:26:29", "remaining_time": "14:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12016, "total_steps": 17941, "loss": 1.5319, "learning_rate": 2.5360719608827843e-05, "epoch": 0.6697508500083608, "percentage": 66.98, "elapsed_time": "1 day, 4:26:39", "remaining_time": "14:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12017, "total_steps": 17941, "loss": 1.5549, "learning_rate": 2.535297197158889e-05, "epoch": 0.6698065882615238, "percentage": 66.98, "elapsed_time": "1 day, 4:26:48", "remaining_time": "14:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12018, "total_steps": 17941, "loss": 1.6838, "learning_rate": 2.5345225116009952e-05, "epoch": 0.669862326514687, "percentage": 66.99, "elapsed_time": "1 day, 4:26:56", "remaining_time": "14:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12019, "total_steps": 17941, "loss": 1.4308, "learning_rate": 2.5337479042336755e-05, "epoch": 0.6699180647678502, "percentage": 66.99, "elapsed_time": "1 day, 4:27:05", "remaining_time": "14:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12020, "total_steps": 17941, "loss": 1.7362, "learning_rate": 2.5329733750814903e-05, "epoch": 0.6699738030210133, "percentage": 67.0, "elapsed_time": "1 day, 4:27:13", "remaining_time": "14:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12021, "total_steps": 17941, "loss": 1.7953, "learning_rate": 2.532198924169006e-05, "epoch": 0.6700295412741765, "percentage": 67.0, "elapsed_time": "1 day, 4:27:22", "remaining_time": "14:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12022, "total_steps": 17941, "loss": 1.9502, "learning_rate": 2.531424551520784e-05, "epoch": 0.6700852795273397, "percentage": 67.01, "elapsed_time": "1 day, 4:27:30", "remaining_time": "14:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12023, "total_steps": 17941, "loss": 1.5504, "learning_rate": 2.5306502571613843e-05, "epoch": 0.6701410177805027, "percentage": 67.01, "elapsed_time": "1 day, 4:27:39", "remaining_time": "14:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12024, "total_steps": 17941, "loss": 1.5688, "learning_rate": 2.5298760411153567e-05, "epoch": 0.6701967560336659, "percentage": 67.02, "elapsed_time": "1 day, 4:27:47", "remaining_time": "14:00:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12025, "total_steps": 17941, "loss": 1.6796, "learning_rate": 2.5291019034072616e-05, "epoch": 0.6702524942868291, "percentage": 67.03, "elapsed_time": "1 day, 4:27:56", "remaining_time": "14:00:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12026, "total_steps": 17941, "loss": 1.8635, "learning_rate": 2.52832784406165e-05, "epoch": 0.6703082325399922, "percentage": 67.03, "elapsed_time": "1 day, 4:28:04", "remaining_time": "14:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12027, "total_steps": 17941, "loss": 1.5262, "learning_rate": 2.5275538631030658e-05, "epoch": 0.6703639707931554, "percentage": 67.04, "elapsed_time": "1 day, 4:28:12", "remaining_time": "13:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12028, "total_steps": 17941, "loss": 1.7629, "learning_rate": 2.5267799605560584e-05, "epoch": 0.6704197090463185, "percentage": 67.04, "elapsed_time": "1 day, 4:28:21", "remaining_time": "13:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12029, "total_steps": 17941, "loss": 1.7794, "learning_rate": 2.5260061364451703e-05, "epoch": 0.6704754472994816, "percentage": 67.05, "elapsed_time": "1 day, 4:28:29", "remaining_time": "13:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12030, "total_steps": 17941, "loss": 1.5772, "learning_rate": 2.5252323907949448e-05, "epoch": 0.6705311855526448, "percentage": 67.05, "elapsed_time": "1 day, 4:28:38", "remaining_time": "13:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12031, "total_steps": 17941, "loss": 1.7015, "learning_rate": 2.5244587236299177e-05, "epoch": 0.670586923805808, "percentage": 67.06, "elapsed_time": "1 day, 4:28:46", "remaining_time": "13:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12032, "total_steps": 17941, "loss": 1.5979, "learning_rate": 2.5236851349746245e-05, "epoch": 0.670642662058971, "percentage": 67.06, "elapsed_time": "1 day, 4:28:55", "remaining_time": "13:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12033, "total_steps": 17941, "loss": 1.6631, "learning_rate": 2.5229116248536044e-05, "epoch": 0.6706984003121342, "percentage": 67.07, "elapsed_time": "1 day, 4:29:03", "remaining_time": "13:59:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12034, "total_steps": 17941, "loss": 1.5784, "learning_rate": 2.5221381932913835e-05, "epoch": 0.6707541385652973, "percentage": 67.08, "elapsed_time": "1 day, 4:29:11", "remaining_time": "13:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12035, "total_steps": 17941, "loss": 1.5644, "learning_rate": 2.5213648403124918e-05, "epoch": 0.6708098768184605, "percentage": 67.08, "elapsed_time": "1 day, 4:29:20", "remaining_time": "13:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12036, "total_steps": 17941, "loss": 1.7091, "learning_rate": 2.520591565941456e-05, "epoch": 0.6708656150716237, "percentage": 67.09, "elapsed_time": "1 day, 4:29:28", "remaining_time": "13:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12037, "total_steps": 17941, "loss": 1.4581, "learning_rate": 2.5198183702028e-05, "epoch": 0.6709213533247868, "percentage": 67.09, "elapsed_time": "1 day, 4:29:38", "remaining_time": "13:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12038, "total_steps": 17941, "loss": 1.4818, "learning_rate": 2.5190452531210463e-05, "epoch": 0.6709770915779499, "percentage": 67.1, "elapsed_time": "1 day, 4:29:46", "remaining_time": "13:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12039, "total_steps": 17941, "loss": 1.5246, "learning_rate": 2.5182722147207088e-05, "epoch": 0.6710328298311131, "percentage": 67.1, "elapsed_time": "1 day, 4:29:55", "remaining_time": "13:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12040, "total_steps": 17941, "loss": 1.5696, "learning_rate": 2.517499255026311e-05, "epoch": 0.6710885680842762, "percentage": 67.11, "elapsed_time": "1 day, 4:30:03", "remaining_time": "13:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12041, "total_steps": 17941, "loss": 1.4597, "learning_rate": 2.5167263740623607e-05, "epoch": 0.6711443063374394, "percentage": 67.11, "elapsed_time": "1 day, 4:30:11", "remaining_time": "13:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12042, "total_steps": 17941, "loss": 1.6307, "learning_rate": 2.5159535718533717e-05, "epoch": 0.6712000445906026, "percentage": 67.12, "elapsed_time": "1 day, 4:30:20", "remaining_time": "13:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12043, "total_steps": 17941, "loss": 1.6608, "learning_rate": 2.5151808484238525e-05, "epoch": 0.6712557828437656, "percentage": 67.13, "elapsed_time": "1 day, 4:30:28", "remaining_time": "13:57:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12044, "total_steps": 17941, "loss": 1.6391, "learning_rate": 2.5144082037983085e-05, "epoch": 0.6713115210969288, "percentage": 67.13, "elapsed_time": "1 day, 4:30:37", "remaining_time": "13:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12045, "total_steps": 17941, "loss": 1.6466, "learning_rate": 2.513635638001247e-05, "epoch": 0.671367259350092, "percentage": 67.14, "elapsed_time": "1 day, 4:30:45", "remaining_time": "13:57:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12046, "total_steps": 17941, "loss": 1.6352, "learning_rate": 2.5128631510571643e-05, "epoch": 0.6714229976032551, "percentage": 67.14, "elapsed_time": "1 day, 4:30:54", "remaining_time": "13:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12047, "total_steps": 17941, "loss": 1.6743, "learning_rate": 2.5120907429905617e-05, "epoch": 0.6714787358564183, "percentage": 67.15, "elapsed_time": "1 day, 4:31:02", "remaining_time": "13:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12048, "total_steps": 17941, "loss": 1.7514, "learning_rate": 2.511318413825935e-05, "epoch": 0.6715344741095814, "percentage": 67.15, "elapsed_time": "1 day, 4:31:11", "remaining_time": "13:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12049, "total_steps": 17941, "loss": 1.2842, "learning_rate": 2.5105461635877797e-05, "epoch": 0.6715902123627445, "percentage": 67.16, "elapsed_time": "1 day, 4:31:19", "remaining_time": "13:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12050, "total_steps": 17941, "loss": 1.5662, "learning_rate": 2.509773992300582e-05, "epoch": 0.6716459506159077, "percentage": 67.16, "elapsed_time": "1 day, 4:31:28", "remaining_time": "13:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12051, "total_steps": 17941, "loss": 1.7842, "learning_rate": 2.5090018999888365e-05, "epoch": 0.6717016888690709, "percentage": 67.17, "elapsed_time": "1 day, 4:31:36", "remaining_time": "13:56:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12052, "total_steps": 17941, "loss": 1.5996, "learning_rate": 2.508229886677029e-05, "epoch": 0.671757427122234, "percentage": 67.18, "elapsed_time": "1 day, 4:31:44", "remaining_time": "13:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12053, "total_steps": 17941, "loss": 1.7818, "learning_rate": 2.507457952389639e-05, "epoch": 0.6718131653753971, "percentage": 67.18, "elapsed_time": "1 day, 4:31:53", "remaining_time": "13:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12054, "total_steps": 17941, "loss": 1.8029, "learning_rate": 2.506686097151151e-05, "epoch": 0.6718689036285603, "percentage": 67.19, "elapsed_time": "1 day, 4:32:01", "remaining_time": "13:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12055, "total_steps": 17941, "loss": 1.8815, "learning_rate": 2.5059143209860425e-05, "epoch": 0.6719246418817234, "percentage": 67.19, "elapsed_time": "1 day, 4:32:10", "remaining_time": "13:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12056, "total_steps": 17941, "loss": 1.6726, "learning_rate": 2.5051426239187918e-05, "epoch": 0.6719803801348866, "percentage": 67.2, "elapsed_time": "1 day, 4:32:18", "remaining_time": "13:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12057, "total_steps": 17941, "loss": 1.5366, "learning_rate": 2.5043710059738702e-05, "epoch": 0.6720361183880497, "percentage": 67.2, "elapsed_time": "1 day, 4:32:27", "remaining_time": "13:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12058, "total_steps": 17941, "loss": 1.8958, "learning_rate": 2.503599467175747e-05, "epoch": 0.6720918566412128, "percentage": 67.21, "elapsed_time": "1 day, 4:32:35", "remaining_time": "13:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12059, "total_steps": 17941, "loss": 1.7533, "learning_rate": 2.5028280075488973e-05, "epoch": 0.672147594894376, "percentage": 67.21, "elapsed_time": "1 day, 4:32:44", "remaining_time": "13:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12060, "total_steps": 17941, "loss": 1.608, "learning_rate": 2.5020566271177824e-05, "epoch": 0.6722033331475391, "percentage": 67.22, "elapsed_time": "1 day, 4:32:52", "remaining_time": "13:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12061, "total_steps": 17941, "loss": 1.5929, "learning_rate": 2.501285325906867e-05, "epoch": 0.6722590714007023, "percentage": 67.23, "elapsed_time": "1 day, 4:33:00", "remaining_time": "13:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12062, "total_steps": 17941, "loss": 1.7366, "learning_rate": 2.500514103940613e-05, "epoch": 0.6723148096538655, "percentage": 67.23, "elapsed_time": "1 day, 4:33:09", "remaining_time": "13:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12063, "total_steps": 17941, "loss": 1.9978, "learning_rate": 2.499742961243478e-05, "epoch": 0.6723705479070285, "percentage": 67.24, "elapsed_time": "1 day, 4:33:17", "remaining_time": "13:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12064, "total_steps": 17941, "loss": 1.6921, "learning_rate": 2.4989718978399207e-05, "epoch": 0.6724262861601917, "percentage": 67.24, "elapsed_time": "1 day, 4:33:26", "remaining_time": "13:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12065, "total_steps": 17941, "loss": 1.5997, "learning_rate": 2.4982009137543894e-05, "epoch": 0.6724820244133549, "percentage": 67.25, "elapsed_time": "1 day, 4:33:34", "remaining_time": "13:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12066, "total_steps": 17941, "loss": 1.7996, "learning_rate": 2.4974300090113422e-05, "epoch": 0.672537762666518, "percentage": 67.25, "elapsed_time": "1 day, 4:33:43", "remaining_time": "13:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12067, "total_steps": 17941, "loss": 1.5594, "learning_rate": 2.4966591836352222e-05, "epoch": 0.6725935009196812, "percentage": 67.26, "elapsed_time": "1 day, 4:33:51", "remaining_time": "13:54:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12068, "total_steps": 17941, "loss": 1.7468, "learning_rate": 2.495888437650477e-05, "epoch": 0.6726492391728444, "percentage": 67.26, "elapsed_time": "1 day, 4:34:00", "remaining_time": "13:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12069, "total_steps": 17941, "loss": 1.8914, "learning_rate": 2.495117771081551e-05, "epoch": 0.6727049774260074, "percentage": 67.27, "elapsed_time": "1 day, 4:34:08", "remaining_time": "13:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12070, "total_steps": 17941, "loss": 1.6262, "learning_rate": 2.494347183952885e-05, "epoch": 0.6727607156791706, "percentage": 67.28, "elapsed_time": "1 day, 4:34:17", "remaining_time": "13:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12071, "total_steps": 17941, "loss": 1.511, "learning_rate": 2.493576676288919e-05, "epoch": 0.6728164539323338, "percentage": 67.28, "elapsed_time": "1 day, 4:34:25", "remaining_time": "13:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12072, "total_steps": 17941, "loss": 1.4848, "learning_rate": 2.4928062481140856e-05, "epoch": 0.6728721921854969, "percentage": 67.29, "elapsed_time": "1 day, 4:34:33", "remaining_time": "13:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12073, "total_steps": 17941, "loss": 1.7329, "learning_rate": 2.4920358994528198e-05, "epoch": 0.6729279304386601, "percentage": 67.29, "elapsed_time": "1 day, 4:34:42", "remaining_time": "13:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12074, "total_steps": 17941, "loss": 1.7582, "learning_rate": 2.4912656303295535e-05, "epoch": 0.6729836686918232, "percentage": 67.3, "elapsed_time": "1 day, 4:34:50", "remaining_time": "13:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12075, "total_steps": 17941, "loss": 1.8324, "learning_rate": 2.4904954407687153e-05, "epoch": 0.6730394069449863, "percentage": 67.3, "elapsed_time": "1 day, 4:34:59", "remaining_time": "13:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12076, "total_steps": 17941, "loss": 1.5541, "learning_rate": 2.4897253307947272e-05, "epoch": 0.6730951451981495, "percentage": 67.31, "elapsed_time": "1 day, 4:35:07", "remaining_time": "13:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12077, "total_steps": 17941, "loss": 1.6382, "learning_rate": 2.4889553004320177e-05, "epoch": 0.6731508834513127, "percentage": 67.32, "elapsed_time": "1 day, 4:35:16", "remaining_time": "13:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12078, "total_steps": 17941, "loss": 1.6186, "learning_rate": 2.488185349705007e-05, "epoch": 0.6732066217044758, "percentage": 67.32, "elapsed_time": "1 day, 4:35:24", "remaining_time": "13:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12079, "total_steps": 17941, "loss": 1.6038, "learning_rate": 2.487415478638111e-05, "epoch": 0.673262359957639, "percentage": 67.33, "elapsed_time": "1 day, 4:35:33", "remaining_time": "13:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12080, "total_steps": 17941, "loss": 1.6577, "learning_rate": 2.4866456872557458e-05, "epoch": 0.673318098210802, "percentage": 67.33, "elapsed_time": "1 day, 4:35:42", "remaining_time": "13:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12081, "total_steps": 17941, "loss": 1.563, "learning_rate": 2.4858759755823258e-05, "epoch": 0.6733738364639652, "percentage": 67.34, "elapsed_time": "1 day, 4:35:50", "remaining_time": "13:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12082, "total_steps": 17941, "loss": 1.6662, "learning_rate": 2.485106343642264e-05, "epoch": 0.6734295747171284, "percentage": 67.34, "elapsed_time": "1 day, 4:35:59", "remaining_time": "13:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12083, "total_steps": 17941, "loss": 1.7301, "learning_rate": 2.4843367914599637e-05, "epoch": 0.6734853129702915, "percentage": 67.35, "elapsed_time": "1 day, 4:36:07", "remaining_time": "13:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12084, "total_steps": 17941, "loss": 1.4877, "learning_rate": 2.4835673190598306e-05, "epoch": 0.6735410512234546, "percentage": 67.35, "elapsed_time": "1 day, 4:36:16", "remaining_time": "13:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12085, "total_steps": 17941, "loss": 1.6383, "learning_rate": 2.482797926466275e-05, "epoch": 0.6735967894766178, "percentage": 67.36, "elapsed_time": "1 day, 4:36:25", "remaining_time": "13:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12086, "total_steps": 17941, "loss": 1.7706, "learning_rate": 2.482028613703691e-05, "epoch": 0.6736525277297809, "percentage": 67.37, "elapsed_time": "1 day, 4:36:33", "remaining_time": "13:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12087, "total_steps": 17941, "loss": 1.5105, "learning_rate": 2.481259380796478e-05, "epoch": 0.6737082659829441, "percentage": 67.37, "elapsed_time": "1 day, 4:36:42", "remaining_time": "13:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12088, "total_steps": 17941, "loss": 1.7255, "learning_rate": 2.480490227769032e-05, "epoch": 0.6737640042361073, "percentage": 67.38, "elapsed_time": "1 day, 4:36:50", "remaining_time": "13:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12089, "total_steps": 17941, "loss": 1.7097, "learning_rate": 2.4797211546457465e-05, "epoch": 0.6738197424892703, "percentage": 67.38, "elapsed_time": "1 day, 4:36:58", "remaining_time": "13:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12090, "total_steps": 17941, "loss": 1.8793, "learning_rate": 2.4789521614510143e-05, "epoch": 0.6738754807424335, "percentage": 67.39, "elapsed_time": "1 day, 4:37:07", "remaining_time": "13:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12091, "total_steps": 17941, "loss": 1.7683, "learning_rate": 2.478183248209216e-05, "epoch": 0.6739312189955967, "percentage": 67.39, "elapsed_time": "1 day, 4:37:15", "remaining_time": "13:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12092, "total_steps": 17941, "loss": 1.3473, "learning_rate": 2.4774144149447465e-05, "epoch": 0.6739869572487598, "percentage": 67.4, "elapsed_time": "1 day, 4:37:24", "remaining_time": "13:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12093, "total_steps": 17941, "loss": 1.9293, "learning_rate": 2.4766456616819818e-05, "epoch": 0.674042695501923, "percentage": 67.4, "elapsed_time": "1 day, 4:37:32", "remaining_time": "13:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12094, "total_steps": 17941, "loss": 1.5863, "learning_rate": 2.4758769884453043e-05, "epoch": 0.6740984337550862, "percentage": 67.41, "elapsed_time": "1 day, 4:37:41", "remaining_time": "13:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12095, "total_steps": 17941, "loss": 1.7642, "learning_rate": 2.4751083952590926e-05, "epoch": 0.6741541720082492, "percentage": 67.42, "elapsed_time": "1 day, 4:37:51", "remaining_time": "13:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12096, "total_steps": 17941, "loss": 1.4794, "learning_rate": 2.474339882147721e-05, "epoch": 0.6742099102614124, "percentage": 67.42, "elapsed_time": "1 day, 4:37:59", "remaining_time": "13:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12097, "total_steps": 17941, "loss": 1.584, "learning_rate": 2.4735714491355643e-05, "epoch": 0.6742656485145756, "percentage": 67.43, "elapsed_time": "1 day, 4:38:07", "remaining_time": "13:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12098, "total_steps": 17941, "loss": 1.828, "learning_rate": 2.47280309624699e-05, "epoch": 0.6743213867677387, "percentage": 67.43, "elapsed_time": "1 day, 4:38:16", "remaining_time": "13:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12099, "total_steps": 17941, "loss": 1.7087, "learning_rate": 2.4720348235063666e-05, "epoch": 0.6743771250209019, "percentage": 67.44, "elapsed_time": "1 day, 4:38:24", "remaining_time": "13:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12100, "total_steps": 17941, "loss": 1.7922, "learning_rate": 2.4712666309380595e-05, "epoch": 0.674432863274065, "percentage": 67.44, "elapsed_time": "1 day, 4:38:33", "remaining_time": "13:49:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12101, "total_steps": 17941, "loss": 1.3383, "learning_rate": 2.470498518566433e-05, "epoch": 0.6744886015272281, "percentage": 67.45, "elapsed_time": "1 day, 4:38:41", "remaining_time": "13:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12102, "total_steps": 17941, "loss": 1.4675, "learning_rate": 2.469730486415842e-05, "epoch": 0.6745443397803913, "percentage": 67.45, "elapsed_time": "1 day, 4:38:50", "remaining_time": "13:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12103, "total_steps": 17941, "loss": 1.7807, "learning_rate": 2.468962534510649e-05, "epoch": 0.6746000780335544, "percentage": 67.46, "elapsed_time": "1 day, 4:38:59", "remaining_time": "13:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12104, "total_steps": 17941, "loss": 1.5491, "learning_rate": 2.46819466287521e-05, "epoch": 0.6746558162867176, "percentage": 67.47, "elapsed_time": "1 day, 4:39:07", "remaining_time": "13:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12105, "total_steps": 17941, "loss": 1.7326, "learning_rate": 2.467426871533873e-05, "epoch": 0.6747115545398807, "percentage": 67.47, "elapsed_time": "1 day, 4:39:15", "remaining_time": "13:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12106, "total_steps": 17941, "loss": 1.7699, "learning_rate": 2.466659160510989e-05, "epoch": 0.6747672927930438, "percentage": 67.48, "elapsed_time": "1 day, 4:39:24", "remaining_time": "13:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12107, "total_steps": 17941, "loss": 1.7571, "learning_rate": 2.4658915298309066e-05, "epoch": 0.674823031046207, "percentage": 67.48, "elapsed_time": "1 day, 4:39:32", "remaining_time": "13:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12108, "total_steps": 17941, "loss": 1.636, "learning_rate": 2.4651239795179713e-05, "epoch": 0.6748787692993702, "percentage": 67.49, "elapsed_time": "1 day, 4:39:41", "remaining_time": "13:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12109, "total_steps": 17941, "loss": 1.4918, "learning_rate": 2.4643565095965204e-05, "epoch": 0.6749345075525333, "percentage": 67.49, "elapsed_time": "1 day, 4:39:49", "remaining_time": "13:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12110, "total_steps": 17941, "loss": 1.6423, "learning_rate": 2.4635891200908996e-05, "epoch": 0.6749902458056964, "percentage": 67.5, "elapsed_time": "1 day, 4:39:59", "remaining_time": "13:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12111, "total_steps": 17941, "loss": 1.644, "learning_rate": 2.4628218110254452e-05, "epoch": 0.6750459840588596, "percentage": 67.5, "elapsed_time": "1 day, 4:40:07", "remaining_time": "13:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12112, "total_steps": 17941, "loss": 1.5569, "learning_rate": 2.462054582424488e-05, "epoch": 0.6751017223120227, "percentage": 67.51, "elapsed_time": "1 day, 4:40:16", "remaining_time": "13:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12113, "total_steps": 17941, "loss": 1.5434, "learning_rate": 2.4612874343123626e-05, "epoch": 0.6751574605651859, "percentage": 67.52, "elapsed_time": "1 day, 4:40:24", "remaining_time": "13:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12114, "total_steps": 17941, "loss": 1.6833, "learning_rate": 2.460520366713398e-05, "epoch": 0.6752131988183491, "percentage": 67.52, "elapsed_time": "1 day, 4:40:33", "remaining_time": "13:47:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12115, "total_steps": 17941, "loss": 1.7659, "learning_rate": 2.4597533796519206e-05, "epoch": 0.6752689370715121, "percentage": 67.53, "elapsed_time": "1 day, 4:40:41", "remaining_time": "13:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12116, "total_steps": 17941, "loss": 1.6773, "learning_rate": 2.4589864731522578e-05, "epoch": 0.6753246753246753, "percentage": 67.53, "elapsed_time": "1 day, 4:40:50", "remaining_time": "13:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12117, "total_steps": 17941, "loss": 1.7786, "learning_rate": 2.4582196472387255e-05, "epoch": 0.6753804135778385, "percentage": 67.54, "elapsed_time": "1 day, 4:40:58", "remaining_time": "13:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12118, "total_steps": 17941, "loss": 1.7779, "learning_rate": 2.4574529019356494e-05, "epoch": 0.6754361518310016, "percentage": 67.54, "elapsed_time": "1 day, 4:41:06", "remaining_time": "13:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12119, "total_steps": 17941, "loss": 1.7638, "learning_rate": 2.4566862372673415e-05, "epoch": 0.6754918900841648, "percentage": 67.55, "elapsed_time": "1 day, 4:41:15", "remaining_time": "13:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12120, "total_steps": 17941, "loss": 1.6782, "learning_rate": 2.4559196532581174e-05, "epoch": 0.675547628337328, "percentage": 67.55, "elapsed_time": "1 day, 4:41:23", "remaining_time": "13:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12121, "total_steps": 17941, "loss": 1.5979, "learning_rate": 2.4551531499322895e-05, "epoch": 0.675603366590491, "percentage": 67.56, "elapsed_time": "1 day, 4:41:32", "remaining_time": "13:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12122, "total_steps": 17941, "loss": 1.5279, "learning_rate": 2.4543867273141658e-05, "epoch": 0.6756591048436542, "percentage": 67.57, "elapsed_time": "1 day, 4:41:41", "remaining_time": "13:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12123, "total_steps": 17941, "loss": 1.5487, "learning_rate": 2.4536203854280553e-05, "epoch": 0.6757148430968174, "percentage": 67.57, "elapsed_time": "1 day, 4:41:50", "remaining_time": "13:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12124, "total_steps": 17941, "loss": 1.6329, "learning_rate": 2.452854124298257e-05, "epoch": 0.6757705813499805, "percentage": 67.58, "elapsed_time": "1 day, 4:41:58", "remaining_time": "13:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12125, "total_steps": 17941, "loss": 1.8838, "learning_rate": 2.4520879439490763e-05, "epoch": 0.6758263196031437, "percentage": 67.58, "elapsed_time": "1 day, 4:42:07", "remaining_time": "13:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12126, "total_steps": 17941, "loss": 1.8276, "learning_rate": 2.45132184440481e-05, "epoch": 0.6758820578563067, "percentage": 67.59, "elapsed_time": "1 day, 4:42:15", "remaining_time": "13:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12127, "total_steps": 17941, "loss": 1.748, "learning_rate": 2.4505558256897564e-05, "epoch": 0.6759377961094699, "percentage": 67.59, "elapsed_time": "1 day, 4:42:24", "remaining_time": "13:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12128, "total_steps": 17941, "loss": 1.5513, "learning_rate": 2.449789887828205e-05, "epoch": 0.6759935343626331, "percentage": 67.6, "elapsed_time": "1 day, 4:42:32", "remaining_time": "13:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12129, "total_steps": 17941, "loss": 1.5345, "learning_rate": 2.4490240308444507e-05, "epoch": 0.6760492726157962, "percentage": 67.6, "elapsed_time": "1 day, 4:42:41", "remaining_time": "13:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12130, "total_steps": 17941, "loss": 1.754, "learning_rate": 2.448258254762783e-05, "epoch": 0.6761050108689594, "percentage": 67.61, "elapsed_time": "1 day, 4:42:49", "remaining_time": "13:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12131, "total_steps": 17941, "loss": 1.5279, "learning_rate": 2.447492559607484e-05, "epoch": 0.6761607491221225, "percentage": 67.62, "elapsed_time": "1 day, 4:42:58", "remaining_time": "13:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12132, "total_steps": 17941, "loss": 1.8167, "learning_rate": 2.4467269454028386e-05, "epoch": 0.6762164873752856, "percentage": 67.62, "elapsed_time": "1 day, 4:43:06", "remaining_time": "13:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12133, "total_steps": 17941, "loss": 1.6938, "learning_rate": 2.4459614121731283e-05, "epoch": 0.6762722256284488, "percentage": 67.63, "elapsed_time": "1 day, 4:43:15", "remaining_time": "13:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12134, "total_steps": 17941, "loss": 1.6087, "learning_rate": 2.445195959942632e-05, "epoch": 0.676327963881612, "percentage": 67.63, "elapsed_time": "1 day, 4:43:23", "remaining_time": "13:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12135, "total_steps": 17941, "loss": 1.8278, "learning_rate": 2.4444305887356218e-05, "epoch": 0.6763837021347751, "percentage": 67.64, "elapsed_time": "1 day, 4:43:32", "remaining_time": "13:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12136, "total_steps": 17941, "loss": 1.6288, "learning_rate": 2.4436652985763742e-05, "epoch": 0.6764394403879382, "percentage": 67.64, "elapsed_time": "1 day, 4:43:41", "remaining_time": "13:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12137, "total_steps": 17941, "loss": 1.4703, "learning_rate": 2.4429000894891606e-05, "epoch": 0.6764951786411014, "percentage": 67.65, "elapsed_time": "1 day, 4:43:49", "remaining_time": "13:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12138, "total_steps": 17941, "loss": 1.435, "learning_rate": 2.4421349614982464e-05, "epoch": 0.6765509168942645, "percentage": 67.66, "elapsed_time": "1 day, 4:43:58", "remaining_time": "13:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12139, "total_steps": 17941, "loss": 1.5009, "learning_rate": 2.441369914627897e-05, "epoch": 0.6766066551474277, "percentage": 67.66, "elapsed_time": "1 day, 4:44:06", "remaining_time": "13:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12140, "total_steps": 17941, "loss": 1.6002, "learning_rate": 2.4406049489023763e-05, "epoch": 0.6766623934005909, "percentage": 67.67, "elapsed_time": "1 day, 4:44:14", "remaining_time": "13:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12141, "total_steps": 17941, "loss": 2.0263, "learning_rate": 2.439840064345944e-05, "epoch": 0.6767181316537539, "percentage": 67.67, "elapsed_time": "1 day, 4:44:24", "remaining_time": "13:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12142, "total_steps": 17941, "loss": 1.5754, "learning_rate": 2.4390752609828603e-05, "epoch": 0.6767738699069171, "percentage": 67.68, "elapsed_time": "1 day, 4:44:32", "remaining_time": "13:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12143, "total_steps": 17941, "loss": 1.6967, "learning_rate": 2.4383105388373745e-05, "epoch": 0.6768296081600803, "percentage": 67.68, "elapsed_time": "1 day, 4:44:40", "remaining_time": "13:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12144, "total_steps": 17941, "loss": 1.4722, "learning_rate": 2.4375458979337463e-05, "epoch": 0.6768853464132434, "percentage": 67.69, "elapsed_time": "1 day, 4:44:49", "remaining_time": "13:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12145, "total_steps": 17941, "loss": 1.567, "learning_rate": 2.4367813382962203e-05, "epoch": 0.6769410846664066, "percentage": 67.69, "elapsed_time": "1 day, 4:44:57", "remaining_time": "13:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12146, "total_steps": 17941, "loss": 1.7543, "learning_rate": 2.436016859949046e-05, "epoch": 0.6769968229195698, "percentage": 67.7, "elapsed_time": "1 day, 4:45:06", "remaining_time": "13:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12147, "total_steps": 17941, "loss": 1.5287, "learning_rate": 2.435252462916467e-05, "epoch": 0.6770525611727328, "percentage": 67.71, "elapsed_time": "1 day, 4:45:14", "remaining_time": "13:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12148, "total_steps": 17941, "loss": 1.6324, "learning_rate": 2.4344881472227264e-05, "epoch": 0.677108299425896, "percentage": 67.71, "elapsed_time": "1 day, 4:45:23", "remaining_time": "13:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12149, "total_steps": 17941, "loss": 1.8157, "learning_rate": 2.4337239128920662e-05, "epoch": 0.6771640376790591, "percentage": 67.72, "elapsed_time": "1 day, 4:45:31", "remaining_time": "13:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12150, "total_steps": 17941, "loss": 1.7171, "learning_rate": 2.4329597599487192e-05, "epoch": 0.6772197759322223, "percentage": 67.72, "elapsed_time": "1 day, 4:45:40", "remaining_time": "13:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12151, "total_steps": 17941, "loss": 1.816, "learning_rate": 2.432195688416921e-05, "epoch": 0.6772755141853855, "percentage": 67.73, "elapsed_time": "1 day, 4:45:48", "remaining_time": "13:42:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12152, "total_steps": 17941, "loss": 1.594, "learning_rate": 2.431431698320905e-05, "epoch": 0.6773312524385485, "percentage": 67.73, "elapsed_time": "1 day, 4:45:57", "remaining_time": "13:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12153, "total_steps": 17941, "loss": 1.6131, "learning_rate": 2.4306677896849018e-05, "epoch": 0.6773869906917117, "percentage": 67.74, "elapsed_time": "1 day, 4:46:05", "remaining_time": "13:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12154, "total_steps": 17941, "loss": 1.5579, "learning_rate": 2.4299039625331315e-05, "epoch": 0.6774427289448749, "percentage": 67.74, "elapsed_time": "1 day, 4:46:14", "remaining_time": "13:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12155, "total_steps": 17941, "loss": 1.7149, "learning_rate": 2.4291402168898252e-05, "epoch": 0.677498467198038, "percentage": 67.75, "elapsed_time": "1 day, 4:46:22", "remaining_time": "13:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12156, "total_steps": 17941, "loss": 1.7342, "learning_rate": 2.4283765527792034e-05, "epoch": 0.6775542054512012, "percentage": 67.76, "elapsed_time": "1 day, 4:46:30", "remaining_time": "13:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12157, "total_steps": 17941, "loss": 1.5972, "learning_rate": 2.4276129702254826e-05, "epoch": 0.6776099437043643, "percentage": 67.76, "elapsed_time": "1 day, 4:46:39", "remaining_time": "13:41:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12158, "total_steps": 17941, "loss": 1.8824, "learning_rate": 2.4268494692528798e-05, "epoch": 0.6776656819575274, "percentage": 67.77, "elapsed_time": "1 day, 4:46:47", "remaining_time": "13:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12159, "total_steps": 17941, "loss": 1.6597, "learning_rate": 2.4260860498856098e-05, "epoch": 0.6777214202106906, "percentage": 67.77, "elapsed_time": "1 day, 4:46:56", "remaining_time": "13:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12160, "total_steps": 17941, "loss": 1.5585, "learning_rate": 2.425322712147885e-05, "epoch": 0.6777771584638538, "percentage": 67.78, "elapsed_time": "1 day, 4:47:04", "remaining_time": "13:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12161, "total_steps": 17941, "loss": 1.5505, "learning_rate": 2.4245594560639084e-05, "epoch": 0.6778328967170169, "percentage": 67.78, "elapsed_time": "1 day, 4:47:13", "remaining_time": "13:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12162, "total_steps": 17941, "loss": 1.5679, "learning_rate": 2.4237962816578918e-05, "epoch": 0.67788863497018, "percentage": 67.79, "elapsed_time": "1 day, 4:47:21", "remaining_time": "13:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12163, "total_steps": 17941, "loss": 1.7587, "learning_rate": 2.4230331889540393e-05, "epoch": 0.6779443732233432, "percentage": 67.79, "elapsed_time": "1 day, 4:47:30", "remaining_time": "13:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12164, "total_steps": 17941, "loss": 1.3722, "learning_rate": 2.4222701779765467e-05, "epoch": 0.6780001114765063, "percentage": 67.8, "elapsed_time": "1 day, 4:47:39", "remaining_time": "13:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12165, "total_steps": 17941, "loss": 1.6003, "learning_rate": 2.4215072487496153e-05, "epoch": 0.6780558497296695, "percentage": 67.81, "elapsed_time": "1 day, 4:47:47", "remaining_time": "13:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12166, "total_steps": 17941, "loss": 1.8517, "learning_rate": 2.4207444012974402e-05, "epoch": 0.6781115879828327, "percentage": 67.81, "elapsed_time": "1 day, 4:47:56", "remaining_time": "13:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12167, "total_steps": 17941, "loss": 1.5125, "learning_rate": 2.4199816356442166e-05, "epoch": 0.6781673262359957, "percentage": 67.82, "elapsed_time": "1 day, 4:48:04", "remaining_time": "13:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12168, "total_steps": 17941, "loss": 1.7082, "learning_rate": 2.419218951814131e-05, "epoch": 0.6782230644891589, "percentage": 67.82, "elapsed_time": "1 day, 4:48:13", "remaining_time": "13:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12169, "total_steps": 17941, "loss": 1.6407, "learning_rate": 2.4184563498313712e-05, "epoch": 0.6782788027423221, "percentage": 67.83, "elapsed_time": "1 day, 4:48:21", "remaining_time": "13:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12170, "total_steps": 17941, "loss": 1.6078, "learning_rate": 2.4176938297201286e-05, "epoch": 0.6783345409954852, "percentage": 67.83, "elapsed_time": "1 day, 4:48:30", "remaining_time": "13:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12171, "total_steps": 17941, "loss": 1.6395, "learning_rate": 2.4169313915045795e-05, "epoch": 0.6783902792486484, "percentage": 67.84, "elapsed_time": "1 day, 4:48:38", "remaining_time": "13:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12172, "total_steps": 17941, "loss": 1.6889, "learning_rate": 2.4161690352089067e-05, "epoch": 0.6784460175018114, "percentage": 67.84, "elapsed_time": "1 day, 4:48:46", "remaining_time": "13:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12173, "total_steps": 17941, "loss": 1.663, "learning_rate": 2.4154067608572874e-05, "epoch": 0.6785017557549746, "percentage": 67.85, "elapsed_time": "1 day, 4:48:55", "remaining_time": "13:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12174, "total_steps": 17941, "loss": 1.8053, "learning_rate": 2.414644568473896e-05, "epoch": 0.6785574940081378, "percentage": 67.86, "elapsed_time": "1 day, 4:49:04", "remaining_time": "13:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12175, "total_steps": 17941, "loss": 1.6296, "learning_rate": 2.413882458082907e-05, "epoch": 0.6786132322613009, "percentage": 67.86, "elapsed_time": "1 day, 4:49:12", "remaining_time": "13:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12176, "total_steps": 17941, "loss": 1.6391, "learning_rate": 2.4131204297084875e-05, "epoch": 0.6786689705144641, "percentage": 67.87, "elapsed_time": "1 day, 4:49:21", "remaining_time": "13:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12177, "total_steps": 17941, "loss": 1.702, "learning_rate": 2.4123584833748042e-05, "epoch": 0.6787247087676272, "percentage": 67.87, "elapsed_time": "1 day, 4:49:29", "remaining_time": "13:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12178, "total_steps": 17941, "loss": 1.7373, "learning_rate": 2.4115966191060236e-05, "epoch": 0.6787804470207903, "percentage": 67.88, "elapsed_time": "1 day, 4:49:38", "remaining_time": "13:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12179, "total_steps": 17941, "loss": 1.6233, "learning_rate": 2.4108348369263084e-05, "epoch": 0.6788361852739535, "percentage": 67.88, "elapsed_time": "1 day, 4:49:46", "remaining_time": "13:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12180, "total_steps": 17941, "loss": 1.6422, "learning_rate": 2.4100731368598123e-05, "epoch": 0.6788919235271167, "percentage": 67.89, "elapsed_time": "1 day, 4:49:54", "remaining_time": "13:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12181, "total_steps": 17941, "loss": 1.6933, "learning_rate": 2.409311518930698e-05, "epoch": 0.6789476617802798, "percentage": 67.89, "elapsed_time": "1 day, 4:50:03", "remaining_time": "13:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12182, "total_steps": 17941, "loss": 1.6532, "learning_rate": 2.4085499831631197e-05, "epoch": 0.679003400033443, "percentage": 67.9, "elapsed_time": "1 day, 4:50:11", "remaining_time": "13:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12183, "total_steps": 17941, "loss": 1.7707, "learning_rate": 2.4077885295812248e-05, "epoch": 0.6790591382866061, "percentage": 67.91, "elapsed_time": "1 day, 4:50:20", "remaining_time": "13:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12184, "total_steps": 17941, "loss": 1.6073, "learning_rate": 2.4070271582091642e-05, "epoch": 0.6791148765397692, "percentage": 67.91, "elapsed_time": "1 day, 4:50:28", "remaining_time": "13:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12185, "total_steps": 17941, "loss": 1.6806, "learning_rate": 2.406265869071084e-05, "epoch": 0.6791706147929324, "percentage": 67.92, "elapsed_time": "1 day, 4:50:37", "remaining_time": "13:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12186, "total_steps": 17941, "loss": 1.4209, "learning_rate": 2.4055046621911294e-05, "epoch": 0.6792263530460956, "percentage": 67.92, "elapsed_time": "1 day, 4:50:45", "remaining_time": "13:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12187, "total_steps": 17941, "loss": 1.7709, "learning_rate": 2.4047435375934363e-05, "epoch": 0.6792820912992587, "percentage": 67.93, "elapsed_time": "1 day, 4:50:53", "remaining_time": "13:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12188, "total_steps": 17941, "loss": 1.6503, "learning_rate": 2.4039824953021488e-05, "epoch": 0.6793378295524218, "percentage": 67.93, "elapsed_time": "1 day, 4:51:03", "remaining_time": "13:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12189, "total_steps": 17941, "loss": 1.6457, "learning_rate": 2.403221535341403e-05, "epoch": 0.679393567805585, "percentage": 67.94, "elapsed_time": "1 day, 4:51:11", "remaining_time": "13:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12190, "total_steps": 17941, "loss": 1.6228, "learning_rate": 2.402460657735327e-05, "epoch": 0.6794493060587481, "percentage": 67.94, "elapsed_time": "1 day, 4:51:20", "remaining_time": "13:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12191, "total_steps": 17941, "loss": 1.8148, "learning_rate": 2.401699862508055e-05, "epoch": 0.6795050443119113, "percentage": 67.95, "elapsed_time": "1 day, 4:51:29", "remaining_time": "13:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12192, "total_steps": 17941, "loss": 1.8663, "learning_rate": 2.4009391496837143e-05, "epoch": 0.6795607825650745, "percentage": 67.96, "elapsed_time": "1 day, 4:51:37", "remaining_time": "13:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12193, "total_steps": 17941, "loss": 1.9342, "learning_rate": 2.4001785192864313e-05, "epoch": 0.6796165208182375, "percentage": 67.96, "elapsed_time": "1 day, 4:51:46", "remaining_time": "13:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12194, "total_steps": 17941, "loss": 1.5368, "learning_rate": 2.3994179713403265e-05, "epoch": 0.6796722590714007, "percentage": 67.97, "elapsed_time": "1 day, 4:51:54", "remaining_time": "13:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12195, "total_steps": 17941, "loss": 1.4992, "learning_rate": 2.398657505869519e-05, "epoch": 0.6797279973245638, "percentage": 67.97, "elapsed_time": "1 day, 4:52:02", "remaining_time": "13:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12196, "total_steps": 17941, "loss": 1.5838, "learning_rate": 2.3978971228981323e-05, "epoch": 0.679783735577727, "percentage": 67.98, "elapsed_time": "1 day, 4:52:11", "remaining_time": "13:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12197, "total_steps": 17941, "loss": 1.8293, "learning_rate": 2.397136822450276e-05, "epoch": 0.6798394738308902, "percentage": 67.98, "elapsed_time": "1 day, 4:52:19", "remaining_time": "13:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12198, "total_steps": 17941, "loss": 1.6752, "learning_rate": 2.3963766045500634e-05, "epoch": 0.6798952120840532, "percentage": 67.99, "elapsed_time": "1 day, 4:52:28", "remaining_time": "13:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12199, "total_steps": 17941, "loss": 1.3596, "learning_rate": 2.3956164692216054e-05, "epoch": 0.6799509503372164, "percentage": 68.0, "elapsed_time": "1 day, 4:52:36", "remaining_time": "13:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12200, "total_steps": 17941, "loss": 1.7068, "learning_rate": 2.394856416489008e-05, "epoch": 0.6800066885903796, "percentage": 68.0, "elapsed_time": "1 day, 4:52:45", "remaining_time": "13:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12201, "total_steps": 17941, "loss": 1.7651, "learning_rate": 2.3940964463763778e-05, "epoch": 0.6800624268435427, "percentage": 68.01, "elapsed_time": "1 day, 4:52:53", "remaining_time": "13:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12202, "total_steps": 17941, "loss": 1.4577, "learning_rate": 2.393336558907811e-05, "epoch": 0.6801181650967059, "percentage": 68.01, "elapsed_time": "1 day, 4:53:02", "remaining_time": "13:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12203, "total_steps": 17941, "loss": 1.6466, "learning_rate": 2.3925767541074147e-05, "epoch": 0.680173903349869, "percentage": 68.02, "elapsed_time": "1 day, 4:53:10", "remaining_time": "13:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12204, "total_steps": 17941, "loss": 1.6213, "learning_rate": 2.3918170319992793e-05, "epoch": 0.6802296416030321, "percentage": 68.02, "elapsed_time": "1 day, 4:53:18", "remaining_time": "13:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12205, "total_steps": 17941, "loss": 1.8441, "learning_rate": 2.391057392607503e-05, "epoch": 0.6802853798561953, "percentage": 68.03, "elapsed_time": "1 day, 4:53:27", "remaining_time": "13:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12206, "total_steps": 17941, "loss": 1.5251, "learning_rate": 2.3902978359561713e-05, "epoch": 0.6803411181093585, "percentage": 68.03, "elapsed_time": "1 day, 4:53:35", "remaining_time": "13:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12207, "total_steps": 17941, "loss": 1.7265, "learning_rate": 2.3895383620693785e-05, "epoch": 0.6803968563625216, "percentage": 68.04, "elapsed_time": "1 day, 4:53:44", "remaining_time": "13:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12208, "total_steps": 17941, "loss": 1.7238, "learning_rate": 2.3887789709712107e-05, "epoch": 0.6804525946156847, "percentage": 68.05, "elapsed_time": "1 day, 4:53:52", "remaining_time": "13:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12209, "total_steps": 17941, "loss": 1.7441, "learning_rate": 2.388019662685747e-05, "epoch": 0.6805083328688479, "percentage": 68.05, "elapsed_time": "1 day, 4:54:01", "remaining_time": "13:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12210, "total_steps": 17941, "loss": 1.5733, "learning_rate": 2.3872604372370717e-05, "epoch": 0.680564071122011, "percentage": 68.06, "elapsed_time": "1 day, 4:54:09", "remaining_time": "13:33:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12211, "total_steps": 17941, "loss": 1.8439, "learning_rate": 2.386501294649261e-05, "epoch": 0.6806198093751742, "percentage": 68.06, "elapsed_time": "1 day, 4:54:18", "remaining_time": "13:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12212, "total_steps": 17941, "loss": 1.6925, "learning_rate": 2.3857422349463944e-05, "epoch": 0.6806755476283374, "percentage": 68.07, "elapsed_time": "1 day, 4:54:26", "remaining_time": "13:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12213, "total_steps": 17941, "loss": 1.7101, "learning_rate": 2.384983258152537e-05, "epoch": 0.6807312858815004, "percentage": 68.07, "elapsed_time": "1 day, 4:54:35", "remaining_time": "13:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12214, "total_steps": 17941, "loss": 1.6757, "learning_rate": 2.3842243642917666e-05, "epoch": 0.6807870241346636, "percentage": 68.08, "elapsed_time": "1 day, 4:54:43", "remaining_time": "13:33:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12215, "total_steps": 17941, "loss": 1.5788, "learning_rate": 2.38346555338815e-05, "epoch": 0.6808427623878268, "percentage": 68.08, "elapsed_time": "1 day, 4:54:51", "remaining_time": "13:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12216, "total_steps": 17941, "loss": 1.5688, "learning_rate": 2.382706825465749e-05, "epoch": 0.6808985006409899, "percentage": 68.09, "elapsed_time": "1 day, 4:55:00", "remaining_time": "13:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12217, "total_steps": 17941, "loss": 1.4546, "learning_rate": 2.3819481805486275e-05, "epoch": 0.6809542388941531, "percentage": 68.1, "elapsed_time": "1 day, 4:55:09", "remaining_time": "13:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12218, "total_steps": 17941, "loss": 1.6903, "learning_rate": 2.3811896186608457e-05, "epoch": 0.6810099771473161, "percentage": 68.1, "elapsed_time": "1 day, 4:55:18", "remaining_time": "13:32:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12219, "total_steps": 17941, "loss": 1.4833, "learning_rate": 2.3804311398264617e-05, "epoch": 0.6810657154004793, "percentage": 68.11, "elapsed_time": "1 day, 4:55:26", "remaining_time": "13:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12220, "total_steps": 17941, "loss": 1.6484, "learning_rate": 2.379672744069527e-05, "epoch": 0.6811214536536425, "percentage": 68.11, "elapsed_time": "1 day, 4:55:35", "remaining_time": "13:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12221, "total_steps": 17941, "loss": 1.7253, "learning_rate": 2.3789144314140938e-05, "epoch": 0.6811771919068056, "percentage": 68.12, "elapsed_time": "1 day, 4:55:43", "remaining_time": "13:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12222, "total_steps": 17941, "loss": 1.7107, "learning_rate": 2.378156201884217e-05, "epoch": 0.6812329301599688, "percentage": 68.12, "elapsed_time": "1 day, 4:55:51", "remaining_time": "13:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12223, "total_steps": 17941, "loss": 1.4336, "learning_rate": 2.377398055503936e-05, "epoch": 0.681288668413132, "percentage": 68.13, "elapsed_time": "1 day, 4:56:00", "remaining_time": "13:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12224, "total_steps": 17941, "loss": 1.4867, "learning_rate": 2.376639992297299e-05, "epoch": 0.681344406666295, "percentage": 68.13, "elapsed_time": "1 day, 4:56:08", "remaining_time": "13:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12225, "total_steps": 17941, "loss": 1.7883, "learning_rate": 2.3758820122883456e-05, "epoch": 0.6814001449194582, "percentage": 68.14, "elapsed_time": "1 day, 4:56:17", "remaining_time": "13:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12226, "total_steps": 17941, "loss": 1.7039, "learning_rate": 2.375124115501115e-05, "epoch": 0.6814558831726214, "percentage": 68.15, "elapsed_time": "1 day, 4:56:26", "remaining_time": "13:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12227, "total_steps": 17941, "loss": 1.592, "learning_rate": 2.3743663019596456e-05, "epoch": 0.6815116214257845, "percentage": 68.15, "elapsed_time": "1 day, 4:56:34", "remaining_time": "13:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12228, "total_steps": 17941, "loss": 1.7615, "learning_rate": 2.3736085716879647e-05, "epoch": 0.6815673596789477, "percentage": 68.16, "elapsed_time": "1 day, 4:56:42", "remaining_time": "13:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12229, "total_steps": 17941, "loss": 1.5715, "learning_rate": 2.3728509247101106e-05, "epoch": 0.6816230979321108, "percentage": 68.16, "elapsed_time": "1 day, 4:56:51", "remaining_time": "13:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12230, "total_steps": 17941, "loss": 1.6945, "learning_rate": 2.3720933610501062e-05, "epoch": 0.6816788361852739, "percentage": 68.17, "elapsed_time": "1 day, 4:56:59", "remaining_time": "13:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12231, "total_steps": 17941, "loss": 1.5869, "learning_rate": 2.37133588073198e-05, "epoch": 0.6817345744384371, "percentage": 68.17, "elapsed_time": "1 day, 4:57:08", "remaining_time": "13:30:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12232, "total_steps": 17941, "loss": 1.5898, "learning_rate": 2.3705784837797502e-05, "epoch": 0.6817903126916003, "percentage": 68.18, "elapsed_time": "1 day, 4:57:17", "remaining_time": "13:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12233, "total_steps": 17941, "loss": 1.6013, "learning_rate": 2.3698211702174423e-05, "epoch": 0.6818460509447634, "percentage": 68.18, "elapsed_time": "1 day, 4:57:25", "remaining_time": "13:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12234, "total_steps": 17941, "loss": 1.6214, "learning_rate": 2.3690639400690735e-05, "epoch": 0.6819017891979265, "percentage": 68.19, "elapsed_time": "1 day, 4:57:34", "remaining_time": "13:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12235, "total_steps": 17941, "loss": 1.6553, "learning_rate": 2.368306793358655e-05, "epoch": 0.6819575274510897, "percentage": 68.2, "elapsed_time": "1 day, 4:57:42", "remaining_time": "13:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12236, "total_steps": 17941, "loss": 1.8637, "learning_rate": 2.3675497301102017e-05, "epoch": 0.6820132657042528, "percentage": 68.2, "elapsed_time": "1 day, 4:57:51", "remaining_time": "13:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12237, "total_steps": 17941, "loss": 1.3013, "learning_rate": 2.3667927503477222e-05, "epoch": 0.682069003957416, "percentage": 68.21, "elapsed_time": "1 day, 4:57:59", "remaining_time": "13:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12238, "total_steps": 17941, "loss": 1.7682, "learning_rate": 2.3660358540952265e-05, "epoch": 0.6821247422105792, "percentage": 68.21, "elapsed_time": "1 day, 4:58:07", "remaining_time": "13:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12239, "total_steps": 17941, "loss": 1.7248, "learning_rate": 2.3652790413767122e-05, "epoch": 0.6821804804637422, "percentage": 68.22, "elapsed_time": "1 day, 4:58:16", "remaining_time": "13:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12240, "total_steps": 17941, "loss": 1.6372, "learning_rate": 2.3645223122161868e-05, "epoch": 0.6822362187169054, "percentage": 68.22, "elapsed_time": "1 day, 4:58:25", "remaining_time": "13:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12241, "total_steps": 17941, "loss": 1.5107, "learning_rate": 2.3637656666376505e-05, "epoch": 0.6822919569700685, "percentage": 68.23, "elapsed_time": "1 day, 4:58:33", "remaining_time": "13:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12242, "total_steps": 17941, "loss": 1.9183, "learning_rate": 2.3630091046650944e-05, "epoch": 0.6823476952232317, "percentage": 68.23, "elapsed_time": "1 day, 4:58:42", "remaining_time": "13:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12243, "total_steps": 17941, "loss": 1.7131, "learning_rate": 2.3622526263225152e-05, "epoch": 0.6824034334763949, "percentage": 68.24, "elapsed_time": "1 day, 4:58:50", "remaining_time": "13:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12244, "total_steps": 17941, "loss": 1.8323, "learning_rate": 2.3614962316339033e-05, "epoch": 0.682459171729558, "percentage": 68.25, "elapsed_time": "1 day, 4:58:59", "remaining_time": "13:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12245, "total_steps": 17941, "loss": 1.46, "learning_rate": 2.3607399206232493e-05, "epoch": 0.6825149099827211, "percentage": 68.25, "elapsed_time": "1 day, 4:59:07", "remaining_time": "13:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12246, "total_steps": 17941, "loss": 1.6821, "learning_rate": 2.359983693314535e-05, "epoch": 0.6825706482358843, "percentage": 68.26, "elapsed_time": "1 day, 4:59:15", "remaining_time": "13:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12247, "total_steps": 17941, "loss": 1.5697, "learning_rate": 2.359227549731744e-05, "epoch": 0.6826263864890474, "percentage": 68.26, "elapsed_time": "1 day, 4:59:24", "remaining_time": "13:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12248, "total_steps": 17941, "loss": 1.5941, "learning_rate": 2.358471489898862e-05, "epoch": 0.6826821247422106, "percentage": 68.27, "elapsed_time": "1 day, 4:59:32", "remaining_time": "13:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12249, "total_steps": 17941, "loss": 1.6352, "learning_rate": 2.3577155138398616e-05, "epoch": 0.6827378629953738, "percentage": 68.27, "elapsed_time": "1 day, 4:59:41", "remaining_time": "13:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12250, "total_steps": 17941, "loss": 1.4396, "learning_rate": 2.3569596215787187e-05, "epoch": 0.6827936012485368, "percentage": 68.28, "elapsed_time": "1 day, 4:59:49", "remaining_time": "13:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12251, "total_steps": 17941, "loss": 1.645, "learning_rate": 2.356203813139407e-05, "epoch": 0.6828493395017, "percentage": 68.28, "elapsed_time": "1 day, 4:59:58", "remaining_time": "13:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12252, "total_steps": 17941, "loss": 1.4556, "learning_rate": 2.3554480885458964e-05, "epoch": 0.6829050777548632, "percentage": 68.29, "elapsed_time": "1 day, 5:00:06", "remaining_time": "13:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12253, "total_steps": 17941, "loss": 1.4566, "learning_rate": 2.354692447822155e-05, "epoch": 0.6829608160080263, "percentage": 68.3, "elapsed_time": "1 day, 5:00:15", "remaining_time": "13:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12254, "total_steps": 17941, "loss": 1.6032, "learning_rate": 2.3539368909921423e-05, "epoch": 0.6830165542611895, "percentage": 68.3, "elapsed_time": "1 day, 5:00:23", "remaining_time": "13:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12255, "total_steps": 17941, "loss": 1.5002, "learning_rate": 2.3531814180798277e-05, "epoch": 0.6830722925143526, "percentage": 68.31, "elapsed_time": "1 day, 5:00:31", "remaining_time": "13:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12256, "total_steps": 17941, "loss": 1.8472, "learning_rate": 2.3524260291091642e-05, "epoch": 0.6831280307675157, "percentage": 68.31, "elapsed_time": "1 day, 5:00:40", "remaining_time": "13:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12257, "total_steps": 17941, "loss": 1.7751, "learning_rate": 2.3516707241041132e-05, "epoch": 0.6831837690206789, "percentage": 68.32, "elapsed_time": "1 day, 5:00:49", "remaining_time": "13:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12258, "total_steps": 17941, "loss": 1.6577, "learning_rate": 2.350915503088622e-05, "epoch": 0.6832395072738421, "percentage": 68.32, "elapsed_time": "1 day, 5:00:58", "remaining_time": "13:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12259, "total_steps": 17941, "loss": 1.8244, "learning_rate": 2.3501603660866473e-05, "epoch": 0.6832952455270052, "percentage": 68.33, "elapsed_time": "1 day, 5:01:06", "remaining_time": "13:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12260, "total_steps": 17941, "loss": 1.7442, "learning_rate": 2.3494053131221383e-05, "epoch": 0.6833509837801683, "percentage": 68.34, "elapsed_time": "1 day, 5:01:15", "remaining_time": "13:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12261, "total_steps": 17941, "loss": 1.5471, "learning_rate": 2.3486503442190373e-05, "epoch": 0.6834067220333315, "percentage": 68.34, "elapsed_time": "1 day, 5:01:23", "remaining_time": "13:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12262, "total_steps": 17941, "loss": 1.5732, "learning_rate": 2.347895459401288e-05, "epoch": 0.6834624602864946, "percentage": 68.35, "elapsed_time": "1 day, 5:01:31", "remaining_time": "13:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12263, "total_steps": 17941, "loss": 1.642, "learning_rate": 2.3471406586928323e-05, "epoch": 0.6835181985396578, "percentage": 68.35, "elapsed_time": "1 day, 5:01:40", "remaining_time": "13:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12264, "total_steps": 17941, "loss": 1.603, "learning_rate": 2.34638594211761e-05, "epoch": 0.6835739367928209, "percentage": 68.36, "elapsed_time": "1 day, 5:01:48", "remaining_time": "13:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12265, "total_steps": 17941, "loss": 1.7664, "learning_rate": 2.3456313096995498e-05, "epoch": 0.683629675045984, "percentage": 68.36, "elapsed_time": "1 day, 5:01:57", "remaining_time": "13:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12266, "total_steps": 17941, "loss": 1.4581, "learning_rate": 2.34487676146259e-05, "epoch": 0.6836854132991472, "percentage": 68.37, "elapsed_time": "1 day, 5:02:05", "remaining_time": "13:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12267, "total_steps": 17941, "loss": 1.6216, "learning_rate": 2.344122297430661e-05, "epoch": 0.6837411515523103, "percentage": 68.37, "elapsed_time": "1 day, 5:02:14", "remaining_time": "13:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12268, "total_steps": 17941, "loss": 1.641, "learning_rate": 2.343367917627686e-05, "epoch": 0.6837968898054735, "percentage": 68.38, "elapsed_time": "1 day, 5:02:22", "remaining_time": "13:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12269, "total_steps": 17941, "loss": 1.5376, "learning_rate": 2.3426136220775917e-05, "epoch": 0.6838526280586367, "percentage": 68.39, "elapsed_time": "1 day, 5:02:31", "remaining_time": "13:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12270, "total_steps": 17941, "loss": 1.4804, "learning_rate": 2.3418594108042996e-05, "epoch": 0.6839083663117997, "percentage": 68.39, "elapsed_time": "1 day, 5:02:39", "remaining_time": "13:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12271, "total_steps": 17941, "loss": 1.6446, "learning_rate": 2.3411052838317306e-05, "epoch": 0.6839641045649629, "percentage": 68.4, "elapsed_time": "1 day, 5:02:48", "remaining_time": "13:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12272, "total_steps": 17941, "loss": 1.6575, "learning_rate": 2.340351241183798e-05, "epoch": 0.6840198428181261, "percentage": 68.4, "elapsed_time": "1 day, 5:02:56", "remaining_time": "13:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12273, "total_steps": 17941, "loss": 1.4676, "learning_rate": 2.339597282884415e-05, "epoch": 0.6840755810712892, "percentage": 68.41, "elapsed_time": "1 day, 5:03:05", "remaining_time": "13:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12274, "total_steps": 17941, "loss": 1.6655, "learning_rate": 2.3388434089574985e-05, "epoch": 0.6841313193244524, "percentage": 68.41, "elapsed_time": "1 day, 5:03:13", "remaining_time": "13:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12275, "total_steps": 17941, "loss": 1.5272, "learning_rate": 2.3380896194269518e-05, "epoch": 0.6841870575776156, "percentage": 68.42, "elapsed_time": "1 day, 5:03:22", "remaining_time": "13:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12276, "total_steps": 17941, "loss": 1.8014, "learning_rate": 2.337335914316683e-05, "epoch": 0.6842427958307786, "percentage": 68.42, "elapsed_time": "1 day, 5:03:30", "remaining_time": "13:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12277, "total_steps": 17941, "loss": 1.7232, "learning_rate": 2.3365822936505938e-05, "epoch": 0.6842985340839418, "percentage": 68.43, "elapsed_time": "1 day, 5:03:39", "remaining_time": "13:24:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12278, "total_steps": 17941, "loss": 1.4039, "learning_rate": 2.3358287574525878e-05, "epoch": 0.684354272337105, "percentage": 68.44, "elapsed_time": "1 day, 5:03:47", "remaining_time": "13:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12279, "total_steps": 17941, "loss": 1.6005, "learning_rate": 2.335075305746558e-05, "epoch": 0.6844100105902681, "percentage": 68.44, "elapsed_time": "1 day, 5:03:56", "remaining_time": "13:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12280, "total_steps": 17941, "loss": 1.5314, "learning_rate": 2.3343219385564003e-05, "epoch": 0.6844657488434313, "percentage": 68.45, "elapsed_time": "1 day, 5:04:06", "remaining_time": "13:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12281, "total_steps": 17941, "loss": 1.5298, "learning_rate": 2.333568655906013e-05, "epoch": 0.6845214870965944, "percentage": 68.45, "elapsed_time": "1 day, 5:04:14", "remaining_time": "13:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12282, "total_steps": 17941, "loss": 1.6174, "learning_rate": 2.332815457819279e-05, "epoch": 0.6845772253497575, "percentage": 68.46, "elapsed_time": "1 day, 5:04:22", "remaining_time": "13:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12283, "total_steps": 17941, "loss": 1.4918, "learning_rate": 2.332062344320088e-05, "epoch": 0.6846329636029207, "percentage": 68.46, "elapsed_time": "1 day, 5:04:31", "remaining_time": "13:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12284, "total_steps": 17941, "loss": 1.8133, "learning_rate": 2.3313093154323246e-05, "epoch": 0.6846887018560839, "percentage": 68.47, "elapsed_time": "1 day, 5:04:39", "remaining_time": "13:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12285, "total_steps": 17941, "loss": 1.7663, "learning_rate": 2.3305563711798694e-05, "epoch": 0.684744440109247, "percentage": 68.47, "elapsed_time": "1 day, 5:04:48", "remaining_time": "13:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12286, "total_steps": 17941, "loss": 1.6054, "learning_rate": 2.3298035115866052e-05, "epoch": 0.6848001783624101, "percentage": 68.48, "elapsed_time": "1 day, 5:04:57", "remaining_time": "13:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12287, "total_steps": 17941, "loss": 1.7638, "learning_rate": 2.3290507366764025e-05, "epoch": 0.6848559166155732, "percentage": 68.49, "elapsed_time": "1 day, 5:05:05", "remaining_time": "13:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12288, "total_steps": 17941, "loss": 1.8447, "learning_rate": 2.3282980464731378e-05, "epoch": 0.6849116548687364, "percentage": 68.49, "elapsed_time": "1 day, 5:05:14", "remaining_time": "13:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12289, "total_steps": 17941, "loss": 1.5922, "learning_rate": 2.3275454410006825e-05, "epoch": 0.6849673931218996, "percentage": 68.5, "elapsed_time": "1 day, 5:05:22", "remaining_time": "13:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12290, "total_steps": 17941, "loss": 1.5335, "learning_rate": 2.326792920282906e-05, "epoch": 0.6850231313750627, "percentage": 68.5, "elapsed_time": "1 day, 5:05:31", "remaining_time": "13:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12291, "total_steps": 17941, "loss": 1.7828, "learning_rate": 2.3260404843436685e-05, "epoch": 0.6850788696282258, "percentage": 68.51, "elapsed_time": "1 day, 5:05:39", "remaining_time": "13:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12292, "total_steps": 17941, "loss": 1.7622, "learning_rate": 2.325288133206838e-05, "epoch": 0.685134607881389, "percentage": 68.51, "elapsed_time": "1 day, 5:05:48", "remaining_time": "13:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12293, "total_steps": 17941, "loss": 1.6446, "learning_rate": 2.3245358668962754e-05, "epoch": 0.6851903461345521, "percentage": 68.52, "elapsed_time": "1 day, 5:05:57", "remaining_time": "13:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12294, "total_steps": 17941, "loss": 1.1563, "learning_rate": 2.323783685435834e-05, "epoch": 0.6852460843877153, "percentage": 68.52, "elapsed_time": "1 day, 5:06:05", "remaining_time": "13:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12295, "total_steps": 17941, "loss": 1.4075, "learning_rate": 2.323031588849371e-05, "epoch": 0.6853018226408785, "percentage": 68.53, "elapsed_time": "1 day, 5:06:14", "remaining_time": "13:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12296, "total_steps": 17941, "loss": 1.5879, "learning_rate": 2.322279577160738e-05, "epoch": 0.6853575608940415, "percentage": 68.54, "elapsed_time": "1 day, 5:06:23", "remaining_time": "13:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12297, "total_steps": 17941, "loss": 1.8357, "learning_rate": 2.3215276503937867e-05, "epoch": 0.6854132991472047, "percentage": 68.54, "elapsed_time": "1 day, 5:06:31", "remaining_time": "13:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12298, "total_steps": 17941, "loss": 1.4444, "learning_rate": 2.3207758085723597e-05, "epoch": 0.6854690374003679, "percentage": 68.55, "elapsed_time": "1 day, 5:06:40", "remaining_time": "13:21:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12299, "total_steps": 17941, "loss": 1.6139, "learning_rate": 2.3200240517203015e-05, "epoch": 0.685524775653531, "percentage": 68.55, "elapsed_time": "1 day, 5:06:48", "remaining_time": "13:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12300, "total_steps": 17941, "loss": 1.7099, "learning_rate": 2.3192723798614584e-05, "epoch": 0.6855805139066942, "percentage": 68.56, "elapsed_time": "1 day, 5:06:57", "remaining_time": "13:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12301, "total_steps": 17941, "loss": 1.602, "learning_rate": 2.318520793019664e-05, "epoch": 0.6856362521598574, "percentage": 68.56, "elapsed_time": "1 day, 5:07:06", "remaining_time": "13:21:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12302, "total_steps": 17941, "loss": 1.6749, "learning_rate": 2.317769291218756e-05, "epoch": 0.6856919904130204, "percentage": 68.57, "elapsed_time": "1 day, 5:07:15", "remaining_time": "13:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12303, "total_steps": 17941, "loss": 1.7086, "learning_rate": 2.3170178744825676e-05, "epoch": 0.6857477286661836, "percentage": 68.57, "elapsed_time": "1 day, 5:07:23", "remaining_time": "13:20:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12304, "total_steps": 17941, "loss": 1.4932, "learning_rate": 2.316266542834931e-05, "epoch": 0.6858034669193468, "percentage": 68.58, "elapsed_time": "1 day, 5:07:32", "remaining_time": "13:20:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12305, "total_steps": 17941, "loss": 1.6363, "learning_rate": 2.3155152962996708e-05, "epoch": 0.6858592051725099, "percentage": 68.59, "elapsed_time": "1 day, 5:07:40", "remaining_time": "13:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12306, "total_steps": 17941, "loss": 1.7378, "learning_rate": 2.3147641349006116e-05, "epoch": 0.685914943425673, "percentage": 68.59, "elapsed_time": "1 day, 5:07:48", "remaining_time": "13:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12307, "total_steps": 17941, "loss": 1.3766, "learning_rate": 2.3140130586615823e-05, "epoch": 0.6859706816788362, "percentage": 68.6, "elapsed_time": "1 day, 5:07:57", "remaining_time": "13:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12308, "total_steps": 17941, "loss": 1.9187, "learning_rate": 2.313262067606396e-05, "epoch": 0.6860264199319993, "percentage": 68.6, "elapsed_time": "1 day, 5:08:06", "remaining_time": "13:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12309, "total_steps": 17941, "loss": 1.7144, "learning_rate": 2.3125111617588717e-05, "epoch": 0.6860821581851625, "percentage": 68.61, "elapsed_time": "1 day, 5:08:14", "remaining_time": "13:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12310, "total_steps": 17941, "loss": 1.7483, "learning_rate": 2.311760341142825e-05, "epoch": 0.6861378964383256, "percentage": 68.61, "elapsed_time": "1 day, 5:08:23", "remaining_time": "13:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12311, "total_steps": 17941, "loss": 1.6752, "learning_rate": 2.3110096057820668e-05, "epoch": 0.6861936346914888, "percentage": 68.62, "elapsed_time": "1 day, 5:08:31", "remaining_time": "13:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12312, "total_steps": 17941, "loss": 1.5869, "learning_rate": 2.310258955700408e-05, "epoch": 0.6862493729446519, "percentage": 68.62, "elapsed_time": "1 day, 5:08:40", "remaining_time": "13:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12313, "total_steps": 17941, "loss": 1.6082, "learning_rate": 2.3095083909216504e-05, "epoch": 0.686305111197815, "percentage": 68.63, "elapsed_time": "1 day, 5:08:49", "remaining_time": "13:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12314, "total_steps": 17941, "loss": 1.6087, "learning_rate": 2.3087579114696e-05, "epoch": 0.6863608494509782, "percentage": 68.64, "elapsed_time": "1 day, 5:08:57", "remaining_time": "13:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12315, "total_steps": 17941, "loss": 1.178, "learning_rate": 2.3080075173680577e-05, "epoch": 0.6864165877041414, "percentage": 68.64, "elapsed_time": "1 day, 5:09:05", "remaining_time": "13:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12316, "total_steps": 17941, "loss": 1.6732, "learning_rate": 2.3072572086408233e-05, "epoch": 0.6864723259573045, "percentage": 68.65, "elapsed_time": "1 day, 5:09:15", "remaining_time": "13:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12317, "total_steps": 17941, "loss": 1.6694, "learning_rate": 2.3065069853116872e-05, "epoch": 0.6865280642104676, "percentage": 68.65, "elapsed_time": "1 day, 5:09:23", "remaining_time": "13:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12318, "total_steps": 17941, "loss": 1.6295, "learning_rate": 2.3057568474044473e-05, "epoch": 0.6865838024636308, "percentage": 68.66, "elapsed_time": "1 day, 5:09:32", "remaining_time": "13:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12319, "total_steps": 17941, "loss": 1.7854, "learning_rate": 2.305006794942893e-05, "epoch": 0.6866395407167939, "percentage": 68.66, "elapsed_time": "1 day, 5:09:40", "remaining_time": "13:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12320, "total_steps": 17941, "loss": 1.5614, "learning_rate": 2.3042568279508087e-05, "epoch": 0.6866952789699571, "percentage": 68.67, "elapsed_time": "1 day, 5:09:49", "remaining_time": "13:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12321, "total_steps": 17941, "loss": 1.8107, "learning_rate": 2.3035069464519805e-05, "epoch": 0.6867510172231203, "percentage": 68.68, "elapsed_time": "1 day, 5:09:57", "remaining_time": "13:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12322, "total_steps": 17941, "loss": 1.4073, "learning_rate": 2.3027571504701902e-05, "epoch": 0.6868067554762833, "percentage": 68.68, "elapsed_time": "1 day, 5:10:06", "remaining_time": "13:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12323, "total_steps": 17941, "loss": 1.4108, "learning_rate": 2.302007440029219e-05, "epoch": 0.6868624937294465, "percentage": 68.69, "elapsed_time": "1 day, 5:10:14", "remaining_time": "13:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12324, "total_steps": 17941, "loss": 1.7426, "learning_rate": 2.3012578151528398e-05, "epoch": 0.6869182319826097, "percentage": 68.69, "elapsed_time": "1 day, 5:10:22", "remaining_time": "13:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12325, "total_steps": 17941, "loss": 1.6956, "learning_rate": 2.3005082758648256e-05, "epoch": 0.6869739702357728, "percentage": 68.7, "elapsed_time": "1 day, 5:10:31", "remaining_time": "13:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12326, "total_steps": 17941, "loss": 1.4693, "learning_rate": 2.299758822188954e-05, "epoch": 0.687029708488936, "percentage": 68.7, "elapsed_time": "1 day, 5:10:40", "remaining_time": "13:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12327, "total_steps": 17941, "loss": 1.9276, "learning_rate": 2.2990094541489866e-05, "epoch": 0.6870854467420991, "percentage": 68.71, "elapsed_time": "1 day, 5:10:49", "remaining_time": "13:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12328, "total_steps": 17941, "loss": 1.4048, "learning_rate": 2.298260171768692e-05, "epoch": 0.6871411849952622, "percentage": 68.71, "elapsed_time": "1 day, 5:10:57", "remaining_time": "13:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12329, "total_steps": 17941, "loss": 1.8137, "learning_rate": 2.2975109750718323e-05, "epoch": 0.6871969232484254, "percentage": 68.72, "elapsed_time": "1 day, 5:11:06", "remaining_time": "13:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12330, "total_steps": 17941, "loss": 1.5533, "learning_rate": 2.2967618640821698e-05, "epoch": 0.6872526615015886, "percentage": 68.73, "elapsed_time": "1 day, 5:11:14", "remaining_time": "13:16:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12331, "total_steps": 17941, "loss": 1.8408, "learning_rate": 2.296012838823458e-05, "epoch": 0.6873083997547517, "percentage": 68.73, "elapsed_time": "1 day, 5:11:23", "remaining_time": "13:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12332, "total_steps": 17941, "loss": 1.6803, "learning_rate": 2.2952638993194515e-05, "epoch": 0.6873641380079148, "percentage": 68.74, "elapsed_time": "1 day, 5:11:31", "remaining_time": "13:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12333, "total_steps": 17941, "loss": 1.5447, "learning_rate": 2.2945150455939084e-05, "epoch": 0.6874198762610779, "percentage": 68.74, "elapsed_time": "1 day, 5:11:40", "remaining_time": "13:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12334, "total_steps": 17941, "loss": 1.7161, "learning_rate": 2.2937662776705728e-05, "epoch": 0.6874756145142411, "percentage": 68.75, "elapsed_time": "1 day, 5:11:48", "remaining_time": "13:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12335, "total_steps": 17941, "loss": 1.5177, "learning_rate": 2.2930175955731914e-05, "epoch": 0.6875313527674043, "percentage": 68.75, "elapsed_time": "1 day, 5:11:57", "remaining_time": "13:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12336, "total_steps": 17941, "loss": 1.9024, "learning_rate": 2.2922689993255093e-05, "epoch": 0.6875870910205674, "percentage": 68.76, "elapsed_time": "1 day, 5:12:05", "remaining_time": "13:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12337, "total_steps": 17941, "loss": 1.7149, "learning_rate": 2.2915204889512678e-05, "epoch": 0.6876428292737305, "percentage": 68.76, "elapsed_time": "1 day, 5:12:14", "remaining_time": "13:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12338, "total_steps": 17941, "loss": 1.8041, "learning_rate": 2.2907720644742064e-05, "epoch": 0.6876985675268937, "percentage": 68.77, "elapsed_time": "1 day, 5:12:23", "remaining_time": "13:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12339, "total_steps": 17941, "loss": 1.5429, "learning_rate": 2.2900237259180575e-05, "epoch": 0.6877543057800568, "percentage": 68.78, "elapsed_time": "1 day, 5:12:31", "remaining_time": "13:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12340, "total_steps": 17941, "loss": 1.6162, "learning_rate": 2.2892754733065558e-05, "epoch": 0.68781004403322, "percentage": 68.78, "elapsed_time": "1 day, 5:12:40", "remaining_time": "13:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12341, "total_steps": 17941, "loss": 1.5418, "learning_rate": 2.2885273066634312e-05, "epoch": 0.6878657822863832, "percentage": 68.79, "elapsed_time": "1 day, 5:12:48", "remaining_time": "13:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12342, "total_steps": 17941, "loss": 1.5795, "learning_rate": 2.287779226012413e-05, "epoch": 0.6879215205395462, "percentage": 68.79, "elapsed_time": "1 day, 5:12:57", "remaining_time": "13:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12343, "total_steps": 17941, "loss": 1.5287, "learning_rate": 2.287031231377221e-05, "epoch": 0.6879772587927094, "percentage": 68.8, "elapsed_time": "1 day, 5:13:05", "remaining_time": "13:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12344, "total_steps": 17941, "loss": 1.8508, "learning_rate": 2.2862833227815834e-05, "epoch": 0.6880329970458726, "percentage": 68.8, "elapsed_time": "1 day, 5:13:14", "remaining_time": "13:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12345, "total_steps": 17941, "loss": 1.8116, "learning_rate": 2.2855355002492173e-05, "epoch": 0.6880887352990357, "percentage": 68.81, "elapsed_time": "1 day, 5:13:23", "remaining_time": "13:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12346, "total_steps": 17941, "loss": 1.911, "learning_rate": 2.2847877638038378e-05, "epoch": 0.6881444735521989, "percentage": 68.81, "elapsed_time": "1 day, 5:13:31", "remaining_time": "13:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12347, "total_steps": 17941, "loss": 1.9441, "learning_rate": 2.2840401134691593e-05, "epoch": 0.6882002118053621, "percentage": 68.82, "elapsed_time": "1 day, 5:13:40", "remaining_time": "13:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12348, "total_steps": 17941, "loss": 1.6979, "learning_rate": 2.283292549268893e-05, "epoch": 0.6882559500585251, "percentage": 68.83, "elapsed_time": "1 day, 5:13:48", "remaining_time": "13:14:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12349, "total_steps": 17941, "loss": 1.4911, "learning_rate": 2.2825450712267495e-05, "epoch": 0.6883116883116883, "percentage": 68.83, "elapsed_time": "1 day, 5:13:57", "remaining_time": "13:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12350, "total_steps": 17941, "loss": 1.7359, "learning_rate": 2.2817976793664286e-05, "epoch": 0.6883674265648515, "percentage": 68.84, "elapsed_time": "1 day, 5:14:05", "remaining_time": "13:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12351, "total_steps": 17941, "loss": 1.5864, "learning_rate": 2.2810503737116395e-05, "epoch": 0.6884231648180146, "percentage": 68.84, "elapsed_time": "1 day, 5:14:14", "remaining_time": "13:13:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12352, "total_steps": 17941, "loss": 1.6317, "learning_rate": 2.2803031542860814e-05, "epoch": 0.6884789030711778, "percentage": 68.85, "elapsed_time": "1 day, 5:14:22", "remaining_time": "13:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12353, "total_steps": 17941, "loss": 1.7449, "learning_rate": 2.2795560211134488e-05, "epoch": 0.688534641324341, "percentage": 68.85, "elapsed_time": "1 day, 5:14:30", "remaining_time": "13:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12354, "total_steps": 17941, "loss": 1.8073, "learning_rate": 2.2788089742174374e-05, "epoch": 0.688590379577504, "percentage": 68.86, "elapsed_time": "1 day, 5:14:39", "remaining_time": "13:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12355, "total_steps": 17941, "loss": 1.4452, "learning_rate": 2.27806201362174e-05, "epoch": 0.6886461178306672, "percentage": 68.86, "elapsed_time": "1 day, 5:14:47", "remaining_time": "13:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12356, "total_steps": 17941, "loss": 1.5739, "learning_rate": 2.2773151393500475e-05, "epoch": 0.6887018560838304, "percentage": 68.87, "elapsed_time": "1 day, 5:14:56", "remaining_time": "13:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12357, "total_steps": 17941, "loss": 1.6514, "learning_rate": 2.2765683514260426e-05, "epoch": 0.6887575943369935, "percentage": 68.88, "elapsed_time": "1 day, 5:15:04", "remaining_time": "13:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12358, "total_steps": 17941, "loss": 1.7062, "learning_rate": 2.2758216498734086e-05, "epoch": 0.6888133325901566, "percentage": 68.88, "elapsed_time": "1 day, 5:15:13", "remaining_time": "13:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12359, "total_steps": 17941, "loss": 1.731, "learning_rate": 2.275075034715833e-05, "epoch": 0.6888690708433197, "percentage": 68.89, "elapsed_time": "1 day, 5:15:21", "remaining_time": "13:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12360, "total_steps": 17941, "loss": 1.445, "learning_rate": 2.2743285059769876e-05, "epoch": 0.6889248090964829, "percentage": 68.89, "elapsed_time": "1 day, 5:15:30", "remaining_time": "13:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12361, "total_steps": 17941, "loss": 1.6502, "learning_rate": 2.2735820636805504e-05, "epoch": 0.6889805473496461, "percentage": 68.9, "elapsed_time": "1 day, 5:15:38", "remaining_time": "13:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12362, "total_steps": 17941, "loss": 1.728, "learning_rate": 2.2728357078501943e-05, "epoch": 0.6890362856028092, "percentage": 68.9, "elapsed_time": "1 day, 5:15:47", "remaining_time": "13:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12363, "total_steps": 17941, "loss": 1.7767, "learning_rate": 2.2720894385095887e-05, "epoch": 0.6890920238559723, "percentage": 68.91, "elapsed_time": "1 day, 5:15:55", "remaining_time": "13:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12364, "total_steps": 17941, "loss": 1.4704, "learning_rate": 2.2713432556824033e-05, "epoch": 0.6891477621091355, "percentage": 68.91, "elapsed_time": "1 day, 5:16:04", "remaining_time": "13:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12365, "total_steps": 17941, "loss": 1.5619, "learning_rate": 2.2705971593922985e-05, "epoch": 0.6892035003622986, "percentage": 68.92, "elapsed_time": "1 day, 5:16:12", "remaining_time": "13:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12366, "total_steps": 17941, "loss": 1.6688, "learning_rate": 2.269851149662939e-05, "epoch": 0.6892592386154618, "percentage": 68.93, "elapsed_time": "1 day, 5:16:21", "remaining_time": "13:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12367, "total_steps": 17941, "loss": 1.73, "learning_rate": 2.269105226517983e-05, "epoch": 0.689314976868625, "percentage": 68.93, "elapsed_time": "1 day, 5:16:29", "remaining_time": "13:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12368, "total_steps": 17941, "loss": 1.713, "learning_rate": 2.2683593899810884e-05, "epoch": 0.689370715121788, "percentage": 68.94, "elapsed_time": "1 day, 5:16:38", "remaining_time": "13:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12369, "total_steps": 17941, "loss": 1.746, "learning_rate": 2.2676136400759036e-05, "epoch": 0.6894264533749512, "percentage": 68.94, "elapsed_time": "1 day, 5:16:46", "remaining_time": "13:11:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12370, "total_steps": 17941, "loss": 1.4742, "learning_rate": 2.2668679768260853e-05, "epoch": 0.6894821916281144, "percentage": 68.95, "elapsed_time": "1 day, 5:16:55", "remaining_time": "13:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12371, "total_steps": 17941, "loss": 1.5458, "learning_rate": 2.2661224002552816e-05, "epoch": 0.6895379298812775, "percentage": 68.95, "elapsed_time": "1 day, 5:17:03", "remaining_time": "13:11:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12372, "total_steps": 17941, "loss": 1.723, "learning_rate": 2.2653769103871337e-05, "epoch": 0.6895936681344407, "percentage": 68.96, "elapsed_time": "1 day, 5:17:12", "remaining_time": "13:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12373, "total_steps": 17941, "loss": 1.5082, "learning_rate": 2.2646315072452862e-05, "epoch": 0.6896494063876039, "percentage": 68.96, "elapsed_time": "1 day, 5:17:20", "remaining_time": "13:10:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12374, "total_steps": 17941, "loss": 1.8428, "learning_rate": 2.2638861908533788e-05, "epoch": 0.6897051446407669, "percentage": 68.97, "elapsed_time": "1 day, 5:17:29", "remaining_time": "13:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12375, "total_steps": 17941, "loss": 1.6155, "learning_rate": 2.2631409612350512e-05, "epoch": 0.6897608828939301, "percentage": 68.98, "elapsed_time": "1 day, 5:17:37", "remaining_time": "13:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12376, "total_steps": 17941, "loss": 1.5198, "learning_rate": 2.262395818413931e-05, "epoch": 0.6898166211470933, "percentage": 68.98, "elapsed_time": "1 day, 5:17:46", "remaining_time": "13:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12377, "total_steps": 17941, "loss": 1.7388, "learning_rate": 2.261650762413656e-05, "epoch": 0.6898723594002564, "percentage": 68.99, "elapsed_time": "1 day, 5:17:54", "remaining_time": "13:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12378, "total_steps": 17941, "loss": 1.4587, "learning_rate": 2.2609057932578554e-05, "epoch": 0.6899280976534196, "percentage": 68.99, "elapsed_time": "1 day, 5:18:02", "remaining_time": "13:10:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12379, "total_steps": 17941, "loss": 1.4442, "learning_rate": 2.260160910970151e-05, "epoch": 0.6899838359065827, "percentage": 69.0, "elapsed_time": "1 day, 5:18:12", "remaining_time": "13:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12380, "total_steps": 17941, "loss": 1.613, "learning_rate": 2.2594161155741683e-05, "epoch": 0.6900395741597458, "percentage": 69.0, "elapsed_time": "1 day, 5:18:20", "remaining_time": "13:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12381, "total_steps": 17941, "loss": 1.6245, "learning_rate": 2.2586714070935272e-05, "epoch": 0.690095312412909, "percentage": 69.01, "elapsed_time": "1 day, 5:18:28", "remaining_time": "13:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12382, "total_steps": 17941, "loss": 1.5427, "learning_rate": 2.257926785551848e-05, "epoch": 0.6901510506660721, "percentage": 69.02, "elapsed_time": "1 day, 5:18:37", "remaining_time": "13:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12383, "total_steps": 17941, "loss": 1.6541, "learning_rate": 2.2571822509727426e-05, "epoch": 0.6902067889192353, "percentage": 69.02, "elapsed_time": "1 day, 5:18:45", "remaining_time": "13:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12384, "total_steps": 17941, "loss": 1.6218, "learning_rate": 2.2564378033798217e-05, "epoch": 0.6902625271723984, "percentage": 69.03, "elapsed_time": "1 day, 5:18:55", "remaining_time": "13:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12385, "total_steps": 17941, "loss": 1.7158, "learning_rate": 2.255693442796702e-05, "epoch": 0.6903182654255615, "percentage": 69.03, "elapsed_time": "1 day, 5:19:03", "remaining_time": "13:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12386, "total_steps": 17941, "loss": 1.5469, "learning_rate": 2.254949169246983e-05, "epoch": 0.6903740036787247, "percentage": 69.04, "elapsed_time": "1 day, 5:19:12", "remaining_time": "13:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12387, "total_steps": 17941, "loss": 1.6359, "learning_rate": 2.254204982754273e-05, "epoch": 0.6904297419318879, "percentage": 69.04, "elapsed_time": "1 day, 5:19:20", "remaining_time": "13:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12388, "total_steps": 17941, "loss": 1.5418, "learning_rate": 2.2534608833421712e-05, "epoch": 0.690485480185051, "percentage": 69.05, "elapsed_time": "1 day, 5:19:29", "remaining_time": "13:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12389, "total_steps": 17941, "loss": 1.7552, "learning_rate": 2.252716871034276e-05, "epoch": 0.6905412184382141, "percentage": 69.05, "elapsed_time": "1 day, 5:19:37", "remaining_time": "13:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12390, "total_steps": 17941, "loss": 1.4821, "learning_rate": 2.2519729458541865e-05, "epoch": 0.6905969566913773, "percentage": 69.06, "elapsed_time": "1 day, 5:19:45", "remaining_time": "13:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12391, "total_steps": 17941, "loss": 1.497, "learning_rate": 2.2512291078254914e-05, "epoch": 0.6906526949445404, "percentage": 69.07, "elapsed_time": "1 day, 5:19:54", "remaining_time": "13:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12392, "total_steps": 17941, "loss": 1.7174, "learning_rate": 2.250485356971782e-05, "epoch": 0.6907084331977036, "percentage": 69.07, "elapsed_time": "1 day, 5:20:02", "remaining_time": "13:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12393, "total_steps": 17941, "loss": 1.8879, "learning_rate": 2.249741693316647e-05, "epoch": 0.6907641714508668, "percentage": 69.08, "elapsed_time": "1 day, 5:20:11", "remaining_time": "13:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12394, "total_steps": 17941, "loss": 1.7202, "learning_rate": 2.2489981168836717e-05, "epoch": 0.6908199097040298, "percentage": 69.08, "elapsed_time": "1 day, 5:20:19", "remaining_time": "13:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12395, "total_steps": 17941, "loss": 1.6372, "learning_rate": 2.2482546276964327e-05, "epoch": 0.690875647957193, "percentage": 69.09, "elapsed_time": "1 day, 5:20:28", "remaining_time": "13:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12396, "total_steps": 17941, "loss": 1.6641, "learning_rate": 2.2475112257785157e-05, "epoch": 0.6909313862103562, "percentage": 69.09, "elapsed_time": "1 day, 5:20:36", "remaining_time": "13:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12397, "total_steps": 17941, "loss": 1.6881, "learning_rate": 2.246767911153496e-05, "epoch": 0.6909871244635193, "percentage": 69.1, "elapsed_time": "1 day, 5:20:45", "remaining_time": "13:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12398, "total_steps": 17941, "loss": 1.5398, "learning_rate": 2.246024683844944e-05, "epoch": 0.6910428627166825, "percentage": 69.1, "elapsed_time": "1 day, 5:20:54", "remaining_time": "13:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12399, "total_steps": 17941, "loss": 1.814, "learning_rate": 2.2452815438764318e-05, "epoch": 0.6910986009698457, "percentage": 69.11, "elapsed_time": "1 day, 5:21:02", "remaining_time": "13:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12400, "total_steps": 17941, "loss": 1.8071, "learning_rate": 2.2445384912715284e-05, "epoch": 0.6911543392230087, "percentage": 69.12, "elapsed_time": "1 day, 5:21:11", "remaining_time": "13:06:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12401, "total_steps": 17941, "loss": 1.6608, "learning_rate": 2.2437955260538e-05, "epoch": 0.6912100774761719, "percentage": 69.12, "elapsed_time": "1 day, 5:21:19", "remaining_time": "13:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12402, "total_steps": 17941, "loss": 1.862, "learning_rate": 2.2430526482468045e-05, "epoch": 0.6912658157293351, "percentage": 69.13, "elapsed_time": "1 day, 5:21:28", "remaining_time": "13:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12403, "total_steps": 17941, "loss": 1.4627, "learning_rate": 2.2423098578741065e-05, "epoch": 0.6913215539824982, "percentage": 69.13, "elapsed_time": "1 day, 5:21:37", "remaining_time": "13:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12404, "total_steps": 17941, "loss": 1.7114, "learning_rate": 2.2415671549592632e-05, "epoch": 0.6913772922356614, "percentage": 69.14, "elapsed_time": "1 day, 5:21:45", "remaining_time": "13:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12405, "total_steps": 17941, "loss": 1.6241, "learning_rate": 2.2408245395258248e-05, "epoch": 0.6914330304888244, "percentage": 69.14, "elapsed_time": "1 day, 5:21:54", "remaining_time": "13:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12406, "total_steps": 17941, "loss": 1.6638, "learning_rate": 2.2400820115973453e-05, "epoch": 0.6914887687419876, "percentage": 69.15, "elapsed_time": "1 day, 5:22:02", "remaining_time": "13:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12407, "total_steps": 17941, "loss": 1.4791, "learning_rate": 2.239339571197373e-05, "epoch": 0.6915445069951508, "percentage": 69.15, "elapsed_time": "1 day, 5:22:10", "remaining_time": "13:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12408, "total_steps": 17941, "loss": 1.7044, "learning_rate": 2.2385972183494552e-05, "epoch": 0.6916002452483139, "percentage": 69.16, "elapsed_time": "1 day, 5:22:19", "remaining_time": "13:05:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12409, "total_steps": 17941, "loss": 1.5771, "learning_rate": 2.237854953077132e-05, "epoch": 0.6916559835014771, "percentage": 69.17, "elapsed_time": "1 day, 5:22:28", "remaining_time": "13:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12410, "total_steps": 17941, "loss": 1.523, "learning_rate": 2.2371127754039433e-05, "epoch": 0.6917117217546402, "percentage": 69.17, "elapsed_time": "1 day, 5:22:36", "remaining_time": "13:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12411, "total_steps": 17941, "loss": 1.7749, "learning_rate": 2.236370685353433e-05, "epoch": 0.6917674600078033, "percentage": 69.18, "elapsed_time": "1 day, 5:22:44", "remaining_time": "13:05:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12412, "total_steps": 17941, "loss": 1.7331, "learning_rate": 2.2356286829491284e-05, "epoch": 0.6918231982609665, "percentage": 69.18, "elapsed_time": "1 day, 5:22:53", "remaining_time": "13:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12413, "total_steps": 17941, "loss": 1.299, "learning_rate": 2.2348867682145653e-05, "epoch": 0.6918789365141297, "percentage": 69.19, "elapsed_time": "1 day, 5:23:02", "remaining_time": "13:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12414, "total_steps": 17941, "loss": 1.7712, "learning_rate": 2.2341449411732724e-05, "epoch": 0.6919346747672928, "percentage": 69.19, "elapsed_time": "1 day, 5:23:10", "remaining_time": "13:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12415, "total_steps": 17941, "loss": 1.8, "learning_rate": 2.2334032018487772e-05, "epoch": 0.6919904130204559, "percentage": 69.2, "elapsed_time": "1 day, 5:23:19", "remaining_time": "13:04:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12416, "total_steps": 17941, "loss": 1.7482, "learning_rate": 2.2326615502646002e-05, "epoch": 0.6920461512736191, "percentage": 69.2, "elapsed_time": "1 day, 5:23:28", "remaining_time": "13:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12417, "total_steps": 17941, "loss": 1.867, "learning_rate": 2.2319199864442648e-05, "epoch": 0.6921018895267822, "percentage": 69.21, "elapsed_time": "1 day, 5:23:36", "remaining_time": "13:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12418, "total_steps": 17941, "loss": 1.627, "learning_rate": 2.2311785104112876e-05, "epoch": 0.6921576277799454, "percentage": 69.22, "elapsed_time": "1 day, 5:23:45", "remaining_time": "13:04:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12419, "total_steps": 17941, "loss": 1.5884, "learning_rate": 2.230437122189185e-05, "epoch": 0.6922133660331086, "percentage": 69.22, "elapsed_time": "1 day, 5:23:53", "remaining_time": "13:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12420, "total_steps": 17941, "loss": 1.5532, "learning_rate": 2.2296958218014712e-05, "epoch": 0.6922691042862716, "percentage": 69.23, "elapsed_time": "1 day, 5:24:01", "remaining_time": "13:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12421, "total_steps": 17941, "loss": 1.5991, "learning_rate": 2.22895460927165e-05, "epoch": 0.6923248425394348, "percentage": 69.23, "elapsed_time": "1 day, 5:24:10", "remaining_time": "13:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12422, "total_steps": 17941, "loss": 1.6068, "learning_rate": 2.2282134846232343e-05, "epoch": 0.692380580792598, "percentage": 69.24, "elapsed_time": "1 day, 5:24:18", "remaining_time": "13:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12423, "total_steps": 17941, "loss": 1.4699, "learning_rate": 2.227472447879728e-05, "epoch": 0.6924363190457611, "percentage": 69.24, "elapsed_time": "1 day, 5:24:28", "remaining_time": "13:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12424, "total_steps": 17941, "loss": 1.7881, "learning_rate": 2.2267314990646294e-05, "epoch": 0.6924920572989243, "percentage": 69.25, "elapsed_time": "1 day, 5:24:36", "remaining_time": "13:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12425, "total_steps": 17941, "loss": 1.4128, "learning_rate": 2.225990638201438e-05, "epoch": 0.6925477955520875, "percentage": 69.25, "elapsed_time": "1 day, 5:24:45", "remaining_time": "13:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12426, "total_steps": 17941, "loss": 1.6069, "learning_rate": 2.2252498653136493e-05, "epoch": 0.6926035338052505, "percentage": 69.26, "elapsed_time": "1 day, 5:24:53", "remaining_time": "13:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12427, "total_steps": 17941, "loss": 1.6399, "learning_rate": 2.22450918042476e-05, "epoch": 0.6926592720584137, "percentage": 69.27, "elapsed_time": "1 day, 5:25:01", "remaining_time": "13:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12428, "total_steps": 17941, "loss": 1.5405, "learning_rate": 2.2237685835582527e-05, "epoch": 0.6927150103115768, "percentage": 69.27, "elapsed_time": "1 day, 5:25:10", "remaining_time": "13:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12429, "total_steps": 17941, "loss": 1.7644, "learning_rate": 2.2230280747376216e-05, "epoch": 0.69277074856474, "percentage": 69.28, "elapsed_time": "1 day, 5:25:18", "remaining_time": "13:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12430, "total_steps": 17941, "loss": 1.5258, "learning_rate": 2.2222876539863508e-05, "epoch": 0.6928264868179032, "percentage": 69.28, "elapsed_time": "1 day, 5:25:27", "remaining_time": "13:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12431, "total_steps": 17941, "loss": 1.8579, "learning_rate": 2.221547321327918e-05, "epoch": 0.6928822250710662, "percentage": 69.29, "elapsed_time": "1 day, 5:25:35", "remaining_time": "13:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12432, "total_steps": 17941, "loss": 1.5001, "learning_rate": 2.2208070767858057e-05, "epoch": 0.6929379633242294, "percentage": 69.29, "elapsed_time": "1 day, 5:25:44", "remaining_time": "13:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12433, "total_steps": 17941, "loss": 1.6712, "learning_rate": 2.2200669203834885e-05, "epoch": 0.6929937015773926, "percentage": 69.3, "elapsed_time": "1 day, 5:25:53", "remaining_time": "13:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12434, "total_steps": 17941, "loss": 1.631, "learning_rate": 2.2193268521444428e-05, "epoch": 0.6930494398305557, "percentage": 69.3, "elapsed_time": "1 day, 5:26:01", "remaining_time": "13:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12435, "total_steps": 17941, "loss": 1.7087, "learning_rate": 2.2185868720921342e-05, "epoch": 0.6931051780837189, "percentage": 69.31, "elapsed_time": "1 day, 5:26:09", "remaining_time": "13:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12436, "total_steps": 17941, "loss": 1.7335, "learning_rate": 2.217846980250032e-05, "epoch": 0.693160916336882, "percentage": 69.32, "elapsed_time": "1 day, 5:26:18", "remaining_time": "13:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12437, "total_steps": 17941, "loss": 1.8468, "learning_rate": 2.2171071766416064e-05, "epoch": 0.6932166545900451, "percentage": 69.32, "elapsed_time": "1 day, 5:26:26", "remaining_time": "13:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12438, "total_steps": 17941, "loss": 1.5575, "learning_rate": 2.2163674612903135e-05, "epoch": 0.6932723928432083, "percentage": 69.33, "elapsed_time": "1 day, 5:26:35", "remaining_time": "13:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12439, "total_steps": 17941, "loss": 1.7773, "learning_rate": 2.215627834219615e-05, "epoch": 0.6933281310963715, "percentage": 69.33, "elapsed_time": "1 day, 5:26:44", "remaining_time": "13:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12440, "total_steps": 17941, "loss": 1.7082, "learning_rate": 2.2148882954529676e-05, "epoch": 0.6933838693495346, "percentage": 69.34, "elapsed_time": "1 day, 5:26:52", "remaining_time": "13:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12441, "total_steps": 17941, "loss": 1.7633, "learning_rate": 2.2141488450138277e-05, "epoch": 0.6934396076026977, "percentage": 69.34, "elapsed_time": "1 day, 5:27:00", "remaining_time": "13:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12442, "total_steps": 17941, "loss": 1.4418, "learning_rate": 2.2134094829256408e-05, "epoch": 0.6934953458558609, "percentage": 69.35, "elapsed_time": "1 day, 5:27:09", "remaining_time": "13:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12443, "total_steps": 17941, "loss": 1.6666, "learning_rate": 2.2126702092118572e-05, "epoch": 0.693551084109024, "percentage": 69.36, "elapsed_time": "1 day, 5:27:18", "remaining_time": "13:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12444, "total_steps": 17941, "loss": 1.8063, "learning_rate": 2.2119310238959268e-05, "epoch": 0.6936068223621872, "percentage": 69.36, "elapsed_time": "1 day, 5:27:26", "remaining_time": "13:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12445, "total_steps": 17941, "loss": 1.8061, "learning_rate": 2.2111919270012866e-05, "epoch": 0.6936625606153504, "percentage": 69.37, "elapsed_time": "1 day, 5:27:35", "remaining_time": "13:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12446, "total_steps": 17941, "loss": 1.7359, "learning_rate": 2.2104529185513806e-05, "epoch": 0.6937182988685134, "percentage": 69.37, "elapsed_time": "1 day, 5:27:43", "remaining_time": "13:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12447, "total_steps": 17941, "loss": 1.7572, "learning_rate": 2.2097139985696404e-05, "epoch": 0.6937740371216766, "percentage": 69.38, "elapsed_time": "1 day, 5:27:52", "remaining_time": "13:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12448, "total_steps": 17941, "loss": 1.8654, "learning_rate": 2.208975167079505e-05, "epoch": 0.6938297753748398, "percentage": 69.38, "elapsed_time": "1 day, 5:28:00", "remaining_time": "13:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12449, "total_steps": 17941, "loss": 1.625, "learning_rate": 2.2082364241044068e-05, "epoch": 0.6938855136280029, "percentage": 69.39, "elapsed_time": "1 day, 5:28:09", "remaining_time": "13:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12450, "total_steps": 17941, "loss": 1.685, "learning_rate": 2.2074977696677703e-05, "epoch": 0.6939412518811661, "percentage": 69.39, "elapsed_time": "1 day, 5:28:17", "remaining_time": "12:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12451, "total_steps": 17941, "loss": 1.6458, "learning_rate": 2.2067592037930224e-05, "epoch": 0.6939969901343291, "percentage": 69.4, "elapsed_time": "1 day, 5:28:26", "remaining_time": "12:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12452, "total_steps": 17941, "loss": 1.6008, "learning_rate": 2.2060207265035876e-05, "epoch": 0.6940527283874923, "percentage": 69.41, "elapsed_time": "1 day, 5:28:34", "remaining_time": "12:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12453, "total_steps": 17941, "loss": 1.4996, "learning_rate": 2.205282337822887e-05, "epoch": 0.6941084666406555, "percentage": 69.41, "elapsed_time": "1 day, 5:28:42", "remaining_time": "12:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12454, "total_steps": 17941, "loss": 1.8717, "learning_rate": 2.2045440377743325e-05, "epoch": 0.6941642048938186, "percentage": 69.42, "elapsed_time": "1 day, 5:28:51", "remaining_time": "12:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12455, "total_steps": 17941, "loss": 1.7107, "learning_rate": 2.2038058263813443e-05, "epoch": 0.6942199431469818, "percentage": 69.42, "elapsed_time": "1 day, 5:28:59", "remaining_time": "12:59:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12456, "total_steps": 17941, "loss": 1.4656, "learning_rate": 2.203067703667334e-05, "epoch": 0.694275681400145, "percentage": 69.43, "elapsed_time": "1 day, 5:29:08", "remaining_time": "12:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12457, "total_steps": 17941, "loss": 1.8354, "learning_rate": 2.202329669655708e-05, "epoch": 0.694331419653308, "percentage": 69.43, "elapsed_time": "1 day, 5:29:17", "remaining_time": "12:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12458, "total_steps": 17941, "loss": 1.6724, "learning_rate": 2.2015917243698725e-05, "epoch": 0.6943871579064712, "percentage": 69.44, "elapsed_time": "1 day, 5:29:25", "remaining_time": "12:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12459, "total_steps": 17941, "loss": 1.7463, "learning_rate": 2.2008538678332314e-05, "epoch": 0.6944428961596344, "percentage": 69.44, "elapsed_time": "1 day, 5:29:33", "remaining_time": "12:58:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12460, "total_steps": 17941, "loss": 1.743, "learning_rate": 2.200116100069188e-05, "epoch": 0.6944986344127975, "percentage": 69.45, "elapsed_time": "1 day, 5:29:42", "remaining_time": "12:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12461, "total_steps": 17941, "loss": 1.6518, "learning_rate": 2.1993784211011353e-05, "epoch": 0.6945543726659607, "percentage": 69.46, "elapsed_time": "1 day, 5:29:50", "remaining_time": "12:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12462, "total_steps": 17941, "loss": 1.4703, "learning_rate": 2.1986408309524682e-05, "epoch": 0.6946101109191238, "percentage": 69.46, "elapsed_time": "1 day, 5:29:59", "remaining_time": "12:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12463, "total_steps": 17941, "loss": 1.6126, "learning_rate": 2.197903329646585e-05, "epoch": 0.6946658491722869, "percentage": 69.47, "elapsed_time": "1 day, 5:30:07", "remaining_time": "12:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12464, "total_steps": 17941, "loss": 1.8363, "learning_rate": 2.1971659172068688e-05, "epoch": 0.6947215874254501, "percentage": 69.47, "elapsed_time": "1 day, 5:30:16", "remaining_time": "12:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12465, "total_steps": 17941, "loss": 1.3474, "learning_rate": 2.196428593656708e-05, "epoch": 0.6947773256786133, "percentage": 69.48, "elapsed_time": "1 day, 5:30:24", "remaining_time": "12:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12466, "total_steps": 17941, "loss": 1.7261, "learning_rate": 2.1956913590194867e-05, "epoch": 0.6948330639317764, "percentage": 69.48, "elapsed_time": "1 day, 5:30:33", "remaining_time": "12:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12467, "total_steps": 17941, "loss": 1.6184, "learning_rate": 2.1949542133185864e-05, "epoch": 0.6948888021849395, "percentage": 69.49, "elapsed_time": "1 day, 5:30:41", "remaining_time": "12:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12468, "total_steps": 17941, "loss": 1.6595, "learning_rate": 2.194217156577383e-05, "epoch": 0.6949445404381027, "percentage": 69.49, "elapsed_time": "1 day, 5:30:50", "remaining_time": "12:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12469, "total_steps": 17941, "loss": 1.4192, "learning_rate": 2.1934801888192496e-05, "epoch": 0.6950002786912658, "percentage": 69.5, "elapsed_time": "1 day, 5:30:59", "remaining_time": "12:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12470, "total_steps": 17941, "loss": 1.9271, "learning_rate": 2.1927433100675652e-05, "epoch": 0.695056016944429, "percentage": 69.51, "elapsed_time": "1 day, 5:31:07", "remaining_time": "12:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12471, "total_steps": 17941, "loss": 1.8332, "learning_rate": 2.1920065203456946e-05, "epoch": 0.6951117551975922, "percentage": 69.51, "elapsed_time": "1 day, 5:31:16", "remaining_time": "12:56:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12472, "total_steps": 17941, "loss": 1.8357, "learning_rate": 2.191269819677007e-05, "epoch": 0.6951674934507552, "percentage": 69.52, "elapsed_time": "1 day, 5:31:25", "remaining_time": "12:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12473, "total_steps": 17941, "loss": 1.9264, "learning_rate": 2.1905332080848606e-05, "epoch": 0.6952232317039184, "percentage": 69.52, "elapsed_time": "1 day, 5:31:33", "remaining_time": "12:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12474, "total_steps": 17941, "loss": 1.7122, "learning_rate": 2.1897966855926227e-05, "epoch": 0.6952789699570815, "percentage": 69.53, "elapsed_time": "1 day, 5:31:42", "remaining_time": "12:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12475, "total_steps": 17941, "loss": 1.5732, "learning_rate": 2.189060252223651e-05, "epoch": 0.6953347082102447, "percentage": 69.53, "elapsed_time": "1 day, 5:31:50", "remaining_time": "12:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12476, "total_steps": 17941, "loss": 1.6042, "learning_rate": 2.1883239080012973e-05, "epoch": 0.6953904464634079, "percentage": 69.54, "elapsed_time": "1 day, 5:31:59", "remaining_time": "12:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12477, "total_steps": 17941, "loss": 1.5583, "learning_rate": 2.1875876529489165e-05, "epoch": 0.6954461847165709, "percentage": 69.54, "elapsed_time": "1 day, 5:32:07", "remaining_time": "12:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12478, "total_steps": 17941, "loss": 1.6155, "learning_rate": 2.1868514870898572e-05, "epoch": 0.6955019229697341, "percentage": 69.55, "elapsed_time": "1 day, 5:32:16", "remaining_time": "12:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12479, "total_steps": 17941, "loss": 1.506, "learning_rate": 2.186115410447469e-05, "epoch": 0.6955576612228973, "percentage": 69.56, "elapsed_time": "1 day, 5:32:24", "remaining_time": "12:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12480, "total_steps": 17941, "loss": 1.5715, "learning_rate": 2.1853794230450903e-05, "epoch": 0.6956133994760604, "percentage": 69.56, "elapsed_time": "1 day, 5:32:32", "remaining_time": "12:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12481, "total_steps": 17941, "loss": 1.6175, "learning_rate": 2.1846435249060677e-05, "epoch": 0.6956691377292236, "percentage": 69.57, "elapsed_time": "1 day, 5:32:41", "remaining_time": "12:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12482, "total_steps": 17941, "loss": 1.4722, "learning_rate": 2.18390771605374e-05, "epoch": 0.6957248759823867, "percentage": 69.57, "elapsed_time": "1 day, 5:32:49", "remaining_time": "12:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12483, "total_steps": 17941, "loss": 1.6391, "learning_rate": 2.1831719965114383e-05, "epoch": 0.6957806142355498, "percentage": 69.58, "elapsed_time": "1 day, 5:32:58", "remaining_time": "12:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12484, "total_steps": 17941, "loss": 1.6116, "learning_rate": 2.1824363663024976e-05, "epoch": 0.695836352488713, "percentage": 69.58, "elapsed_time": "1 day, 5:33:06", "remaining_time": "12:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12485, "total_steps": 17941, "loss": 1.7712, "learning_rate": 2.181700825450248e-05, "epoch": 0.6958920907418762, "percentage": 69.59, "elapsed_time": "1 day, 5:33:15", "remaining_time": "12:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12486, "total_steps": 17941, "loss": 1.5029, "learning_rate": 2.1809653739780182e-05, "epoch": 0.6959478289950393, "percentage": 69.59, "elapsed_time": "1 day, 5:33:23", "remaining_time": "12:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12487, "total_steps": 17941, "loss": 1.5279, "learning_rate": 2.180230011909129e-05, "epoch": 0.6960035672482024, "percentage": 69.6, "elapsed_time": "1 day, 5:33:32", "remaining_time": "12:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12488, "total_steps": 17941, "loss": 1.4994, "learning_rate": 2.1794947392669013e-05, "epoch": 0.6960593055013656, "percentage": 69.61, "elapsed_time": "1 day, 5:33:40", "remaining_time": "12:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12489, "total_steps": 17941, "loss": 1.7903, "learning_rate": 2.1787595560746593e-05, "epoch": 0.6961150437545287, "percentage": 69.61, "elapsed_time": "1 day, 5:33:48", "remaining_time": "12:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12490, "total_steps": 17941, "loss": 1.5443, "learning_rate": 2.178024462355714e-05, "epoch": 0.6961707820076919, "percentage": 69.62, "elapsed_time": "1 day, 5:33:57", "remaining_time": "12:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12491, "total_steps": 17941, "loss": 1.5959, "learning_rate": 2.1772894581333792e-05, "epoch": 0.6962265202608551, "percentage": 69.62, "elapsed_time": "1 day, 5:34:06", "remaining_time": "12:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12492, "total_steps": 17941, "loss": 1.4327, "learning_rate": 2.176554543430965e-05, "epoch": 0.6962822585140181, "percentage": 69.63, "elapsed_time": "1 day, 5:34:14", "remaining_time": "12:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12493, "total_steps": 17941, "loss": 1.7718, "learning_rate": 2.175819718271781e-05, "epoch": 0.6963379967671813, "percentage": 69.63, "elapsed_time": "1 day, 5:34:23", "remaining_time": "12:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12494, "total_steps": 17941, "loss": 1.5627, "learning_rate": 2.1750849826791275e-05, "epoch": 0.6963937350203445, "percentage": 69.64, "elapsed_time": "1 day, 5:34:31", "remaining_time": "12:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12495, "total_steps": 17941, "loss": 1.6201, "learning_rate": 2.1743503366763058e-05, "epoch": 0.6964494732735076, "percentage": 69.64, "elapsed_time": "1 day, 5:34:39", "remaining_time": "12:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12496, "total_steps": 17941, "loss": 1.6484, "learning_rate": 2.173615780286621e-05, "epoch": 0.6965052115266708, "percentage": 69.65, "elapsed_time": "1 day, 5:34:48", "remaining_time": "12:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12497, "total_steps": 17941, "loss": 1.5867, "learning_rate": 2.172881313533362e-05, "epoch": 0.6965609497798338, "percentage": 69.66, "elapsed_time": "1 day, 5:34:56", "remaining_time": "12:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12498, "total_steps": 17941, "loss": 1.6964, "learning_rate": 2.1721469364398274e-05, "epoch": 0.696616688032997, "percentage": 69.66, "elapsed_time": "1 day, 5:35:05", "remaining_time": "12:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12499, "total_steps": 17941, "loss": 1.4694, "learning_rate": 2.1714126490292998e-05, "epoch": 0.6966724262861602, "percentage": 69.67, "elapsed_time": "1 day, 5:35:14", "remaining_time": "12:52:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12500, "total_steps": 17941, "loss": 1.679, "learning_rate": 2.1706784513250734e-05, "epoch": 0.6967281645393233, "percentage": 69.67, "elapsed_time": "1 day, 5:35:23", "remaining_time": "12:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12501, "total_steps": 17941, "loss": 1.8925, "learning_rate": 2.1699443433504326e-05, "epoch": 0.6967839027924865, "percentage": 69.68, "elapsed_time": "1 day, 5:35:31", "remaining_time": "12:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12502, "total_steps": 17941, "loss": 1.5665, "learning_rate": 2.1692103251286544e-05, "epoch": 0.6968396410456497, "percentage": 69.68, "elapsed_time": "1 day, 5:35:40", "remaining_time": "12:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12503, "total_steps": 17941, "loss": 1.5741, "learning_rate": 2.1684763966830208e-05, "epoch": 0.6968953792988127, "percentage": 69.69, "elapsed_time": "1 day, 5:35:48", "remaining_time": "12:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12504, "total_steps": 17941, "loss": 1.6109, "learning_rate": 2.167742558036806e-05, "epoch": 0.6969511175519759, "percentage": 69.7, "elapsed_time": "1 day, 5:35:57", "remaining_time": "12:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12505, "total_steps": 17941, "loss": 1.5966, "learning_rate": 2.1670088092132866e-05, "epoch": 0.6970068558051391, "percentage": 69.7, "elapsed_time": "1 day, 5:36:05", "remaining_time": "12:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12506, "total_steps": 17941, "loss": 1.7803, "learning_rate": 2.1662751502357265e-05, "epoch": 0.6970625940583022, "percentage": 69.71, "elapsed_time": "1 day, 5:36:14", "remaining_time": "12:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12507, "total_steps": 17941, "loss": 1.366, "learning_rate": 2.1655415811273988e-05, "epoch": 0.6971183323114654, "percentage": 69.71, "elapsed_time": "1 day, 5:36:22", "remaining_time": "12:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12508, "total_steps": 17941, "loss": 1.7152, "learning_rate": 2.1648081019115675e-05, "epoch": 0.6971740705646285, "percentage": 69.72, "elapsed_time": "1 day, 5:36:31", "remaining_time": "12:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12509, "total_steps": 17941, "loss": 1.6061, "learning_rate": 2.1640747126114915e-05, "epoch": 0.6972298088177916, "percentage": 69.72, "elapsed_time": "1 day, 5:36:39", "remaining_time": "12:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12510, "total_steps": 17941, "loss": 1.455, "learning_rate": 2.163341413250431e-05, "epoch": 0.6972855470709548, "percentage": 69.73, "elapsed_time": "1 day, 5:36:47", "remaining_time": "12:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12511, "total_steps": 17941, "loss": 1.554, "learning_rate": 2.1626082038516415e-05, "epoch": 0.697341285324118, "percentage": 69.73, "elapsed_time": "1 day, 5:36:56", "remaining_time": "12:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12512, "total_steps": 17941, "loss": 1.4238, "learning_rate": 2.161875084438379e-05, "epoch": 0.6973970235772811, "percentage": 69.74, "elapsed_time": "1 day, 5:37:04", "remaining_time": "12:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12513, "total_steps": 17941, "loss": 1.6579, "learning_rate": 2.1611420550338894e-05, "epoch": 0.6974527618304442, "percentage": 69.75, "elapsed_time": "1 day, 5:37:13", "remaining_time": "12:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12514, "total_steps": 17941, "loss": 1.7723, "learning_rate": 2.1604091156614204e-05, "epoch": 0.6975085000836074, "percentage": 69.75, "elapsed_time": "1 day, 5:37:21", "remaining_time": "12:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12515, "total_steps": 17941, "loss": 1.5309, "learning_rate": 2.1596762663442218e-05, "epoch": 0.6975642383367705, "percentage": 69.76, "elapsed_time": "1 day, 5:37:30", "remaining_time": "12:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12516, "total_steps": 17941, "loss": 1.6055, "learning_rate": 2.1589435071055296e-05, "epoch": 0.6976199765899337, "percentage": 69.76, "elapsed_time": "1 day, 5:37:38", "remaining_time": "12:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12517, "total_steps": 17941, "loss": 1.8028, "learning_rate": 2.1582108379685856e-05, "epoch": 0.6976757148430969, "percentage": 69.77, "elapsed_time": "1 day, 5:37:47", "remaining_time": "12:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12518, "total_steps": 17941, "loss": 1.6126, "learning_rate": 2.1574782589566244e-05, "epoch": 0.69773145309626, "percentage": 69.77, "elapsed_time": "1 day, 5:37:55", "remaining_time": "12:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12519, "total_steps": 17941, "loss": 1.6897, "learning_rate": 2.1567457700928822e-05, "epoch": 0.6977871913494231, "percentage": 69.78, "elapsed_time": "1 day, 5:38:03", "remaining_time": "12:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12520, "total_steps": 17941, "loss": 1.5911, "learning_rate": 2.1560133714005848e-05, "epoch": 0.6978429296025862, "percentage": 69.78, "elapsed_time": "1 day, 5:38:12", "remaining_time": "12:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12521, "total_steps": 17941, "loss": 1.7061, "learning_rate": 2.1552810629029596e-05, "epoch": 0.6978986678557494, "percentage": 69.79, "elapsed_time": "1 day, 5:38:20", "remaining_time": "12:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12522, "total_steps": 17941, "loss": 1.5237, "learning_rate": 2.154548844623237e-05, "epoch": 0.6979544061089126, "percentage": 69.8, "elapsed_time": "1 day, 5:38:29", "remaining_time": "12:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12523, "total_steps": 17941, "loss": 1.7261, "learning_rate": 2.1538167165846333e-05, "epoch": 0.6980101443620756, "percentage": 69.8, "elapsed_time": "1 day, 5:38:37", "remaining_time": "12:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12524, "total_steps": 17941, "loss": 1.7511, "learning_rate": 2.1530846788103686e-05, "epoch": 0.6980658826152388, "percentage": 69.81, "elapsed_time": "1 day, 5:38:46", "remaining_time": "12:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12525, "total_steps": 17941, "loss": 1.6178, "learning_rate": 2.1523527313236598e-05, "epoch": 0.698121620868402, "percentage": 69.81, "elapsed_time": "1 day, 5:38:54", "remaining_time": "12:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12526, "total_steps": 17941, "loss": 1.436, "learning_rate": 2.1516208741477207e-05, "epoch": 0.6981773591215651, "percentage": 69.82, "elapsed_time": "1 day, 5:39:03", "remaining_time": "12:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12527, "total_steps": 17941, "loss": 1.4729, "learning_rate": 2.1508891073057587e-05, "epoch": 0.6982330973747283, "percentage": 69.82, "elapsed_time": "1 day, 5:39:11", "remaining_time": "12:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12528, "total_steps": 17941, "loss": 1.9092, "learning_rate": 2.1501574308209828e-05, "epoch": 0.6982888356278915, "percentage": 69.83, "elapsed_time": "1 day, 5:39:20", "remaining_time": "12:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12529, "total_steps": 17941, "loss": 1.6061, "learning_rate": 2.1494258447165973e-05, "epoch": 0.6983445738810545, "percentage": 69.83, "elapsed_time": "1 day, 5:39:28", "remaining_time": "12:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12530, "total_steps": 17941, "loss": 1.828, "learning_rate": 2.1486943490158034e-05, "epoch": 0.6984003121342177, "percentage": 69.84, "elapsed_time": "1 day, 5:39:36", "remaining_time": "12:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12531, "total_steps": 17941, "loss": 1.8147, "learning_rate": 2.1479629437418032e-05, "epoch": 0.6984560503873809, "percentage": 69.85, "elapsed_time": "1 day, 5:39:45", "remaining_time": "12:48:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12532, "total_steps": 17941, "loss": 1.6662, "learning_rate": 2.1472316289177856e-05, "epoch": 0.698511788640544, "percentage": 69.85, "elapsed_time": "1 day, 5:39:53", "remaining_time": "12:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12533, "total_steps": 17941, "loss": 1.5294, "learning_rate": 2.1465004045669505e-05, "epoch": 0.6985675268937072, "percentage": 69.86, "elapsed_time": "1 day, 5:40:02", "remaining_time": "12:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12534, "total_steps": 17941, "loss": 1.7331, "learning_rate": 2.145769270712487e-05, "epoch": 0.6986232651468703, "percentage": 69.86, "elapsed_time": "1 day, 5:40:11", "remaining_time": "12:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12535, "total_steps": 17941, "loss": 1.5622, "learning_rate": 2.1450382273775788e-05, "epoch": 0.6986790034000334, "percentage": 69.87, "elapsed_time": "1 day, 5:40:19", "remaining_time": "12:47:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12536, "total_steps": 17941, "loss": 1.418, "learning_rate": 2.144307274585413e-05, "epoch": 0.6987347416531966, "percentage": 69.87, "elapsed_time": "1 day, 5:40:28", "remaining_time": "12:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12537, "total_steps": 17941, "loss": 1.5661, "learning_rate": 2.14357641235917e-05, "epoch": 0.6987904799063598, "percentage": 69.88, "elapsed_time": "1 day, 5:40:36", "remaining_time": "12:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12538, "total_steps": 17941, "loss": 1.8971, "learning_rate": 2.1428456407220315e-05, "epoch": 0.6988462181595229, "percentage": 69.88, "elapsed_time": "1 day, 5:40:45", "remaining_time": "12:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12539, "total_steps": 17941, "loss": 1.5624, "learning_rate": 2.142114959697169e-05, "epoch": 0.698901956412686, "percentage": 69.89, "elapsed_time": "1 day, 5:40:53", "remaining_time": "12:47:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12540, "total_steps": 17941, "loss": 1.7243, "learning_rate": 2.1413843693077552e-05, "epoch": 0.6989576946658492, "percentage": 69.9, "elapsed_time": "1 day, 5:41:02", "remaining_time": "12:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12541, "total_steps": 17941, "loss": 1.5812, "learning_rate": 2.140653869576966e-05, "epoch": 0.6990134329190123, "percentage": 69.9, "elapsed_time": "1 day, 5:41:10", "remaining_time": "12:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12542, "total_steps": 17941, "loss": 1.6288, "learning_rate": 2.1399234605279634e-05, "epoch": 0.6990691711721755, "percentage": 69.91, "elapsed_time": "1 day, 5:41:19", "remaining_time": "12:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12543, "total_steps": 17941, "loss": 1.6193, "learning_rate": 2.1391931421839127e-05, "epoch": 0.6991249094253386, "percentage": 69.91, "elapsed_time": "1 day, 5:41:27", "remaining_time": "12:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12544, "total_steps": 17941, "loss": 1.8533, "learning_rate": 2.1384629145679765e-05, "epoch": 0.6991806476785017, "percentage": 69.92, "elapsed_time": "1 day, 5:41:35", "remaining_time": "12:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12545, "total_steps": 17941, "loss": 1.8032, "learning_rate": 2.137732777703314e-05, "epoch": 0.6992363859316649, "percentage": 69.92, "elapsed_time": "1 day, 5:41:44", "remaining_time": "12:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12546, "total_steps": 17941, "loss": 1.8345, "learning_rate": 2.137002731613078e-05, "epoch": 0.699292124184828, "percentage": 69.93, "elapsed_time": "1 day, 5:41:52", "remaining_time": "12:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12547, "total_steps": 17941, "loss": 1.6405, "learning_rate": 2.1362727763204216e-05, "epoch": 0.6993478624379912, "percentage": 69.93, "elapsed_time": "1 day, 5:42:01", "remaining_time": "12:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12548, "total_steps": 17941, "loss": 1.4639, "learning_rate": 2.1355429118484986e-05, "epoch": 0.6994036006911544, "percentage": 69.94, "elapsed_time": "1 day, 5:42:10", "remaining_time": "12:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12549, "total_steps": 17941, "loss": 1.6657, "learning_rate": 2.1348131382204527e-05, "epoch": 0.6994593389443174, "percentage": 69.95, "elapsed_time": "1 day, 5:42:18", "remaining_time": "12:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12550, "total_steps": 17941, "loss": 1.7891, "learning_rate": 2.1340834554594287e-05, "epoch": 0.6995150771974806, "percentage": 69.95, "elapsed_time": "1 day, 5:42:27", "remaining_time": "12:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12551, "total_steps": 17941, "loss": 1.9755, "learning_rate": 2.1333538635885674e-05, "epoch": 0.6995708154506438, "percentage": 69.96, "elapsed_time": "1 day, 5:42:35", "remaining_time": "12:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12552, "total_steps": 17941, "loss": 1.4889, "learning_rate": 2.13262436263101e-05, "epoch": 0.6996265537038069, "percentage": 69.96, "elapsed_time": "1 day, 5:42:44", "remaining_time": "12:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12553, "total_steps": 17941, "loss": 1.3855, "learning_rate": 2.131894952609888e-05, "epoch": 0.6996822919569701, "percentage": 69.97, "elapsed_time": "1 day, 5:42:52", "remaining_time": "12:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12554, "total_steps": 17941, "loss": 1.8536, "learning_rate": 2.131165633548336e-05, "epoch": 0.6997380302101333, "percentage": 69.97, "elapsed_time": "1 day, 5:43:01", "remaining_time": "12:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12555, "total_steps": 17941, "loss": 1.6022, "learning_rate": 2.1304364054694835e-05, "epoch": 0.6997937684632963, "percentage": 69.98, "elapsed_time": "1 day, 5:43:09", "remaining_time": "12:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12556, "total_steps": 17941, "loss": 1.812, "learning_rate": 2.129707268396458e-05, "epoch": 0.6998495067164595, "percentage": 69.98, "elapsed_time": "1 day, 5:43:18", "remaining_time": "12:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12557, "total_steps": 17941, "loss": 1.7548, "learning_rate": 2.1289782223523848e-05, "epoch": 0.6999052449696227, "percentage": 69.99, "elapsed_time": "1 day, 5:43:27", "remaining_time": "12:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12558, "total_steps": 17941, "loss": 1.5542, "learning_rate": 2.1282492673603788e-05, "epoch": 0.6999609832227858, "percentage": 70.0, "elapsed_time": "1 day, 5:43:36", "remaining_time": "12:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12559, "total_steps": 17941, "loss": 1.7433, "learning_rate": 2.1275204034435647e-05, "epoch": 0.700016721475949, "percentage": 70.0, "elapsed_time": "1 day, 5:43:44", "remaining_time": "12:44:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12560, "total_steps": 17941, "loss": 1.7956, "learning_rate": 2.1267916306250573e-05, "epoch": 0.7000724597291121, "percentage": 70.01, "elapsed_time": "1 day, 5:43:52", "remaining_time": "12:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12561, "total_steps": 17941, "loss": 1.1928, "learning_rate": 2.126062948927966e-05, "epoch": 0.7001281979822752, "percentage": 70.01, "elapsed_time": "1 day, 5:44:01", "remaining_time": "12:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12562, "total_steps": 17941, "loss": 1.6835, "learning_rate": 2.1253343583754016e-05, "epoch": 0.7001839362354384, "percentage": 70.02, "elapsed_time": "1 day, 5:44:09", "remaining_time": "12:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12563, "total_steps": 17941, "loss": 1.7763, "learning_rate": 2.124605858990471e-05, "epoch": 0.7002396744886016, "percentage": 70.02, "elapsed_time": "1 day, 5:44:18", "remaining_time": "12:43:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12564, "total_steps": 17941, "loss": 1.5703, "learning_rate": 2.1238774507962795e-05, "epoch": 0.7002954127417647, "percentage": 70.03, "elapsed_time": "1 day, 5:44:26", "remaining_time": "12:43:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12565, "total_steps": 17941, "loss": 1.7078, "learning_rate": 2.123149133815925e-05, "epoch": 0.7003511509949278, "percentage": 70.04, "elapsed_time": "1 day, 5:44:35", "remaining_time": "12:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12566, "total_steps": 17941, "loss": 1.6979, "learning_rate": 2.1224209080725042e-05, "epoch": 0.7004068892480909, "percentage": 70.04, "elapsed_time": "1 day, 5:44:44", "remaining_time": "12:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12567, "total_steps": 17941, "loss": 1.3949, "learning_rate": 2.1216927735891183e-05, "epoch": 0.7004626275012541, "percentage": 70.05, "elapsed_time": "1 day, 5:44:52", "remaining_time": "12:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12568, "total_steps": 17941, "loss": 1.6486, "learning_rate": 2.1209647303888546e-05, "epoch": 0.7005183657544173, "percentage": 70.05, "elapsed_time": "1 day, 5:45:01", "remaining_time": "12:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12569, "total_steps": 17941, "loss": 1.7111, "learning_rate": 2.1202367784948036e-05, "epoch": 0.7005741040075804, "percentage": 70.06, "elapsed_time": "1 day, 5:45:09", "remaining_time": "12:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12570, "total_steps": 17941, "loss": 1.5828, "learning_rate": 2.119508917930052e-05, "epoch": 0.7006298422607435, "percentage": 70.06, "elapsed_time": "1 day, 5:45:18", "remaining_time": "12:42:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12571, "total_steps": 17941, "loss": 1.499, "learning_rate": 2.1187811487176845e-05, "epoch": 0.7006855805139067, "percentage": 70.07, "elapsed_time": "1 day, 5:45:26", "remaining_time": "12:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12572, "total_steps": 17941, "loss": 1.6988, "learning_rate": 2.1180534708807787e-05, "epoch": 0.7007413187670698, "percentage": 70.07, "elapsed_time": "1 day, 5:45:35", "remaining_time": "12:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12573, "total_steps": 17941, "loss": 1.3717, "learning_rate": 2.117325884442412e-05, "epoch": 0.700797057020233, "percentage": 70.08, "elapsed_time": "1 day, 5:45:43", "remaining_time": "12:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12574, "total_steps": 17941, "loss": 1.5043, "learning_rate": 2.1165983894256647e-05, "epoch": 0.7008527952733962, "percentage": 70.09, "elapsed_time": "1 day, 5:45:52", "remaining_time": "12:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12575, "total_steps": 17941, "loss": 1.602, "learning_rate": 2.1158709858536037e-05, "epoch": 0.7009085335265592, "percentage": 70.09, "elapsed_time": "1 day, 5:46:00", "remaining_time": "12:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12576, "total_steps": 17941, "loss": 1.6733, "learning_rate": 2.115143673749299e-05, "epoch": 0.7009642717797224, "percentage": 70.1, "elapsed_time": "1 day, 5:46:09", "remaining_time": "12:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12577, "total_steps": 17941, "loss": 1.8525, "learning_rate": 2.114416453135817e-05, "epoch": 0.7010200100328856, "percentage": 70.1, "elapsed_time": "1 day, 5:46:17", "remaining_time": "12:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12578, "total_steps": 17941, "loss": 1.7004, "learning_rate": 2.1136893240362226e-05, "epoch": 0.7010757482860487, "percentage": 70.11, "elapsed_time": "1 day, 5:46:26", "remaining_time": "12:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12579, "total_steps": 17941, "loss": 1.5932, "learning_rate": 2.112962286473573e-05, "epoch": 0.7011314865392119, "percentage": 70.11, "elapsed_time": "1 day, 5:46:34", "remaining_time": "12:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12580, "total_steps": 17941, "loss": 1.5578, "learning_rate": 2.1122353404709274e-05, "epoch": 0.701187224792375, "percentage": 70.12, "elapsed_time": "1 day, 5:46:43", "remaining_time": "12:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12581, "total_steps": 17941, "loss": 1.8148, "learning_rate": 2.1115084860513395e-05, "epoch": 0.7012429630455381, "percentage": 70.12, "elapsed_time": "1 day, 5:46:51", "remaining_time": "12:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12582, "total_steps": 17941, "loss": 1.7272, "learning_rate": 2.1107817232378618e-05, "epoch": 0.7012987012987013, "percentage": 70.13, "elapsed_time": "1 day, 5:47:00", "remaining_time": "12:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12583, "total_steps": 17941, "loss": 1.6468, "learning_rate": 2.110055052053544e-05, "epoch": 0.7013544395518645, "percentage": 70.14, "elapsed_time": "1 day, 5:47:08", "remaining_time": "12:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12584, "total_steps": 17941, "loss": 1.5593, "learning_rate": 2.1093284725214268e-05, "epoch": 0.7014101778050276, "percentage": 70.14, "elapsed_time": "1 day, 5:47:16", "remaining_time": "12:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12585, "total_steps": 17941, "loss": 1.6528, "learning_rate": 2.1086019846645582e-05, "epoch": 0.7014659160581908, "percentage": 70.15, "elapsed_time": "1 day, 5:47:25", "remaining_time": "12:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12586, "total_steps": 17941, "loss": 1.9402, "learning_rate": 2.1078755885059786e-05, "epoch": 0.7015216543113539, "percentage": 70.15, "elapsed_time": "1 day, 5:47:33", "remaining_time": "12:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12587, "total_steps": 17941, "loss": 1.6465, "learning_rate": 2.1071492840687218e-05, "epoch": 0.701577392564517, "percentage": 70.16, "elapsed_time": "1 day, 5:47:42", "remaining_time": "12:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12588, "total_steps": 17941, "loss": 1.5343, "learning_rate": 2.1064230713758225e-05, "epoch": 0.7016331308176802, "percentage": 70.16, "elapsed_time": "1 day, 5:47:50", "remaining_time": "12:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12589, "total_steps": 17941, "loss": 1.7163, "learning_rate": 2.1056969504503134e-05, "epoch": 0.7016888690708433, "percentage": 70.17, "elapsed_time": "1 day, 5:47:59", "remaining_time": "12:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12590, "total_steps": 17941, "loss": 1.6034, "learning_rate": 2.104970921315223e-05, "epoch": 0.7017446073240065, "percentage": 70.17, "elapsed_time": "1 day, 5:48:07", "remaining_time": "12:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12591, "total_steps": 17941, "loss": 1.7492, "learning_rate": 2.1042449839935747e-05, "epoch": 0.7018003455771696, "percentage": 70.18, "elapsed_time": "1 day, 5:48:16", "remaining_time": "12:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12592, "total_steps": 17941, "loss": 1.8769, "learning_rate": 2.1035191385083895e-05, "epoch": 0.7018560838303327, "percentage": 70.19, "elapsed_time": "1 day, 5:48:24", "remaining_time": "12:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12593, "total_steps": 17941, "loss": 1.7465, "learning_rate": 2.1027933848826942e-05, "epoch": 0.7019118220834959, "percentage": 70.19, "elapsed_time": "1 day, 5:48:33", "remaining_time": "12:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12594, "total_steps": 17941, "loss": 1.7793, "learning_rate": 2.1020677231394982e-05, "epoch": 0.7019675603366591, "percentage": 70.2, "elapsed_time": "1 day, 5:48:41", "remaining_time": "12:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12595, "total_steps": 17941, "loss": 1.5743, "learning_rate": 2.1013421533018184e-05, "epoch": 0.7020232985898222, "percentage": 70.2, "elapsed_time": "1 day, 5:48:50", "remaining_time": "12:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12596, "total_steps": 17941, "loss": 1.6089, "learning_rate": 2.1006166753926648e-05, "epoch": 0.7020790368429853, "percentage": 70.21, "elapsed_time": "1 day, 5:48:58", "remaining_time": "12:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12597, "total_steps": 17941, "loss": 1.6831, "learning_rate": 2.0998912894350477e-05, "epoch": 0.7021347750961485, "percentage": 70.21, "elapsed_time": "1 day, 5:49:07", "remaining_time": "12:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12598, "total_steps": 17941, "loss": 1.787, "learning_rate": 2.0991659954519682e-05, "epoch": 0.7021905133493116, "percentage": 70.22, "elapsed_time": "1 day, 5:49:16", "remaining_time": "12:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12599, "total_steps": 17941, "loss": 1.5232, "learning_rate": 2.0984407934664287e-05, "epoch": 0.7022462516024748, "percentage": 70.22, "elapsed_time": "1 day, 5:49:24", "remaining_time": "12:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12600, "total_steps": 17941, "loss": 1.7159, "learning_rate": 2.097715683501433e-05, "epoch": 0.702301989855638, "percentage": 70.23, "elapsed_time": "1 day, 5:49:33", "remaining_time": "12:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12601, "total_steps": 17941, "loss": 1.6153, "learning_rate": 2.0969906655799732e-05, "epoch": 0.702357728108801, "percentage": 70.24, "elapsed_time": "1 day, 5:49:41", "remaining_time": "12:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12602, "total_steps": 17941, "loss": 1.5843, "learning_rate": 2.0962657397250433e-05, "epoch": 0.7024134663619642, "percentage": 70.24, "elapsed_time": "1 day, 5:49:50", "remaining_time": "12:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12603, "total_steps": 17941, "loss": 1.6255, "learning_rate": 2.0955409059596348e-05, "epoch": 0.7024692046151274, "percentage": 70.25, "elapsed_time": "1 day, 5:49:58", "remaining_time": "12:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12604, "total_steps": 17941, "loss": 1.5451, "learning_rate": 2.094816164306736e-05, "epoch": 0.7025249428682905, "percentage": 70.25, "elapsed_time": "1 day, 5:50:07", "remaining_time": "12:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12605, "total_steps": 17941, "loss": 1.4511, "learning_rate": 2.094091514789328e-05, "epoch": 0.7025806811214537, "percentage": 70.26, "elapsed_time": "1 day, 5:50:15", "remaining_time": "12:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12606, "total_steps": 17941, "loss": 1.5672, "learning_rate": 2.093366957430395e-05, "epoch": 0.7026364193746168, "percentage": 70.26, "elapsed_time": "1 day, 5:50:24", "remaining_time": "12:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12607, "total_steps": 17941, "loss": 1.636, "learning_rate": 2.092642492252915e-05, "epoch": 0.7026921576277799, "percentage": 70.27, "elapsed_time": "1 day, 5:50:32", "remaining_time": "12:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12608, "total_steps": 17941, "loss": 1.7725, "learning_rate": 2.0919181192798644e-05, "epoch": 0.7027478958809431, "percentage": 70.27, "elapsed_time": "1 day, 5:50:40", "remaining_time": "12:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12609, "total_steps": 17941, "loss": 1.467, "learning_rate": 2.091193838534217e-05, "epoch": 0.7028036341341063, "percentage": 70.28, "elapsed_time": "1 day, 5:50:49", "remaining_time": "12:37:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12610, "total_steps": 17941, "loss": 1.5876, "learning_rate": 2.090469650038938e-05, "epoch": 0.7028593723872694, "percentage": 70.29, "elapsed_time": "1 day, 5:50:57", "remaining_time": "12:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12611, "total_steps": 17941, "loss": 1.698, "learning_rate": 2.089745553817e-05, "epoch": 0.7029151106404325, "percentage": 70.29, "elapsed_time": "1 day, 5:51:06", "remaining_time": "12:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12612, "total_steps": 17941, "loss": 1.5782, "learning_rate": 2.0890215498913668e-05, "epoch": 0.7029708488935956, "percentage": 70.3, "elapsed_time": "1 day, 5:51:14", "remaining_time": "12:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12613, "total_steps": 17941, "loss": 1.7965, "learning_rate": 2.0882976382849962e-05, "epoch": 0.7030265871467588, "percentage": 70.3, "elapsed_time": "1 day, 5:51:23", "remaining_time": "12:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12614, "total_steps": 17941, "loss": 1.6878, "learning_rate": 2.0875738190208483e-05, "epoch": 0.703082325399922, "percentage": 70.31, "elapsed_time": "1 day, 5:51:32", "remaining_time": "12:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12615, "total_steps": 17941, "loss": 1.5877, "learning_rate": 2.0868500921218775e-05, "epoch": 0.7031380636530851, "percentage": 70.31, "elapsed_time": "1 day, 5:51:40", "remaining_time": "12:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12616, "total_steps": 17941, "loss": 1.54, "learning_rate": 2.0861264576110395e-05, "epoch": 0.7031938019062483, "percentage": 70.32, "elapsed_time": "1 day, 5:51:49", "remaining_time": "12:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12617, "total_steps": 17941, "loss": 1.9004, "learning_rate": 2.085402915511277e-05, "epoch": 0.7032495401594114, "percentage": 70.32, "elapsed_time": "1 day, 5:51:57", "remaining_time": "12:36:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12618, "total_steps": 17941, "loss": 1.7008, "learning_rate": 2.0846794658455433e-05, "epoch": 0.7033052784125745, "percentage": 70.33, "elapsed_time": "1 day, 5:52:06", "remaining_time": "12:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12619, "total_steps": 17941, "loss": 1.6724, "learning_rate": 2.0839561086367802e-05, "epoch": 0.7033610166657377, "percentage": 70.34, "elapsed_time": "1 day, 5:52:14", "remaining_time": "12:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12620, "total_steps": 17941, "loss": 1.4036, "learning_rate": 2.0832328439079268e-05, "epoch": 0.7034167549189009, "percentage": 70.34, "elapsed_time": "1 day, 5:52:23", "remaining_time": "12:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12621, "total_steps": 17941, "loss": 1.6769, "learning_rate": 2.082509671681921e-05, "epoch": 0.703472493172064, "percentage": 70.35, "elapsed_time": "1 day, 5:52:31", "remaining_time": "12:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12622, "total_steps": 17941, "loss": 1.7971, "learning_rate": 2.0817865919816988e-05, "epoch": 0.7035282314252271, "percentage": 70.35, "elapsed_time": "1 day, 5:52:40", "remaining_time": "12:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12623, "total_steps": 17941, "loss": 1.7429, "learning_rate": 2.081063604830193e-05, "epoch": 0.7035839696783903, "percentage": 70.36, "elapsed_time": "1 day, 5:52:48", "remaining_time": "12:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12624, "total_steps": 17941, "loss": 1.6767, "learning_rate": 2.0803407102503293e-05, "epoch": 0.7036397079315534, "percentage": 70.36, "elapsed_time": "1 day, 5:52:56", "remaining_time": "12:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12625, "total_steps": 17941, "loss": 1.8749, "learning_rate": 2.0796179082650336e-05, "epoch": 0.7036954461847166, "percentage": 70.37, "elapsed_time": "1 day, 5:53:06", "remaining_time": "12:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12626, "total_steps": 17941, "loss": 1.6783, "learning_rate": 2.0788951988972345e-05, "epoch": 0.7037511844378798, "percentage": 70.38, "elapsed_time": "1 day, 5:53:14", "remaining_time": "12:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12627, "total_steps": 17941, "loss": 1.3523, "learning_rate": 2.0781725821698466e-05, "epoch": 0.7038069226910428, "percentage": 70.38, "elapsed_time": "1 day, 5:53:23", "remaining_time": "12:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12628, "total_steps": 17941, "loss": 1.5957, "learning_rate": 2.0774500581057892e-05, "epoch": 0.703862660944206, "percentage": 70.39, "elapsed_time": "1 day, 5:53:31", "remaining_time": "12:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12629, "total_steps": 17941, "loss": 1.7849, "learning_rate": 2.076727626727976e-05, "epoch": 0.7039183991973692, "percentage": 70.39, "elapsed_time": "1 day, 5:53:40", "remaining_time": "12:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12630, "total_steps": 17941, "loss": 1.7172, "learning_rate": 2.0760052880593213e-05, "epoch": 0.7039741374505323, "percentage": 70.4, "elapsed_time": "1 day, 5:53:48", "remaining_time": "12:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12631, "total_steps": 17941, "loss": 1.72, "learning_rate": 2.0752830421227277e-05, "epoch": 0.7040298757036955, "percentage": 70.4, "elapsed_time": "1 day, 5:53:57", "remaining_time": "12:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12632, "total_steps": 17941, "loss": 1.5975, "learning_rate": 2.0745608889411044e-05, "epoch": 0.7040856139568586, "percentage": 70.41, "elapsed_time": "1 day, 5:54:05", "remaining_time": "12:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12633, "total_steps": 17941, "loss": 1.6038, "learning_rate": 2.0738388285373533e-05, "epoch": 0.7041413522100217, "percentage": 70.41, "elapsed_time": "1 day, 5:54:13", "remaining_time": "12:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12634, "total_steps": 17941, "loss": 1.5777, "learning_rate": 2.0731168609343737e-05, "epoch": 0.7041970904631849, "percentage": 70.42, "elapsed_time": "1 day, 5:54:22", "remaining_time": "12:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12635, "total_steps": 17941, "loss": 1.7384, "learning_rate": 2.072394986155064e-05, "epoch": 0.704252828716348, "percentage": 70.43, "elapsed_time": "1 day, 5:54:30", "remaining_time": "12:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12636, "total_steps": 17941, "loss": 1.5779, "learning_rate": 2.071673204222313e-05, "epoch": 0.7043085669695112, "percentage": 70.43, "elapsed_time": "1 day, 5:54:39", "remaining_time": "12:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12637, "total_steps": 17941, "loss": 1.6983, "learning_rate": 2.070951515159016e-05, "epoch": 0.7043643052226743, "percentage": 70.44, "elapsed_time": "1 day, 5:54:48", "remaining_time": "12:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12638, "total_steps": 17941, "loss": 1.8005, "learning_rate": 2.0702299189880613e-05, "epoch": 0.7044200434758374, "percentage": 70.44, "elapsed_time": "1 day, 5:54:56", "remaining_time": "12:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12639, "total_steps": 17941, "loss": 1.5594, "learning_rate": 2.0695084157323303e-05, "epoch": 0.7044757817290006, "percentage": 70.45, "elapsed_time": "1 day, 5:55:05", "remaining_time": "12:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12640, "total_steps": 17941, "loss": 1.7295, "learning_rate": 2.0687870054147062e-05, "epoch": 0.7045315199821638, "percentage": 70.45, "elapsed_time": "1 day, 5:55:13", "remaining_time": "12:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12641, "total_steps": 17941, "loss": 1.7237, "learning_rate": 2.068065688058068e-05, "epoch": 0.7045872582353269, "percentage": 70.46, "elapsed_time": "1 day, 5:55:22", "remaining_time": "12:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12642, "total_steps": 17941, "loss": 1.3802, "learning_rate": 2.067344463685294e-05, "epoch": 0.70464299648849, "percentage": 70.46, "elapsed_time": "1 day, 5:55:30", "remaining_time": "12:32:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12643, "total_steps": 17941, "loss": 1.6697, "learning_rate": 2.0666233323192515e-05, "epoch": 0.7046987347416532, "percentage": 70.47, "elapsed_time": "1 day, 5:55:39", "remaining_time": "12:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12644, "total_steps": 17941, "loss": 1.604, "learning_rate": 2.0659022939828154e-05, "epoch": 0.7047544729948163, "percentage": 70.48, "elapsed_time": "1 day, 5:55:47", "remaining_time": "12:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12645, "total_steps": 17941, "loss": 1.7428, "learning_rate": 2.0651813486988535e-05, "epoch": 0.7048102112479795, "percentage": 70.48, "elapsed_time": "1 day, 5:55:56", "remaining_time": "12:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12646, "total_steps": 17941, "loss": 1.7455, "learning_rate": 2.0644604964902264e-05, "epoch": 0.7048659495011427, "percentage": 70.49, "elapsed_time": "1 day, 5:56:04", "remaining_time": "12:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12647, "total_steps": 17941, "loss": 1.5011, "learning_rate": 2.063739737379797e-05, "epoch": 0.7049216877543057, "percentage": 70.49, "elapsed_time": "1 day, 5:56:13", "remaining_time": "12:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12648, "total_steps": 17941, "loss": 1.7493, "learning_rate": 2.063019071390423e-05, "epoch": 0.7049774260074689, "percentage": 70.5, "elapsed_time": "1 day, 5:56:21", "remaining_time": "12:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12649, "total_steps": 17941, "loss": 1.741, "learning_rate": 2.062298498544963e-05, "epoch": 0.7050331642606321, "percentage": 70.5, "elapsed_time": "1 day, 5:56:30", "remaining_time": "12:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12650, "total_steps": 17941, "loss": 1.6665, "learning_rate": 2.0615780188662642e-05, "epoch": 0.7050889025137952, "percentage": 70.51, "elapsed_time": "1 day, 5:56:38", "remaining_time": "12:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12651, "total_steps": 17941, "loss": 1.4688, "learning_rate": 2.0608576323771767e-05, "epoch": 0.7051446407669584, "percentage": 70.51, "elapsed_time": "1 day, 5:56:46", "remaining_time": "12:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12652, "total_steps": 17941, "loss": 1.584, "learning_rate": 2.0601373391005525e-05, "epoch": 0.7052003790201216, "percentage": 70.52, "elapsed_time": "1 day, 5:56:55", "remaining_time": "12:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12653, "total_steps": 17941, "loss": 1.729, "learning_rate": 2.0594171390592294e-05, "epoch": 0.7052561172732846, "percentage": 70.53, "elapsed_time": "1 day, 5:57:03", "remaining_time": "12:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12654, "total_steps": 17941, "loss": 1.7496, "learning_rate": 2.0586970322760498e-05, "epoch": 0.7053118555264478, "percentage": 70.53, "elapsed_time": "1 day, 5:57:12", "remaining_time": "12:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12655, "total_steps": 17941, "loss": 1.5804, "learning_rate": 2.057977018773851e-05, "epoch": 0.705367593779611, "percentage": 70.54, "elapsed_time": "1 day, 5:57:20", "remaining_time": "12:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12656, "total_steps": 17941, "loss": 1.5512, "learning_rate": 2.057257098575471e-05, "epoch": 0.7054233320327741, "percentage": 70.54, "elapsed_time": "1 day, 5:57:29", "remaining_time": "12:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12657, "total_steps": 17941, "loss": 1.7573, "learning_rate": 2.0565372717037356e-05, "epoch": 0.7054790702859373, "percentage": 70.55, "elapsed_time": "1 day, 5:57:37", "remaining_time": "12:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12658, "total_steps": 17941, "loss": 1.9962, "learning_rate": 2.0558175381814766e-05, "epoch": 0.7055348085391003, "percentage": 70.55, "elapsed_time": "1 day, 5:57:45", "remaining_time": "12:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12659, "total_steps": 17941, "loss": 1.6104, "learning_rate": 2.0550978980315194e-05, "epoch": 0.7055905467922635, "percentage": 70.56, "elapsed_time": "1 day, 5:57:54", "remaining_time": "12:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12660, "total_steps": 17941, "loss": 1.6372, "learning_rate": 2.0543783512766873e-05, "epoch": 0.7056462850454267, "percentage": 70.56, "elapsed_time": "1 day, 5:58:03", "remaining_time": "12:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12661, "total_steps": 17941, "loss": 1.5143, "learning_rate": 2.0536588979398013e-05, "epoch": 0.7057020232985898, "percentage": 70.57, "elapsed_time": "1 day, 5:58:11", "remaining_time": "12:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12662, "total_steps": 17941, "loss": 1.7892, "learning_rate": 2.0529395380436727e-05, "epoch": 0.705757761551753, "percentage": 70.58, "elapsed_time": "1 day, 5:58:20", "remaining_time": "12:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12663, "total_steps": 17941, "loss": 1.6492, "learning_rate": 2.052220271611124e-05, "epoch": 0.7058134998049161, "percentage": 70.58, "elapsed_time": "1 day, 5:58:28", "remaining_time": "12:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12664, "total_steps": 17941, "loss": 1.6053, "learning_rate": 2.051501098664959e-05, "epoch": 0.7058692380580792, "percentage": 70.59, "elapsed_time": "1 day, 5:58:37", "remaining_time": "12:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12665, "total_steps": 17941, "loss": 1.475, "learning_rate": 2.050782019227988e-05, "epoch": 0.7059249763112424, "percentage": 70.59, "elapsed_time": "1 day, 5:58:45", "remaining_time": "12:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12666, "total_steps": 17941, "loss": 1.7296, "learning_rate": 2.0500630333230168e-05, "epoch": 0.7059807145644056, "percentage": 70.6, "elapsed_time": "1 day, 5:58:54", "remaining_time": "12:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12667, "total_steps": 17941, "loss": 1.7089, "learning_rate": 2.0493441409728466e-05, "epoch": 0.7060364528175687, "percentage": 70.6, "elapsed_time": "1 day, 5:59:02", "remaining_time": "12:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12668, "total_steps": 17941, "loss": 1.5953, "learning_rate": 2.0486253422002784e-05, "epoch": 0.7060921910707318, "percentage": 70.61, "elapsed_time": "1 day, 5:59:11", "remaining_time": "12:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12669, "total_steps": 17941, "loss": 1.7162, "learning_rate": 2.047906637028103e-05, "epoch": 0.706147929323895, "percentage": 70.61, "elapsed_time": "1 day, 5:59:19", "remaining_time": "12:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12670, "total_steps": 17941, "loss": 1.5502, "learning_rate": 2.047188025479119e-05, "epoch": 0.7062036675770581, "percentage": 70.62, "elapsed_time": "1 day, 5:59:28", "remaining_time": "12:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12671, "total_steps": 17941, "loss": 1.9175, "learning_rate": 2.046469507576117e-05, "epoch": 0.7062594058302213, "percentage": 70.63, "elapsed_time": "1 day, 5:59:36", "remaining_time": "12:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12672, "total_steps": 17941, "loss": 1.6203, "learning_rate": 2.0457510833418796e-05, "epoch": 0.7063151440833845, "percentage": 70.63, "elapsed_time": "1 day, 5:59:45", "remaining_time": "12:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12673, "total_steps": 17941, "loss": 1.7017, "learning_rate": 2.045032752799194e-05, "epoch": 0.7063708823365475, "percentage": 70.64, "elapsed_time": "1 day, 5:59:53", "remaining_time": "12:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12674, "total_steps": 17941, "loss": 1.7859, "learning_rate": 2.0443145159708405e-05, "epoch": 0.7064266205897107, "percentage": 70.64, "elapsed_time": "1 day, 6:00:02", "remaining_time": "12:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12675, "total_steps": 17941, "loss": 1.7632, "learning_rate": 2.0435963728795992e-05, "epoch": 0.7064823588428739, "percentage": 70.65, "elapsed_time": "1 day, 6:00:10", "remaining_time": "12:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12676, "total_steps": 17941, "loss": 1.5312, "learning_rate": 2.0428783235482424e-05, "epoch": 0.706538097096037, "percentage": 70.65, "elapsed_time": "1 day, 6:00:19", "remaining_time": "12:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12677, "total_steps": 17941, "loss": 1.5461, "learning_rate": 2.042160367999542e-05, "epoch": 0.7065938353492002, "percentage": 70.66, "elapsed_time": "1 day, 6:00:27", "remaining_time": "12:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12678, "total_steps": 17941, "loss": 1.7262, "learning_rate": 2.041442506256273e-05, "epoch": 0.7066495736023634, "percentage": 70.66, "elapsed_time": "1 day, 6:00:36", "remaining_time": "12:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12679, "total_steps": 17941, "loss": 1.7994, "learning_rate": 2.0407247383411966e-05, "epoch": 0.7067053118555264, "percentage": 70.67, "elapsed_time": "1 day, 6:00:44", "remaining_time": "12:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12680, "total_steps": 17941, "loss": 1.7502, "learning_rate": 2.0400070642770775e-05, "epoch": 0.7067610501086896, "percentage": 70.68, "elapsed_time": "1 day, 6:00:52", "remaining_time": "12:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12681, "total_steps": 17941, "loss": 1.8929, "learning_rate": 2.0392894840866767e-05, "epoch": 0.7068167883618527, "percentage": 70.68, "elapsed_time": "1 day, 6:01:01", "remaining_time": "12:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12682, "total_steps": 17941, "loss": 1.8354, "learning_rate": 2.0385719977927526e-05, "epoch": 0.7068725266150159, "percentage": 70.69, "elapsed_time": "1 day, 6:01:09", "remaining_time": "12:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12683, "total_steps": 17941, "loss": 1.7345, "learning_rate": 2.0378546054180568e-05, "epoch": 0.7069282648681791, "percentage": 70.69, "elapsed_time": "1 day, 6:01:18", "remaining_time": "12:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12684, "total_steps": 17941, "loss": 1.9439, "learning_rate": 2.0371373069853424e-05, "epoch": 0.7069840031213421, "percentage": 70.7, "elapsed_time": "1 day, 6:01:27", "remaining_time": "12:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12685, "total_steps": 17941, "loss": 1.5638, "learning_rate": 2.036420102517358e-05, "epoch": 0.7070397413745053, "percentage": 70.7, "elapsed_time": "1 day, 6:01:35", "remaining_time": "12:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12686, "total_steps": 17941, "loss": 1.5163, "learning_rate": 2.035702992036849e-05, "epoch": 0.7070954796276685, "percentage": 70.71, "elapsed_time": "1 day, 6:01:44", "remaining_time": "12:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12687, "total_steps": 17941, "loss": 1.6277, "learning_rate": 2.0349859755665595e-05, "epoch": 0.7071512178808316, "percentage": 70.72, "elapsed_time": "1 day, 6:01:52", "remaining_time": "12:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12688, "total_steps": 17941, "loss": 1.4882, "learning_rate": 2.0342690531292248e-05, "epoch": 0.7072069561339948, "percentage": 70.72, "elapsed_time": "1 day, 6:02:01", "remaining_time": "12:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12689, "total_steps": 17941, "loss": 1.611, "learning_rate": 2.0335522247475874e-05, "epoch": 0.7072626943871579, "percentage": 70.73, "elapsed_time": "1 day, 6:02:09", "remaining_time": "12:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12690, "total_steps": 17941, "loss": 1.8073, "learning_rate": 2.0328354904443764e-05, "epoch": 0.707318432640321, "percentage": 70.73, "elapsed_time": "1 day, 6:02:17", "remaining_time": "12:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12691, "total_steps": 17941, "loss": 1.6561, "learning_rate": 2.0321188502423232e-05, "epoch": 0.7073741708934842, "percentage": 70.74, "elapsed_time": "1 day, 6:02:27", "remaining_time": "12:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12692, "total_steps": 17941, "loss": 1.7064, "learning_rate": 2.0314023041641568e-05, "epoch": 0.7074299091466474, "percentage": 70.74, "elapsed_time": "1 day, 6:02:35", "remaining_time": "12:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12693, "total_steps": 17941, "loss": 1.511, "learning_rate": 2.030685852232601e-05, "epoch": 0.7074856473998105, "percentage": 70.75, "elapsed_time": "1 day, 6:02:43", "remaining_time": "12:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12694, "total_steps": 17941, "loss": 1.4849, "learning_rate": 2.0299694944703796e-05, "epoch": 0.7075413856529736, "percentage": 70.75, "elapsed_time": "1 day, 6:02:53", "remaining_time": "12:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12695, "total_steps": 17941, "loss": 1.5751, "learning_rate": 2.0292532309002054e-05, "epoch": 0.7075971239061368, "percentage": 70.76, "elapsed_time": "1 day, 6:03:01", "remaining_time": "12:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12696, "total_steps": 17941, "loss": 1.5558, "learning_rate": 2.0285370615448002e-05, "epoch": 0.7076528621592999, "percentage": 70.77, "elapsed_time": "1 day, 6:03:10", "remaining_time": "12:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12697, "total_steps": 17941, "loss": 1.3527, "learning_rate": 2.027820986426876e-05, "epoch": 0.7077086004124631, "percentage": 70.77, "elapsed_time": "1 day, 6:03:18", "remaining_time": "12:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12698, "total_steps": 17941, "loss": 1.4686, "learning_rate": 2.0271050055691393e-05, "epoch": 0.7077643386656263, "percentage": 70.78, "elapsed_time": "1 day, 6:03:27", "remaining_time": "12:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12699, "total_steps": 17941, "loss": 1.6368, "learning_rate": 2.026389118994299e-05, "epoch": 0.7078200769187893, "percentage": 70.78, "elapsed_time": "1 day, 6:03:35", "remaining_time": "12:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12700, "total_steps": 17941, "loss": 1.6877, "learning_rate": 2.0256733267250583e-05, "epoch": 0.7078758151719525, "percentage": 70.79, "elapsed_time": "1 day, 6:03:44", "remaining_time": "12:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12701, "total_steps": 17941, "loss": 1.5749, "learning_rate": 2.02495762878412e-05, "epoch": 0.7079315534251157, "percentage": 70.79, "elapsed_time": "1 day, 6:03:52", "remaining_time": "12:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12702, "total_steps": 17941, "loss": 1.5247, "learning_rate": 2.024242025194178e-05, "epoch": 0.7079872916782788, "percentage": 70.8, "elapsed_time": "1 day, 6:04:00", "remaining_time": "12:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12703, "total_steps": 17941, "loss": 1.7531, "learning_rate": 2.0235265159779277e-05, "epoch": 0.708043029931442, "percentage": 70.8, "elapsed_time": "1 day, 6:04:09", "remaining_time": "12:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12704, "total_steps": 17941, "loss": 1.7212, "learning_rate": 2.022811101158066e-05, "epoch": 0.708098768184605, "percentage": 70.81, "elapsed_time": "1 day, 6:04:18", "remaining_time": "12:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12705, "total_steps": 17941, "loss": 1.6991, "learning_rate": 2.0220957807572756e-05, "epoch": 0.7081545064377682, "percentage": 70.82, "elapsed_time": "1 day, 6:04:26", "remaining_time": "12:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12706, "total_steps": 17941, "loss": 1.6026, "learning_rate": 2.0213805547982446e-05, "epoch": 0.7082102446909314, "percentage": 70.82, "elapsed_time": "1 day, 6:04:36", "remaining_time": "12:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12707, "total_steps": 17941, "loss": 1.8268, "learning_rate": 2.020665423303656e-05, "epoch": 0.7082659829440945, "percentage": 70.83, "elapsed_time": "1 day, 6:04:44", "remaining_time": "12:23:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12708, "total_steps": 17941, "loss": 1.6651, "learning_rate": 2.0199503862961917e-05, "epoch": 0.7083217211972577, "percentage": 70.83, "elapsed_time": "1 day, 6:04:52", "remaining_time": "12:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12709, "total_steps": 17941, "loss": 1.6086, "learning_rate": 2.019235443798524e-05, "epoch": 0.7083774594504209, "percentage": 70.84, "elapsed_time": "1 day, 6:05:01", "remaining_time": "12:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12710, "total_steps": 17941, "loss": 1.6118, "learning_rate": 2.0185205958333275e-05, "epoch": 0.7084331977035839, "percentage": 70.84, "elapsed_time": "1 day, 6:05:09", "remaining_time": "12:22:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12711, "total_steps": 17941, "loss": 1.6655, "learning_rate": 2.0178058424232776e-05, "epoch": 0.7084889359567471, "percentage": 70.85, "elapsed_time": "1 day, 6:05:18", "remaining_time": "12:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12712, "total_steps": 17941, "loss": 1.4887, "learning_rate": 2.017091183591037e-05, "epoch": 0.7085446742099103, "percentage": 70.85, "elapsed_time": "1 day, 6:05:26", "remaining_time": "12:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12713, "total_steps": 17941, "loss": 1.7438, "learning_rate": 2.0163766193592753e-05, "epoch": 0.7086004124630734, "percentage": 70.86, "elapsed_time": "1 day, 6:05:35", "remaining_time": "12:22:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12714, "total_steps": 17941, "loss": 1.4655, "learning_rate": 2.0156621497506472e-05, "epoch": 0.7086561507162366, "percentage": 70.87, "elapsed_time": "1 day, 6:05:43", "remaining_time": "12:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12715, "total_steps": 17941, "loss": 1.6594, "learning_rate": 2.0149477747878194e-05, "epoch": 0.7087118889693997, "percentage": 70.87, "elapsed_time": "1 day, 6:05:52", "remaining_time": "12:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12716, "total_steps": 17941, "loss": 1.583, "learning_rate": 2.0142334944934426e-05, "epoch": 0.7087676272225628, "percentage": 70.88, "elapsed_time": "1 day, 6:06:00", "remaining_time": "12:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12717, "total_steps": 17941, "loss": 1.5247, "learning_rate": 2.013519308890171e-05, "epoch": 0.708823365475726, "percentage": 70.88, "elapsed_time": "1 day, 6:06:09", "remaining_time": "12:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12718, "total_steps": 17941, "loss": 1.6722, "learning_rate": 2.0128052180006546e-05, "epoch": 0.7088791037288892, "percentage": 70.89, "elapsed_time": "1 day, 6:06:17", "remaining_time": "12:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12719, "total_steps": 17941, "loss": 1.6948, "learning_rate": 2.0120912218475396e-05, "epoch": 0.7089348419820523, "percentage": 70.89, "elapsed_time": "1 day, 6:06:26", "remaining_time": "12:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12720, "total_steps": 17941, "loss": 1.6412, "learning_rate": 2.011377320453473e-05, "epoch": 0.7089905802352154, "percentage": 70.9, "elapsed_time": "1 day, 6:06:34", "remaining_time": "12:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12721, "total_steps": 17941, "loss": 1.6345, "learning_rate": 2.0106635138410883e-05, "epoch": 0.7090463184883786, "percentage": 70.9, "elapsed_time": "1 day, 6:06:42", "remaining_time": "12:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12722, "total_steps": 17941, "loss": 1.6459, "learning_rate": 2.0099498020330303e-05, "epoch": 0.7091020567415417, "percentage": 70.91, "elapsed_time": "1 day, 6:06:52", "remaining_time": "12:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12723, "total_steps": 17941, "loss": 1.5565, "learning_rate": 2.0092361850519336e-05, "epoch": 0.7091577949947049, "percentage": 70.92, "elapsed_time": "1 day, 6:07:00", "remaining_time": "12:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12724, "total_steps": 17941, "loss": 1.6026, "learning_rate": 2.0085226629204256e-05, "epoch": 0.7092135332478681, "percentage": 70.92, "elapsed_time": "1 day, 6:07:09", "remaining_time": "12:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12725, "total_steps": 17941, "loss": 1.6818, "learning_rate": 2.0078092356611372e-05, "epoch": 0.7092692715010311, "percentage": 70.93, "elapsed_time": "1 day, 6:07:17", "remaining_time": "12:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12726, "total_steps": 17941, "loss": 1.6622, "learning_rate": 2.0070959032966942e-05, "epoch": 0.7093250097541943, "percentage": 70.93, "elapsed_time": "1 day, 6:07:26", "remaining_time": "12:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12727, "total_steps": 17941, "loss": 1.8945, "learning_rate": 2.0063826658497203e-05, "epoch": 0.7093807480073574, "percentage": 70.94, "elapsed_time": "1 day, 6:07:35", "remaining_time": "12:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12728, "total_steps": 17941, "loss": 1.4223, "learning_rate": 2.0056695233428335e-05, "epoch": 0.7094364862605206, "percentage": 70.94, "elapsed_time": "1 day, 6:07:43", "remaining_time": "12:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12729, "total_steps": 17941, "loss": 1.5615, "learning_rate": 2.0049564757986488e-05, "epoch": 0.7094922245136838, "percentage": 70.95, "elapsed_time": "1 day, 6:07:52", "remaining_time": "12:20:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12730, "total_steps": 17941, "loss": 1.9871, "learning_rate": 2.0042435232397867e-05, "epoch": 0.7095479627668468, "percentage": 70.95, "elapsed_time": "1 day, 6:08:00", "remaining_time": "12:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12731, "total_steps": 17941, "loss": 1.4064, "learning_rate": 2.0035306656888515e-05, "epoch": 0.70960370102001, "percentage": 70.96, "elapsed_time": "1 day, 6:08:09", "remaining_time": "12:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12732, "total_steps": 17941, "loss": 1.6376, "learning_rate": 2.0028179031684523e-05, "epoch": 0.7096594392731732, "percentage": 70.97, "elapsed_time": "1 day, 6:08:17", "remaining_time": "12:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12733, "total_steps": 17941, "loss": 1.7685, "learning_rate": 2.002105235701195e-05, "epoch": 0.7097151775263363, "percentage": 70.97, "elapsed_time": "1 day, 6:08:25", "remaining_time": "12:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12734, "total_steps": 17941, "loss": 1.6685, "learning_rate": 2.0013926633096825e-05, "epoch": 0.7097709157794995, "percentage": 70.98, "elapsed_time": "1 day, 6:08:34", "remaining_time": "12:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12735, "total_steps": 17941, "loss": 1.5448, "learning_rate": 2.0006801860165098e-05, "epoch": 0.7098266540326627, "percentage": 70.98, "elapsed_time": "1 day, 6:08:43", "remaining_time": "12:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12736, "total_steps": 17941, "loss": 1.8328, "learning_rate": 1.9999678038442727e-05, "epoch": 0.7098823922858257, "percentage": 70.99, "elapsed_time": "1 day, 6:08:51", "remaining_time": "12:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12737, "total_steps": 17941, "loss": 1.3826, "learning_rate": 1.9992555168155687e-05, "epoch": 0.7099381305389889, "percentage": 70.99, "elapsed_time": "1 day, 6:09:00", "remaining_time": "12:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12738, "total_steps": 17941, "loss": 1.4891, "learning_rate": 1.998543324952982e-05, "epoch": 0.7099938687921521, "percentage": 71.0, "elapsed_time": "1 day, 6:09:08", "remaining_time": "12:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12739, "total_steps": 17941, "loss": 1.6531, "learning_rate": 1.997831228279104e-05, "epoch": 0.7100496070453152, "percentage": 71.0, "elapsed_time": "1 day, 6:09:17", "remaining_time": "12:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12740, "total_steps": 17941, "loss": 1.7154, "learning_rate": 1.9971192268165116e-05, "epoch": 0.7101053452984784, "percentage": 71.01, "elapsed_time": "1 day, 6:09:25", "remaining_time": "12:18:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12741, "total_steps": 17941, "loss": 1.5835, "learning_rate": 1.9964073205877924e-05, "epoch": 0.7101610835516415, "percentage": 71.02, "elapsed_time": "1 day, 6:09:33", "remaining_time": "12:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12742, "total_steps": 17941, "loss": 1.8135, "learning_rate": 1.99569550961552e-05, "epoch": 0.7102168218048046, "percentage": 71.02, "elapsed_time": "1 day, 6:09:42", "remaining_time": "12:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12743, "total_steps": 17941, "loss": 1.6409, "learning_rate": 1.9949837939222693e-05, "epoch": 0.7102725600579678, "percentage": 71.03, "elapsed_time": "1 day, 6:09:50", "remaining_time": "12:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12744, "total_steps": 17941, "loss": 1.0639, "learning_rate": 1.994272173530612e-05, "epoch": 0.710328298311131, "percentage": 71.03, "elapsed_time": "1 day, 6:09:59", "remaining_time": "12:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12745, "total_steps": 17941, "loss": 1.7668, "learning_rate": 1.993560648463117e-05, "epoch": 0.710384036564294, "percentage": 71.04, "elapsed_time": "1 day, 6:10:07", "remaining_time": "12:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12746, "total_steps": 17941, "loss": 1.4886, "learning_rate": 1.9928492187423514e-05, "epoch": 0.7104397748174572, "percentage": 71.04, "elapsed_time": "1 day, 6:10:16", "remaining_time": "12:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12747, "total_steps": 17941, "loss": 1.9898, "learning_rate": 1.9921378843908716e-05, "epoch": 0.7104955130706204, "percentage": 71.05, "elapsed_time": "1 day, 6:10:24", "remaining_time": "12:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12748, "total_steps": 17941, "loss": 1.6636, "learning_rate": 1.991426645431243e-05, "epoch": 0.7105512513237835, "percentage": 71.06, "elapsed_time": "1 day, 6:10:33", "remaining_time": "12:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12749, "total_steps": 17941, "loss": 1.6165, "learning_rate": 1.9907155018860217e-05, "epoch": 0.7106069895769467, "percentage": 71.06, "elapsed_time": "1 day, 6:10:41", "remaining_time": "12:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12750, "total_steps": 17941, "loss": 1.6894, "learning_rate": 1.9900044537777586e-05, "epoch": 0.7106627278301098, "percentage": 71.07, "elapsed_time": "1 day, 6:10:49", "remaining_time": "12:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12751, "total_steps": 17941, "loss": 1.4837, "learning_rate": 1.9892935011290037e-05, "epoch": 0.7107184660832729, "percentage": 71.07, "elapsed_time": "1 day, 6:10:58", "remaining_time": "12:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12752, "total_steps": 17941, "loss": 1.6393, "learning_rate": 1.9885826439623052e-05, "epoch": 0.7107742043364361, "percentage": 71.08, "elapsed_time": "1 day, 6:11:06", "remaining_time": "12:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12753, "total_steps": 17941, "loss": 1.6043, "learning_rate": 1.9878718823002097e-05, "epoch": 0.7108299425895992, "percentage": 71.08, "elapsed_time": "1 day, 6:11:15", "remaining_time": "12:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12754, "total_steps": 17941, "loss": 1.6273, "learning_rate": 1.9871612161652542e-05, "epoch": 0.7108856808427624, "percentage": 71.09, "elapsed_time": "1 day, 6:11:23", "remaining_time": "12:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12755, "total_steps": 17941, "loss": 1.6094, "learning_rate": 1.9864506455799768e-05, "epoch": 0.7109414190959256, "percentage": 71.09, "elapsed_time": "1 day, 6:11:32", "remaining_time": "12:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12756, "total_steps": 17941, "loss": 1.7298, "learning_rate": 1.9857401705669186e-05, "epoch": 0.7109971573490886, "percentage": 71.1, "elapsed_time": "1 day, 6:11:41", "remaining_time": "12:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12757, "total_steps": 17941, "loss": 1.649, "learning_rate": 1.9850297911486067e-05, "epoch": 0.7110528956022518, "percentage": 71.11, "elapsed_time": "1 day, 6:11:49", "remaining_time": "12:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12758, "total_steps": 17941, "loss": 1.4049, "learning_rate": 1.98431950734757e-05, "epoch": 0.711108633855415, "percentage": 71.11, "elapsed_time": "1 day, 6:11:58", "remaining_time": "12:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12759, "total_steps": 17941, "loss": 1.5951, "learning_rate": 1.983609319186337e-05, "epoch": 0.7111643721085781, "percentage": 71.12, "elapsed_time": "1 day, 6:12:06", "remaining_time": "12:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12760, "total_steps": 17941, "loss": 1.7238, "learning_rate": 1.982899226687431e-05, "epoch": 0.7112201103617413, "percentage": 71.12, "elapsed_time": "1 day, 6:12:15", "remaining_time": "12:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12761, "total_steps": 17941, "loss": 1.7273, "learning_rate": 1.9821892298733686e-05, "epoch": 0.7112758486149044, "percentage": 71.13, "elapsed_time": "1 day, 6:12:23", "remaining_time": "12:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12762, "total_steps": 17941, "loss": 1.7202, "learning_rate": 1.9814793287666673e-05, "epoch": 0.7113315868680675, "percentage": 71.13, "elapsed_time": "1 day, 6:12:32", "remaining_time": "12:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12763, "total_steps": 17941, "loss": 1.6107, "learning_rate": 1.9807695233898455e-05, "epoch": 0.7113873251212307, "percentage": 71.14, "elapsed_time": "1 day, 6:12:40", "remaining_time": "12:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12764, "total_steps": 17941, "loss": 1.5467, "learning_rate": 1.98005981376541e-05, "epoch": 0.7114430633743939, "percentage": 71.14, "elapsed_time": "1 day, 6:12:48", "remaining_time": "12:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12765, "total_steps": 17941, "loss": 1.7664, "learning_rate": 1.9793501999158708e-05, "epoch": 0.711498801627557, "percentage": 71.15, "elapsed_time": "1 day, 6:12:57", "remaining_time": "12:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12766, "total_steps": 17941, "loss": 1.6013, "learning_rate": 1.9786406818637286e-05, "epoch": 0.7115545398807201, "percentage": 71.16, "elapsed_time": "1 day, 6:13:05", "remaining_time": "12:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12767, "total_steps": 17941, "loss": 1.4807, "learning_rate": 1.977931259631492e-05, "epoch": 0.7116102781338833, "percentage": 71.16, "elapsed_time": "1 day, 6:13:14", "remaining_time": "12:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12768, "total_steps": 17941, "loss": 1.9146, "learning_rate": 1.977221933241654e-05, "epoch": 0.7116660163870464, "percentage": 71.17, "elapsed_time": "1 day, 6:13:22", "remaining_time": "12:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12769, "total_steps": 17941, "loss": 1.4818, "learning_rate": 1.9765127027167117e-05, "epoch": 0.7117217546402096, "percentage": 71.17, "elapsed_time": "1 day, 6:13:31", "remaining_time": "12:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12770, "total_steps": 17941, "loss": 1.6821, "learning_rate": 1.9758035680791593e-05, "epoch": 0.7117774928933728, "percentage": 71.18, "elapsed_time": "1 day, 6:13:39", "remaining_time": "12:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12771, "total_steps": 17941, "loss": 1.5839, "learning_rate": 1.975094529351485e-05, "epoch": 0.7118332311465358, "percentage": 71.18, "elapsed_time": "1 day, 6:13:48", "remaining_time": "12:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12772, "total_steps": 17941, "loss": 1.7335, "learning_rate": 1.9743855865561772e-05, "epoch": 0.711888969399699, "percentage": 71.19, "elapsed_time": "1 day, 6:13:56", "remaining_time": "12:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12773, "total_steps": 17941, "loss": 1.4159, "learning_rate": 1.9736767397157147e-05, "epoch": 0.7119447076528621, "percentage": 71.19, "elapsed_time": "1 day, 6:14:05", "remaining_time": "12:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12774, "total_steps": 17941, "loss": 1.6998, "learning_rate": 1.9729679888525847e-05, "epoch": 0.7120004459060253, "percentage": 71.2, "elapsed_time": "1 day, 6:14:14", "remaining_time": "12:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12775, "total_steps": 17941, "loss": 1.6072, "learning_rate": 1.9722593339892605e-05, "epoch": 0.7120561841591885, "percentage": 71.21, "elapsed_time": "1 day, 6:14:22", "remaining_time": "12:13:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12776, "total_steps": 17941, "loss": 1.4811, "learning_rate": 1.971550775148216e-05, "epoch": 0.7121119224123516, "percentage": 71.21, "elapsed_time": "1 day, 6:14:30", "remaining_time": "12:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12777, "total_steps": 17941, "loss": 1.7223, "learning_rate": 1.9708423123519242e-05, "epoch": 0.7121676606655147, "percentage": 71.22, "elapsed_time": "1 day, 6:14:39", "remaining_time": "12:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12778, "total_steps": 17941, "loss": 1.7612, "learning_rate": 1.9701339456228534e-05, "epoch": 0.7122233989186779, "percentage": 71.22, "elapsed_time": "1 day, 6:14:47", "remaining_time": "12:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12779, "total_steps": 17941, "loss": 1.7783, "learning_rate": 1.96942567498347e-05, "epoch": 0.712279137171841, "percentage": 71.23, "elapsed_time": "1 day, 6:14:57", "remaining_time": "12:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12780, "total_steps": 17941, "loss": 1.5199, "learning_rate": 1.968717500456233e-05, "epoch": 0.7123348754250042, "percentage": 71.23, "elapsed_time": "1 day, 6:15:05", "remaining_time": "12:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12781, "total_steps": 17941, "loss": 1.6642, "learning_rate": 1.9680094220636018e-05, "epoch": 0.7123906136781674, "percentage": 71.24, "elapsed_time": "1 day, 6:15:14", "remaining_time": "12:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12782, "total_steps": 17941, "loss": 1.5273, "learning_rate": 1.967301439828037e-05, "epoch": 0.7124463519313304, "percentage": 71.24, "elapsed_time": "1 day, 6:15:22", "remaining_time": "12:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12783, "total_steps": 17941, "loss": 1.484, "learning_rate": 1.966593553771987e-05, "epoch": 0.7125020901844936, "percentage": 71.25, "elapsed_time": "1 day, 6:15:30", "remaining_time": "12:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12784, "total_steps": 17941, "loss": 1.798, "learning_rate": 1.965885763917904e-05, "epoch": 0.7125578284376568, "percentage": 71.26, "elapsed_time": "1 day, 6:15:39", "remaining_time": "12:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12785, "total_steps": 17941, "loss": 1.4035, "learning_rate": 1.9651780702882338e-05, "epoch": 0.7126135666908199, "percentage": 71.26, "elapsed_time": "1 day, 6:15:47", "remaining_time": "12:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12786, "total_steps": 17941, "loss": 1.5595, "learning_rate": 1.964470472905423e-05, "epoch": 0.7126693049439831, "percentage": 71.27, "elapsed_time": "1 day, 6:15:56", "remaining_time": "12:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12787, "total_steps": 17941, "loss": 1.6134, "learning_rate": 1.9637629717919094e-05, "epoch": 0.7127250431971462, "percentage": 71.27, "elapsed_time": "1 day, 6:16:04", "remaining_time": "12:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12788, "total_steps": 17941, "loss": 1.9148, "learning_rate": 1.963055566970129e-05, "epoch": 0.7127807814503093, "percentage": 71.28, "elapsed_time": "1 day, 6:16:13", "remaining_time": "12:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12789, "total_steps": 17941, "loss": 1.3516, "learning_rate": 1.9623482584625237e-05, "epoch": 0.7128365197034725, "percentage": 71.28, "elapsed_time": "1 day, 6:16:21", "remaining_time": "12:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12790, "total_steps": 17941, "loss": 1.6736, "learning_rate": 1.9616410462915186e-05, "epoch": 0.7128922579566357, "percentage": 71.29, "elapsed_time": "1 day, 6:16:30", "remaining_time": "12:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12791, "total_steps": 17941, "loss": 1.6827, "learning_rate": 1.960933930479545e-05, "epoch": 0.7129479962097988, "percentage": 71.29, "elapsed_time": "1 day, 6:16:38", "remaining_time": "12:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12792, "total_steps": 17941, "loss": 1.7693, "learning_rate": 1.9602269110490273e-05, "epoch": 0.713003734462962, "percentage": 71.3, "elapsed_time": "1 day, 6:16:46", "remaining_time": "12:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12793, "total_steps": 17941, "loss": 1.7255, "learning_rate": 1.9595199880223912e-05, "epoch": 0.7130594727161251, "percentage": 71.31, "elapsed_time": "1 day, 6:16:55", "remaining_time": "12:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12794, "total_steps": 17941, "loss": 1.5599, "learning_rate": 1.9588131614220522e-05, "epoch": 0.7131152109692882, "percentage": 71.31, "elapsed_time": "1 day, 6:17:03", "remaining_time": "12:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12795, "total_steps": 17941, "loss": 1.7379, "learning_rate": 1.958106431270429e-05, "epoch": 0.7131709492224514, "percentage": 71.32, "elapsed_time": "1 day, 6:17:12", "remaining_time": "12:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12796, "total_steps": 17941, "loss": 1.6852, "learning_rate": 1.957399797589933e-05, "epoch": 0.7132266874756145, "percentage": 71.32, "elapsed_time": "1 day, 6:17:20", "remaining_time": "12:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12797, "total_steps": 17941, "loss": 1.8283, "learning_rate": 1.956693260402977e-05, "epoch": 0.7132824257287776, "percentage": 71.33, "elapsed_time": "1 day, 6:17:28", "remaining_time": "12:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12798, "total_steps": 17941, "loss": 1.8184, "learning_rate": 1.955986819731968e-05, "epoch": 0.7133381639819408, "percentage": 71.33, "elapsed_time": "1 day, 6:17:37", "remaining_time": "12:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12799, "total_steps": 17941, "loss": 1.8002, "learning_rate": 1.9552804755993065e-05, "epoch": 0.7133939022351039, "percentage": 71.34, "elapsed_time": "1 day, 6:17:45", "remaining_time": "12:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12800, "total_steps": 17941, "loss": 1.4038, "learning_rate": 1.9545742280273993e-05, "epoch": 0.7134496404882671, "percentage": 71.34, "elapsed_time": "1 day, 6:17:54", "remaining_time": "12:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12801, "total_steps": 17941, "loss": 1.6931, "learning_rate": 1.9538680770386398e-05, "epoch": 0.7135053787414303, "percentage": 71.35, "elapsed_time": "1 day, 6:18:02", "remaining_time": "12:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12802, "total_steps": 17941, "loss": 1.7565, "learning_rate": 1.9531620226554248e-05, "epoch": 0.7135611169945933, "percentage": 71.36, "elapsed_time": "1 day, 6:18:11", "remaining_time": "12:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12803, "total_steps": 17941, "loss": 1.7543, "learning_rate": 1.9524560649001462e-05, "epoch": 0.7136168552477565, "percentage": 71.36, "elapsed_time": "1 day, 6:18:19", "remaining_time": "12:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12804, "total_steps": 17941, "loss": 1.7114, "learning_rate": 1.951750203795193e-05, "epoch": 0.7136725935009197, "percentage": 71.37, "elapsed_time": "1 day, 6:18:28", "remaining_time": "12:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12805, "total_steps": 17941, "loss": 1.4792, "learning_rate": 1.9510444393629525e-05, "epoch": 0.7137283317540828, "percentage": 71.37, "elapsed_time": "1 day, 6:18:36", "remaining_time": "12:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12806, "total_steps": 17941, "loss": 1.6419, "learning_rate": 1.9503387716258038e-05, "epoch": 0.713784070007246, "percentage": 71.38, "elapsed_time": "1 day, 6:18:44", "remaining_time": "12:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12807, "total_steps": 17941, "loss": 1.5288, "learning_rate": 1.9496332006061262e-05, "epoch": 0.7138398082604092, "percentage": 71.38, "elapsed_time": "1 day, 6:18:53", "remaining_time": "12:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12808, "total_steps": 17941, "loss": 1.7274, "learning_rate": 1.9489277263263028e-05, "epoch": 0.7138955465135722, "percentage": 71.39, "elapsed_time": "1 day, 6:19:02", "remaining_time": "12:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12809, "total_steps": 17941, "loss": 2.0038, "learning_rate": 1.9482223488087016e-05, "epoch": 0.7139512847667354, "percentage": 71.4, "elapsed_time": "1 day, 6:19:10", "remaining_time": "12:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12810, "total_steps": 17941, "loss": 1.6409, "learning_rate": 1.9475170680756938e-05, "epoch": 0.7140070230198986, "percentage": 71.4, "elapsed_time": "1 day, 6:19:19", "remaining_time": "12:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12811, "total_steps": 17941, "loss": 1.8189, "learning_rate": 1.9468118841496476e-05, "epoch": 0.7140627612730617, "percentage": 71.41, "elapsed_time": "1 day, 6:19:27", "remaining_time": "12:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12812, "total_steps": 17941, "loss": 1.5253, "learning_rate": 1.9461067970529286e-05, "epoch": 0.7141184995262249, "percentage": 71.41, "elapsed_time": "1 day, 6:19:35", "remaining_time": "12:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12813, "total_steps": 17941, "loss": 1.5391, "learning_rate": 1.9454018068078948e-05, "epoch": 0.714174237779388, "percentage": 71.42, "elapsed_time": "1 day, 6:19:44", "remaining_time": "12:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12814, "total_steps": 17941, "loss": 1.7251, "learning_rate": 1.944696913436905e-05, "epoch": 0.7142299760325511, "percentage": 71.42, "elapsed_time": "1 day, 6:19:52", "remaining_time": "12:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12815, "total_steps": 17941, "loss": 1.6815, "learning_rate": 1.9439921169623183e-05, "epoch": 0.7142857142857143, "percentage": 71.43, "elapsed_time": "1 day, 6:20:01", "remaining_time": "12:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12816, "total_steps": 17941, "loss": 1.5858, "learning_rate": 1.943287417406482e-05, "epoch": 0.7143414525388775, "percentage": 71.43, "elapsed_time": "1 day, 6:20:09", "remaining_time": "12:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12817, "total_steps": 17941, "loss": 1.6417, "learning_rate": 1.9425828147917475e-05, "epoch": 0.7143971907920406, "percentage": 71.44, "elapsed_time": "1 day, 6:20:18", "remaining_time": "12:07:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12818, "total_steps": 17941, "loss": 1.7085, "learning_rate": 1.9418783091404597e-05, "epoch": 0.7144529290452037, "percentage": 71.45, "elapsed_time": "1 day, 6:20:26", "remaining_time": "12:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12819, "total_steps": 17941, "loss": 1.7192, "learning_rate": 1.941173900474964e-05, "epoch": 0.7145086672983668, "percentage": 71.45, "elapsed_time": "1 day, 6:20:35", "remaining_time": "12:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12820, "total_steps": 17941, "loss": 1.7091, "learning_rate": 1.940469588817596e-05, "epoch": 0.71456440555153, "percentage": 71.46, "elapsed_time": "1 day, 6:20:43", "remaining_time": "12:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12821, "total_steps": 17941, "loss": 1.7204, "learning_rate": 1.9397653741906947e-05, "epoch": 0.7146201438046932, "percentage": 71.46, "elapsed_time": "1 day, 6:20:51", "remaining_time": "12:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12822, "total_steps": 17941, "loss": 1.8386, "learning_rate": 1.939061256616593e-05, "epoch": 0.7146758820578563, "percentage": 71.47, "elapsed_time": "1 day, 6:21:00", "remaining_time": "12:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12823, "total_steps": 17941, "loss": 1.4818, "learning_rate": 1.9383572361176216e-05, "epoch": 0.7147316203110194, "percentage": 71.47, "elapsed_time": "1 day, 6:21:08", "remaining_time": "12:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12824, "total_steps": 17941, "loss": 1.6351, "learning_rate": 1.93765331271611e-05, "epoch": 0.7147873585641826, "percentage": 71.48, "elapsed_time": "1 day, 6:21:17", "remaining_time": "12:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12825, "total_steps": 17941, "loss": 1.7558, "learning_rate": 1.9369494864343768e-05, "epoch": 0.7148430968173457, "percentage": 71.48, "elapsed_time": "1 day, 6:21:25", "remaining_time": "12:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12826, "total_steps": 17941, "loss": 1.4818, "learning_rate": 1.9362457572947508e-05, "epoch": 0.7148988350705089, "percentage": 71.49, "elapsed_time": "1 day, 6:21:34", "remaining_time": "12:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12827, "total_steps": 17941, "loss": 1.5985, "learning_rate": 1.935542125319545e-05, "epoch": 0.7149545733236721, "percentage": 71.5, "elapsed_time": "1 day, 6:21:42", "remaining_time": "12:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12828, "total_steps": 17941, "loss": 1.6352, "learning_rate": 1.9348385905310757e-05, "epoch": 0.7150103115768351, "percentage": 71.5, "elapsed_time": "1 day, 6:21:51", "remaining_time": "12:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12829, "total_steps": 17941, "loss": 1.6083, "learning_rate": 1.934135152951655e-05, "epoch": 0.7150660498299983, "percentage": 71.51, "elapsed_time": "1 day, 6:21:59", "remaining_time": "12:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12830, "total_steps": 17941, "loss": 1.6754, "learning_rate": 1.9334318126035922e-05, "epoch": 0.7151217880831615, "percentage": 71.51, "elapsed_time": "1 day, 6:22:08", "remaining_time": "12:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12831, "total_steps": 17941, "loss": 1.695, "learning_rate": 1.9327285695091946e-05, "epoch": 0.7151775263363246, "percentage": 71.52, "elapsed_time": "1 day, 6:22:16", "remaining_time": "12:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12832, "total_steps": 17941, "loss": 1.9642, "learning_rate": 1.932025423690762e-05, "epoch": 0.7152332645894878, "percentage": 71.52, "elapsed_time": "1 day, 6:22:25", "remaining_time": "12:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12833, "total_steps": 17941, "loss": 1.3916, "learning_rate": 1.9313223751705935e-05, "epoch": 0.715289002842651, "percentage": 71.53, "elapsed_time": "1 day, 6:22:34", "remaining_time": "12:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12834, "total_steps": 17941, "loss": 1.4148, "learning_rate": 1.9306194239709906e-05, "epoch": 0.715344741095814, "percentage": 71.53, "elapsed_time": "1 day, 6:22:42", "remaining_time": "12:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12835, "total_steps": 17941, "loss": 1.3771, "learning_rate": 1.9299165701142426e-05, "epoch": 0.7154004793489772, "percentage": 71.54, "elapsed_time": "1 day, 6:22:51", "remaining_time": "12:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12836, "total_steps": 17941, "loss": 1.6937, "learning_rate": 1.9292138136226413e-05, "epoch": 0.7154562176021404, "percentage": 71.55, "elapsed_time": "1 day, 6:23:00", "remaining_time": "12:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12837, "total_steps": 17941, "loss": 1.6335, "learning_rate": 1.928511154518473e-05, "epoch": 0.7155119558553035, "percentage": 71.55, "elapsed_time": "1 day, 6:23:08", "remaining_time": "12:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12838, "total_steps": 17941, "loss": 1.7754, "learning_rate": 1.927808592824026e-05, "epoch": 0.7155676941084667, "percentage": 71.56, "elapsed_time": "1 day, 6:23:16", "remaining_time": "12:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12839, "total_steps": 17941, "loss": 1.607, "learning_rate": 1.9271061285615755e-05, "epoch": 0.7156234323616298, "percentage": 71.56, "elapsed_time": "1 day, 6:23:25", "remaining_time": "12:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12840, "total_steps": 17941, "loss": 1.6942, "learning_rate": 1.926403761753401e-05, "epoch": 0.7156791706147929, "percentage": 71.57, "elapsed_time": "1 day, 6:23:33", "remaining_time": "12:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12841, "total_steps": 17941, "loss": 1.7635, "learning_rate": 1.925701492421782e-05, "epoch": 0.7157349088679561, "percentage": 71.57, "elapsed_time": "1 day, 6:23:42", "remaining_time": "12:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12842, "total_steps": 17941, "loss": 1.5762, "learning_rate": 1.924999320588986e-05, "epoch": 0.7157906471211192, "percentage": 71.58, "elapsed_time": "1 day, 6:23:50", "remaining_time": "12:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12843, "total_steps": 17941, "loss": 1.8578, "learning_rate": 1.924297246277283e-05, "epoch": 0.7158463853742824, "percentage": 71.58, "elapsed_time": "1 day, 6:23:59", "remaining_time": "12:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12844, "total_steps": 17941, "loss": 1.5414, "learning_rate": 1.9235952695089388e-05, "epoch": 0.7159021236274455, "percentage": 71.59, "elapsed_time": "1 day, 6:24:07", "remaining_time": "12:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12845, "total_steps": 17941, "loss": 1.4997, "learning_rate": 1.9228933903062173e-05, "epoch": 0.7159578618806086, "percentage": 71.6, "elapsed_time": "1 day, 6:24:16", "remaining_time": "12:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12846, "total_steps": 17941, "loss": 1.6019, "learning_rate": 1.9221916086913756e-05, "epoch": 0.7160136001337718, "percentage": 71.6, "elapsed_time": "1 day, 6:24:24", "remaining_time": "12:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12847, "total_steps": 17941, "loss": 1.4985, "learning_rate": 1.9214899246866707e-05, "epoch": 0.716069338386935, "percentage": 71.61, "elapsed_time": "1 day, 6:24:32", "remaining_time": "12:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12848, "total_steps": 17941, "loss": 1.9859, "learning_rate": 1.9207883383143566e-05, "epoch": 0.7161250766400981, "percentage": 71.61, "elapsed_time": "1 day, 6:24:41", "remaining_time": "12:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12849, "total_steps": 17941, "loss": 1.8885, "learning_rate": 1.9200868495966827e-05, "epoch": 0.7161808148932612, "percentage": 71.62, "elapsed_time": "1 day, 6:24:49", "remaining_time": "12:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12850, "total_steps": 17941, "loss": 1.8515, "learning_rate": 1.9193854585558996e-05, "epoch": 0.7162365531464244, "percentage": 71.62, "elapsed_time": "1 day, 6:24:58", "remaining_time": "12:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12851, "total_steps": 17941, "loss": 1.6183, "learning_rate": 1.9186841652142446e-05, "epoch": 0.7162922913995875, "percentage": 71.63, "elapsed_time": "1 day, 6:25:07", "remaining_time": "12:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12852, "total_steps": 17941, "loss": 1.5724, "learning_rate": 1.917982969593966e-05, "epoch": 0.7163480296527507, "percentage": 71.63, "elapsed_time": "1 day, 6:25:15", "remaining_time": "12:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12853, "total_steps": 17941, "loss": 1.7062, "learning_rate": 1.9172818717172964e-05, "epoch": 0.7164037679059139, "percentage": 71.64, "elapsed_time": "1 day, 6:25:23", "remaining_time": "12:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12854, "total_steps": 17941, "loss": 1.6388, "learning_rate": 1.9165808716064727e-05, "epoch": 0.7164595061590769, "percentage": 71.65, "elapsed_time": "1 day, 6:25:32", "remaining_time": "12:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12855, "total_steps": 17941, "loss": 1.5902, "learning_rate": 1.9158799692837258e-05, "epoch": 0.7165152444122401, "percentage": 71.65, "elapsed_time": "1 day, 6:25:40", "remaining_time": "12:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12856, "total_steps": 17941, "loss": 1.5341, "learning_rate": 1.9151791647712848e-05, "epoch": 0.7165709826654033, "percentage": 71.66, "elapsed_time": "1 day, 6:25:49", "remaining_time": "12:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12857, "total_steps": 17941, "loss": 1.5641, "learning_rate": 1.9144784580913765e-05, "epoch": 0.7166267209185664, "percentage": 71.66, "elapsed_time": "1 day, 6:25:57", "remaining_time": "12:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12858, "total_steps": 17941, "loss": 1.4185, "learning_rate": 1.91377784926622e-05, "epoch": 0.7166824591717296, "percentage": 71.67, "elapsed_time": "1 day, 6:26:06", "remaining_time": "12:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12859, "total_steps": 17941, "loss": 1.6281, "learning_rate": 1.9130773383180344e-05, "epoch": 0.7167381974248928, "percentage": 71.67, "elapsed_time": "1 day, 6:26:14", "remaining_time": "12:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12860, "total_steps": 17941, "loss": 1.4896, "learning_rate": 1.912376925269041e-05, "epoch": 0.7167939356780558, "percentage": 71.68, "elapsed_time": "1 day, 6:26:23", "remaining_time": "12:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12861, "total_steps": 17941, "loss": 1.6033, "learning_rate": 1.911676610141448e-05, "epoch": 0.716849673931219, "percentage": 71.68, "elapsed_time": "1 day, 6:26:31", "remaining_time": "12:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12862, "total_steps": 17941, "loss": 1.5138, "learning_rate": 1.9109763929574665e-05, "epoch": 0.7169054121843822, "percentage": 71.69, "elapsed_time": "1 day, 6:26:39", "remaining_time": "12:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12863, "total_steps": 17941, "loss": 1.728, "learning_rate": 1.910276273739304e-05, "epoch": 0.7169611504375453, "percentage": 71.7, "elapsed_time": "1 day, 6:26:48", "remaining_time": "12:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12864, "total_steps": 17941, "loss": 1.8363, "learning_rate": 1.909576252509165e-05, "epoch": 0.7170168886907085, "percentage": 71.7, "elapsed_time": "1 day, 6:26:56", "remaining_time": "12:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12865, "total_steps": 17941, "loss": 1.6138, "learning_rate": 1.9088763292892468e-05, "epoch": 0.7170726269438715, "percentage": 71.71, "elapsed_time": "1 day, 6:27:05", "remaining_time": "12:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12866, "total_steps": 17941, "loss": 1.6805, "learning_rate": 1.908176504101748e-05, "epoch": 0.7171283651970347, "percentage": 71.71, "elapsed_time": "1 day, 6:27:13", "remaining_time": "12:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12867, "total_steps": 17941, "loss": 1.5874, "learning_rate": 1.9074767769688674e-05, "epoch": 0.7171841034501979, "percentage": 71.72, "elapsed_time": "1 day, 6:27:22", "remaining_time": "12:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12868, "total_steps": 17941, "loss": 1.7405, "learning_rate": 1.9067771479127905e-05, "epoch": 0.717239841703361, "percentage": 71.72, "elapsed_time": "1 day, 6:27:30", "remaining_time": "12:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12869, "total_steps": 17941, "loss": 1.9751, "learning_rate": 1.9060776169557083e-05, "epoch": 0.7172955799565242, "percentage": 71.73, "elapsed_time": "1 day, 6:27:39", "remaining_time": "12:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12870, "total_steps": 17941, "loss": 1.701, "learning_rate": 1.9053781841198044e-05, "epoch": 0.7173513182096873, "percentage": 71.74, "elapsed_time": "1 day, 6:27:47", "remaining_time": "12:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12871, "total_steps": 17941, "loss": 1.5356, "learning_rate": 1.9046788494272638e-05, "epoch": 0.7174070564628504, "percentage": 71.74, "elapsed_time": "1 day, 6:27:56", "remaining_time": "12:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12872, "total_steps": 17941, "loss": 1.6373, "learning_rate": 1.903979612900262e-05, "epoch": 0.7174627947160136, "percentage": 71.75, "elapsed_time": "1 day, 6:28:04", "remaining_time": "11:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12873, "total_steps": 17941, "loss": 1.919, "learning_rate": 1.903280474560975e-05, "epoch": 0.7175185329691768, "percentage": 71.75, "elapsed_time": "1 day, 6:28:13", "remaining_time": "11:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12874, "total_steps": 17941, "loss": 1.6801, "learning_rate": 1.902581434431576e-05, "epoch": 0.7175742712223399, "percentage": 71.76, "elapsed_time": "1 day, 6:28:21", "remaining_time": "11:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12875, "total_steps": 17941, "loss": 1.7047, "learning_rate": 1.9018824925342353e-05, "epoch": 0.717630009475503, "percentage": 71.76, "elapsed_time": "1 day, 6:28:30", "remaining_time": "11:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12876, "total_steps": 17941, "loss": 1.5699, "learning_rate": 1.9011836488911207e-05, "epoch": 0.7176857477286662, "percentage": 71.77, "elapsed_time": "1 day, 6:28:39", "remaining_time": "11:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12877, "total_steps": 17941, "loss": 1.8281, "learning_rate": 1.9004849035243894e-05, "epoch": 0.7177414859818293, "percentage": 71.77, "elapsed_time": "1 day, 6:28:47", "remaining_time": "11:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12878, "total_steps": 17941, "loss": 1.6098, "learning_rate": 1.8997862564562092e-05, "epoch": 0.7177972242349925, "percentage": 71.78, "elapsed_time": "1 day, 6:28:55", "remaining_time": "11:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12879, "total_steps": 17941, "loss": 1.6627, "learning_rate": 1.8990877077087315e-05, "epoch": 0.7178529624881557, "percentage": 71.79, "elapsed_time": "1 day, 6:29:04", "remaining_time": "11:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12880, "total_steps": 17941, "loss": 1.5231, "learning_rate": 1.8983892573041124e-05, "epoch": 0.7179087007413187, "percentage": 71.79, "elapsed_time": "1 day, 6:29:12", "remaining_time": "11:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12881, "total_steps": 17941, "loss": 1.5775, "learning_rate": 1.897690905264502e-05, "epoch": 0.7179644389944819, "percentage": 71.8, "elapsed_time": "1 day, 6:29:21", "remaining_time": "11:58:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12882, "total_steps": 17941, "loss": 1.5025, "learning_rate": 1.8969926516120486e-05, "epoch": 0.7180201772476451, "percentage": 71.8, "elapsed_time": "1 day, 6:29:29", "remaining_time": "11:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12883, "total_steps": 17941, "loss": 1.6357, "learning_rate": 1.8962944963688982e-05, "epoch": 0.7180759155008082, "percentage": 71.81, "elapsed_time": "1 day, 6:29:38", "remaining_time": "11:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12884, "total_steps": 17941, "loss": 1.617, "learning_rate": 1.8955964395571875e-05, "epoch": 0.7181316537539714, "percentage": 71.81, "elapsed_time": "1 day, 6:29:46", "remaining_time": "11:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12885, "total_steps": 17941, "loss": 1.7125, "learning_rate": 1.894898481199059e-05, "epoch": 0.7181873920071346, "percentage": 71.82, "elapsed_time": "1 day, 6:29:55", "remaining_time": "11:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12886, "total_steps": 17941, "loss": 1.5926, "learning_rate": 1.8942006213166486e-05, "epoch": 0.7182431302602976, "percentage": 71.82, "elapsed_time": "1 day, 6:30:03", "remaining_time": "11:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12887, "total_steps": 17941, "loss": 1.5145, "learning_rate": 1.8935028599320846e-05, "epoch": 0.7182988685134608, "percentage": 71.83, "elapsed_time": "1 day, 6:30:12", "remaining_time": "11:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12888, "total_steps": 17941, "loss": 1.7493, "learning_rate": 1.8928051970674975e-05, "epoch": 0.7183546067666239, "percentage": 71.84, "elapsed_time": "1 day, 6:30:20", "remaining_time": "11:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12889, "total_steps": 17941, "loss": 1.5814, "learning_rate": 1.892107632745014e-05, "epoch": 0.7184103450197871, "percentage": 71.84, "elapsed_time": "1 day, 6:30:28", "remaining_time": "11:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12890, "total_steps": 17941, "loss": 1.5899, "learning_rate": 1.8914101669867572e-05, "epoch": 0.7184660832729503, "percentage": 71.85, "elapsed_time": "1 day, 6:30:37", "remaining_time": "11:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12891, "total_steps": 17941, "loss": 1.6587, "learning_rate": 1.8907127998148444e-05, "epoch": 0.7185218215261133, "percentage": 71.85, "elapsed_time": "1 day, 6:30:46", "remaining_time": "11:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12892, "total_steps": 17941, "loss": 1.4609, "learning_rate": 1.8900155312513913e-05, "epoch": 0.7185775597792765, "percentage": 71.86, "elapsed_time": "1 day, 6:30:54", "remaining_time": "11:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12893, "total_steps": 17941, "loss": 1.715, "learning_rate": 1.8893183613185163e-05, "epoch": 0.7186332980324397, "percentage": 71.86, "elapsed_time": "1 day, 6:31:02", "remaining_time": "11:56:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12894, "total_steps": 17941, "loss": 1.5037, "learning_rate": 1.8886212900383248e-05, "epoch": 0.7186890362856028, "percentage": 71.87, "elapsed_time": "1 day, 6:31:11", "remaining_time": "11:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12895, "total_steps": 17941, "loss": 1.3882, "learning_rate": 1.887924317432925e-05, "epoch": 0.718744774538766, "percentage": 71.87, "elapsed_time": "1 day, 6:31:20", "remaining_time": "11:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12896, "total_steps": 17941, "loss": 1.6411, "learning_rate": 1.887227443524422e-05, "epoch": 0.7188005127919291, "percentage": 71.88, "elapsed_time": "1 day, 6:31:29", "remaining_time": "11:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12897, "total_steps": 17941, "loss": 1.7263, "learning_rate": 1.886530668334917e-05, "epoch": 0.7188562510450922, "percentage": 71.89, "elapsed_time": "1 day, 6:31:37", "remaining_time": "11:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12898, "total_steps": 17941, "loss": 1.5848, "learning_rate": 1.8858339918865046e-05, "epoch": 0.7189119892982554, "percentage": 71.89, "elapsed_time": "1 day, 6:31:45", "remaining_time": "11:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12899, "total_steps": 17941, "loss": 1.8026, "learning_rate": 1.885137414201281e-05, "epoch": 0.7189677275514186, "percentage": 71.9, "elapsed_time": "1 day, 6:31:54", "remaining_time": "11:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12900, "total_steps": 17941, "loss": 1.6852, "learning_rate": 1.884440935301338e-05, "epoch": 0.7190234658045817, "percentage": 71.9, "elapsed_time": "1 day, 6:32:03", "remaining_time": "11:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12901, "total_steps": 17941, "loss": 1.5815, "learning_rate": 1.883744555208764e-05, "epoch": 0.7190792040577448, "percentage": 71.91, "elapsed_time": "1 day, 6:32:12", "remaining_time": "11:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12902, "total_steps": 17941, "loss": 1.6217, "learning_rate": 1.8830482739456452e-05, "epoch": 0.719134942310908, "percentage": 71.91, "elapsed_time": "1 day, 6:32:20", "remaining_time": "11:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12903, "total_steps": 17941, "loss": 1.7787, "learning_rate": 1.8823520915340583e-05, "epoch": 0.7191906805640711, "percentage": 71.92, "elapsed_time": "1 day, 6:32:28", "remaining_time": "11:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12904, "total_steps": 17941, "loss": 1.2857, "learning_rate": 1.8816560079960892e-05, "epoch": 0.7192464188172343, "percentage": 71.92, "elapsed_time": "1 day, 6:32:37", "remaining_time": "11:55:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12905, "total_steps": 17941, "loss": 1.6263, "learning_rate": 1.8809600233538087e-05, "epoch": 0.7193021570703975, "percentage": 71.93, "elapsed_time": "1 day, 6:32:45", "remaining_time": "11:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12906, "total_steps": 17941, "loss": 1.3656, "learning_rate": 1.8802641376292914e-05, "epoch": 0.7193578953235605, "percentage": 71.94, "elapsed_time": "1 day, 6:32:54", "remaining_time": "11:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12907, "total_steps": 17941, "loss": 1.7087, "learning_rate": 1.8795683508446055e-05, "epoch": 0.7194136335767237, "percentage": 71.94, "elapsed_time": "1 day, 6:33:02", "remaining_time": "11:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12908, "total_steps": 17941, "loss": 1.7132, "learning_rate": 1.878872663021819e-05, "epoch": 0.7194693718298869, "percentage": 71.95, "elapsed_time": "1 day, 6:33:11", "remaining_time": "11:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12909, "total_steps": 17941, "loss": 1.6527, "learning_rate": 1.8781770741829956e-05, "epoch": 0.71952511008305, "percentage": 71.95, "elapsed_time": "1 day, 6:33:19", "remaining_time": "11:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12910, "total_steps": 17941, "loss": 1.7389, "learning_rate": 1.8774815843501904e-05, "epoch": 0.7195808483362132, "percentage": 71.96, "elapsed_time": "1 day, 6:33:28", "remaining_time": "11:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12911, "total_steps": 17941, "loss": 1.5739, "learning_rate": 1.8767861935454673e-05, "epoch": 0.7196365865893762, "percentage": 71.96, "elapsed_time": "1 day, 6:33:36", "remaining_time": "11:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12912, "total_steps": 17941, "loss": 1.3315, "learning_rate": 1.8760909017908746e-05, "epoch": 0.7196923248425394, "percentage": 71.97, "elapsed_time": "1 day, 6:33:45", "remaining_time": "11:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12913, "total_steps": 17941, "loss": 1.634, "learning_rate": 1.875395709108465e-05, "epoch": 0.7197480630957026, "percentage": 71.97, "elapsed_time": "1 day, 6:33:53", "remaining_time": "11:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12914, "total_steps": 17941, "loss": 1.6764, "learning_rate": 1.874700615520286e-05, "epoch": 0.7198038013488657, "percentage": 71.98, "elapsed_time": "1 day, 6:34:02", "remaining_time": "11:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12915, "total_steps": 17941, "loss": 1.7273, "learning_rate": 1.8740056210483815e-05, "epoch": 0.7198595396020289, "percentage": 71.99, "elapsed_time": "1 day, 6:34:10", "remaining_time": "11:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12916, "total_steps": 17941, "loss": 1.6144, "learning_rate": 1.873310725714795e-05, "epoch": 0.719915277855192, "percentage": 71.99, "elapsed_time": "1 day, 6:34:18", "remaining_time": "11:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12917, "total_steps": 17941, "loss": 1.6216, "learning_rate": 1.8726159295415603e-05, "epoch": 0.7199710161083551, "percentage": 72.0, "elapsed_time": "1 day, 6:34:27", "remaining_time": "11:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12918, "total_steps": 17941, "loss": 1.44, "learning_rate": 1.8719212325507123e-05, "epoch": 0.7200267543615183, "percentage": 72.0, "elapsed_time": "1 day, 6:34:35", "remaining_time": "11:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12919, "total_steps": 17941, "loss": 1.7272, "learning_rate": 1.871226634764289e-05, "epoch": 0.7200824926146815, "percentage": 72.01, "elapsed_time": "1 day, 6:34:44", "remaining_time": "11:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12920, "total_steps": 17941, "loss": 1.4406, "learning_rate": 1.870532136204313e-05, "epoch": 0.7201382308678446, "percentage": 72.01, "elapsed_time": "1 day, 6:34:52", "remaining_time": "11:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12921, "total_steps": 17941, "loss": 1.6393, "learning_rate": 1.8698377368928115e-05, "epoch": 0.7201939691210077, "percentage": 72.02, "elapsed_time": "1 day, 6:35:01", "remaining_time": "11:52:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12922, "total_steps": 17941, "loss": 1.7118, "learning_rate": 1.8691434368518067e-05, "epoch": 0.7202497073741709, "percentage": 72.02, "elapsed_time": "1 day, 6:35:10", "remaining_time": "11:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12923, "total_steps": 17941, "loss": 1.7196, "learning_rate": 1.8684492361033196e-05, "epoch": 0.720305445627334, "percentage": 72.03, "elapsed_time": "1 day, 6:35:18", "remaining_time": "11:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12924, "total_steps": 17941, "loss": 1.5354, "learning_rate": 1.8677551346693633e-05, "epoch": 0.7203611838804972, "percentage": 72.04, "elapsed_time": "1 day, 6:35:27", "remaining_time": "11:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12925, "total_steps": 17941, "loss": 1.7636, "learning_rate": 1.867061132571951e-05, "epoch": 0.7204169221336604, "percentage": 72.04, "elapsed_time": "1 day, 6:35:35", "remaining_time": "11:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12926, "total_steps": 17941, "loss": 1.6949, "learning_rate": 1.8663672298330942e-05, "epoch": 0.7204726603868234, "percentage": 72.05, "elapsed_time": "1 day, 6:35:44", "remaining_time": "11:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12927, "total_steps": 17941, "loss": 1.684, "learning_rate": 1.865673426474798e-05, "epoch": 0.7205283986399866, "percentage": 72.05, "elapsed_time": "1 day, 6:35:52", "remaining_time": "11:52:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12928, "total_steps": 17941, "loss": 1.6678, "learning_rate": 1.864979722519068e-05, "epoch": 0.7205841368931498, "percentage": 72.06, "elapsed_time": "1 day, 6:36:01", "remaining_time": "11:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12929, "total_steps": 17941, "loss": 1.7897, "learning_rate": 1.8642861179878994e-05, "epoch": 0.7206398751463129, "percentage": 72.06, "elapsed_time": "1 day, 6:36:09", "remaining_time": "11:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12930, "total_steps": 17941, "loss": 1.7266, "learning_rate": 1.8635926129032964e-05, "epoch": 0.7206956133994761, "percentage": 72.07, "elapsed_time": "1 day, 6:36:18", "remaining_time": "11:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12931, "total_steps": 17941, "loss": 1.606, "learning_rate": 1.8628992072872476e-05, "epoch": 0.7207513516526393, "percentage": 72.08, "elapsed_time": "1 day, 6:36:26", "remaining_time": "11:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12932, "total_steps": 17941, "loss": 1.7615, "learning_rate": 1.862205901161745e-05, "epoch": 0.7208070899058023, "percentage": 72.08, "elapsed_time": "1 day, 6:36:35", "remaining_time": "11:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12933, "total_steps": 17941, "loss": 1.8626, "learning_rate": 1.8615126945487766e-05, "epoch": 0.7208628281589655, "percentage": 72.09, "elapsed_time": "1 day, 6:36:43", "remaining_time": "11:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12934, "total_steps": 17941, "loss": 1.871, "learning_rate": 1.8608195874703266e-05, "epoch": 0.7209185664121286, "percentage": 72.09, "elapsed_time": "1 day, 6:36:52", "remaining_time": "11:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12935, "total_steps": 17941, "loss": 1.4462, "learning_rate": 1.8601265799483786e-05, "epoch": 0.7209743046652918, "percentage": 72.1, "elapsed_time": "1 day, 6:37:00", "remaining_time": "11:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12936, "total_steps": 17941, "loss": 1.4693, "learning_rate": 1.8594336720049055e-05, "epoch": 0.721030042918455, "percentage": 72.1, "elapsed_time": "1 day, 6:37:08", "remaining_time": "11:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12937, "total_steps": 17941, "loss": 1.3201, "learning_rate": 1.8587408636618887e-05, "epoch": 0.721085781171618, "percentage": 72.11, "elapsed_time": "1 day, 6:37:17", "remaining_time": "11:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12938, "total_steps": 17941, "loss": 1.5373, "learning_rate": 1.8580481549412953e-05, "epoch": 0.7211415194247812, "percentage": 72.11, "elapsed_time": "1 day, 6:37:26", "remaining_time": "11:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12939, "total_steps": 17941, "loss": 1.5566, "learning_rate": 1.857355545865096e-05, "epoch": 0.7211972576779444, "percentage": 72.12, "elapsed_time": "1 day, 6:37:34", "remaining_time": "11:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12940, "total_steps": 17941, "loss": 1.9095, "learning_rate": 1.856663036455255e-05, "epoch": 0.7212529959311075, "percentage": 72.13, "elapsed_time": "1 day, 6:37:42", "remaining_time": "11:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12941, "total_steps": 17941, "loss": 1.7033, "learning_rate": 1.8559706267337362e-05, "epoch": 0.7213087341842707, "percentage": 72.13, "elapsed_time": "1 day, 6:37:51", "remaining_time": "11:50:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12942, "total_steps": 17941, "loss": 1.7649, "learning_rate": 1.8552783167224995e-05, "epoch": 0.7213644724374338, "percentage": 72.14, "elapsed_time": "1 day, 6:37:59", "remaining_time": "11:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12943, "total_steps": 17941, "loss": 1.6757, "learning_rate": 1.8545861064434984e-05, "epoch": 0.7214202106905969, "percentage": 72.14, "elapsed_time": "1 day, 6:38:08", "remaining_time": "11:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12944, "total_steps": 17941, "loss": 1.5795, "learning_rate": 1.853893995918685e-05, "epoch": 0.7214759489437601, "percentage": 72.15, "elapsed_time": "1 day, 6:38:16", "remaining_time": "11:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12945, "total_steps": 17941, "loss": 1.3856, "learning_rate": 1.8532019851700143e-05, "epoch": 0.7215316871969233, "percentage": 72.15, "elapsed_time": "1 day, 6:38:25", "remaining_time": "11:49:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12946, "total_steps": 17941, "loss": 1.83, "learning_rate": 1.852510074219428e-05, "epoch": 0.7215874254500864, "percentage": 72.16, "elapsed_time": "1 day, 6:38:33", "remaining_time": "11:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12947, "total_steps": 17941, "loss": 1.3333, "learning_rate": 1.851818263088871e-05, "epoch": 0.7216431637032495, "percentage": 72.16, "elapsed_time": "1 day, 6:38:42", "remaining_time": "11:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12948, "total_steps": 17941, "loss": 1.2956, "learning_rate": 1.851126551800283e-05, "epoch": 0.7216989019564127, "percentage": 72.17, "elapsed_time": "1 day, 6:38:50", "remaining_time": "11:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12949, "total_steps": 17941, "loss": 1.5162, "learning_rate": 1.8504349403756038e-05, "epoch": 0.7217546402095758, "percentage": 72.18, "elapsed_time": "1 day, 6:38:59", "remaining_time": "11:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12950, "total_steps": 17941, "loss": 1.5998, "learning_rate": 1.8497434288367633e-05, "epoch": 0.721810378462739, "percentage": 72.18, "elapsed_time": "1 day, 6:39:07", "remaining_time": "11:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12951, "total_steps": 17941, "loss": 1.6553, "learning_rate": 1.8490520172056942e-05, "epoch": 0.7218661167159022, "percentage": 72.19, "elapsed_time": "1 day, 6:39:16", "remaining_time": "11:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12952, "total_steps": 17941, "loss": 1.5902, "learning_rate": 1.8483607055043233e-05, "epoch": 0.7219218549690652, "percentage": 72.19, "elapsed_time": "1 day, 6:39:24", "remaining_time": "11:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12953, "total_steps": 17941, "loss": 1.6285, "learning_rate": 1.847669493754576e-05, "epoch": 0.7219775932222284, "percentage": 72.2, "elapsed_time": "1 day, 6:39:32", "remaining_time": "11:48:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12954, "total_steps": 17941, "loss": 1.625, "learning_rate": 1.8469783819783735e-05, "epoch": 0.7220333314753916, "percentage": 72.2, "elapsed_time": "1 day, 6:39:41", "remaining_time": "11:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12955, "total_steps": 17941, "loss": 1.7366, "learning_rate": 1.8462873701976314e-05, "epoch": 0.7220890697285547, "percentage": 72.21, "elapsed_time": "1 day, 6:39:49", "remaining_time": "11:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12956, "total_steps": 17941, "loss": 1.608, "learning_rate": 1.8455964584342693e-05, "epoch": 0.7221448079817179, "percentage": 72.21, "elapsed_time": "1 day, 6:39:58", "remaining_time": "11:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12957, "total_steps": 17941, "loss": 1.7061, "learning_rate": 1.8449056467101945e-05, "epoch": 0.722200546234881, "percentage": 72.22, "elapsed_time": "1 day, 6:40:07", "remaining_time": "11:47:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12958, "total_steps": 17941, "loss": 1.5652, "learning_rate": 1.8442149350473172e-05, "epoch": 0.7222562844880441, "percentage": 72.23, "elapsed_time": "1 day, 6:40:15", "remaining_time": "11:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12959, "total_steps": 17941, "loss": 1.6385, "learning_rate": 1.843524323467542e-05, "epoch": 0.7223120227412073, "percentage": 72.23, "elapsed_time": "1 day, 6:40:24", "remaining_time": "11:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12960, "total_steps": 17941, "loss": 1.7745, "learning_rate": 1.8428338119927724e-05, "epoch": 0.7223677609943704, "percentage": 72.24, "elapsed_time": "1 day, 6:40:33", "remaining_time": "11:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12961, "total_steps": 17941, "loss": 1.6446, "learning_rate": 1.8421434006449084e-05, "epoch": 0.7224234992475336, "percentage": 72.24, "elapsed_time": "1 day, 6:40:42", "remaining_time": "11:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12962, "total_steps": 17941, "loss": 1.6425, "learning_rate": 1.8414530894458403e-05, "epoch": 0.7224792375006968, "percentage": 72.25, "elapsed_time": "1 day, 6:40:50", "remaining_time": "11:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12963, "total_steps": 17941, "loss": 1.6815, "learning_rate": 1.8407628784174686e-05, "epoch": 0.7225349757538598, "percentage": 72.25, "elapsed_time": "1 day, 6:40:58", "remaining_time": "11:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12964, "total_steps": 17941, "loss": 1.6791, "learning_rate": 1.8400727675816765e-05, "epoch": 0.722590714007023, "percentage": 72.26, "elapsed_time": "1 day, 6:41:07", "remaining_time": "11:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12965, "total_steps": 17941, "loss": 1.8262, "learning_rate": 1.8393827569603528e-05, "epoch": 0.7226464522601862, "percentage": 72.26, "elapsed_time": "1 day, 6:41:15", "remaining_time": "11:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12966, "total_steps": 17941, "loss": 1.7666, "learning_rate": 1.8386928465753807e-05, "epoch": 0.7227021905133493, "percentage": 72.27, "elapsed_time": "1 day, 6:41:24", "remaining_time": "11:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12967, "total_steps": 17941, "loss": 1.5913, "learning_rate": 1.838003036448639e-05, "epoch": 0.7227579287665125, "percentage": 72.28, "elapsed_time": "1 day, 6:41:32", "remaining_time": "11:46:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12968, "total_steps": 17941, "loss": 1.6933, "learning_rate": 1.8373133266020078e-05, "epoch": 0.7228136670196756, "percentage": 72.28, "elapsed_time": "1 day, 6:41:41", "remaining_time": "11:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12969, "total_steps": 17941, "loss": 1.6757, "learning_rate": 1.836623717057356e-05, "epoch": 0.7228694052728387, "percentage": 72.29, "elapsed_time": "1 day, 6:41:50", "remaining_time": "11:46:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12970, "total_steps": 17941, "loss": 1.605, "learning_rate": 1.8359342078365544e-05, "epoch": 0.7229251435260019, "percentage": 72.29, "elapsed_time": "1 day, 6:41:58", "remaining_time": "11:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12971, "total_steps": 17941, "loss": 1.6577, "learning_rate": 1.8352447989614758e-05, "epoch": 0.7229808817791651, "percentage": 72.3, "elapsed_time": "1 day, 6:42:06", "remaining_time": "11:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12972, "total_steps": 17941, "loss": 1.5251, "learning_rate": 1.834555490453978e-05, "epoch": 0.7230366200323282, "percentage": 72.3, "elapsed_time": "1 day, 6:42:15", "remaining_time": "11:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12973, "total_steps": 17941, "loss": 1.6013, "learning_rate": 1.8338662823359248e-05, "epoch": 0.7230923582854913, "percentage": 72.31, "elapsed_time": "1 day, 6:42:23", "remaining_time": "11:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12974, "total_steps": 17941, "loss": 1.5824, "learning_rate": 1.8331771746291728e-05, "epoch": 0.7231480965386545, "percentage": 72.31, "elapsed_time": "1 day, 6:42:32", "remaining_time": "11:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12975, "total_steps": 17941, "loss": 1.7972, "learning_rate": 1.8324881673555788e-05, "epoch": 0.7232038347918176, "percentage": 72.32, "elapsed_time": "1 day, 6:42:41", "remaining_time": "11:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12976, "total_steps": 17941, "loss": 1.6554, "learning_rate": 1.831799260536991e-05, "epoch": 0.7232595730449808, "percentage": 72.33, "elapsed_time": "1 day, 6:42:49", "remaining_time": "11:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12977, "total_steps": 17941, "loss": 1.3969, "learning_rate": 1.8311104541952567e-05, "epoch": 0.723315311298144, "percentage": 72.33, "elapsed_time": "1 day, 6:42:58", "remaining_time": "11:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12978, "total_steps": 17941, "loss": 1.5403, "learning_rate": 1.8304217483522263e-05, "epoch": 0.723371049551307, "percentage": 72.34, "elapsed_time": "1 day, 6:43:06", "remaining_time": "11:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12979, "total_steps": 17941, "loss": 1.7002, "learning_rate": 1.8297331430297365e-05, "epoch": 0.7234267878044702, "percentage": 72.34, "elapsed_time": "1 day, 6:43:15", "remaining_time": "11:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12980, "total_steps": 17941, "loss": 1.4977, "learning_rate": 1.829044638249629e-05, "epoch": 0.7234825260576333, "percentage": 72.35, "elapsed_time": "1 day, 6:43:24", "remaining_time": "11:44:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12981, "total_steps": 17941, "loss": 1.5423, "learning_rate": 1.8283562340337342e-05, "epoch": 0.7235382643107965, "percentage": 72.35, "elapsed_time": "1 day, 6:43:33", "remaining_time": "11:44:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12982, "total_steps": 17941, "loss": 1.7416, "learning_rate": 1.8276679304038912e-05, "epoch": 0.7235940025639597, "percentage": 72.36, "elapsed_time": "1 day, 6:43:41", "remaining_time": "11:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12983, "total_steps": 17941, "loss": 1.6216, "learning_rate": 1.826979727381924e-05, "epoch": 0.7236497408171227, "percentage": 72.36, "elapsed_time": "1 day, 6:43:50", "remaining_time": "11:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12984, "total_steps": 17941, "loss": 1.4643, "learning_rate": 1.8262916249896595e-05, "epoch": 0.7237054790702859, "percentage": 72.37, "elapsed_time": "1 day, 6:43:59", "remaining_time": "11:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12985, "total_steps": 17941, "loss": 1.7197, "learning_rate": 1.825603623248921e-05, "epoch": 0.7237612173234491, "percentage": 72.38, "elapsed_time": "1 day, 6:44:07", "remaining_time": "11:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12986, "total_steps": 17941, "loss": 1.5418, "learning_rate": 1.8249157221815273e-05, "epoch": 0.7238169555766122, "percentage": 72.38, "elapsed_time": "1 day, 6:44:16", "remaining_time": "11:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12987, "total_steps": 17941, "loss": 1.2166, "learning_rate": 1.8242279218092968e-05, "epoch": 0.7238726938297754, "percentage": 72.39, "elapsed_time": "1 day, 6:44:24", "remaining_time": "11:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12988, "total_steps": 17941, "loss": 1.6258, "learning_rate": 1.8235402221540367e-05, "epoch": 0.7239284320829386, "percentage": 72.39, "elapsed_time": "1 day, 6:44:32", "remaining_time": "11:43:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12989, "total_steps": 17941, "loss": 1.6773, "learning_rate": 1.8228526232375643e-05, "epoch": 0.7239841703361016, "percentage": 72.4, "elapsed_time": "1 day, 6:44:41", "remaining_time": "11:43:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12990, "total_steps": 17941, "loss": 1.6878, "learning_rate": 1.822165125081681e-05, "epoch": 0.7240399085892648, "percentage": 72.4, "elapsed_time": "1 day, 6:44:49", "remaining_time": "11:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12991, "total_steps": 17941, "loss": 1.732, "learning_rate": 1.8214777277081917e-05, "epoch": 0.724095646842428, "percentage": 72.41, "elapsed_time": "1 day, 6:44:58", "remaining_time": "11:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12992, "total_steps": 17941, "loss": 1.6358, "learning_rate": 1.8207904311388973e-05, "epoch": 0.7241513850955911, "percentage": 72.42, "elapsed_time": "1 day, 6:45:06", "remaining_time": "11:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12993, "total_steps": 17941, "loss": 1.7553, "learning_rate": 1.8201032353955937e-05, "epoch": 0.7242071233487543, "percentage": 72.42, "elapsed_time": "1 day, 6:45:15", "remaining_time": "11:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12994, "total_steps": 17941, "loss": 1.7667, "learning_rate": 1.8194161405000777e-05, "epoch": 0.7242628616019174, "percentage": 72.43, "elapsed_time": "1 day, 6:45:23", "remaining_time": "11:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12995, "total_steps": 17941, "loss": 1.5637, "learning_rate": 1.8187291464741357e-05, "epoch": 0.7243185998550805, "percentage": 72.43, "elapsed_time": "1 day, 6:45:32", "remaining_time": "11:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12996, "total_steps": 17941, "loss": 1.7027, "learning_rate": 1.8180422533395552e-05, "epoch": 0.7243743381082437, "percentage": 72.44, "elapsed_time": "1 day, 6:45:40", "remaining_time": "11:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12997, "total_steps": 17941, "loss": 1.4391, "learning_rate": 1.817355461118126e-05, "epoch": 0.7244300763614069, "percentage": 72.44, "elapsed_time": "1 day, 6:45:48", "remaining_time": "11:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12998, "total_steps": 17941, "loss": 1.5179, "learning_rate": 1.8166687698316236e-05, "epoch": 0.72448581461457, "percentage": 72.45, "elapsed_time": "1 day, 6:45:57", "remaining_time": "11:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12999, "total_steps": 17941, "loss": 1.9367, "learning_rate": 1.815982179501828e-05, "epoch": 0.7245415528677331, "percentage": 72.45, "elapsed_time": "1 day, 6:46:05", "remaining_time": "11:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13000, "total_steps": 17941, "loss": 1.4403, "learning_rate": 1.815295690150513e-05, "epoch": 0.7245972911208963, "percentage": 72.46, "elapsed_time": "1 day, 6:46:14", "remaining_time": "11:41:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13001, "total_steps": 17941, "loss": 1.611, "learning_rate": 1.814609301799453e-05, "epoch": 0.7246530293740594, "percentage": 72.47, "elapsed_time": "1 day, 6:46:22", "remaining_time": "11:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13002, "total_steps": 17941, "loss": 1.5506, "learning_rate": 1.8139230144704116e-05, "epoch": 0.7247087676272226, "percentage": 72.47, "elapsed_time": "1 day, 6:46:31", "remaining_time": "11:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13003, "total_steps": 17941, "loss": 1.7454, "learning_rate": 1.8132368281851547e-05, "epoch": 0.7247645058803857, "percentage": 72.48, "elapsed_time": "1 day, 6:46:39", "remaining_time": "11:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13004, "total_steps": 17941, "loss": 1.7844, "learning_rate": 1.8125507429654488e-05, "epoch": 0.7248202441335488, "percentage": 72.48, "elapsed_time": "1 day, 6:46:48", "remaining_time": "11:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13005, "total_steps": 17941, "loss": 1.4738, "learning_rate": 1.8118647588330472e-05, "epoch": 0.724875982386712, "percentage": 72.49, "elapsed_time": "1 day, 6:46:56", "remaining_time": "11:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13006, "total_steps": 17941, "loss": 1.7141, "learning_rate": 1.8111788758097092e-05, "epoch": 0.7249317206398751, "percentage": 72.49, "elapsed_time": "1 day, 6:47:05", "remaining_time": "11:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13007, "total_steps": 17941, "loss": 1.4829, "learning_rate": 1.8104930939171814e-05, "epoch": 0.7249874588930383, "percentage": 72.5, "elapsed_time": "1 day, 6:47:13", "remaining_time": "11:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13008, "total_steps": 17941, "loss": 1.5404, "learning_rate": 1.809807413177221e-05, "epoch": 0.7250431971462015, "percentage": 72.5, "elapsed_time": "1 day, 6:47:22", "remaining_time": "11:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13009, "total_steps": 17941, "loss": 1.6544, "learning_rate": 1.8091218336115667e-05, "epoch": 0.7250989353993645, "percentage": 72.51, "elapsed_time": "1 day, 6:47:31", "remaining_time": "11:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13010, "total_steps": 17941, "loss": 1.6339, "learning_rate": 1.8084363552419643e-05, "epoch": 0.7251546736525277, "percentage": 72.52, "elapsed_time": "1 day, 6:47:40", "remaining_time": "11:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13011, "total_steps": 17941, "loss": 1.5828, "learning_rate": 1.807750978090152e-05, "epoch": 0.7252104119056909, "percentage": 72.52, "elapsed_time": "1 day, 6:47:48", "remaining_time": "11:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13012, "total_steps": 17941, "loss": 1.5901, "learning_rate": 1.807065702177867e-05, "epoch": 0.725266150158854, "percentage": 72.53, "elapsed_time": "1 day, 6:47:57", "remaining_time": "11:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13013, "total_steps": 17941, "loss": 1.7264, "learning_rate": 1.8063805275268437e-05, "epoch": 0.7253218884120172, "percentage": 72.53, "elapsed_time": "1 day, 6:48:05", "remaining_time": "11:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13014, "total_steps": 17941, "loss": 1.559, "learning_rate": 1.8056954541588063e-05, "epoch": 0.7253776266651804, "percentage": 72.54, "elapsed_time": "1 day, 6:48:14", "remaining_time": "11:39:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13015, "total_steps": 17941, "loss": 1.857, "learning_rate": 1.8050104820954883e-05, "epoch": 0.7254333649183434, "percentage": 72.54, "elapsed_time": "1 day, 6:48:23", "remaining_time": "11:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13016, "total_steps": 17941, "loss": 1.9097, "learning_rate": 1.8043256113586078e-05, "epoch": 0.7254891031715066, "percentage": 72.55, "elapsed_time": "1 day, 6:48:31", "remaining_time": "11:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13017, "total_steps": 17941, "loss": 1.6233, "learning_rate": 1.8036408419698873e-05, "epoch": 0.7255448414246698, "percentage": 72.55, "elapsed_time": "1 day, 6:48:39", "remaining_time": "11:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13018, "total_steps": 17941, "loss": 1.7397, "learning_rate": 1.802956173951043e-05, "epoch": 0.7256005796778329, "percentage": 72.56, "elapsed_time": "1 day, 6:48:48", "remaining_time": "11:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13019, "total_steps": 17941, "loss": 1.5947, "learning_rate": 1.8022716073237887e-05, "epoch": 0.725656317930996, "percentage": 72.57, "elapsed_time": "1 day, 6:48:56", "remaining_time": "11:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13020, "total_steps": 17941, "loss": 1.4622, "learning_rate": 1.8015871421098373e-05, "epoch": 0.7257120561841592, "percentage": 72.57, "elapsed_time": "1 day, 6:49:05", "remaining_time": "11:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13021, "total_steps": 17941, "loss": 1.7291, "learning_rate": 1.8009027783308914e-05, "epoch": 0.7257677944373223, "percentage": 72.58, "elapsed_time": "1 day, 6:49:13", "remaining_time": "11:38:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13022, "total_steps": 17941, "loss": 1.5213, "learning_rate": 1.8002185160086575e-05, "epoch": 0.7258235326904855, "percentage": 72.58, "elapsed_time": "1 day, 6:49:22", "remaining_time": "11:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13023, "total_steps": 17941, "loss": 1.7677, "learning_rate": 1.7995343551648365e-05, "epoch": 0.7258792709436487, "percentage": 72.59, "elapsed_time": "1 day, 6:49:31", "remaining_time": "11:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13024, "total_steps": 17941, "loss": 1.4572, "learning_rate": 1.798850295821125e-05, "epoch": 0.7259350091968118, "percentage": 72.59, "elapsed_time": "1 day, 6:49:39", "remaining_time": "11:38:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13025, "total_steps": 17941, "loss": 1.6194, "learning_rate": 1.7981663379992187e-05, "epoch": 0.7259907474499749, "percentage": 72.6, "elapsed_time": "1 day, 6:49:48", "remaining_time": "11:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13026, "total_steps": 17941, "loss": 1.5044, "learning_rate": 1.797482481720808e-05, "epoch": 0.726046485703138, "percentage": 72.6, "elapsed_time": "1 day, 6:49:57", "remaining_time": "11:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13027, "total_steps": 17941, "loss": 1.5585, "learning_rate": 1.796798727007583e-05, "epoch": 0.7261022239563012, "percentage": 72.61, "elapsed_time": "1 day, 6:50:06", "remaining_time": "11:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13028, "total_steps": 17941, "loss": 1.6835, "learning_rate": 1.7961150738812244e-05, "epoch": 0.7261579622094644, "percentage": 72.62, "elapsed_time": "1 day, 6:50:14", "remaining_time": "11:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13029, "total_steps": 17941, "loss": 1.7269, "learning_rate": 1.7954315223634143e-05, "epoch": 0.7262137004626275, "percentage": 72.62, "elapsed_time": "1 day, 6:50:23", "remaining_time": "11:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13030, "total_steps": 17941, "loss": 1.6663, "learning_rate": 1.794748072475836e-05, "epoch": 0.7262694387157906, "percentage": 72.63, "elapsed_time": "1 day, 6:50:31", "remaining_time": "11:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13031, "total_steps": 17941, "loss": 1.7742, "learning_rate": 1.7940647242401586e-05, "epoch": 0.7263251769689538, "percentage": 72.63, "elapsed_time": "1 day, 6:50:40", "remaining_time": "11:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13032, "total_steps": 17941, "loss": 1.7405, "learning_rate": 1.7933814776780583e-05, "epoch": 0.7263809152221169, "percentage": 72.64, "elapsed_time": "1 day, 6:50:48", "remaining_time": "11:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13033, "total_steps": 17941, "loss": 1.6648, "learning_rate": 1.7926983328111978e-05, "epoch": 0.7264366534752801, "percentage": 72.64, "elapsed_time": "1 day, 6:50:57", "remaining_time": "11:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13034, "total_steps": 17941, "loss": 1.6446, "learning_rate": 1.7920152896612503e-05, "epoch": 0.7264923917284433, "percentage": 72.65, "elapsed_time": "1 day, 6:51:05", "remaining_time": "11:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13035, "total_steps": 17941, "loss": 1.7264, "learning_rate": 1.7913323482498718e-05, "epoch": 0.7265481299816063, "percentage": 72.65, "elapsed_time": "1 day, 6:51:14", "remaining_time": "11:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13036, "total_steps": 17941, "loss": 1.5724, "learning_rate": 1.7906495085987236e-05, "epoch": 0.7266038682347695, "percentage": 72.66, "elapsed_time": "1 day, 6:51:22", "remaining_time": "11:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13037, "total_steps": 17941, "loss": 1.6304, "learning_rate": 1.789966770729461e-05, "epoch": 0.7266596064879327, "percentage": 72.67, "elapsed_time": "1 day, 6:51:30", "remaining_time": "11:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13038, "total_steps": 17941, "loss": 1.6261, "learning_rate": 1.789284134663737e-05, "epoch": 0.7267153447410958, "percentage": 72.67, "elapsed_time": "1 day, 6:51:39", "remaining_time": "11:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13039, "total_steps": 17941, "loss": 1.6302, "learning_rate": 1.788601600423202e-05, "epoch": 0.726771082994259, "percentage": 72.68, "elapsed_time": "1 day, 6:51:47", "remaining_time": "11:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13040, "total_steps": 17941, "loss": 1.5139, "learning_rate": 1.787919168029497e-05, "epoch": 0.7268268212474222, "percentage": 72.68, "elapsed_time": "1 day, 6:51:56", "remaining_time": "11:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13041, "total_steps": 17941, "loss": 1.5585, "learning_rate": 1.787236837504272e-05, "epoch": 0.7268825595005852, "percentage": 72.69, "elapsed_time": "1 day, 6:52:04", "remaining_time": "11:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13042, "total_steps": 17941, "loss": 1.5051, "learning_rate": 1.786554608869161e-05, "epoch": 0.7269382977537484, "percentage": 72.69, "elapsed_time": "1 day, 6:52:13", "remaining_time": "11:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13043, "total_steps": 17941, "loss": 1.8636, "learning_rate": 1.785872482145802e-05, "epoch": 0.7269940360069116, "percentage": 72.7, "elapsed_time": "1 day, 6:52:21", "remaining_time": "11:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13044, "total_steps": 17941, "loss": 1.5822, "learning_rate": 1.7851904573558276e-05, "epoch": 0.7270497742600747, "percentage": 72.7, "elapsed_time": "1 day, 6:52:30", "remaining_time": "11:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13045, "total_steps": 17941, "loss": 1.5041, "learning_rate": 1.784508534520869e-05, "epoch": 0.7271055125132379, "percentage": 72.71, "elapsed_time": "1 day, 6:52:38", "remaining_time": "11:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13046, "total_steps": 17941, "loss": 1.7019, "learning_rate": 1.7838267136625535e-05, "epoch": 0.727161250766401, "percentage": 72.72, "elapsed_time": "1 day, 6:52:46", "remaining_time": "11:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13047, "total_steps": 17941, "loss": 1.7343, "learning_rate": 1.7831449948025015e-05, "epoch": 0.7272169890195641, "percentage": 72.72, "elapsed_time": "1 day, 6:52:56", "remaining_time": "11:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13048, "total_steps": 17941, "loss": 1.9108, "learning_rate": 1.7824633779623347e-05, "epoch": 0.7272727272727273, "percentage": 72.73, "elapsed_time": "1 day, 6:53:05", "remaining_time": "11:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13049, "total_steps": 17941, "loss": 1.559, "learning_rate": 1.78178186316367e-05, "epoch": 0.7273284655258904, "percentage": 72.73, "elapsed_time": "1 day, 6:53:13", "remaining_time": "11:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13050, "total_steps": 17941, "loss": 1.8311, "learning_rate": 1.7811004504281208e-05, "epoch": 0.7273842037790536, "percentage": 72.74, "elapsed_time": "1 day, 6:53:22", "remaining_time": "11:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13051, "total_steps": 17941, "loss": 1.585, "learning_rate": 1.7804191397772984e-05, "epoch": 0.7274399420322167, "percentage": 72.74, "elapsed_time": "1 day, 6:53:30", "remaining_time": "11:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13052, "total_steps": 17941, "loss": 1.4848, "learning_rate": 1.7797379312328088e-05, "epoch": 0.7274956802853798, "percentage": 72.75, "elapsed_time": "1 day, 6:53:39", "remaining_time": "11:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13053, "total_steps": 17941, "loss": 1.5032, "learning_rate": 1.7790568248162586e-05, "epoch": 0.727551418538543, "percentage": 72.76, "elapsed_time": "1 day, 6:53:47", "remaining_time": "11:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13054, "total_steps": 17941, "loss": 1.728, "learning_rate": 1.7783758205492452e-05, "epoch": 0.7276071567917062, "percentage": 72.76, "elapsed_time": "1 day, 6:53:56", "remaining_time": "11:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13055, "total_steps": 17941, "loss": 1.4794, "learning_rate": 1.777694918453365e-05, "epoch": 0.7276628950448693, "percentage": 72.77, "elapsed_time": "1 day, 6:54:05", "remaining_time": "11:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13056, "total_steps": 17941, "loss": 1.5339, "learning_rate": 1.777014118550218e-05, "epoch": 0.7277186332980324, "percentage": 72.77, "elapsed_time": "1 day, 6:54:13", "remaining_time": "11:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13057, "total_steps": 17941, "loss": 1.8527, "learning_rate": 1.7763334208613908e-05, "epoch": 0.7277743715511956, "percentage": 72.78, "elapsed_time": "1 day, 6:54:23", "remaining_time": "11:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13058, "total_steps": 17941, "loss": 1.4837, "learning_rate": 1.775652825408472e-05, "epoch": 0.7278301098043587, "percentage": 72.78, "elapsed_time": "1 day, 6:54:32", "remaining_time": "11:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13059, "total_steps": 17941, "loss": 1.4804, "learning_rate": 1.7749723322130462e-05, "epoch": 0.7278858480575219, "percentage": 72.79, "elapsed_time": "1 day, 6:54:40", "remaining_time": "11:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13060, "total_steps": 17941, "loss": 1.8064, "learning_rate": 1.7742919412966964e-05, "epoch": 0.7279415863106851, "percentage": 72.79, "elapsed_time": "1 day, 6:54:49", "remaining_time": "11:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13061, "total_steps": 17941, "loss": 1.6725, "learning_rate": 1.7736116526809975e-05, "epoch": 0.7279973245638481, "percentage": 72.8, "elapsed_time": "1 day, 6:54:57", "remaining_time": "11:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13062, "total_steps": 17941, "loss": 1.4949, "learning_rate": 1.7729314663875257e-05, "epoch": 0.7280530628170113, "percentage": 72.81, "elapsed_time": "1 day, 6:55:06", "remaining_time": "11:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13063, "total_steps": 17941, "loss": 1.4885, "learning_rate": 1.7722513824378527e-05, "epoch": 0.7281088010701745, "percentage": 72.81, "elapsed_time": "1 day, 6:55:14", "remaining_time": "11:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13064, "total_steps": 17941, "loss": 1.653, "learning_rate": 1.7715714008535472e-05, "epoch": 0.7281645393233376, "percentage": 72.82, "elapsed_time": "1 day, 6:55:23", "remaining_time": "11:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13065, "total_steps": 17941, "loss": 1.6643, "learning_rate": 1.770891521656175e-05, "epoch": 0.7282202775765008, "percentage": 72.82, "elapsed_time": "1 day, 6:55:31", "remaining_time": "11:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13066, "total_steps": 17941, "loss": 1.8701, "learning_rate": 1.7702117448672933e-05, "epoch": 0.728276015829664, "percentage": 72.83, "elapsed_time": "1 day, 6:55:39", "remaining_time": "11:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13067, "total_steps": 17941, "loss": 1.8521, "learning_rate": 1.7695320705084677e-05, "epoch": 0.728331754082827, "percentage": 72.83, "elapsed_time": "1 day, 6:55:48", "remaining_time": "11:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13068, "total_steps": 17941, "loss": 1.67, "learning_rate": 1.7688524986012484e-05, "epoch": 0.7283874923359902, "percentage": 72.84, "elapsed_time": "1 day, 6:55:56", "remaining_time": "11:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13069, "total_steps": 17941, "loss": 1.6678, "learning_rate": 1.7681730291671888e-05, "epoch": 0.7284432305891534, "percentage": 72.84, "elapsed_time": "1 day, 6:56:05", "remaining_time": "11:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13070, "total_steps": 17941, "loss": 1.6773, "learning_rate": 1.7674936622278377e-05, "epoch": 0.7284989688423165, "percentage": 72.85, "elapsed_time": "1 day, 6:56:14", "remaining_time": "11:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13071, "total_steps": 17941, "loss": 1.6948, "learning_rate": 1.7668143978047408e-05, "epoch": 0.7285547070954796, "percentage": 72.86, "elapsed_time": "1 day, 6:56:22", "remaining_time": "11:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13072, "total_steps": 17941, "loss": 1.9477, "learning_rate": 1.7661352359194423e-05, "epoch": 0.7286104453486427, "percentage": 72.86, "elapsed_time": "1 day, 6:56:31", "remaining_time": "11:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13073, "total_steps": 17941, "loss": 1.1618, "learning_rate": 1.7654561765934772e-05, "epoch": 0.7286661836018059, "percentage": 72.87, "elapsed_time": "1 day, 6:56:39", "remaining_time": "11:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13074, "total_steps": 17941, "loss": 1.5494, "learning_rate": 1.7647772198483842e-05, "epoch": 0.7287219218549691, "percentage": 72.87, "elapsed_time": "1 day, 6:56:48", "remaining_time": "11:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13075, "total_steps": 17941, "loss": 1.6923, "learning_rate": 1.7640983657056948e-05, "epoch": 0.7287776601081322, "percentage": 72.88, "elapsed_time": "1 day, 6:56:56", "remaining_time": "11:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13076, "total_steps": 17941, "loss": 1.6827, "learning_rate": 1.7634196141869386e-05, "epoch": 0.7288333983612953, "percentage": 72.88, "elapsed_time": "1 day, 6:57:05", "remaining_time": "11:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13077, "total_steps": 17941, "loss": 1.7496, "learning_rate": 1.7627409653136417e-05, "epoch": 0.7288891366144585, "percentage": 72.89, "elapsed_time": "1 day, 6:57:13", "remaining_time": "11:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13078, "total_steps": 17941, "loss": 1.5867, "learning_rate": 1.7620624191073266e-05, "epoch": 0.7289448748676216, "percentage": 72.89, "elapsed_time": "1 day, 6:57:21", "remaining_time": "11:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13079, "total_steps": 17941, "loss": 1.8191, "learning_rate": 1.761383975589515e-05, "epoch": 0.7290006131207848, "percentage": 72.9, "elapsed_time": "1 day, 6:57:30", "remaining_time": "11:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13080, "total_steps": 17941, "loss": 1.8822, "learning_rate": 1.7607056347817196e-05, "epoch": 0.729056351373948, "percentage": 72.91, "elapsed_time": "1 day, 6:57:38", "remaining_time": "11:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13081, "total_steps": 17941, "loss": 1.7475, "learning_rate": 1.7600273967054535e-05, "epoch": 0.729112089627111, "percentage": 72.91, "elapsed_time": "1 day, 6:57:47", "remaining_time": "11:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13082, "total_steps": 17941, "loss": 1.6764, "learning_rate": 1.759349261382231e-05, "epoch": 0.7291678278802742, "percentage": 72.92, "elapsed_time": "1 day, 6:57:55", "remaining_time": "11:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13083, "total_steps": 17941, "loss": 1.6163, "learning_rate": 1.7586712288335543e-05, "epoch": 0.7292235661334374, "percentage": 72.92, "elapsed_time": "1 day, 6:58:04", "remaining_time": "11:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13084, "total_steps": 17941, "loss": 1.5605, "learning_rate": 1.7579932990809277e-05, "epoch": 0.7292793043866005, "percentage": 72.93, "elapsed_time": "1 day, 6:58:12", "remaining_time": "11:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13085, "total_steps": 17941, "loss": 1.458, "learning_rate": 1.7573154721458518e-05, "epoch": 0.7293350426397637, "percentage": 72.93, "elapsed_time": "1 day, 6:58:21", "remaining_time": "11:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13086, "total_steps": 17941, "loss": 1.5316, "learning_rate": 1.7566377480498246e-05, "epoch": 0.7293907808929269, "percentage": 72.94, "elapsed_time": "1 day, 6:58:29", "remaining_time": "11:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13087, "total_steps": 17941, "loss": 1.3185, "learning_rate": 1.755960126814336e-05, "epoch": 0.7294465191460899, "percentage": 72.94, "elapsed_time": "1 day, 6:58:38", "remaining_time": "11:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13088, "total_steps": 17941, "loss": 1.59, "learning_rate": 1.755282608460878e-05, "epoch": 0.7295022573992531, "percentage": 72.95, "elapsed_time": "1 day, 6:58:46", "remaining_time": "11:29:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13089, "total_steps": 17941, "loss": 1.7575, "learning_rate": 1.754605193010938e-05, "epoch": 0.7295579956524163, "percentage": 72.96, "elapsed_time": "1 day, 6:58:54", "remaining_time": "11:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13090, "total_steps": 17941, "loss": 1.988, "learning_rate": 1.7539278804859993e-05, "epoch": 0.7296137339055794, "percentage": 72.96, "elapsed_time": "1 day, 6:59:03", "remaining_time": "11:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13091, "total_steps": 17941, "loss": 1.6315, "learning_rate": 1.7532506709075436e-05, "epoch": 0.7296694721587426, "percentage": 72.97, "elapsed_time": "1 day, 6:59:11", "remaining_time": "11:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13092, "total_steps": 17941, "loss": 1.8533, "learning_rate": 1.7525735642970438e-05, "epoch": 0.7297252104119057, "percentage": 72.97, "elapsed_time": "1 day, 6:59:20", "remaining_time": "11:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13093, "total_steps": 17941, "loss": 1.7435, "learning_rate": 1.7518965606759797e-05, "epoch": 0.7297809486650688, "percentage": 72.98, "elapsed_time": "1 day, 6:59:29", "remaining_time": "11:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13094, "total_steps": 17941, "loss": 1.6991, "learning_rate": 1.7512196600658175e-05, "epoch": 0.729836686918232, "percentage": 72.98, "elapsed_time": "1 day, 6:59:37", "remaining_time": "11:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13095, "total_steps": 17941, "loss": 1.6129, "learning_rate": 1.750542862488026e-05, "epoch": 0.7298924251713951, "percentage": 72.99, "elapsed_time": "1 day, 6:59:46", "remaining_time": "11:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13096, "total_steps": 17941, "loss": 1.555, "learning_rate": 1.7498661679640693e-05, "epoch": 0.7299481634245583, "percentage": 72.99, "elapsed_time": "1 day, 6:59:55", "remaining_time": "11:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13097, "total_steps": 17941, "loss": 1.5851, "learning_rate": 1.749189576515408e-05, "epoch": 0.7300039016777214, "percentage": 73.0, "elapsed_time": "1 day, 7:00:03", "remaining_time": "11:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13098, "total_steps": 17941, "loss": 1.6828, "learning_rate": 1.7485130881635014e-05, "epoch": 0.7300596399308845, "percentage": 73.01, "elapsed_time": "1 day, 7:00:12", "remaining_time": "11:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13099, "total_steps": 17941, "loss": 1.5023, "learning_rate": 1.747836702929801e-05, "epoch": 0.7301153781840477, "percentage": 73.01, "elapsed_time": "1 day, 7:00:20", "remaining_time": "11:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13100, "total_steps": 17941, "loss": 1.7822, "learning_rate": 1.7471604208357584e-05, "epoch": 0.7301711164372109, "percentage": 73.02, "elapsed_time": "1 day, 7:00:29", "remaining_time": "11:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13101, "total_steps": 17941, "loss": 1.5506, "learning_rate": 1.746484241902822e-05, "epoch": 0.730226854690374, "percentage": 73.02, "elapsed_time": "1 day, 7:00:37", "remaining_time": "11:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13102, "total_steps": 17941, "loss": 1.7494, "learning_rate": 1.7458081661524363e-05, "epoch": 0.7302825929435371, "percentage": 73.03, "elapsed_time": "1 day, 7:00:46", "remaining_time": "11:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13103, "total_steps": 17941, "loss": 1.6126, "learning_rate": 1.745132193606042e-05, "epoch": 0.7303383311967003, "percentage": 73.03, "elapsed_time": "1 day, 7:00:54", "remaining_time": "11:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13104, "total_steps": 17941, "loss": 1.6587, "learning_rate": 1.7444563242850774e-05, "epoch": 0.7303940694498634, "percentage": 73.04, "elapsed_time": "1 day, 7:01:03", "remaining_time": "11:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13105, "total_steps": 17941, "loss": 1.7012, "learning_rate": 1.743780558210979e-05, "epoch": 0.7304498077030266, "percentage": 73.04, "elapsed_time": "1 day, 7:01:11", "remaining_time": "11:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13106, "total_steps": 17941, "loss": 1.6279, "learning_rate": 1.743104895405175e-05, "epoch": 0.7305055459561898, "percentage": 73.05, "elapsed_time": "1 day, 7:01:20", "remaining_time": "11:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13107, "total_steps": 17941, "loss": 1.6917, "learning_rate": 1.742429335889092e-05, "epoch": 0.7305612842093528, "percentage": 73.06, "elapsed_time": "1 day, 7:01:29", "remaining_time": "11:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13108, "total_steps": 17941, "loss": 1.5668, "learning_rate": 1.7417538796841615e-05, "epoch": 0.730617022462516, "percentage": 73.06, "elapsed_time": "1 day, 7:01:37", "remaining_time": "11:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13109, "total_steps": 17941, "loss": 1.3751, "learning_rate": 1.741078526811799e-05, "epoch": 0.7306727607156792, "percentage": 73.07, "elapsed_time": "1 day, 7:01:46", "remaining_time": "11:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13110, "total_steps": 17941, "loss": 1.5854, "learning_rate": 1.7404032772934246e-05, "epoch": 0.7307284989688423, "percentage": 73.07, "elapsed_time": "1 day, 7:01:54", "remaining_time": "11:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13111, "total_steps": 17941, "loss": 1.646, "learning_rate": 1.7397281311504544e-05, "epoch": 0.7307842372220055, "percentage": 73.08, "elapsed_time": "1 day, 7:02:02", "remaining_time": "11:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13112, "total_steps": 17941, "loss": 1.796, "learning_rate": 1.7390530884043e-05, "epoch": 0.7308399754751687, "percentage": 73.08, "elapsed_time": "1 day, 7:02:12", "remaining_time": "11:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13113, "total_steps": 17941, "loss": 1.5496, "learning_rate": 1.738378149076368e-05, "epoch": 0.7308957137283317, "percentage": 73.09, "elapsed_time": "1 day, 7:02:20", "remaining_time": "11:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13114, "total_steps": 17941, "loss": 1.5582, "learning_rate": 1.7377033131880638e-05, "epoch": 0.7309514519814949, "percentage": 73.1, "elapsed_time": "1 day, 7:02:29", "remaining_time": "11:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13115, "total_steps": 17941, "loss": 1.5616, "learning_rate": 1.7370285807607905e-05, "epoch": 0.7310071902346581, "percentage": 73.1, "elapsed_time": "1 day, 7:02:37", "remaining_time": "11:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13116, "total_steps": 17941, "loss": 1.6777, "learning_rate": 1.736353951815946e-05, "epoch": 0.7310629284878212, "percentage": 73.11, "elapsed_time": "1 day, 7:02:46", "remaining_time": "11:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13117, "total_steps": 17941, "loss": 1.5789, "learning_rate": 1.7356794263749275e-05, "epoch": 0.7311186667409844, "percentage": 73.11, "elapsed_time": "1 day, 7:02:54", "remaining_time": "11:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13118, "total_steps": 17941, "loss": 1.4678, "learning_rate": 1.735005004459122e-05, "epoch": 0.7311744049941474, "percentage": 73.12, "elapsed_time": "1 day, 7:03:02", "remaining_time": "11:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13119, "total_steps": 17941, "loss": 1.6012, "learning_rate": 1.7343306860899243e-05, "epoch": 0.7312301432473106, "percentage": 73.12, "elapsed_time": "1 day, 7:03:11", "remaining_time": "11:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13120, "total_steps": 17941, "loss": 1.3831, "learning_rate": 1.733656471288716e-05, "epoch": 0.7312858815004738, "percentage": 73.13, "elapsed_time": "1 day, 7:03:19", "remaining_time": "11:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13121, "total_steps": 17941, "loss": 1.5432, "learning_rate": 1.73298236007688e-05, "epoch": 0.7313416197536369, "percentage": 73.13, "elapsed_time": "1 day, 7:03:28", "remaining_time": "11:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13122, "total_steps": 17941, "loss": 1.6044, "learning_rate": 1.732308352475796e-05, "epoch": 0.7313973580068001, "percentage": 73.14, "elapsed_time": "1 day, 7:03:36", "remaining_time": "11:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13123, "total_steps": 17941, "loss": 1.4039, "learning_rate": 1.7316344485068392e-05, "epoch": 0.7314530962599632, "percentage": 73.15, "elapsed_time": "1 day, 7:03:45", "remaining_time": "11:24:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13124, "total_steps": 17941, "loss": 1.6396, "learning_rate": 1.7309606481913826e-05, "epoch": 0.7315088345131263, "percentage": 73.15, "elapsed_time": "1 day, 7:03:53", "remaining_time": "11:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13125, "total_steps": 17941, "loss": 1.7854, "learning_rate": 1.730286951550792e-05, "epoch": 0.7315645727662895, "percentage": 73.16, "elapsed_time": "1 day, 7:04:02", "remaining_time": "11:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13126, "total_steps": 17941, "loss": 1.8116, "learning_rate": 1.7296133586064382e-05, "epoch": 0.7316203110194527, "percentage": 73.16, "elapsed_time": "1 day, 7:04:10", "remaining_time": "11:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13127, "total_steps": 17941, "loss": 1.8243, "learning_rate": 1.7289398693796795e-05, "epoch": 0.7316760492726158, "percentage": 73.17, "elapsed_time": "1 day, 7:04:19", "remaining_time": "11:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13128, "total_steps": 17941, "loss": 1.4941, "learning_rate": 1.7282664838918766e-05, "epoch": 0.7317317875257789, "percentage": 73.17, "elapsed_time": "1 day, 7:04:27", "remaining_time": "11:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13129, "total_steps": 17941, "loss": 1.4587, "learning_rate": 1.7275932021643853e-05, "epoch": 0.7317875257789421, "percentage": 73.18, "elapsed_time": "1 day, 7:04:35", "remaining_time": "11:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13130, "total_steps": 17941, "loss": 1.7593, "learning_rate": 1.726920024218558e-05, "epoch": 0.7318432640321052, "percentage": 73.18, "elapsed_time": "1 day, 7:04:44", "remaining_time": "11:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13131, "total_steps": 17941, "loss": 1.7246, "learning_rate": 1.726246950075746e-05, "epoch": 0.7318990022852684, "percentage": 73.19, "elapsed_time": "1 day, 7:04:52", "remaining_time": "11:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13132, "total_steps": 17941, "loss": 1.4019, "learning_rate": 1.7255739797572916e-05, "epoch": 0.7319547405384316, "percentage": 73.2, "elapsed_time": "1 day, 7:05:01", "remaining_time": "11:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13133, "total_steps": 17941, "loss": 1.4506, "learning_rate": 1.72490111328454e-05, "epoch": 0.7320104787915946, "percentage": 73.2, "elapsed_time": "1 day, 7:05:09", "remaining_time": "11:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13134, "total_steps": 17941, "loss": 1.4996, "learning_rate": 1.7242283506788292e-05, "epoch": 0.7320662170447578, "percentage": 73.21, "elapsed_time": "1 day, 7:05:18", "remaining_time": "11:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13135, "total_steps": 17941, "loss": 1.8975, "learning_rate": 1.7235556919614964e-05, "epoch": 0.732121955297921, "percentage": 73.21, "elapsed_time": "1 day, 7:05:26", "remaining_time": "11:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13136, "total_steps": 17941, "loss": 1.7209, "learning_rate": 1.722883137153874e-05, "epoch": 0.7321776935510841, "percentage": 73.22, "elapsed_time": "1 day, 7:05:35", "remaining_time": "11:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13137, "total_steps": 17941, "loss": 1.3764, "learning_rate": 1.7222106862772912e-05, "epoch": 0.7322334318042473, "percentage": 73.22, "elapsed_time": "1 day, 7:05:43", "remaining_time": "11:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13138, "total_steps": 17941, "loss": 1.4915, "learning_rate": 1.7215383393530767e-05, "epoch": 0.7322891700574105, "percentage": 73.23, "elapsed_time": "1 day, 7:05:52", "remaining_time": "11:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13139, "total_steps": 17941, "loss": 1.6684, "learning_rate": 1.7208660964025498e-05, "epoch": 0.7323449083105735, "percentage": 73.23, "elapsed_time": "1 day, 7:06:00", "remaining_time": "11:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13140, "total_steps": 17941, "loss": 1.6384, "learning_rate": 1.720193957447031e-05, "epoch": 0.7324006465637367, "percentage": 73.24, "elapsed_time": "1 day, 7:06:09", "remaining_time": "11:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13141, "total_steps": 17941, "loss": 1.7146, "learning_rate": 1.719521922507838e-05, "epoch": 0.7324563848168998, "percentage": 73.25, "elapsed_time": "1 day, 7:06:17", "remaining_time": "11:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13142, "total_steps": 17941, "loss": 1.6765, "learning_rate": 1.7188499916062823e-05, "epoch": 0.732512123070063, "percentage": 73.25, "elapsed_time": "1 day, 7:06:26", "remaining_time": "11:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13143, "total_steps": 17941, "loss": 1.7715, "learning_rate": 1.718178164763677e-05, "epoch": 0.7325678613232262, "percentage": 73.26, "elapsed_time": "1 day, 7:06:34", "remaining_time": "11:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13144, "total_steps": 17941, "loss": 1.8965, "learning_rate": 1.717506442001322e-05, "epoch": 0.7326235995763892, "percentage": 73.26, "elapsed_time": "1 day, 7:06:43", "remaining_time": "11:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13145, "total_steps": 17941, "loss": 1.6592, "learning_rate": 1.716834823340528e-05, "epoch": 0.7326793378295524, "percentage": 73.27, "elapsed_time": "1 day, 7:06:51", "remaining_time": "11:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13146, "total_steps": 17941, "loss": 1.6016, "learning_rate": 1.7161633088025892e-05, "epoch": 0.7327350760827156, "percentage": 73.27, "elapsed_time": "1 day, 7:07:00", "remaining_time": "11:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13147, "total_steps": 17941, "loss": 1.5946, "learning_rate": 1.715491898408804e-05, "epoch": 0.7327908143358787, "percentage": 73.28, "elapsed_time": "1 day, 7:07:08", "remaining_time": "11:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13148, "total_steps": 17941, "loss": 1.5196, "learning_rate": 1.7148205921804665e-05, "epoch": 0.7328465525890419, "percentage": 73.28, "elapsed_time": "1 day, 7:07:17", "remaining_time": "11:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13149, "total_steps": 17941, "loss": 1.5667, "learning_rate": 1.7141493901388657e-05, "epoch": 0.732902290842205, "percentage": 73.29, "elapsed_time": "1 day, 7:07:25", "remaining_time": "11:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13150, "total_steps": 17941, "loss": 1.3212, "learning_rate": 1.71347829230529e-05, "epoch": 0.7329580290953681, "percentage": 73.3, "elapsed_time": "1 day, 7:07:34", "remaining_time": "11:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13151, "total_steps": 17941, "loss": 1.8084, "learning_rate": 1.7128072987010173e-05, "epoch": 0.7330137673485313, "percentage": 73.3, "elapsed_time": "1 day, 7:07:43", "remaining_time": "11:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13152, "total_steps": 17941, "loss": 1.9594, "learning_rate": 1.7121364093473352e-05, "epoch": 0.7330695056016945, "percentage": 73.31, "elapsed_time": "1 day, 7:07:51", "remaining_time": "11:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13153, "total_steps": 17941, "loss": 1.6426, "learning_rate": 1.7114656242655153e-05, "epoch": 0.7331252438548576, "percentage": 73.31, "elapsed_time": "1 day, 7:07:59", "remaining_time": "11:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13154, "total_steps": 17941, "loss": 1.4455, "learning_rate": 1.7107949434768317e-05, "epoch": 0.7331809821080207, "percentage": 73.32, "elapsed_time": "1 day, 7:08:08", "remaining_time": "11:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13155, "total_steps": 17941, "loss": 1.5018, "learning_rate": 1.710124367002555e-05, "epoch": 0.7332367203611839, "percentage": 73.32, "elapsed_time": "1 day, 7:08:16", "remaining_time": "11:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13156, "total_steps": 17941, "loss": 1.6713, "learning_rate": 1.7094538948639527e-05, "epoch": 0.733292458614347, "percentage": 73.33, "elapsed_time": "1 day, 7:08:25", "remaining_time": "11:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13157, "total_steps": 17941, "loss": 1.6141, "learning_rate": 1.7087835270822893e-05, "epoch": 0.7333481968675102, "percentage": 73.33, "elapsed_time": "1 day, 7:08:33", "remaining_time": "11:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13158, "total_steps": 17941, "loss": 1.7676, "learning_rate": 1.708113263678821e-05, "epoch": 0.7334039351206734, "percentage": 73.34, "elapsed_time": "1 day, 7:08:42", "remaining_time": "11:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13159, "total_steps": 17941, "loss": 1.5305, "learning_rate": 1.7074431046748075e-05, "epoch": 0.7334596733738364, "percentage": 73.35, "elapsed_time": "1 day, 7:08:50", "remaining_time": "11:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13160, "total_steps": 17941, "loss": 1.5329, "learning_rate": 1.7067730500915015e-05, "epoch": 0.7335154116269996, "percentage": 73.35, "elapsed_time": "1 day, 7:08:58", "remaining_time": "11:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13161, "total_steps": 17941, "loss": 1.8066, "learning_rate": 1.7061030999501538e-05, "epoch": 0.7335711498801628, "percentage": 73.36, "elapsed_time": "1 day, 7:09:07", "remaining_time": "11:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13162, "total_steps": 17941, "loss": 1.6414, "learning_rate": 1.705433254272011e-05, "epoch": 0.7336268881333259, "percentage": 73.36, "elapsed_time": "1 day, 7:09:15", "remaining_time": "11:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13163, "total_steps": 17941, "loss": 1.6874, "learning_rate": 1.7047635130783163e-05, "epoch": 0.7336826263864891, "percentage": 73.37, "elapsed_time": "1 day, 7:09:24", "remaining_time": "11:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13164, "total_steps": 17941, "loss": 1.8305, "learning_rate": 1.704093876390312e-05, "epoch": 0.7337383646396521, "percentage": 73.37, "elapsed_time": "1 day, 7:09:32", "remaining_time": "11:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13165, "total_steps": 17941, "loss": 1.5281, "learning_rate": 1.7034243442292326e-05, "epoch": 0.7337941028928153, "percentage": 73.38, "elapsed_time": "1 day, 7:09:41", "remaining_time": "11:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13166, "total_steps": 17941, "loss": 1.4261, "learning_rate": 1.702754916616312e-05, "epoch": 0.7338498411459785, "percentage": 73.38, "elapsed_time": "1 day, 7:09:49", "remaining_time": "11:18:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13167, "total_steps": 17941, "loss": 1.4768, "learning_rate": 1.702085593572781e-05, "epoch": 0.7339055793991416, "percentage": 73.39, "elapsed_time": "1 day, 7:09:58", "remaining_time": "11:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13168, "total_steps": 17941, "loss": 1.8325, "learning_rate": 1.701416375119867e-05, "epoch": 0.7339613176523048, "percentage": 73.4, "elapsed_time": "1 day, 7:10:06", "remaining_time": "11:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13169, "total_steps": 17941, "loss": 1.8015, "learning_rate": 1.7007472612787957e-05, "epoch": 0.734017055905468, "percentage": 73.4, "elapsed_time": "1 day, 7:10:15", "remaining_time": "11:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13170, "total_steps": 17941, "loss": 1.5654, "learning_rate": 1.7000782520707815e-05, "epoch": 0.734072794158631, "percentage": 73.41, "elapsed_time": "1 day, 7:10:23", "remaining_time": "11:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13171, "total_steps": 17941, "loss": 1.5492, "learning_rate": 1.6994093475170485e-05, "epoch": 0.7341285324117942, "percentage": 73.41, "elapsed_time": "1 day, 7:10:31", "remaining_time": "11:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13172, "total_steps": 17941, "loss": 1.753, "learning_rate": 1.6987405476388056e-05, "epoch": 0.7341842706649574, "percentage": 73.42, "elapsed_time": "1 day, 7:10:40", "remaining_time": "11:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13173, "total_steps": 17941, "loss": 1.68, "learning_rate": 1.6980718524572648e-05, "epoch": 0.7342400089181205, "percentage": 73.42, "elapsed_time": "1 day, 7:10:48", "remaining_time": "11:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13174, "total_steps": 17941, "loss": 1.6085, "learning_rate": 1.6974032619936338e-05, "epoch": 0.7342957471712837, "percentage": 73.43, "elapsed_time": "1 day, 7:10:57", "remaining_time": "11:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13175, "total_steps": 17941, "loss": 1.6717, "learning_rate": 1.6967347762691154e-05, "epoch": 0.7343514854244468, "percentage": 73.44, "elapsed_time": "1 day, 7:11:05", "remaining_time": "11:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13176, "total_steps": 17941, "loss": 1.5811, "learning_rate": 1.6960663953049123e-05, "epoch": 0.7344072236776099, "percentage": 73.44, "elapsed_time": "1 day, 7:11:15", "remaining_time": "11:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13177, "total_steps": 17941, "loss": 1.6795, "learning_rate": 1.6953981191222162e-05, "epoch": 0.7344629619307731, "percentage": 73.45, "elapsed_time": "1 day, 7:11:23", "remaining_time": "11:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13178, "total_steps": 17941, "loss": 1.7929, "learning_rate": 1.6947299477422284e-05, "epoch": 0.7345187001839363, "percentage": 73.45, "elapsed_time": "1 day, 7:11:31", "remaining_time": "11:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13179, "total_steps": 17941, "loss": 1.6411, "learning_rate": 1.6940618811861335e-05, "epoch": 0.7345744384370994, "percentage": 73.46, "elapsed_time": "1 day, 7:11:40", "remaining_time": "11:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13180, "total_steps": 17941, "loss": 1.5319, "learning_rate": 1.6933939194751215e-05, "epoch": 0.7346301766902625, "percentage": 73.46, "elapsed_time": "1 day, 7:11:49", "remaining_time": "11:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13181, "total_steps": 17941, "loss": 1.5279, "learning_rate": 1.6927260626303748e-05, "epoch": 0.7346859149434257, "percentage": 73.47, "elapsed_time": "1 day, 7:11:57", "remaining_time": "11:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13182, "total_steps": 17941, "loss": 1.8239, "learning_rate": 1.6920583106730748e-05, "epoch": 0.7347416531965888, "percentage": 73.47, "elapsed_time": "1 day, 7:12:06", "remaining_time": "11:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13183, "total_steps": 17941, "loss": 1.7993, "learning_rate": 1.6913906636244005e-05, "epoch": 0.734797391449752, "percentage": 73.48, "elapsed_time": "1 day, 7:12:14", "remaining_time": "11:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13184, "total_steps": 17941, "loss": 1.5527, "learning_rate": 1.690723121505522e-05, "epoch": 0.7348531297029152, "percentage": 73.49, "elapsed_time": "1 day, 7:12:23", "remaining_time": "11:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13185, "total_steps": 17941, "loss": 1.6684, "learning_rate": 1.6900556843376115e-05, "epoch": 0.7349088679560782, "percentage": 73.49, "elapsed_time": "1 day, 7:12:31", "remaining_time": "11:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13186, "total_steps": 17941, "loss": 1.5172, "learning_rate": 1.6893883521418362e-05, "epoch": 0.7349646062092414, "percentage": 73.5, "elapsed_time": "1 day, 7:12:40", "remaining_time": "11:15:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13187, "total_steps": 17941, "loss": 1.6473, "learning_rate": 1.6887211249393608e-05, "epoch": 0.7350203444624045, "percentage": 73.5, "elapsed_time": "1 day, 7:12:48", "remaining_time": "11:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13188, "total_steps": 17941, "loss": 1.8738, "learning_rate": 1.6880540027513448e-05, "epoch": 0.7350760827155677, "percentage": 73.51, "elapsed_time": "1 day, 7:12:57", "remaining_time": "11:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13189, "total_steps": 17941, "loss": 1.8411, "learning_rate": 1.687386985598946e-05, "epoch": 0.7351318209687309, "percentage": 73.51, "elapsed_time": "1 day, 7:13:05", "remaining_time": "11:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13190, "total_steps": 17941, "loss": 1.5319, "learning_rate": 1.6867200735033196e-05, "epoch": 0.7351875592218939, "percentage": 73.52, "elapsed_time": "1 day, 7:13:14", "remaining_time": "11:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13191, "total_steps": 17941, "loss": 1.5069, "learning_rate": 1.6860532664856133e-05, "epoch": 0.7352432974750571, "percentage": 73.52, "elapsed_time": "1 day, 7:13:22", "remaining_time": "11:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13192, "total_steps": 17941, "loss": 1.6411, "learning_rate": 1.6853865645669752e-05, "epoch": 0.7352990357282203, "percentage": 73.53, "elapsed_time": "1 day, 7:13:31", "remaining_time": "11:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13193, "total_steps": 17941, "loss": 1.6466, "learning_rate": 1.6847199677685505e-05, "epoch": 0.7353547739813834, "percentage": 73.54, "elapsed_time": "1 day, 7:13:40", "remaining_time": "11:14:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13194, "total_steps": 17941, "loss": 1.4866, "learning_rate": 1.6840534761114786e-05, "epoch": 0.7354105122345466, "percentage": 73.54, "elapsed_time": "1 day, 7:13:48", "remaining_time": "11:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13195, "total_steps": 17941, "loss": 1.903, "learning_rate": 1.683387089616899e-05, "epoch": 0.7354662504877097, "percentage": 73.55, "elapsed_time": "1 day, 7:13:57", "remaining_time": "11:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13196, "total_steps": 17941, "loss": 1.8349, "learning_rate": 1.68272080830594e-05, "epoch": 0.7355219887408728, "percentage": 73.55, "elapsed_time": "1 day, 7:14:05", "remaining_time": "11:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13197, "total_steps": 17941, "loss": 1.7329, "learning_rate": 1.6820546321997395e-05, "epoch": 0.735577726994036, "percentage": 73.56, "elapsed_time": "1 day, 7:14:14", "remaining_time": "11:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13198, "total_steps": 17941, "loss": 1.6086, "learning_rate": 1.6813885613194195e-05, "epoch": 0.7356334652471992, "percentage": 73.56, "elapsed_time": "1 day, 7:14:22", "remaining_time": "11:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13199, "total_steps": 17941, "loss": 1.5956, "learning_rate": 1.6807225956861054e-05, "epoch": 0.7356892035003623, "percentage": 73.57, "elapsed_time": "1 day, 7:14:31", "remaining_time": "11:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13200, "total_steps": 17941, "loss": 1.5, "learning_rate": 1.6800567353209178e-05, "epoch": 0.7357449417535254, "percentage": 73.57, "elapsed_time": "1 day, 7:14:39", "remaining_time": "11:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13201, "total_steps": 17941, "loss": 1.764, "learning_rate": 1.6793909802449737e-05, "epoch": 0.7358006800066886, "percentage": 73.58, "elapsed_time": "1 day, 7:14:48", "remaining_time": "11:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13202, "total_steps": 17941, "loss": 1.5798, "learning_rate": 1.6787253304793892e-05, "epoch": 0.7358564182598517, "percentage": 73.59, "elapsed_time": "1 day, 7:14:56", "remaining_time": "11:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13203, "total_steps": 17941, "loss": 1.7875, "learning_rate": 1.6780597860452695e-05, "epoch": 0.7359121565130149, "percentage": 73.59, "elapsed_time": "1 day, 7:15:05", "remaining_time": "11:12:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13204, "total_steps": 17941, "loss": 1.7364, "learning_rate": 1.6773943469637282e-05, "epoch": 0.7359678947661781, "percentage": 73.6, "elapsed_time": "1 day, 7:15:13", "remaining_time": "11:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13205, "total_steps": 17941, "loss": 1.5179, "learning_rate": 1.676729013255865e-05, "epoch": 0.7360236330193412, "percentage": 73.6, "elapsed_time": "1 day, 7:15:22", "remaining_time": "11:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13206, "total_steps": 17941, "loss": 1.6597, "learning_rate": 1.6760637849427812e-05, "epoch": 0.7360793712725043, "percentage": 73.61, "elapsed_time": "1 day, 7:15:30", "remaining_time": "11:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13207, "total_steps": 17941, "loss": 1.7935, "learning_rate": 1.675398662045574e-05, "epoch": 0.7361351095256675, "percentage": 73.61, "elapsed_time": "1 day, 7:15:38", "remaining_time": "11:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13208, "total_steps": 17941, "loss": 1.5229, "learning_rate": 1.6747336445853373e-05, "epoch": 0.7361908477788306, "percentage": 73.62, "elapsed_time": "1 day, 7:15:47", "remaining_time": "11:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13209, "total_steps": 17941, "loss": 1.4077, "learning_rate": 1.6740687325831638e-05, "epoch": 0.7362465860319938, "percentage": 73.62, "elapsed_time": "1 day, 7:15:55", "remaining_time": "11:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13210, "total_steps": 17941, "loss": 1.641, "learning_rate": 1.673403926060137e-05, "epoch": 0.7363023242851569, "percentage": 73.63, "elapsed_time": "1 day, 7:16:04", "remaining_time": "11:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13211, "total_steps": 17941, "loss": 1.3975, "learning_rate": 1.672739225037342e-05, "epoch": 0.73635806253832, "percentage": 73.64, "elapsed_time": "1 day, 7:16:13", "remaining_time": "11:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13212, "total_steps": 17941, "loss": 1.8485, "learning_rate": 1.6720746295358596e-05, "epoch": 0.7364138007914832, "percentage": 73.64, "elapsed_time": "1 day, 7:16:21", "remaining_time": "11:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13213, "total_steps": 17941, "loss": 1.7343, "learning_rate": 1.6714101395767673e-05, "epoch": 0.7364695390446463, "percentage": 73.65, "elapsed_time": "1 day, 7:16:30", "remaining_time": "11:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13214, "total_steps": 17941, "loss": 1.5785, "learning_rate": 1.670745755181138e-05, "epoch": 0.7365252772978095, "percentage": 73.65, "elapsed_time": "1 day, 7:16:38", "remaining_time": "11:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13215, "total_steps": 17941, "loss": 1.7871, "learning_rate": 1.670081476370042e-05, "epoch": 0.7365810155509727, "percentage": 73.66, "elapsed_time": "1 day, 7:16:47", "remaining_time": "11:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13216, "total_steps": 17941, "loss": 1.707, "learning_rate": 1.669417303164549e-05, "epoch": 0.7366367538041357, "percentage": 73.66, "elapsed_time": "1 day, 7:16:55", "remaining_time": "11:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13217, "total_steps": 17941, "loss": 1.5654, "learning_rate": 1.6687532355857183e-05, "epoch": 0.7366924920572989, "percentage": 73.67, "elapsed_time": "1 day, 7:17:04", "remaining_time": "11:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13218, "total_steps": 17941, "loss": 1.7403, "learning_rate": 1.668089273654611e-05, "epoch": 0.7367482303104621, "percentage": 73.67, "elapsed_time": "1 day, 7:17:12", "remaining_time": "11:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13219, "total_steps": 17941, "loss": 1.8995, "learning_rate": 1.6674254173922893e-05, "epoch": 0.7368039685636252, "percentage": 73.68, "elapsed_time": "1 day, 7:17:21", "remaining_time": "11:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13220, "total_steps": 17941, "loss": 1.4678, "learning_rate": 1.666761666819801e-05, "epoch": 0.7368597068167884, "percentage": 73.69, "elapsed_time": "1 day, 7:17:29", "remaining_time": "11:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13221, "total_steps": 17941, "loss": 1.5932, "learning_rate": 1.6660980219582e-05, "epoch": 0.7369154450699515, "percentage": 73.69, "elapsed_time": "1 day, 7:17:37", "remaining_time": "11:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13222, "total_steps": 17941, "loss": 1.8013, "learning_rate": 1.665434482828529e-05, "epoch": 0.7369711833231146, "percentage": 73.7, "elapsed_time": "1 day, 7:17:46", "remaining_time": "11:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13223, "total_steps": 17941, "loss": 1.4329, "learning_rate": 1.664771049451837e-05, "epoch": 0.7370269215762778, "percentage": 73.7, "elapsed_time": "1 day, 7:17:54", "remaining_time": "11:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13224, "total_steps": 17941, "loss": 1.4933, "learning_rate": 1.6641077218491606e-05, "epoch": 0.737082659829441, "percentage": 73.71, "elapsed_time": "1 day, 7:18:03", "remaining_time": "11:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13225, "total_steps": 17941, "loss": 1.7321, "learning_rate": 1.6634445000415372e-05, "epoch": 0.7371383980826041, "percentage": 73.71, "elapsed_time": "1 day, 7:18:11", "remaining_time": "11:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13226, "total_steps": 17941, "loss": 1.5427, "learning_rate": 1.662781384050001e-05, "epoch": 0.7371941363357672, "percentage": 73.72, "elapsed_time": "1 day, 7:18:20", "remaining_time": "11:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13227, "total_steps": 17941, "loss": 1.6237, "learning_rate": 1.662118373895582e-05, "epoch": 0.7372498745889304, "percentage": 73.72, "elapsed_time": "1 day, 7:18:28", "remaining_time": "11:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13228, "total_steps": 17941, "loss": 1.7387, "learning_rate": 1.6614554695993084e-05, "epoch": 0.7373056128420935, "percentage": 73.73, "elapsed_time": "1 day, 7:18:37", "remaining_time": "11:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13229, "total_steps": 17941, "loss": 1.6295, "learning_rate": 1.660792671182199e-05, "epoch": 0.7373613510952567, "percentage": 73.74, "elapsed_time": "1 day, 7:18:45", "remaining_time": "11:09:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13230, "total_steps": 17941, "loss": 1.6571, "learning_rate": 1.6601299786652807e-05, "epoch": 0.7374170893484199, "percentage": 73.74, "elapsed_time": "1 day, 7:18:54", "remaining_time": "11:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13231, "total_steps": 17941, "loss": 1.7502, "learning_rate": 1.6594673920695647e-05, "epoch": 0.737472827601583, "percentage": 73.75, "elapsed_time": "1 day, 7:19:02", "remaining_time": "11:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13232, "total_steps": 17941, "loss": 1.7857, "learning_rate": 1.658804911416067e-05, "epoch": 0.7375285658547461, "percentage": 73.75, "elapsed_time": "1 day, 7:19:10", "remaining_time": "11:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13233, "total_steps": 17941, "loss": 1.5482, "learning_rate": 1.6581425367257963e-05, "epoch": 0.7375843041079092, "percentage": 73.76, "elapsed_time": "1 day, 7:19:19", "remaining_time": "11:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13234, "total_steps": 17941, "loss": 1.6569, "learning_rate": 1.65748026801976e-05, "epoch": 0.7376400423610724, "percentage": 73.76, "elapsed_time": "1 day, 7:19:27", "remaining_time": "11:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13235, "total_steps": 17941, "loss": 1.8769, "learning_rate": 1.656818105318963e-05, "epoch": 0.7376957806142356, "percentage": 73.77, "elapsed_time": "1 day, 7:19:36", "remaining_time": "11:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13236, "total_steps": 17941, "loss": 1.5192, "learning_rate": 1.6561560486444023e-05, "epoch": 0.7377515188673986, "percentage": 73.78, "elapsed_time": "1 day, 7:19:44", "remaining_time": "11:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13237, "total_steps": 17941, "loss": 1.5064, "learning_rate": 1.6554940980170757e-05, "epoch": 0.7378072571205618, "percentage": 73.78, "elapsed_time": "1 day, 7:19:53", "remaining_time": "11:08:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13238, "total_steps": 17941, "loss": 1.5538, "learning_rate": 1.6548322534579765e-05, "epoch": 0.737862995373725, "percentage": 73.79, "elapsed_time": "1 day, 7:20:01", "remaining_time": "11:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13239, "total_steps": 17941, "loss": 1.5847, "learning_rate": 1.6541705149880943e-05, "epoch": 0.7379187336268881, "percentage": 73.79, "elapsed_time": "1 day, 7:20:10", "remaining_time": "11:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13240, "total_steps": 17941, "loss": 1.6449, "learning_rate": 1.6535088826284158e-05, "epoch": 0.7379744718800513, "percentage": 73.8, "elapsed_time": "1 day, 7:20:18", "remaining_time": "11:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13241, "total_steps": 17941, "loss": 1.608, "learning_rate": 1.652847356399924e-05, "epoch": 0.7380302101332145, "percentage": 73.8, "elapsed_time": "1 day, 7:20:27", "remaining_time": "11:07:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13242, "total_steps": 17941, "loss": 1.5354, "learning_rate": 1.6521859363236008e-05, "epoch": 0.7380859483863775, "percentage": 73.81, "elapsed_time": "1 day, 7:20:36", "remaining_time": "11:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13243, "total_steps": 17941, "loss": 1.658, "learning_rate": 1.651524622420419e-05, "epoch": 0.7381416866395407, "percentage": 73.81, "elapsed_time": "1 day, 7:20:44", "remaining_time": "11:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13244, "total_steps": 17941, "loss": 1.6284, "learning_rate": 1.6508634147113515e-05, "epoch": 0.7381974248927039, "percentage": 73.82, "elapsed_time": "1 day, 7:20:53", "remaining_time": "11:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13245, "total_steps": 17941, "loss": 1.7111, "learning_rate": 1.6502023132173733e-05, "epoch": 0.738253163145867, "percentage": 73.83, "elapsed_time": "1 day, 7:21:02", "remaining_time": "11:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13246, "total_steps": 17941, "loss": 1.6066, "learning_rate": 1.6495413179594448e-05, "epoch": 0.7383089013990302, "percentage": 73.83, "elapsed_time": "1 day, 7:21:10", "remaining_time": "11:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13247, "total_steps": 17941, "loss": 1.409, "learning_rate": 1.648880428958533e-05, "epoch": 0.7383646396521933, "percentage": 73.84, "elapsed_time": "1 day, 7:21:19", "remaining_time": "11:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13248, "total_steps": 17941, "loss": 1.6826, "learning_rate": 1.6482196462355925e-05, "epoch": 0.7384203779053564, "percentage": 73.84, "elapsed_time": "1 day, 7:21:28", "remaining_time": "11:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13249, "total_steps": 17941, "loss": 1.2258, "learning_rate": 1.6475589698115856e-05, "epoch": 0.7384761161585196, "percentage": 73.85, "elapsed_time": "1 day, 7:21:36", "remaining_time": "11:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13250, "total_steps": 17941, "loss": 1.6302, "learning_rate": 1.6468983997074606e-05, "epoch": 0.7385318544116828, "percentage": 73.85, "elapsed_time": "1 day, 7:21:44", "remaining_time": "11:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13251, "total_steps": 17941, "loss": 1.4842, "learning_rate": 1.6462379359441683e-05, "epoch": 0.7385875926648459, "percentage": 73.86, "elapsed_time": "1 day, 7:21:53", "remaining_time": "11:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13252, "total_steps": 17941, "loss": 1.771, "learning_rate": 1.6455775785426548e-05, "epoch": 0.738643330918009, "percentage": 73.86, "elapsed_time": "1 day, 7:22:01", "remaining_time": "11:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13253, "total_steps": 17941, "loss": 1.7011, "learning_rate": 1.6449173275238634e-05, "epoch": 0.7386990691711722, "percentage": 73.87, "elapsed_time": "1 day, 7:22:10", "remaining_time": "11:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13254, "total_steps": 17941, "loss": 1.7596, "learning_rate": 1.644257182908734e-05, "epoch": 0.7387548074243353, "percentage": 73.88, "elapsed_time": "1 day, 7:22:18", "remaining_time": "11:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13255, "total_steps": 17941, "loss": 1.626, "learning_rate": 1.6435971447181982e-05, "epoch": 0.7388105456774985, "percentage": 73.88, "elapsed_time": "1 day, 7:22:27", "remaining_time": "11:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13256, "total_steps": 17941, "loss": 1.5525, "learning_rate": 1.642937212973195e-05, "epoch": 0.7388662839306616, "percentage": 73.89, "elapsed_time": "1 day, 7:22:35", "remaining_time": "11:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13257, "total_steps": 17941, "loss": 1.5693, "learning_rate": 1.642277387694649e-05, "epoch": 0.7389220221838247, "percentage": 73.89, "elapsed_time": "1 day, 7:22:44", "remaining_time": "11:05:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13258, "total_steps": 17941, "loss": 1.6173, "learning_rate": 1.6416176689034873e-05, "epoch": 0.7389777604369879, "percentage": 73.9, "elapsed_time": "1 day, 7:22:52", "remaining_time": "11:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13259, "total_steps": 17941, "loss": 1.6737, "learning_rate": 1.6409580566206324e-05, "epoch": 0.739033498690151, "percentage": 73.9, "elapsed_time": "1 day, 7:23:01", "remaining_time": "11:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13260, "total_steps": 17941, "loss": 1.8666, "learning_rate": 1.6402985508670032e-05, "epoch": 0.7390892369433142, "percentage": 73.91, "elapsed_time": "1 day, 7:23:09", "remaining_time": "11:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13261, "total_steps": 17941, "loss": 1.8081, "learning_rate": 1.639639151663518e-05, "epoch": 0.7391449751964774, "percentage": 73.91, "elapsed_time": "1 day, 7:23:17", "remaining_time": "11:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13262, "total_steps": 17941, "loss": 1.7515, "learning_rate": 1.638979859031084e-05, "epoch": 0.7392007134496404, "percentage": 73.92, "elapsed_time": "1 day, 7:23:26", "remaining_time": "11:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13263, "total_steps": 17941, "loss": 1.8197, "learning_rate": 1.638320672990613e-05, "epoch": 0.7392564517028036, "percentage": 73.93, "elapsed_time": "1 day, 7:23:34", "remaining_time": "11:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13264, "total_steps": 17941, "loss": 1.4308, "learning_rate": 1.6376615935630106e-05, "epoch": 0.7393121899559668, "percentage": 73.93, "elapsed_time": "1 day, 7:23:43", "remaining_time": "11:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13265, "total_steps": 17941, "loss": 1.4348, "learning_rate": 1.6370026207691786e-05, "epoch": 0.7393679282091299, "percentage": 73.94, "elapsed_time": "1 day, 7:23:51", "remaining_time": "11:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13266, "total_steps": 17941, "loss": 1.7006, "learning_rate": 1.636343754630015e-05, "epoch": 0.7394236664622931, "percentage": 73.94, "elapsed_time": "1 day, 7:24:00", "remaining_time": "11:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13267, "total_steps": 17941, "loss": 1.5063, "learning_rate": 1.6356849951664172e-05, "epoch": 0.7394794047154563, "percentage": 73.95, "elapsed_time": "1 day, 7:24:08", "remaining_time": "11:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13268, "total_steps": 17941, "loss": 1.6295, "learning_rate": 1.6350263423992774e-05, "epoch": 0.7395351429686193, "percentage": 73.95, "elapsed_time": "1 day, 7:24:17", "remaining_time": "11:03:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13269, "total_steps": 17941, "loss": 1.7564, "learning_rate": 1.634367796349481e-05, "epoch": 0.7395908812217825, "percentage": 73.96, "elapsed_time": "1 day, 7:24:25", "remaining_time": "11:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13270, "total_steps": 17941, "loss": 1.6458, "learning_rate": 1.6337093570379153e-05, "epoch": 0.7396466194749457, "percentage": 73.96, "elapsed_time": "1 day, 7:24:34", "remaining_time": "11:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13271, "total_steps": 17941, "loss": 1.5231, "learning_rate": 1.6330510244854612e-05, "epoch": 0.7397023577281088, "percentage": 73.97, "elapsed_time": "1 day, 7:24:42", "remaining_time": "11:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13272, "total_steps": 17941, "loss": 1.9289, "learning_rate": 1.632392798712999e-05, "epoch": 0.739758095981272, "percentage": 73.98, "elapsed_time": "1 day, 7:24:50", "remaining_time": "11:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13273, "total_steps": 17941, "loss": 1.515, "learning_rate": 1.631734679741404e-05, "epoch": 0.7398138342344351, "percentage": 73.98, "elapsed_time": "1 day, 7:24:59", "remaining_time": "11:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13274, "total_steps": 17941, "loss": 1.5093, "learning_rate": 1.631076667591543e-05, "epoch": 0.7398695724875982, "percentage": 73.99, "elapsed_time": "1 day, 7:25:07", "remaining_time": "11:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13275, "total_steps": 17941, "loss": 1.7421, "learning_rate": 1.6304187622842916e-05, "epoch": 0.7399253107407614, "percentage": 73.99, "elapsed_time": "1 day, 7:25:16", "remaining_time": "11:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13276, "total_steps": 17941, "loss": 1.4374, "learning_rate": 1.6297609638405093e-05, "epoch": 0.7399810489939246, "percentage": 74.0, "elapsed_time": "1 day, 7:25:24", "remaining_time": "11:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13277, "total_steps": 17941, "loss": 1.591, "learning_rate": 1.629103272281059e-05, "epoch": 0.7400367872470877, "percentage": 74.0, "elapsed_time": "1 day, 7:25:33", "remaining_time": "11:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13278, "total_steps": 17941, "loss": 1.8288, "learning_rate": 1.6284456876267994e-05, "epoch": 0.7400925255002508, "percentage": 74.01, "elapsed_time": "1 day, 7:25:42", "remaining_time": "11:02:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13279, "total_steps": 17941, "loss": 1.4758, "learning_rate": 1.6277882098985852e-05, "epoch": 0.7401482637534139, "percentage": 74.01, "elapsed_time": "1 day, 7:25:50", "remaining_time": "11:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13280, "total_steps": 17941, "loss": 1.7342, "learning_rate": 1.6271308391172696e-05, "epoch": 0.7402040020065771, "percentage": 74.02, "elapsed_time": "1 day, 7:25:59", "remaining_time": "11:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13281, "total_steps": 17941, "loss": 1.7038, "learning_rate": 1.626473575303695e-05, "epoch": 0.7402597402597403, "percentage": 74.03, "elapsed_time": "1 day, 7:26:08", "remaining_time": "11:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13282, "total_steps": 17941, "loss": 1.5131, "learning_rate": 1.6258164184787123e-05, "epoch": 0.7403154785129034, "percentage": 74.03, "elapsed_time": "1 day, 7:26:16", "remaining_time": "11:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13283, "total_steps": 17941, "loss": 1.6506, "learning_rate": 1.6251593686631588e-05, "epoch": 0.7403712167660665, "percentage": 74.04, "elapsed_time": "1 day, 7:26:24", "remaining_time": "11:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13284, "total_steps": 17941, "loss": 1.7275, "learning_rate": 1.6245024258778733e-05, "epoch": 0.7404269550192297, "percentage": 74.04, "elapsed_time": "1 day, 7:26:33", "remaining_time": "11:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13285, "total_steps": 17941, "loss": 1.4691, "learning_rate": 1.6238455901436905e-05, "epoch": 0.7404826932723928, "percentage": 74.05, "elapsed_time": "1 day, 7:26:41", "remaining_time": "11:01:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13286, "total_steps": 17941, "loss": 1.6232, "learning_rate": 1.6231888614814416e-05, "epoch": 0.740538431525556, "percentage": 74.05, "elapsed_time": "1 day, 7:26:50", "remaining_time": "11:01:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13287, "total_steps": 17941, "loss": 1.6881, "learning_rate": 1.622532239911955e-05, "epoch": 0.7405941697787192, "percentage": 74.06, "elapsed_time": "1 day, 7:26:58", "remaining_time": "11:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13288, "total_steps": 17941, "loss": 1.496, "learning_rate": 1.6218757254560523e-05, "epoch": 0.7406499080318822, "percentage": 74.06, "elapsed_time": "1 day, 7:27:07", "remaining_time": "11:00:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13289, "total_steps": 17941, "loss": 1.7215, "learning_rate": 1.6212193181345554e-05, "epoch": 0.7407056462850454, "percentage": 74.07, "elapsed_time": "1 day, 7:27:15", "remaining_time": "11:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13290, "total_steps": 17941, "loss": 1.6221, "learning_rate": 1.6205630179682825e-05, "epoch": 0.7407613845382086, "percentage": 74.08, "elapsed_time": "1 day, 7:27:24", "remaining_time": "11:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13291, "total_steps": 17941, "loss": 1.6172, "learning_rate": 1.619906824978047e-05, "epoch": 0.7408171227913717, "percentage": 74.08, "elapsed_time": "1 day, 7:27:32", "remaining_time": "11:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13292, "total_steps": 17941, "loss": 1.5224, "learning_rate": 1.6192507391846597e-05, "epoch": 0.7408728610445349, "percentage": 74.09, "elapsed_time": "1 day, 7:27:41", "remaining_time": "11:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13293, "total_steps": 17941, "loss": 2.1171, "learning_rate": 1.618594760608928e-05, "epoch": 0.740928599297698, "percentage": 74.09, "elapsed_time": "1 day, 7:27:49", "remaining_time": "11:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13294, "total_steps": 17941, "loss": 1.4332, "learning_rate": 1.6179388892716568e-05, "epoch": 0.7409843375508611, "percentage": 74.1, "elapsed_time": "1 day, 7:27:57", "remaining_time": "10:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13295, "total_steps": 17941, "loss": 1.7089, "learning_rate": 1.617283125193644e-05, "epoch": 0.7410400758040243, "percentage": 74.1, "elapsed_time": "1 day, 7:28:06", "remaining_time": "10:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13296, "total_steps": 17941, "loss": 1.425, "learning_rate": 1.6166274683956872e-05, "epoch": 0.7410958140571875, "percentage": 74.11, "elapsed_time": "1 day, 7:28:14", "remaining_time": "10:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13297, "total_steps": 17941, "loss": 1.599, "learning_rate": 1.6159719188985813e-05, "epoch": 0.7411515523103506, "percentage": 74.12, "elapsed_time": "1 day, 7:28:23", "remaining_time": "10:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13298, "total_steps": 17941, "loss": 1.713, "learning_rate": 1.615316476723116e-05, "epoch": 0.7412072905635138, "percentage": 74.12, "elapsed_time": "1 day, 7:28:31", "remaining_time": "10:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13299, "total_steps": 17941, "loss": 1.5347, "learning_rate": 1.6146611418900777e-05, "epoch": 0.7412630288166769, "percentage": 74.13, "elapsed_time": "1 day, 7:28:40", "remaining_time": "10:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13300, "total_steps": 17941, "loss": 1.7316, "learning_rate": 1.6140059144202497e-05, "epoch": 0.74131876706984, "percentage": 74.13, "elapsed_time": "1 day, 7:28:48", "remaining_time": "10:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13301, "total_steps": 17941, "loss": 1.8572, "learning_rate": 1.6133507943344144e-05, "epoch": 0.7413745053230032, "percentage": 74.14, "elapsed_time": "1 day, 7:28:57", "remaining_time": "10:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13302, "total_steps": 17941, "loss": 1.6987, "learning_rate": 1.612695781653345e-05, "epoch": 0.7414302435761663, "percentage": 74.14, "elapsed_time": "1 day, 7:29:06", "remaining_time": "10:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13303, "total_steps": 17941, "loss": 1.6614, "learning_rate": 1.6120408763978156e-05, "epoch": 0.7414859818293295, "percentage": 74.15, "elapsed_time": "1 day, 7:29:14", "remaining_time": "10:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13304, "total_steps": 17941, "loss": 1.4362, "learning_rate": 1.6113860785885966e-05, "epoch": 0.7415417200824926, "percentage": 74.15, "elapsed_time": "1 day, 7:29:22", "remaining_time": "10:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13305, "total_steps": 17941, "loss": 1.5918, "learning_rate": 1.6107313882464542e-05, "epoch": 0.7415974583356557, "percentage": 74.16, "elapsed_time": "1 day, 7:29:31", "remaining_time": "10:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13306, "total_steps": 17941, "loss": 1.6136, "learning_rate": 1.6100768053921534e-05, "epoch": 0.7416531965888189, "percentage": 74.17, "elapsed_time": "1 day, 7:29:39", "remaining_time": "10:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13307, "total_steps": 17941, "loss": 1.3586, "learning_rate": 1.609422330046448e-05, "epoch": 0.7417089348419821, "percentage": 74.17, "elapsed_time": "1 day, 7:29:48", "remaining_time": "10:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13308, "total_steps": 17941, "loss": 1.6597, "learning_rate": 1.608767962230101e-05, "epoch": 0.7417646730951452, "percentage": 74.18, "elapsed_time": "1 day, 7:29:56", "remaining_time": "10:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13309, "total_steps": 17941, "loss": 1.3816, "learning_rate": 1.6081137019638603e-05, "epoch": 0.7418204113483083, "percentage": 74.18, "elapsed_time": "1 day, 7:30:05", "remaining_time": "10:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13310, "total_steps": 17941, "loss": 1.9714, "learning_rate": 1.6074595492684774e-05, "epoch": 0.7418761496014715, "percentage": 74.19, "elapsed_time": "1 day, 7:30:13", "remaining_time": "10:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13311, "total_steps": 17941, "loss": 1.647, "learning_rate": 1.6068055041646973e-05, "epoch": 0.7419318878546346, "percentage": 74.19, "elapsed_time": "1 day, 7:30:22", "remaining_time": "10:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13312, "total_steps": 17941, "loss": 1.5836, "learning_rate": 1.606151566673263e-05, "epoch": 0.7419876261077978, "percentage": 74.2, "elapsed_time": "1 day, 7:30:31", "remaining_time": "10:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13313, "total_steps": 17941, "loss": 1.6138, "learning_rate": 1.6054977368149154e-05, "epoch": 0.742043364360961, "percentage": 74.2, "elapsed_time": "1 day, 7:30:39", "remaining_time": "10:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13314, "total_steps": 17941, "loss": 1.9437, "learning_rate": 1.6048440146103866e-05, "epoch": 0.742099102614124, "percentage": 74.21, "elapsed_time": "1 day, 7:30:48", "remaining_time": "10:57:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13315, "total_steps": 17941, "loss": 1.6194, "learning_rate": 1.6041904000804103e-05, "epoch": 0.7421548408672872, "percentage": 74.22, "elapsed_time": "1 day, 7:30:56", "remaining_time": "10:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13316, "total_steps": 17941, "loss": 1.7029, "learning_rate": 1.603536893245715e-05, "epoch": 0.7422105791204504, "percentage": 74.22, "elapsed_time": "1 day, 7:31:05", "remaining_time": "10:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13317, "total_steps": 17941, "loss": 1.6231, "learning_rate": 1.6028834941270277e-05, "epoch": 0.7422663173736135, "percentage": 74.23, "elapsed_time": "1 day, 7:31:14", "remaining_time": "10:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13318, "total_steps": 17941, "loss": 1.4641, "learning_rate": 1.602230202745069e-05, "epoch": 0.7423220556267767, "percentage": 74.23, "elapsed_time": "1 day, 7:31:22", "remaining_time": "10:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13319, "total_steps": 17941, "loss": 1.5502, "learning_rate": 1.601577019120558e-05, "epoch": 0.7423777938799399, "percentage": 74.24, "elapsed_time": "1 day, 7:31:31", "remaining_time": "10:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13320, "total_steps": 17941, "loss": 1.437, "learning_rate": 1.600923943274211e-05, "epoch": 0.7424335321331029, "percentage": 74.24, "elapsed_time": "1 day, 7:31:39", "remaining_time": "10:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13321, "total_steps": 17941, "loss": 1.4918, "learning_rate": 1.6002709752267375e-05, "epoch": 0.7424892703862661, "percentage": 74.25, "elapsed_time": "1 day, 7:31:47", "remaining_time": "10:56:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13322, "total_steps": 17941, "loss": 1.7844, "learning_rate": 1.5996181149988467e-05, "epoch": 0.7425450086394293, "percentage": 74.25, "elapsed_time": "1 day, 7:31:56", "remaining_time": "10:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13323, "total_steps": 17941, "loss": 1.5067, "learning_rate": 1.598965362611243e-05, "epoch": 0.7426007468925924, "percentage": 74.26, "elapsed_time": "1 day, 7:32:04", "remaining_time": "10:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13324, "total_steps": 17941, "loss": 1.454, "learning_rate": 1.5983127180846298e-05, "epoch": 0.7426564851457556, "percentage": 74.27, "elapsed_time": "1 day, 7:32:13", "remaining_time": "10:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13325, "total_steps": 17941, "loss": 1.7211, "learning_rate": 1.597660181439703e-05, "epoch": 0.7427122233989186, "percentage": 74.27, "elapsed_time": "1 day, 7:32:21", "remaining_time": "10:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13326, "total_steps": 17941, "loss": 1.4562, "learning_rate": 1.5970077526971582e-05, "epoch": 0.7427679616520818, "percentage": 74.28, "elapsed_time": "1 day, 7:32:30", "remaining_time": "10:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13327, "total_steps": 17941, "loss": 1.8089, "learning_rate": 1.596355431877689e-05, "epoch": 0.742823699905245, "percentage": 74.28, "elapsed_time": "1 day, 7:32:38", "remaining_time": "10:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13328, "total_steps": 17941, "loss": 1.6357, "learning_rate": 1.5957032190019787e-05, "epoch": 0.7428794381584081, "percentage": 74.29, "elapsed_time": "1 day, 7:32:47", "remaining_time": "10:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13329, "total_steps": 17941, "loss": 1.5216, "learning_rate": 1.5950511140907142e-05, "epoch": 0.7429351764115713, "percentage": 74.29, "elapsed_time": "1 day, 7:32:55", "remaining_time": "10:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13330, "total_steps": 17941, "loss": 1.6905, "learning_rate": 1.5943991171645762e-05, "epoch": 0.7429909146647344, "percentage": 74.3, "elapsed_time": "1 day, 7:33:04", "remaining_time": "10:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13331, "total_steps": 17941, "loss": 1.6697, "learning_rate": 1.5937472282442416e-05, "epoch": 0.7430466529178975, "percentage": 74.3, "elapsed_time": "1 day, 7:33:12", "remaining_time": "10:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13332, "total_steps": 17941, "loss": 1.7427, "learning_rate": 1.5930954473503874e-05, "epoch": 0.7431023911710607, "percentage": 74.31, "elapsed_time": "1 day, 7:33:21", "remaining_time": "10:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13333, "total_steps": 17941, "loss": 1.6212, "learning_rate": 1.5924437745036784e-05, "epoch": 0.7431581294242239, "percentage": 74.32, "elapsed_time": "1 day, 7:33:29", "remaining_time": "10:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13334, "total_steps": 17941, "loss": 1.4751, "learning_rate": 1.5917922097247882e-05, "epoch": 0.743213867677387, "percentage": 74.32, "elapsed_time": "1 day, 7:33:38", "remaining_time": "10:54:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13335, "total_steps": 17941, "loss": 1.9724, "learning_rate": 1.5911407530343768e-05, "epoch": 0.7432696059305501, "percentage": 74.33, "elapsed_time": "1 day, 7:33:47", "remaining_time": "10:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13336, "total_steps": 17941, "loss": 1.3127, "learning_rate": 1.590489404453106e-05, "epoch": 0.7433253441837133, "percentage": 74.33, "elapsed_time": "1 day, 7:33:55", "remaining_time": "10:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13337, "total_steps": 17941, "loss": 1.6791, "learning_rate": 1.5898381640016318e-05, "epoch": 0.7433810824368764, "percentage": 74.34, "elapsed_time": "1 day, 7:34:04", "remaining_time": "10:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13338, "total_steps": 17941, "loss": 1.6209, "learning_rate": 1.5891870317006093e-05, "epoch": 0.7434368206900396, "percentage": 74.34, "elapsed_time": "1 day, 7:34:12", "remaining_time": "10:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13339, "total_steps": 17941, "loss": 1.6723, "learning_rate": 1.5885360075706886e-05, "epoch": 0.7434925589432028, "percentage": 74.35, "elapsed_time": "1 day, 7:34:21", "remaining_time": "10:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13340, "total_steps": 17941, "loss": 1.8016, "learning_rate": 1.587885091632514e-05, "epoch": 0.7435482971963658, "percentage": 74.35, "elapsed_time": "1 day, 7:34:29", "remaining_time": "10:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13341, "total_steps": 17941, "loss": 1.6212, "learning_rate": 1.5872342839067306e-05, "epoch": 0.743604035449529, "percentage": 74.36, "elapsed_time": "1 day, 7:34:38", "remaining_time": "10:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13342, "total_steps": 17941, "loss": 1.735, "learning_rate": 1.5865835844139776e-05, "epoch": 0.7436597737026922, "percentage": 74.37, "elapsed_time": "1 day, 7:34:47", "remaining_time": "10:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13343, "total_steps": 17941, "loss": 1.6558, "learning_rate": 1.585932993174892e-05, "epoch": 0.7437155119558553, "percentage": 74.37, "elapsed_time": "1 day, 7:34:55", "remaining_time": "10:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13344, "total_steps": 17941, "loss": 1.4825, "learning_rate": 1.585282510210106e-05, "epoch": 0.7437712502090185, "percentage": 74.38, "elapsed_time": "1 day, 7:35:04", "remaining_time": "10:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13345, "total_steps": 17941, "loss": 1.7989, "learning_rate": 1.58463213554025e-05, "epoch": 0.7438269884621816, "percentage": 74.38, "elapsed_time": "1 day, 7:35:12", "remaining_time": "10:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13346, "total_steps": 17941, "loss": 1.6123, "learning_rate": 1.583981869185951e-05, "epoch": 0.7438827267153447, "percentage": 74.39, "elapsed_time": "1 day, 7:35:21", "remaining_time": "10:52:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13347, "total_steps": 17941, "loss": 1.7726, "learning_rate": 1.5833317111678285e-05, "epoch": 0.7439384649685079, "percentage": 74.39, "elapsed_time": "1 day, 7:35:29", "remaining_time": "10:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13348, "total_steps": 17941, "loss": 1.6517, "learning_rate": 1.5826816615065042e-05, "epoch": 0.743994203221671, "percentage": 74.4, "elapsed_time": "1 day, 7:35:38", "remaining_time": "10:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13349, "total_steps": 17941, "loss": 1.6328, "learning_rate": 1.5820317202225926e-05, "epoch": 0.7440499414748342, "percentage": 74.4, "elapsed_time": "1 day, 7:35:46", "remaining_time": "10:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13350, "total_steps": 17941, "loss": 1.632, "learning_rate": 1.5813818873367076e-05, "epoch": 0.7441056797279973, "percentage": 74.41, "elapsed_time": "1 day, 7:35:55", "remaining_time": "10:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13351, "total_steps": 17941, "loss": 1.5918, "learning_rate": 1.5807321628694567e-05, "epoch": 0.7441614179811604, "percentage": 74.42, "elapsed_time": "1 day, 7:36:04", "remaining_time": "10:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13352, "total_steps": 17941, "loss": 1.8415, "learning_rate": 1.5800825468414452e-05, "epoch": 0.7442171562343236, "percentage": 74.42, "elapsed_time": "1 day, 7:36:13", "remaining_time": "10:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13353, "total_steps": 17941, "loss": 1.6525, "learning_rate": 1.5794330392732787e-05, "epoch": 0.7442728944874868, "percentage": 74.43, "elapsed_time": "1 day, 7:36:21", "remaining_time": "10:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13354, "total_steps": 17941, "loss": 1.7335, "learning_rate": 1.5787836401855503e-05, "epoch": 0.7443286327406499, "percentage": 74.43, "elapsed_time": "1 day, 7:36:29", "remaining_time": "10:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13355, "total_steps": 17941, "loss": 1.6273, "learning_rate": 1.578134349598858e-05, "epoch": 0.744384370993813, "percentage": 74.44, "elapsed_time": "1 day, 7:36:38", "remaining_time": "10:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13356, "total_steps": 17941, "loss": 1.7174, "learning_rate": 1.577485167533794e-05, "epoch": 0.7444401092469762, "percentage": 74.44, "elapsed_time": "1 day, 7:36:46", "remaining_time": "10:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13357, "total_steps": 17941, "loss": 1.621, "learning_rate": 1.576836094010945e-05, "epoch": 0.7444958475001393, "percentage": 74.45, "elapsed_time": "1 day, 7:36:55", "remaining_time": "10:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13358, "total_steps": 17941, "loss": 1.4205, "learning_rate": 1.5761871290508983e-05, "epoch": 0.7445515857533025, "percentage": 74.46, "elapsed_time": "1 day, 7:37:03", "remaining_time": "10:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13359, "total_steps": 17941, "loss": 1.6063, "learning_rate": 1.5755382726742308e-05, "epoch": 0.7446073240064657, "percentage": 74.46, "elapsed_time": "1 day, 7:37:12", "remaining_time": "10:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13360, "total_steps": 17941, "loss": 1.6184, "learning_rate": 1.5748895249015266e-05, "epoch": 0.7446630622596287, "percentage": 74.47, "elapsed_time": "1 day, 7:37:20", "remaining_time": "10:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13361, "total_steps": 17941, "loss": 1.6787, "learning_rate": 1.5742408857533546e-05, "epoch": 0.7447188005127919, "percentage": 74.47, "elapsed_time": "1 day, 7:37:29", "remaining_time": "10:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13362, "total_steps": 17941, "loss": 1.5111, "learning_rate": 1.573592355250289e-05, "epoch": 0.7447745387659551, "percentage": 74.48, "elapsed_time": "1 day, 7:37:37", "remaining_time": "10:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13363, "total_steps": 17941, "loss": 1.7729, "learning_rate": 1.572943933412896e-05, "epoch": 0.7448302770191182, "percentage": 74.48, "elapsed_time": "1 day, 7:37:46", "remaining_time": "10:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13364, "total_steps": 17941, "loss": 1.5573, "learning_rate": 1.5722956202617408e-05, "epoch": 0.7448860152722814, "percentage": 74.49, "elapsed_time": "1 day, 7:37:54", "remaining_time": "10:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13365, "total_steps": 17941, "loss": 1.5506, "learning_rate": 1.5716474158173845e-05, "epoch": 0.7449417535254446, "percentage": 74.49, "elapsed_time": "1 day, 7:38:03", "remaining_time": "10:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13366, "total_steps": 17941, "loss": 1.4187, "learning_rate": 1.5709993201003827e-05, "epoch": 0.7449974917786076, "percentage": 74.5, "elapsed_time": "1 day, 7:38:11", "remaining_time": "10:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13367, "total_steps": 17941, "loss": 1.6344, "learning_rate": 1.570351333131289e-05, "epoch": 0.7450532300317708, "percentage": 74.51, "elapsed_time": "1 day, 7:38:19", "remaining_time": "10:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13368, "total_steps": 17941, "loss": 1.6753, "learning_rate": 1.5697034549306554e-05, "epoch": 0.745108968284934, "percentage": 74.51, "elapsed_time": "1 day, 7:38:28", "remaining_time": "10:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13369, "total_steps": 17941, "loss": 1.8055, "learning_rate": 1.569055685519028e-05, "epoch": 0.7451647065380971, "percentage": 74.52, "elapsed_time": "1 day, 7:38:36", "remaining_time": "10:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13370, "total_steps": 17941, "loss": 1.426, "learning_rate": 1.5684080249169507e-05, "epoch": 0.7452204447912603, "percentage": 74.52, "elapsed_time": "1 day, 7:38:45", "remaining_time": "10:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13371, "total_steps": 17941, "loss": 1.832, "learning_rate": 1.5677604731449635e-05, "epoch": 0.7452761830444233, "percentage": 74.53, "elapsed_time": "1 day, 7:38:53", "remaining_time": "10:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13372, "total_steps": 17941, "loss": 1.511, "learning_rate": 1.5671130302236038e-05, "epoch": 0.7453319212975865, "percentage": 74.53, "elapsed_time": "1 day, 7:39:02", "remaining_time": "10:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13373, "total_steps": 17941, "loss": 1.8098, "learning_rate": 1.5664656961734025e-05, "epoch": 0.7453876595507497, "percentage": 74.54, "elapsed_time": "1 day, 7:39:10", "remaining_time": "10:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13374, "total_steps": 17941, "loss": 1.6672, "learning_rate": 1.5658184710148897e-05, "epoch": 0.7454433978039128, "percentage": 74.54, "elapsed_time": "1 day, 7:39:19", "remaining_time": "10:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13375, "total_steps": 17941, "loss": 1.9259, "learning_rate": 1.565171354768593e-05, "epoch": 0.745499136057076, "percentage": 74.55, "elapsed_time": "1 day, 7:39:27", "remaining_time": "10:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13376, "total_steps": 17941, "loss": 1.6948, "learning_rate": 1.5645243474550346e-05, "epoch": 0.7455548743102391, "percentage": 74.56, "elapsed_time": "1 day, 7:39:37", "remaining_time": "10:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13377, "total_steps": 17941, "loss": 1.6303, "learning_rate": 1.5638774490947332e-05, "epoch": 0.7456106125634022, "percentage": 74.56, "elapsed_time": "1 day, 7:39:45", "remaining_time": "10:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13378, "total_steps": 17941, "loss": 1.56, "learning_rate": 1.563230659708206e-05, "epoch": 0.7456663508165654, "percentage": 74.57, "elapsed_time": "1 day, 7:39:54", "remaining_time": "10:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13379, "total_steps": 17941, "loss": 1.79, "learning_rate": 1.562583979315965e-05, "epoch": 0.7457220890697286, "percentage": 74.57, "elapsed_time": "1 day, 7:40:02", "remaining_time": "10:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13380, "total_steps": 17941, "loss": 1.6725, "learning_rate": 1.5619374079385175e-05, "epoch": 0.7457778273228917, "percentage": 74.58, "elapsed_time": "1 day, 7:40:11", "remaining_time": "10:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13381, "total_steps": 17941, "loss": 1.8324, "learning_rate": 1.5612909455963703e-05, "epoch": 0.7458335655760548, "percentage": 74.58, "elapsed_time": "1 day, 7:40:19", "remaining_time": "10:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13382, "total_steps": 17941, "loss": 1.5773, "learning_rate": 1.560644592310025e-05, "epoch": 0.745889303829218, "percentage": 74.59, "elapsed_time": "1 day, 7:40:28", "remaining_time": "10:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13383, "total_steps": 17941, "loss": 1.4419, "learning_rate": 1.5599983480999802e-05, "epoch": 0.7459450420823811, "percentage": 74.59, "elapsed_time": "1 day, 7:40:36", "remaining_time": "10:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13384, "total_steps": 17941, "loss": 1.6136, "learning_rate": 1.559352212986733e-05, "epoch": 0.7460007803355443, "percentage": 74.6, "elapsed_time": "1 day, 7:40:45", "remaining_time": "10:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13385, "total_steps": 17941, "loss": 1.5806, "learning_rate": 1.5587061869907704e-05, "epoch": 0.7460565185887075, "percentage": 74.61, "elapsed_time": "1 day, 7:40:53", "remaining_time": "10:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13386, "total_steps": 17941, "loss": 1.6182, "learning_rate": 1.5580602701325865e-05, "epoch": 0.7461122568418705, "percentage": 74.61, "elapsed_time": "1 day, 7:41:02", "remaining_time": "10:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13387, "total_steps": 17941, "loss": 1.4877, "learning_rate": 1.5574144624326607e-05, "epoch": 0.7461679950950337, "percentage": 74.62, "elapsed_time": "1 day, 7:41:10", "remaining_time": "10:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13388, "total_steps": 17941, "loss": 1.4704, "learning_rate": 1.5567687639114776e-05, "epoch": 0.7462237333481969, "percentage": 74.62, "elapsed_time": "1 day, 7:41:19", "remaining_time": "10:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13389, "total_steps": 17941, "loss": 1.6477, "learning_rate": 1.5561231745895127e-05, "epoch": 0.74627947160136, "percentage": 74.63, "elapsed_time": "1 day, 7:41:27", "remaining_time": "10:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13390, "total_steps": 17941, "loss": 1.8731, "learning_rate": 1.5554776944872422e-05, "epoch": 0.7463352098545232, "percentage": 74.63, "elapsed_time": "1 day, 7:41:36", "remaining_time": "10:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13391, "total_steps": 17941, "loss": 1.4527, "learning_rate": 1.5548323236251378e-05, "epoch": 0.7463909481076864, "percentage": 74.64, "elapsed_time": "1 day, 7:41:44", "remaining_time": "10:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13392, "total_steps": 17941, "loss": 1.7002, "learning_rate": 1.5541870620236622e-05, "epoch": 0.7464466863608494, "percentage": 74.64, "elapsed_time": "1 day, 7:41:53", "remaining_time": "10:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13393, "total_steps": 17941, "loss": 1.7703, "learning_rate": 1.5535419097032854e-05, "epoch": 0.7465024246140126, "percentage": 74.65, "elapsed_time": "1 day, 7:42:01", "remaining_time": "10:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13394, "total_steps": 17941, "loss": 1.7067, "learning_rate": 1.5528968666844634e-05, "epoch": 0.7465581628671757, "percentage": 74.66, "elapsed_time": "1 day, 7:42:10", "remaining_time": "10:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13395, "total_steps": 17941, "loss": 1.5557, "learning_rate": 1.552251932987655e-05, "epoch": 0.7466139011203389, "percentage": 74.66, "elapsed_time": "1 day, 7:42:18", "remaining_time": "10:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13396, "total_steps": 17941, "loss": 1.6904, "learning_rate": 1.5516071086333138e-05, "epoch": 0.7466696393735021, "percentage": 74.67, "elapsed_time": "1 day, 7:42:27", "remaining_time": "10:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13397, "total_steps": 17941, "loss": 1.6019, "learning_rate": 1.5509623936418892e-05, "epoch": 0.7467253776266651, "percentage": 74.67, "elapsed_time": "1 day, 7:42:35", "remaining_time": "10:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13398, "total_steps": 17941, "loss": 1.8989, "learning_rate": 1.5503177880338298e-05, "epoch": 0.7467811158798283, "percentage": 74.68, "elapsed_time": "1 day, 7:42:44", "remaining_time": "10:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13399, "total_steps": 17941, "loss": 1.7319, "learning_rate": 1.5496732918295755e-05, "epoch": 0.7468368541329915, "percentage": 74.68, "elapsed_time": "1 day, 7:42:53", "remaining_time": "10:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13400, "total_steps": 17941, "loss": 1.8259, "learning_rate": 1.5490289050495676e-05, "epoch": 0.7468925923861546, "percentage": 74.69, "elapsed_time": "1 day, 7:43:02", "remaining_time": "10:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13401, "total_steps": 17941, "loss": 1.658, "learning_rate": 1.5483846277142423e-05, "epoch": 0.7469483306393178, "percentage": 74.69, "elapsed_time": "1 day, 7:43:10", "remaining_time": "10:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13402, "total_steps": 17941, "loss": 1.3426, "learning_rate": 1.5477404598440327e-05, "epoch": 0.7470040688924809, "percentage": 74.7, "elapsed_time": "1 day, 7:43:19", "remaining_time": "10:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13403, "total_steps": 17941, "loss": 1.5072, "learning_rate": 1.547096401459367e-05, "epoch": 0.747059807145644, "percentage": 74.71, "elapsed_time": "1 day, 7:43:27", "remaining_time": "10:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13404, "total_steps": 17941, "loss": 1.7707, "learning_rate": 1.5464524525806717e-05, "epoch": 0.7471155453988072, "percentage": 74.71, "elapsed_time": "1 day, 7:43:36", "remaining_time": "10:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13405, "total_steps": 17941, "loss": 1.5782, "learning_rate": 1.5458086132283712e-05, "epoch": 0.7471712836519704, "percentage": 74.72, "elapsed_time": "1 day, 7:43:44", "remaining_time": "10:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13406, "total_steps": 17941, "loss": 1.5931, "learning_rate": 1.54516488342288e-05, "epoch": 0.7472270219051335, "percentage": 74.72, "elapsed_time": "1 day, 7:43:52", "remaining_time": "10:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13407, "total_steps": 17941, "loss": 1.7915, "learning_rate": 1.5445212631846157e-05, "epoch": 0.7472827601582966, "percentage": 74.73, "elapsed_time": "1 day, 7:44:01", "remaining_time": "10:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13408, "total_steps": 17941, "loss": 1.6272, "learning_rate": 1.5438777525339902e-05, "epoch": 0.7473384984114598, "percentage": 74.73, "elapsed_time": "1 day, 7:44:10", "remaining_time": "10:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13409, "total_steps": 17941, "loss": 1.4453, "learning_rate": 1.5432343514914123e-05, "epoch": 0.7473942366646229, "percentage": 74.74, "elapsed_time": "1 day, 7:44:18", "remaining_time": "10:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13410, "total_steps": 17941, "loss": 1.4543, "learning_rate": 1.5425910600772868e-05, "epoch": 0.7474499749177861, "percentage": 74.74, "elapsed_time": "1 day, 7:44:27", "remaining_time": "10:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13411, "total_steps": 17941, "loss": 1.5641, "learning_rate": 1.5419478783120127e-05, "epoch": 0.7475057131709493, "percentage": 74.75, "elapsed_time": "1 day, 7:44:35", "remaining_time": "10:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13412, "total_steps": 17941, "loss": 1.5104, "learning_rate": 1.541304806215993e-05, "epoch": 0.7475614514241123, "percentage": 74.76, "elapsed_time": "1 day, 7:44:44", "remaining_time": "10:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13413, "total_steps": 17941, "loss": 1.8031, "learning_rate": 1.5406618438096172e-05, "epoch": 0.7476171896772755, "percentage": 74.76, "elapsed_time": "1 day, 7:44:52", "remaining_time": "10:43:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13414, "total_steps": 17941, "loss": 1.8608, "learning_rate": 1.540018991113279e-05, "epoch": 0.7476729279304387, "percentage": 74.77, "elapsed_time": "1 day, 7:45:00", "remaining_time": "10:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13415, "total_steps": 17941, "loss": 1.6909, "learning_rate": 1.5393762481473644e-05, "epoch": 0.7477286661836018, "percentage": 74.77, "elapsed_time": "1 day, 7:45:09", "remaining_time": "10:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13416, "total_steps": 17941, "loss": 1.7286, "learning_rate": 1.5387336149322594e-05, "epoch": 0.747784404436765, "percentage": 74.78, "elapsed_time": "1 day, 7:45:18", "remaining_time": "10:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13417, "total_steps": 17941, "loss": 1.6818, "learning_rate": 1.5380910914883445e-05, "epoch": 0.747840142689928, "percentage": 74.78, "elapsed_time": "1 day, 7:45:26", "remaining_time": "10:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13418, "total_steps": 17941, "loss": 1.6994, "learning_rate": 1.5374486778359932e-05, "epoch": 0.7478958809430912, "percentage": 74.79, "elapsed_time": "1 day, 7:45:35", "remaining_time": "10:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13419, "total_steps": 17941, "loss": 1.8279, "learning_rate": 1.5368063739955845e-05, "epoch": 0.7479516191962544, "percentage": 74.8, "elapsed_time": "1 day, 7:45:43", "remaining_time": "10:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13420, "total_steps": 17941, "loss": 1.5076, "learning_rate": 1.5361641799874843e-05, "epoch": 0.7480073574494175, "percentage": 74.8, "elapsed_time": "1 day, 7:45:52", "remaining_time": "10:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13421, "total_steps": 17941, "loss": 1.604, "learning_rate": 1.5355220958320604e-05, "epoch": 0.7480630957025807, "percentage": 74.81, "elapsed_time": "1 day, 7:46:00", "remaining_time": "10:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13422, "total_steps": 17941, "loss": 1.8152, "learning_rate": 1.5348801215496773e-05, "epoch": 0.7481188339557439, "percentage": 74.81, "elapsed_time": "1 day, 7:46:09", "remaining_time": "10:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13423, "total_steps": 17941, "loss": 1.6422, "learning_rate": 1.5342382571606928e-05, "epoch": 0.7481745722089069, "percentage": 74.82, "elapsed_time": "1 day, 7:46:18", "remaining_time": "10:41:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13424, "total_steps": 17941, "loss": 1.5407, "learning_rate": 1.533596502685466e-05, "epoch": 0.7482303104620701, "percentage": 74.82, "elapsed_time": "1 day, 7:46:26", "remaining_time": "10:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13425, "total_steps": 17941, "loss": 1.4653, "learning_rate": 1.532954858144346e-05, "epoch": 0.7482860487152333, "percentage": 74.83, "elapsed_time": "1 day, 7:46:35", "remaining_time": "10:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13426, "total_steps": 17941, "loss": 1.5693, "learning_rate": 1.532313323557683e-05, "epoch": 0.7483417869683964, "percentage": 74.83, "elapsed_time": "1 day, 7:46:44", "remaining_time": "10:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13427, "total_steps": 17941, "loss": 1.5493, "learning_rate": 1.531671898945824e-05, "epoch": 0.7483975252215596, "percentage": 74.84, "elapsed_time": "1 day, 7:46:52", "remaining_time": "10:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13428, "total_steps": 17941, "loss": 1.3341, "learning_rate": 1.5310305843291106e-05, "epoch": 0.7484532634747227, "percentage": 74.85, "elapsed_time": "1 day, 7:47:01", "remaining_time": "10:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13429, "total_steps": 17941, "loss": 1.6766, "learning_rate": 1.5303893797278813e-05, "epoch": 0.7485090017278858, "percentage": 74.85, "elapsed_time": "1 day, 7:47:09", "remaining_time": "10:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13430, "total_steps": 17941, "loss": 1.7853, "learning_rate": 1.5297482851624718e-05, "epoch": 0.748564739981049, "percentage": 74.86, "elapsed_time": "1 day, 7:47:18", "remaining_time": "10:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13431, "total_steps": 17941, "loss": 1.6365, "learning_rate": 1.529107300653215e-05, "epoch": 0.7486204782342122, "percentage": 74.86, "elapsed_time": "1 day, 7:47:26", "remaining_time": "10:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13432, "total_steps": 17941, "loss": 1.6628, "learning_rate": 1.528466426220437e-05, "epoch": 0.7486762164873753, "percentage": 74.87, "elapsed_time": "1 day, 7:47:35", "remaining_time": "10:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13433, "total_steps": 17941, "loss": 1.5994, "learning_rate": 1.527825661884463e-05, "epoch": 0.7487319547405384, "percentage": 74.87, "elapsed_time": "1 day, 7:47:43", "remaining_time": "10:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13434, "total_steps": 17941, "loss": 1.4491, "learning_rate": 1.527185007665615e-05, "epoch": 0.7487876929937016, "percentage": 74.88, "elapsed_time": "1 day, 7:47:51", "remaining_time": "10:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13435, "total_steps": 17941, "loss": 1.7824, "learning_rate": 1.526544463584211e-05, "epoch": 0.7488434312468647, "percentage": 74.88, "elapsed_time": "1 day, 7:48:00", "remaining_time": "10:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13436, "total_steps": 17941, "loss": 1.5596, "learning_rate": 1.525904029660566e-05, "epoch": 0.7488991695000279, "percentage": 74.89, "elapsed_time": "1 day, 7:48:08", "remaining_time": "10:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13437, "total_steps": 17941, "loss": 1.7777, "learning_rate": 1.5252637059149866e-05, "epoch": 0.7489549077531911, "percentage": 74.9, "elapsed_time": "1 day, 7:48:17", "remaining_time": "10:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13438, "total_steps": 17941, "loss": 1.6985, "learning_rate": 1.5246234923677866e-05, "epoch": 0.7490106460063541, "percentage": 74.9, "elapsed_time": "1 day, 7:48:25", "remaining_time": "10:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13439, "total_steps": 17941, "loss": 1.9387, "learning_rate": 1.5239833890392652e-05, "epoch": 0.7490663842595173, "percentage": 74.91, "elapsed_time": "1 day, 7:48:34", "remaining_time": "10:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13440, "total_steps": 17941, "loss": 1.5936, "learning_rate": 1.523343395949724e-05, "epoch": 0.7491221225126804, "percentage": 74.91, "elapsed_time": "1 day, 7:48:43", "remaining_time": "10:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13441, "total_steps": 17941, "loss": 1.6402, "learning_rate": 1.52270351311946e-05, "epoch": 0.7491778607658436, "percentage": 74.92, "elapsed_time": "1 day, 7:48:51", "remaining_time": "10:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13442, "total_steps": 17941, "loss": 1.599, "learning_rate": 1.5220637405687659e-05, "epoch": 0.7492335990190068, "percentage": 74.92, "elapsed_time": "1 day, 7:48:59", "remaining_time": "10:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13443, "total_steps": 17941, "loss": 1.5019, "learning_rate": 1.5214240783179345e-05, "epoch": 0.7492893372721698, "percentage": 74.93, "elapsed_time": "1 day, 7:49:08", "remaining_time": "10:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13444, "total_steps": 17941, "loss": 1.6836, "learning_rate": 1.5207845263872466e-05, "epoch": 0.749345075525333, "percentage": 74.93, "elapsed_time": "1 day, 7:49:16", "remaining_time": "10:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13445, "total_steps": 17941, "loss": 1.6637, "learning_rate": 1.5201450847969911e-05, "epoch": 0.7494008137784962, "percentage": 74.94, "elapsed_time": "1 day, 7:49:25", "remaining_time": "10:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13446, "total_steps": 17941, "loss": 1.7797, "learning_rate": 1.5195057535674434e-05, "epoch": 0.7494565520316593, "percentage": 74.95, "elapsed_time": "1 day, 7:49:33", "remaining_time": "10:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13447, "total_steps": 17941, "loss": 1.7168, "learning_rate": 1.5188665327188805e-05, "epoch": 0.7495122902848225, "percentage": 74.95, "elapsed_time": "1 day, 7:49:42", "remaining_time": "10:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13448, "total_steps": 17941, "loss": 1.4862, "learning_rate": 1.5182274222715747e-05, "epoch": 0.7495680285379857, "percentage": 74.96, "elapsed_time": "1 day, 7:49:51", "remaining_time": "10:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13449, "total_steps": 17941, "loss": 1.6067, "learning_rate": 1.5175884222457948e-05, "epoch": 0.7496237667911487, "percentage": 74.96, "elapsed_time": "1 day, 7:49:59", "remaining_time": "10:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13450, "total_steps": 17941, "loss": 1.5944, "learning_rate": 1.5169495326618077e-05, "epoch": 0.7496795050443119, "percentage": 74.97, "elapsed_time": "1 day, 7:50:08", "remaining_time": "10:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13451, "total_steps": 17941, "loss": 1.7657, "learning_rate": 1.5163107535398724e-05, "epoch": 0.7497352432974751, "percentage": 74.97, "elapsed_time": "1 day, 7:50:16", "remaining_time": "10:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13452, "total_steps": 17941, "loss": 1.4466, "learning_rate": 1.5156720849002487e-05, "epoch": 0.7497909815506382, "percentage": 74.98, "elapsed_time": "1 day, 7:50:25", "remaining_time": "10:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13453, "total_steps": 17941, "loss": 1.6204, "learning_rate": 1.5150335267631915e-05, "epoch": 0.7498467198038014, "percentage": 74.98, "elapsed_time": "1 day, 7:50:33", "remaining_time": "10:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13454, "total_steps": 17941, "loss": 1.8471, "learning_rate": 1.514395079148952e-05, "epoch": 0.7499024580569645, "percentage": 74.99, "elapsed_time": "1 day, 7:50:42", "remaining_time": "10:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13455, "total_steps": 17941, "loss": 1.567, "learning_rate": 1.5137567420777783e-05, "epoch": 0.7499581963101276, "percentage": 75.0, "elapsed_time": "1 day, 7:50:50", "remaining_time": "10:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13456, "total_steps": 17941, "loss": 1.6508, "learning_rate": 1.513118515569914e-05, "epoch": 0.7500139345632908, "percentage": 75.0, "elapsed_time": "1 day, 7:50:59", "remaining_time": "10:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13457, "total_steps": 17941, "loss": 1.6505, "learning_rate": 1.5124803996456021e-05, "epoch": 0.750069672816454, "percentage": 75.01, "elapsed_time": "1 day, 7:51:07", "remaining_time": "10:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13458, "total_steps": 17941, "loss": 1.7703, "learning_rate": 1.5118423943250771e-05, "epoch": 0.750125411069617, "percentage": 75.01, "elapsed_time": "1 day, 7:51:16", "remaining_time": "10:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13459, "total_steps": 17941, "loss": 1.8, "learning_rate": 1.511204499628574e-05, "epoch": 0.7501811493227802, "percentage": 75.02, "elapsed_time": "1 day, 7:51:24", "remaining_time": "10:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13460, "total_steps": 17941, "loss": 1.597, "learning_rate": 1.5105667155763231e-05, "epoch": 0.7502368875759434, "percentage": 75.02, "elapsed_time": "1 day, 7:51:33", "remaining_time": "10:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13461, "total_steps": 17941, "loss": 1.56, "learning_rate": 1.5099290421885509e-05, "epoch": 0.7502926258291065, "percentage": 75.03, "elapsed_time": "1 day, 7:51:41", "remaining_time": "10:36:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13462, "total_steps": 17941, "loss": 1.7026, "learning_rate": 1.5092914794854824e-05, "epoch": 0.7503483640822697, "percentage": 75.03, "elapsed_time": "1 day, 7:51:49", "remaining_time": "10:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13463, "total_steps": 17941, "loss": 1.7195, "learning_rate": 1.5086540274873328e-05, "epoch": 0.7504041023354328, "percentage": 75.04, "elapsed_time": "1 day, 7:51:58", "remaining_time": "10:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13464, "total_steps": 17941, "loss": 1.5934, "learning_rate": 1.5080166862143253e-05, "epoch": 0.7504598405885959, "percentage": 75.05, "elapsed_time": "1 day, 7:52:06", "remaining_time": "10:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13465, "total_steps": 17941, "loss": 1.4999, "learning_rate": 1.5073794556866666e-05, "epoch": 0.7505155788417591, "percentage": 75.05, "elapsed_time": "1 day, 7:52:15", "remaining_time": "10:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13466, "total_steps": 17941, "loss": 1.836, "learning_rate": 1.5067423359245686e-05, "epoch": 0.7505713170949222, "percentage": 75.06, "elapsed_time": "1 day, 7:52:23", "remaining_time": "10:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13467, "total_steps": 17941, "loss": 1.7677, "learning_rate": 1.5061053269482362e-05, "epoch": 0.7506270553480854, "percentage": 75.06, "elapsed_time": "1 day, 7:52:32", "remaining_time": "10:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13468, "total_steps": 17941, "loss": 1.5995, "learning_rate": 1.505468428777872e-05, "epoch": 0.7506827936012486, "percentage": 75.07, "elapsed_time": "1 day, 7:52:40", "remaining_time": "10:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13469, "total_steps": 17941, "loss": 1.7743, "learning_rate": 1.5048316414336766e-05, "epoch": 0.7507385318544116, "percentage": 75.07, "elapsed_time": "1 day, 7:52:49", "remaining_time": "10:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13470, "total_steps": 17941, "loss": 1.4866, "learning_rate": 1.50419496493584e-05, "epoch": 0.7507942701075748, "percentage": 75.08, "elapsed_time": "1 day, 7:52:57", "remaining_time": "10:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13471, "total_steps": 17941, "loss": 1.601, "learning_rate": 1.5035583993045604e-05, "epoch": 0.750850008360738, "percentage": 75.09, "elapsed_time": "1 day, 7:53:05", "remaining_time": "10:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13472, "total_steps": 17941, "loss": 1.8084, "learning_rate": 1.5029219445600212e-05, "epoch": 0.7509057466139011, "percentage": 75.09, "elapsed_time": "1 day, 7:53:14", "remaining_time": "10:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13473, "total_steps": 17941, "loss": 1.498, "learning_rate": 1.5022856007224084e-05, "epoch": 0.7509614848670643, "percentage": 75.1, "elapsed_time": "1 day, 7:53:22", "remaining_time": "10:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13474, "total_steps": 17941, "loss": 1.4284, "learning_rate": 1.5016493678119031e-05, "epoch": 0.7510172231202275, "percentage": 75.1, "elapsed_time": "1 day, 7:53:31", "remaining_time": "10:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13475, "total_steps": 17941, "loss": 1.8732, "learning_rate": 1.5010132458486832e-05, "epoch": 0.7510729613733905, "percentage": 75.11, "elapsed_time": "1 day, 7:53:39", "remaining_time": "10:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13476, "total_steps": 17941, "loss": 1.4964, "learning_rate": 1.5003772348529243e-05, "epoch": 0.7511286996265537, "percentage": 75.11, "elapsed_time": "1 day, 7:53:48", "remaining_time": "10:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13477, "total_steps": 17941, "loss": 1.5421, "learning_rate": 1.4997413348447937e-05, "epoch": 0.7511844378797169, "percentage": 75.12, "elapsed_time": "1 day, 7:53:56", "remaining_time": "10:33:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13478, "total_steps": 17941, "loss": 1.664, "learning_rate": 1.4991055458444597e-05, "epoch": 0.75124017613288, "percentage": 75.12, "elapsed_time": "1 day, 7:54:05", "remaining_time": "10:33:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13479, "total_steps": 17941, "loss": 1.4636, "learning_rate": 1.4984698678720865e-05, "epoch": 0.7512959143860432, "percentage": 75.13, "elapsed_time": "1 day, 7:54:14", "remaining_time": "10:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13480, "total_steps": 17941, "loss": 1.5685, "learning_rate": 1.4978343009478335e-05, "epoch": 0.7513516526392063, "percentage": 75.14, "elapsed_time": "1 day, 7:54:22", "remaining_time": "10:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13481, "total_steps": 17941, "loss": 1.4127, "learning_rate": 1.4971988450918578e-05, "epoch": 0.7514073908923694, "percentage": 75.14, "elapsed_time": "1 day, 7:54:31", "remaining_time": "10:33:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13482, "total_steps": 17941, "loss": 1.6098, "learning_rate": 1.4965635003243117e-05, "epoch": 0.7514631291455326, "percentage": 75.15, "elapsed_time": "1 day, 7:54:39", "remaining_time": "10:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13483, "total_steps": 17941, "loss": 1.6879, "learning_rate": 1.4959282666653468e-05, "epoch": 0.7515188673986958, "percentage": 75.15, "elapsed_time": "1 day, 7:54:47", "remaining_time": "10:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13484, "total_steps": 17941, "loss": 1.5991, "learning_rate": 1.4952931441351054e-05, "epoch": 0.7515746056518589, "percentage": 75.16, "elapsed_time": "1 day, 7:54:57", "remaining_time": "10:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13485, "total_steps": 17941, "loss": 1.5979, "learning_rate": 1.4946581327537312e-05, "epoch": 0.751630343905022, "percentage": 75.16, "elapsed_time": "1 day, 7:55:05", "remaining_time": "10:32:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13486, "total_steps": 17941, "loss": 1.672, "learning_rate": 1.4940232325413638e-05, "epoch": 0.7516860821581851, "percentage": 75.17, "elapsed_time": "1 day, 7:55:14", "remaining_time": "10:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13487, "total_steps": 17941, "loss": 1.7764, "learning_rate": 1.4933884435181383e-05, "epoch": 0.7517418204113483, "percentage": 75.17, "elapsed_time": "1 day, 7:55:22", "remaining_time": "10:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13488, "total_steps": 17941, "loss": 1.6431, "learning_rate": 1.4927537657041879e-05, "epoch": 0.7517975586645115, "percentage": 75.18, "elapsed_time": "1 day, 7:55:31", "remaining_time": "10:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13489, "total_steps": 17941, "loss": 1.5381, "learning_rate": 1.4921191991196365e-05, "epoch": 0.7518532969176746, "percentage": 75.19, "elapsed_time": "1 day, 7:55:39", "remaining_time": "10:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13490, "total_steps": 17941, "loss": 1.7817, "learning_rate": 1.4914847437846147e-05, "epoch": 0.7519090351708377, "percentage": 75.19, "elapsed_time": "1 day, 7:55:47", "remaining_time": "10:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13491, "total_steps": 17941, "loss": 1.6046, "learning_rate": 1.4908503997192391e-05, "epoch": 0.7519647734240009, "percentage": 75.2, "elapsed_time": "1 day, 7:55:56", "remaining_time": "10:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13492, "total_steps": 17941, "loss": 1.8871, "learning_rate": 1.4902161669436287e-05, "epoch": 0.752020511677164, "percentage": 75.2, "elapsed_time": "1 day, 7:56:04", "remaining_time": "10:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13493, "total_steps": 17941, "loss": 1.6076, "learning_rate": 1.4895820454778986e-05, "epoch": 0.7520762499303272, "percentage": 75.21, "elapsed_time": "1 day, 7:56:13", "remaining_time": "10:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13494, "total_steps": 17941, "loss": 1.5878, "learning_rate": 1.4889480353421586e-05, "epoch": 0.7521319881834904, "percentage": 75.21, "elapsed_time": "1 day, 7:56:22", "remaining_time": "10:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13495, "total_steps": 17941, "loss": 1.5914, "learning_rate": 1.4883141365565178e-05, "epoch": 0.7521877264366534, "percentage": 75.22, "elapsed_time": "1 day, 7:56:30", "remaining_time": "10:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13496, "total_steps": 17941, "loss": 1.5741, "learning_rate": 1.4876803491410746e-05, "epoch": 0.7522434646898166, "percentage": 75.22, "elapsed_time": "1 day, 7:56:39", "remaining_time": "10:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13497, "total_steps": 17941, "loss": 1.6547, "learning_rate": 1.487046673115936e-05, "epoch": 0.7522992029429798, "percentage": 75.23, "elapsed_time": "1 day, 7:56:47", "remaining_time": "10:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13498, "total_steps": 17941, "loss": 1.6673, "learning_rate": 1.4864131085011934e-05, "epoch": 0.7523549411961429, "percentage": 75.24, "elapsed_time": "1 day, 7:56:56", "remaining_time": "10:30:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13499, "total_steps": 17941, "loss": 1.4904, "learning_rate": 1.4857796553169412e-05, "epoch": 0.7524106794493061, "percentage": 75.24, "elapsed_time": "1 day, 7:57:04", "remaining_time": "10:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13500, "total_steps": 17941, "loss": 1.6627, "learning_rate": 1.4851463135832689e-05, "epoch": 0.7524664177024692, "percentage": 75.25, "elapsed_time": "1 day, 7:57:12", "remaining_time": "10:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13501, "total_steps": 17941, "loss": 1.4796, "learning_rate": 1.4845130833202625e-05, "epoch": 0.7525221559556323, "percentage": 75.25, "elapsed_time": "1 day, 7:57:21", "remaining_time": "10:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13502, "total_steps": 17941, "loss": 1.4919, "learning_rate": 1.4838799645480061e-05, "epoch": 0.7525778942087955, "percentage": 75.26, "elapsed_time": "1 day, 7:57:30", "remaining_time": "10:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13503, "total_steps": 17941, "loss": 1.7236, "learning_rate": 1.4832469572865754e-05, "epoch": 0.7526336324619587, "percentage": 75.26, "elapsed_time": "1 day, 7:57:38", "remaining_time": "10:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13504, "total_steps": 17941, "loss": 1.56, "learning_rate": 1.4826140615560469e-05, "epoch": 0.7526893707151218, "percentage": 75.27, "elapsed_time": "1 day, 7:57:46", "remaining_time": "10:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13505, "total_steps": 17941, "loss": 1.7928, "learning_rate": 1.4819812773764924e-05, "epoch": 0.752745108968285, "percentage": 75.27, "elapsed_time": "1 day, 7:57:55", "remaining_time": "10:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13506, "total_steps": 17941, "loss": 1.7989, "learning_rate": 1.4813486047679808e-05, "epoch": 0.7528008472214481, "percentage": 75.28, "elapsed_time": "1 day, 7:58:03", "remaining_time": "10:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13507, "total_steps": 17941, "loss": 1.8563, "learning_rate": 1.4807160437505756e-05, "epoch": 0.7528565854746112, "percentage": 75.29, "elapsed_time": "1 day, 7:58:12", "remaining_time": "10:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13508, "total_steps": 17941, "loss": 1.6341, "learning_rate": 1.4800835943443392e-05, "epoch": 0.7529123237277744, "percentage": 75.29, "elapsed_time": "1 day, 7:58:20", "remaining_time": "10:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13509, "total_steps": 17941, "loss": 1.5606, "learning_rate": 1.4794512565693303e-05, "epoch": 0.7529680619809375, "percentage": 75.3, "elapsed_time": "1 day, 7:58:29", "remaining_time": "10:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13510, "total_steps": 17941, "loss": 1.6136, "learning_rate": 1.4788190304455996e-05, "epoch": 0.7530238002341006, "percentage": 75.3, "elapsed_time": "1 day, 7:58:37", "remaining_time": "10:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13511, "total_steps": 17941, "loss": 1.6516, "learning_rate": 1.4781869159931994e-05, "epoch": 0.7530795384872638, "percentage": 75.31, "elapsed_time": "1 day, 7:58:46", "remaining_time": "10:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13512, "total_steps": 17941, "loss": 1.6058, "learning_rate": 1.4775549132321764e-05, "epoch": 0.7531352767404269, "percentage": 75.31, "elapsed_time": "1 day, 7:58:54", "remaining_time": "10:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13513, "total_steps": 17941, "loss": 1.6085, "learning_rate": 1.4769230221825741e-05, "epoch": 0.7531910149935901, "percentage": 75.32, "elapsed_time": "1 day, 7:59:02", "remaining_time": "10:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13514, "total_steps": 17941, "loss": 1.5802, "learning_rate": 1.4762912428644348e-05, "epoch": 0.7532467532467533, "percentage": 75.32, "elapsed_time": "1 day, 7:59:11", "remaining_time": "10:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13515, "total_steps": 17941, "loss": 1.5401, "learning_rate": 1.4756595752977892e-05, "epoch": 0.7533024914999163, "percentage": 75.33, "elapsed_time": "1 day, 7:59:20", "remaining_time": "10:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13516, "total_steps": 17941, "loss": 1.6784, "learning_rate": 1.4756595752977892e-05, "epoch": 0.7533582297530795, "percentage": 75.34, "elapsed_time": "1 day, 7:59:28", "remaining_time": "10:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13517, "total_steps": 17941, "loss": 1.782, "learning_rate": 1.4750280195026767e-05, "epoch": 0.7534139680062427, "percentage": 75.34, "elapsed_time": "1 day, 7:59:38", "remaining_time": "10:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13518, "total_steps": 17941, "loss": 1.4861, "learning_rate": 1.4743965754991217e-05, "epoch": 0.7534697062594058, "percentage": 75.35, "elapsed_time": "1 day, 7:59:46", "remaining_time": "10:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13519, "total_steps": 17941, "loss": 1.8707, "learning_rate": 1.4737652433071513e-05, "epoch": 0.753525444512569, "percentage": 75.35, "elapsed_time": "1 day, 7:59:54", "remaining_time": "10:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13520, "total_steps": 17941, "loss": 1.606, "learning_rate": 1.4731340229467888e-05, "epoch": 0.7535811827657322, "percentage": 75.36, "elapsed_time": "1 day, 8:00:03", "remaining_time": "10:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13521, "total_steps": 17941, "loss": 1.7317, "learning_rate": 1.4725029144380515e-05, "epoch": 0.7536369210188952, "percentage": 75.36, "elapsed_time": "1 day, 8:00:11", "remaining_time": "10:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13522, "total_steps": 17941, "loss": 1.5096, "learning_rate": 1.4718719178009567e-05, "epoch": 0.7536926592720584, "percentage": 75.37, "elapsed_time": "1 day, 8:00:20", "remaining_time": "10:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13523, "total_steps": 17941, "loss": 1.5065, "learning_rate": 1.471241033055511e-05, "epoch": 0.7537483975252216, "percentage": 75.37, "elapsed_time": "1 day, 8:00:28", "remaining_time": "10:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13524, "total_steps": 17941, "loss": 1.5696, "learning_rate": 1.4706102602217291e-05, "epoch": 0.7538041357783847, "percentage": 75.38, "elapsed_time": "1 day, 8:00:37", "remaining_time": "10:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13525, "total_steps": 17941, "loss": 1.7403, "learning_rate": 1.4699795993196103e-05, "epoch": 0.7538598740315479, "percentage": 75.39, "elapsed_time": "1 day, 8:00:45", "remaining_time": "10:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13526, "total_steps": 17941, "loss": 1.6232, "learning_rate": 1.4693490503691571e-05, "epoch": 0.753915612284711, "percentage": 75.39, "elapsed_time": "1 day, 8:00:54", "remaining_time": "10:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13527, "total_steps": 17941, "loss": 1.732, "learning_rate": 1.4687186133903668e-05, "epoch": 0.7539713505378741, "percentage": 75.4, "elapsed_time": "1 day, 8:01:02", "remaining_time": "10:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13528, "total_steps": 17941, "loss": 1.4731, "learning_rate": 1.4680882884032332e-05, "epoch": 0.7540270887910373, "percentage": 75.4, "elapsed_time": "1 day, 8:01:11", "remaining_time": "10:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13529, "total_steps": 17941, "loss": 1.6842, "learning_rate": 1.4674580754277483e-05, "epoch": 0.7540828270442005, "percentage": 75.41, "elapsed_time": "1 day, 8:01:19", "remaining_time": "10:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13530, "total_steps": 17941, "loss": 1.6571, "learning_rate": 1.4668279744838958e-05, "epoch": 0.7541385652973636, "percentage": 75.41, "elapsed_time": "1 day, 8:01:28", "remaining_time": "10:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13531, "total_steps": 17941, "loss": 1.5902, "learning_rate": 1.4661979855916602e-05, "epoch": 0.7541943035505267, "percentage": 75.42, "elapsed_time": "1 day, 8:01:36", "remaining_time": "10:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13532, "total_steps": 17941, "loss": 1.799, "learning_rate": 1.4655681087710205e-05, "epoch": 0.7542500418036898, "percentage": 75.43, "elapsed_time": "1 day, 8:01:44", "remaining_time": "10:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13533, "total_steps": 17941, "loss": 1.477, "learning_rate": 1.4649383440419534e-05, "epoch": 0.754305780056853, "percentage": 75.43, "elapsed_time": "1 day, 8:01:53", "remaining_time": "10:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13534, "total_steps": 17941, "loss": 1.6655, "learning_rate": 1.4643086914244314e-05, "epoch": 0.7543615183100162, "percentage": 75.44, "elapsed_time": "1 day, 8:02:01", "remaining_time": "10:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13535, "total_steps": 17941, "loss": 1.7415, "learning_rate": 1.463679150938423e-05, "epoch": 0.7544172565631793, "percentage": 75.44, "elapsed_time": "1 day, 8:02:10", "remaining_time": "10:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13536, "total_steps": 17941, "loss": 1.5266, "learning_rate": 1.4630497226038953e-05, "epoch": 0.7544729948163424, "percentage": 75.45, "elapsed_time": "1 day, 8:02:18", "remaining_time": "10:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13537, "total_steps": 17941, "loss": 1.5921, "learning_rate": 1.462420406440807e-05, "epoch": 0.7545287330695056, "percentage": 75.45, "elapsed_time": "1 day, 8:02:27", "remaining_time": "10:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13538, "total_steps": 17941, "loss": 1.5367, "learning_rate": 1.4617912024691177e-05, "epoch": 0.7545844713226687, "percentage": 75.46, "elapsed_time": "1 day, 8:02:35", "remaining_time": "10:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13539, "total_steps": 17941, "loss": 1.3466, "learning_rate": 1.4611621107087826e-05, "epoch": 0.7546402095758319, "percentage": 75.46, "elapsed_time": "1 day, 8:02:44", "remaining_time": "10:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13540, "total_steps": 17941, "loss": 1.5763, "learning_rate": 1.4605331311797526e-05, "epoch": 0.7546959478289951, "percentage": 75.47, "elapsed_time": "1 day, 8:02:53", "remaining_time": "10:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13541, "total_steps": 17941, "loss": 2.1011, "learning_rate": 1.4599042639019767e-05, "epoch": 0.7547516860821581, "percentage": 75.48, "elapsed_time": "1 day, 8:03:02", "remaining_time": "10:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13542, "total_steps": 17941, "loss": 1.7852, "learning_rate": 1.4592755088953935e-05, "epoch": 0.7548074243353213, "percentage": 75.48, "elapsed_time": "1 day, 8:03:10", "remaining_time": "10:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13543, "total_steps": 17941, "loss": 1.7704, "learning_rate": 1.4586468661799512e-05, "epoch": 0.7548631625884845, "percentage": 75.49, "elapsed_time": "1 day, 8:03:20", "remaining_time": "10:24:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13544, "total_steps": 17941, "loss": 1.6328, "learning_rate": 1.458018335775581e-05, "epoch": 0.7549189008416476, "percentage": 75.49, "elapsed_time": "1 day, 8:03:28", "remaining_time": "10:24:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13545, "total_steps": 17941, "loss": 1.4073, "learning_rate": 1.4573899177022176e-05, "epoch": 0.7549746390948108, "percentage": 75.5, "elapsed_time": "1 day, 8:03:36", "remaining_time": "10:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13546, "total_steps": 17941, "loss": 1.4983, "learning_rate": 1.4567616119797916e-05, "epoch": 0.755030377347974, "percentage": 75.5, "elapsed_time": "1 day, 8:03:45", "remaining_time": "10:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13547, "total_steps": 17941, "loss": 1.7044, "learning_rate": 1.4561334186282288e-05, "epoch": 0.755086115601137, "percentage": 75.51, "elapsed_time": "1 day, 8:03:53", "remaining_time": "10:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13548, "total_steps": 17941, "loss": 1.5564, "learning_rate": 1.4555053376674532e-05, "epoch": 0.7551418538543002, "percentage": 75.51, "elapsed_time": "1 day, 8:04:02", "remaining_time": "10:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13549, "total_steps": 17941, "loss": 1.5752, "learning_rate": 1.4548773691173794e-05, "epoch": 0.7551975921074634, "percentage": 75.52, "elapsed_time": "1 day, 8:04:10", "remaining_time": "10:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13550, "total_steps": 17941, "loss": 1.5379, "learning_rate": 1.4542495129979294e-05, "epoch": 0.7552533303606265, "percentage": 75.53, "elapsed_time": "1 day, 8:04:19", "remaining_time": "10:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13551, "total_steps": 17941, "loss": 1.6103, "learning_rate": 1.4536217693290094e-05, "epoch": 0.7553090686137897, "percentage": 75.53, "elapsed_time": "1 day, 8:04:27", "remaining_time": "10:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13552, "total_steps": 17941, "loss": 1.2465, "learning_rate": 1.4529941381305307e-05, "epoch": 0.7553648068669528, "percentage": 75.54, "elapsed_time": "1 day, 8:04:36", "remaining_time": "10:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13553, "total_steps": 17941, "loss": 1.8333, "learning_rate": 1.4523666194223972e-05, "epoch": 0.7554205451201159, "percentage": 75.54, "elapsed_time": "1 day, 8:04:44", "remaining_time": "10:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13554, "total_steps": 17941, "loss": 1.6442, "learning_rate": 1.4517392132245105e-05, "epoch": 0.7554762833732791, "percentage": 75.55, "elapsed_time": "1 day, 8:04:53", "remaining_time": "10:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13555, "total_steps": 17941, "loss": 1.5921, "learning_rate": 1.4511119195567696e-05, "epoch": 0.7555320216264422, "percentage": 75.55, "elapsed_time": "1 day, 8:05:01", "remaining_time": "10:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13556, "total_steps": 17941, "loss": 1.833, "learning_rate": 1.4504847384390657e-05, "epoch": 0.7555877598796054, "percentage": 75.56, "elapsed_time": "1 day, 8:05:10", "remaining_time": "10:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13557, "total_steps": 17941, "loss": 1.8395, "learning_rate": 1.4498576698912902e-05, "epoch": 0.7556434981327685, "percentage": 75.56, "elapsed_time": "1 day, 8:05:18", "remaining_time": "10:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13558, "total_steps": 17941, "loss": 1.4357, "learning_rate": 1.4492307139333316e-05, "epoch": 0.7556992363859316, "percentage": 75.57, "elapsed_time": "1 day, 8:05:27", "remaining_time": "10:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13559, "total_steps": 17941, "loss": 1.511, "learning_rate": 1.448603870585072e-05, "epoch": 0.7557549746390948, "percentage": 75.58, "elapsed_time": "1 day, 8:05:35", "remaining_time": "10:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13560, "total_steps": 17941, "loss": 1.5333, "learning_rate": 1.447977139866391e-05, "epoch": 0.755810712892258, "percentage": 75.58, "elapsed_time": "1 day, 8:05:43", "remaining_time": "10:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13561, "total_steps": 17941, "loss": 1.3624, "learning_rate": 1.447350521797166e-05, "epoch": 0.7558664511454211, "percentage": 75.59, "elapsed_time": "1 day, 8:05:52", "remaining_time": "10:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13562, "total_steps": 17941, "loss": 1.3457, "learning_rate": 1.4467240163972706e-05, "epoch": 0.7559221893985842, "percentage": 75.59, "elapsed_time": "1 day, 8:06:00", "remaining_time": "10:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13563, "total_steps": 17941, "loss": 1.1391, "learning_rate": 1.4460976236865703e-05, "epoch": 0.7559779276517474, "percentage": 75.6, "elapsed_time": "1 day, 8:06:09", "remaining_time": "10:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13564, "total_steps": 17941, "loss": 1.7568, "learning_rate": 1.4454713436849333e-05, "epoch": 0.7560336659049105, "percentage": 75.6, "elapsed_time": "1 day, 8:06:17", "remaining_time": "10:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13565, "total_steps": 17941, "loss": 1.6173, "learning_rate": 1.4448451764122206e-05, "epoch": 0.7560894041580737, "percentage": 75.61, "elapsed_time": "1 day, 8:06:26", "remaining_time": "10:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13566, "total_steps": 17941, "loss": 1.7494, "learning_rate": 1.4442191218882911e-05, "epoch": 0.7561451424112369, "percentage": 75.61, "elapsed_time": "1 day, 8:06:34", "remaining_time": "10:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13567, "total_steps": 17941, "loss": 1.6753, "learning_rate": 1.4435931801329994e-05, "epoch": 0.7562008806643999, "percentage": 75.62, "elapsed_time": "1 day, 8:06:43", "remaining_time": "10:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13568, "total_steps": 17941, "loss": 1.7557, "learning_rate": 1.4429673511661962e-05, "epoch": 0.7562566189175631, "percentage": 75.63, "elapsed_time": "1 day, 8:06:51", "remaining_time": "10:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13569, "total_steps": 17941, "loss": 1.6739, "learning_rate": 1.4423416350077318e-05, "epoch": 0.7563123571707263, "percentage": 75.63, "elapsed_time": "1 day, 8:06:59", "remaining_time": "10:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13570, "total_steps": 17941, "loss": 1.824, "learning_rate": 1.4417160316774465e-05, "epoch": 0.7563680954238894, "percentage": 75.64, "elapsed_time": "1 day, 8:07:09", "remaining_time": "10:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13571, "total_steps": 17941, "loss": 1.5959, "learning_rate": 1.4410905411951824e-05, "epoch": 0.7564238336770526, "percentage": 75.64, "elapsed_time": "1 day, 8:07:17", "remaining_time": "10:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13572, "total_steps": 17941, "loss": 1.6415, "learning_rate": 1.4404651635807764e-05, "epoch": 0.7564795719302158, "percentage": 75.65, "elapsed_time": "1 day, 8:07:25", "remaining_time": "10:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13573, "total_steps": 17941, "loss": 1.3973, "learning_rate": 1.4398398988540623e-05, "epoch": 0.7565353101833788, "percentage": 75.65, "elapsed_time": "1 day, 8:07:34", "remaining_time": "10:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13574, "total_steps": 17941, "loss": 1.5665, "learning_rate": 1.4392147470348704e-05, "epoch": 0.756591048436542, "percentage": 75.66, "elapsed_time": "1 day, 8:07:42", "remaining_time": "10:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13575, "total_steps": 17941, "loss": 1.4084, "learning_rate": 1.4385897081430233e-05, "epoch": 0.7566467866897052, "percentage": 75.66, "elapsed_time": "1 day, 8:07:51", "remaining_time": "10:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13576, "total_steps": 17941, "loss": 1.6453, "learning_rate": 1.4379647821983488e-05, "epoch": 0.7567025249428683, "percentage": 75.67, "elapsed_time": "1 day, 8:07:59", "remaining_time": "10:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13577, "total_steps": 17941, "loss": 1.7396, "learning_rate": 1.4373399692206618e-05, "epoch": 0.7567582631960315, "percentage": 75.68, "elapsed_time": "1 day, 8:08:08", "remaining_time": "10:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13578, "total_steps": 17941, "loss": 1.8246, "learning_rate": 1.4367152692297797e-05, "epoch": 0.7568140014491945, "percentage": 75.68, "elapsed_time": "1 day, 8:08:16", "remaining_time": "10:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13579, "total_steps": 17941, "loss": 1.5035, "learning_rate": 1.4360906822455134e-05, "epoch": 0.7568697397023577, "percentage": 75.69, "elapsed_time": "1 day, 8:08:25", "remaining_time": "10:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13580, "total_steps": 17941, "loss": 1.6054, "learning_rate": 1.4354662082876718e-05, "epoch": 0.7569254779555209, "percentage": 75.69, "elapsed_time": "1 day, 8:08:33", "remaining_time": "10:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13581, "total_steps": 17941, "loss": 1.5249, "learning_rate": 1.434841847376061e-05, "epoch": 0.756981216208684, "percentage": 75.7, "elapsed_time": "1 day, 8:08:42", "remaining_time": "10:19:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13582, "total_steps": 17941, "loss": 1.6811, "learning_rate": 1.434217599530479e-05, "epoch": 0.7570369544618472, "percentage": 75.7, "elapsed_time": "1 day, 8:08:51", "remaining_time": "10:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13583, "total_steps": 17941, "loss": 1.5311, "learning_rate": 1.4335934647707244e-05, "epoch": 0.7570926927150103, "percentage": 75.71, "elapsed_time": "1 day, 8:08:59", "remaining_time": "10:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13584, "total_steps": 17941, "loss": 1.2596, "learning_rate": 1.432969443116592e-05, "epoch": 0.7571484309681734, "percentage": 75.71, "elapsed_time": "1 day, 8:09:08", "remaining_time": "10:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13585, "total_steps": 17941, "loss": 1.737, "learning_rate": 1.4323455345878717e-05, "epoch": 0.7572041692213366, "percentage": 75.72, "elapsed_time": "1 day, 8:09:16", "remaining_time": "10:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13586, "total_steps": 17941, "loss": 1.6467, "learning_rate": 1.4317217392043496e-05, "epoch": 0.7572599074744998, "percentage": 75.73, "elapsed_time": "1 day, 8:09:25", "remaining_time": "10:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13587, "total_steps": 17941, "loss": 1.6087, "learning_rate": 1.4310980569858096e-05, "epoch": 0.7573156457276629, "percentage": 75.73, "elapsed_time": "1 day, 8:09:33", "remaining_time": "10:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13588, "total_steps": 17941, "loss": 1.495, "learning_rate": 1.4304744879520333e-05, "epoch": 0.757371383980826, "percentage": 75.74, "elapsed_time": "1 day, 8:09:41", "remaining_time": "10:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13589, "total_steps": 17941, "loss": 1.5276, "learning_rate": 1.429851032122792e-05, "epoch": 0.7574271222339892, "percentage": 75.74, "elapsed_time": "1 day, 8:09:50", "remaining_time": "10:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13590, "total_steps": 17941, "loss": 1.3332, "learning_rate": 1.4292276895178608e-05, "epoch": 0.7574828604871523, "percentage": 75.75, "elapsed_time": "1 day, 8:09:58", "remaining_time": "10:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13591, "total_steps": 17941, "loss": 1.6538, "learning_rate": 1.4286044601570086e-05, "epoch": 0.7575385987403155, "percentage": 75.75, "elapsed_time": "1 day, 8:10:07", "remaining_time": "10:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13592, "total_steps": 17941, "loss": 1.6558, "learning_rate": 1.4279813440599999e-05, "epoch": 0.7575943369934787, "percentage": 75.76, "elapsed_time": "1 day, 8:10:15", "remaining_time": "10:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13593, "total_steps": 17941, "loss": 1.9873, "learning_rate": 1.4273583412465968e-05, "epoch": 0.7576500752466417, "percentage": 75.77, "elapsed_time": "1 day, 8:10:24", "remaining_time": "10:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13594, "total_steps": 17941, "loss": 1.5415, "learning_rate": 1.4267354517365572e-05, "epoch": 0.7577058134998049, "percentage": 75.77, "elapsed_time": "1 day, 8:10:32", "remaining_time": "10:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13595, "total_steps": 17941, "loss": 1.7035, "learning_rate": 1.4261126755496368e-05, "epoch": 0.7577615517529681, "percentage": 75.78, "elapsed_time": "1 day, 8:10:41", "remaining_time": "10:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13596, "total_steps": 17941, "loss": 1.5896, "learning_rate": 1.4254900127055843e-05, "epoch": 0.7578172900061312, "percentage": 75.78, "elapsed_time": "1 day, 8:10:49", "remaining_time": "10:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13597, "total_steps": 17941, "loss": 1.5107, "learning_rate": 1.424867463224147e-05, "epoch": 0.7578730282592944, "percentage": 75.79, "elapsed_time": "1 day, 8:10:57", "remaining_time": "10:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13598, "total_steps": 17941, "loss": 1.7632, "learning_rate": 1.4242450271250696e-05, "epoch": 0.7579287665124576, "percentage": 75.79, "elapsed_time": "1 day, 8:11:06", "remaining_time": "10:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13599, "total_steps": 17941, "loss": 1.4528, "learning_rate": 1.4236227044280914e-05, "epoch": 0.7579845047656206, "percentage": 75.8, "elapsed_time": "1 day, 8:11:14", "remaining_time": "10:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13600, "total_steps": 17941, "loss": 1.5148, "learning_rate": 1.4230004951529513e-05, "epoch": 0.7580402430187838, "percentage": 75.8, "elapsed_time": "1 day, 8:11:23", "remaining_time": "10:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13601, "total_steps": 17941, "loss": 1.6172, "learning_rate": 1.4223783993193767e-05, "epoch": 0.7580959812719469, "percentage": 75.81, "elapsed_time": "1 day, 8:11:31", "remaining_time": "10:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13602, "total_steps": 17941, "loss": 1.9368, "learning_rate": 1.4217564169471038e-05, "epoch": 0.7581517195251101, "percentage": 75.82, "elapsed_time": "1 day, 8:11:40", "remaining_time": "10:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13603, "total_steps": 17941, "loss": 1.6861, "learning_rate": 1.421134548055853e-05, "epoch": 0.7582074577782733, "percentage": 75.82, "elapsed_time": "1 day, 8:11:48", "remaining_time": "10:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13604, "total_steps": 17941, "loss": 1.5603, "learning_rate": 1.4205127926653483e-05, "epoch": 0.7582631960314363, "percentage": 75.83, "elapsed_time": "1 day, 8:11:57", "remaining_time": "10:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13605, "total_steps": 17941, "loss": 1.7819, "learning_rate": 1.4198911507953077e-05, "epoch": 0.7583189342845995, "percentage": 75.83, "elapsed_time": "1 day, 8:12:05", "remaining_time": "10:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13606, "total_steps": 17941, "loss": 1.7878, "learning_rate": 1.4192696224654467e-05, "epoch": 0.7583746725377627, "percentage": 75.84, "elapsed_time": "1 day, 8:12:13", "remaining_time": "10:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13607, "total_steps": 17941, "loss": 1.7785, "learning_rate": 1.418648207695477e-05, "epoch": 0.7584304107909258, "percentage": 75.84, "elapsed_time": "1 day, 8:12:22", "remaining_time": "10:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13608, "total_steps": 17941, "loss": 1.6062, "learning_rate": 1.4180269065051043e-05, "epoch": 0.758486149044089, "percentage": 75.85, "elapsed_time": "1 day, 8:12:30", "remaining_time": "10:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13609, "total_steps": 17941, "loss": 1.663, "learning_rate": 1.4174057189140339e-05, "epoch": 0.7585418872972521, "percentage": 75.85, "elapsed_time": "1 day, 8:12:39", "remaining_time": "10:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13610, "total_steps": 17941, "loss": 1.5436, "learning_rate": 1.4167846449419659e-05, "epoch": 0.7585976255504152, "percentage": 75.86, "elapsed_time": "1 day, 8:12:47", "remaining_time": "10:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13611, "total_steps": 17941, "loss": 2.0576, "learning_rate": 1.4161636846085973e-05, "epoch": 0.7586533638035784, "percentage": 75.87, "elapsed_time": "1 day, 8:12:56", "remaining_time": "10:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13612, "total_steps": 17941, "loss": 1.5829, "learning_rate": 1.4155428379336216e-05, "epoch": 0.7587091020567416, "percentage": 75.87, "elapsed_time": "1 day, 8:13:04", "remaining_time": "10:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13613, "total_steps": 17941, "loss": 1.7045, "learning_rate": 1.4149221049367283e-05, "epoch": 0.7587648403099047, "percentage": 75.88, "elapsed_time": "1 day, 8:13:13", "remaining_time": "10:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13614, "total_steps": 17941, "loss": 1.7569, "learning_rate": 1.4143014856376053e-05, "epoch": 0.7588205785630678, "percentage": 75.88, "elapsed_time": "1 day, 8:13:22", "remaining_time": "10:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13615, "total_steps": 17941, "loss": 1.592, "learning_rate": 1.4136809800559308e-05, "epoch": 0.758876316816231, "percentage": 75.89, "elapsed_time": "1 day, 8:13:30", "remaining_time": "10:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13616, "total_steps": 17941, "loss": 1.7016, "learning_rate": 1.4130605882113862e-05, "epoch": 0.7589320550693941, "percentage": 75.89, "elapsed_time": "1 day, 8:13:39", "remaining_time": "10:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13617, "total_steps": 17941, "loss": 1.8053, "learning_rate": 1.4124403101236466e-05, "epoch": 0.7589877933225573, "percentage": 75.9, "elapsed_time": "1 day, 8:13:47", "remaining_time": "10:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13618, "total_steps": 17941, "loss": 1.3909, "learning_rate": 1.411820145812383e-05, "epoch": 0.7590435315757205, "percentage": 75.9, "elapsed_time": "1 day, 8:13:55", "remaining_time": "10:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13619, "total_steps": 17941, "loss": 1.6921, "learning_rate": 1.4112000952972643e-05, "epoch": 0.7590992698288835, "percentage": 75.91, "elapsed_time": "1 day, 8:14:04", "remaining_time": "10:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13620, "total_steps": 17941, "loss": 1.7093, "learning_rate": 1.4105801585979545e-05, "epoch": 0.7591550080820467, "percentage": 75.92, "elapsed_time": "1 day, 8:14:12", "remaining_time": "10:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13621, "total_steps": 17941, "loss": 1.7623, "learning_rate": 1.4099603357341152e-05, "epoch": 0.7592107463352099, "percentage": 75.92, "elapsed_time": "1 day, 8:14:21", "remaining_time": "10:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13622, "total_steps": 17941, "loss": 1.5728, "learning_rate": 1.4093406267254017e-05, "epoch": 0.759266484588373, "percentage": 75.93, "elapsed_time": "1 day, 8:14:29", "remaining_time": "10:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13623, "total_steps": 17941, "loss": 1.653, "learning_rate": 1.4087210315914684e-05, "epoch": 0.7593222228415362, "percentage": 75.93, "elapsed_time": "1 day, 8:14:38", "remaining_time": "10:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13624, "total_steps": 17941, "loss": 1.6385, "learning_rate": 1.4081015503519651e-05, "epoch": 0.7593779610946992, "percentage": 75.94, "elapsed_time": "1 day, 8:14:47", "remaining_time": "10:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13625, "total_steps": 17941, "loss": 1.5487, "learning_rate": 1.4074821830265388e-05, "epoch": 0.7594336993478624, "percentage": 75.94, "elapsed_time": "1 day, 8:14:56", "remaining_time": "10:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13626, "total_steps": 17941, "loss": 1.4538, "learning_rate": 1.406862929634833e-05, "epoch": 0.7594894376010256, "percentage": 75.95, "elapsed_time": "1 day, 8:15:04", "remaining_time": "10:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13627, "total_steps": 17941, "loss": 1.5614, "learning_rate": 1.4062437901964825e-05, "epoch": 0.7595451758541887, "percentage": 75.95, "elapsed_time": "1 day, 8:15:13", "remaining_time": "10:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13628, "total_steps": 17941, "loss": 1.382, "learning_rate": 1.4056247647311294e-05, "epoch": 0.7596009141073519, "percentage": 75.96, "elapsed_time": "1 day, 8:15:21", "remaining_time": "10:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13629, "total_steps": 17941, "loss": 1.5966, "learning_rate": 1.4050058532584003e-05, "epoch": 0.759656652360515, "percentage": 75.97, "elapsed_time": "1 day, 8:15:30", "remaining_time": "10:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13630, "total_steps": 17941, "loss": 1.5784, "learning_rate": 1.4043870557979255e-05, "epoch": 0.7597123906136781, "percentage": 75.97, "elapsed_time": "1 day, 8:15:39", "remaining_time": "10:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13631, "total_steps": 17941, "loss": 1.409, "learning_rate": 1.4037683723693296e-05, "epoch": 0.7597681288668413, "percentage": 75.98, "elapsed_time": "1 day, 8:15:48", "remaining_time": "10:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13632, "total_steps": 17941, "loss": 1.5705, "learning_rate": 1.403149802992233e-05, "epoch": 0.7598238671200045, "percentage": 75.98, "elapsed_time": "1 day, 8:15:56", "remaining_time": "10:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13633, "total_steps": 17941, "loss": 1.8538, "learning_rate": 1.4025313476862551e-05, "epoch": 0.7598796053731676, "percentage": 75.99, "elapsed_time": "1 day, 8:16:04", "remaining_time": "10:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13634, "total_steps": 17941, "loss": 1.3479, "learning_rate": 1.4019130064710068e-05, "epoch": 0.7599353436263308, "percentage": 75.99, "elapsed_time": "1 day, 8:16:13", "remaining_time": "10:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13635, "total_steps": 17941, "loss": 1.6895, "learning_rate": 1.4012947793660996e-05, "epoch": 0.7599910818794939, "percentage": 76.0, "elapsed_time": "1 day, 8:16:21", "remaining_time": "10:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13636, "total_steps": 17941, "loss": 1.5507, "learning_rate": 1.4006766663911397e-05, "epoch": 0.760046820132657, "percentage": 76.0, "elapsed_time": "1 day, 8:16:30", "remaining_time": "10:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13637, "total_steps": 17941, "loss": 1.4995, "learning_rate": 1.4000586675657312e-05, "epoch": 0.7601025583858202, "percentage": 76.01, "elapsed_time": "1 day, 8:16:38", "remaining_time": "10:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13638, "total_steps": 17941, "loss": 1.6442, "learning_rate": 1.399440782909472e-05, "epoch": 0.7601582966389834, "percentage": 76.02, "elapsed_time": "1 day, 8:16:47", "remaining_time": "10:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13639, "total_steps": 17941, "loss": 1.6857, "learning_rate": 1.3988230124419589e-05, "epoch": 0.7602140348921465, "percentage": 76.02, "elapsed_time": "1 day, 8:16:55", "remaining_time": "10:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13640, "total_steps": 17941, "loss": 1.6515, "learning_rate": 1.3982053561827846e-05, "epoch": 0.7602697731453096, "percentage": 76.03, "elapsed_time": "1 day, 8:17:04", "remaining_time": "10:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13641, "total_steps": 17941, "loss": 1.7898, "learning_rate": 1.3975878141515352e-05, "epoch": 0.7603255113984728, "percentage": 76.03, "elapsed_time": "1 day, 8:17:12", "remaining_time": "10:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13642, "total_steps": 17941, "loss": 1.5781, "learning_rate": 1.3969703863677969e-05, "epoch": 0.7603812496516359, "percentage": 76.04, "elapsed_time": "1 day, 8:17:21", "remaining_time": "10:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13643, "total_steps": 17941, "loss": 1.7786, "learning_rate": 1.396353072851151e-05, "epoch": 0.7604369879047991, "percentage": 76.04, "elapsed_time": "1 day, 8:17:29", "remaining_time": "10:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13644, "total_steps": 17941, "loss": 1.6052, "learning_rate": 1.3957358736211745e-05, "epoch": 0.7604927261579623, "percentage": 76.05, "elapsed_time": "1 day, 8:17:37", "remaining_time": "10:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13645, "total_steps": 17941, "loss": 1.7038, "learning_rate": 1.3951187886974416e-05, "epoch": 0.7605484644111253, "percentage": 76.05, "elapsed_time": "1 day, 8:17:46", "remaining_time": "10:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13646, "total_steps": 17941, "loss": 1.6561, "learning_rate": 1.3945018180995234e-05, "epoch": 0.7606042026642885, "percentage": 76.06, "elapsed_time": "1 day, 8:17:54", "remaining_time": "10:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13647, "total_steps": 17941, "loss": 1.6025, "learning_rate": 1.3938849618469868e-05, "epoch": 0.7606599409174516, "percentage": 76.07, "elapsed_time": "1 day, 8:18:03", "remaining_time": "10:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13648, "total_steps": 17941, "loss": 1.7453, "learning_rate": 1.3932682199593933e-05, "epoch": 0.7607156791706148, "percentage": 76.07, "elapsed_time": "1 day, 8:18:11", "remaining_time": "10:09:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13649, "total_steps": 17941, "loss": 1.6144, "learning_rate": 1.3926515924563027e-05, "epoch": 0.760771417423778, "percentage": 76.08, "elapsed_time": "1 day, 8:18:20", "remaining_time": "10:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13650, "total_steps": 17941, "loss": 1.6279, "learning_rate": 1.3920350793572717e-05, "epoch": 0.760827155676941, "percentage": 76.08, "elapsed_time": "1 day, 8:18:29", "remaining_time": "10:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13651, "total_steps": 17941, "loss": 1.6013, "learning_rate": 1.391418680681852e-05, "epoch": 0.7608828939301042, "percentage": 76.09, "elapsed_time": "1 day, 8:18:37", "remaining_time": "10:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13652, "total_steps": 17941, "loss": 1.7508, "learning_rate": 1.3908023964495937e-05, "epoch": 0.7609386321832674, "percentage": 76.09, "elapsed_time": "1 day, 8:18:46", "remaining_time": "10:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13653, "total_steps": 17941, "loss": 1.7573, "learning_rate": 1.390186226680037e-05, "epoch": 0.7609943704364305, "percentage": 76.1, "elapsed_time": "1 day, 8:18:54", "remaining_time": "10:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13654, "total_steps": 17941, "loss": 1.8013, "learning_rate": 1.38957017139273e-05, "epoch": 0.7610501086895937, "percentage": 76.11, "elapsed_time": "1 day, 8:19:03", "remaining_time": "10:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13655, "total_steps": 17941, "loss": 1.5425, "learning_rate": 1.3889542306072052e-05, "epoch": 0.7611058469427568, "percentage": 76.11, "elapsed_time": "1 day, 8:19:11", "remaining_time": "10:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13656, "total_steps": 17941, "loss": 1.694, "learning_rate": 1.388338404342998e-05, "epoch": 0.7611615851959199, "percentage": 76.12, "elapsed_time": "1 day, 8:19:20", "remaining_time": "10:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13657, "total_steps": 17941, "loss": 1.6321, "learning_rate": 1.3877226926196397e-05, "epoch": 0.7612173234490831, "percentage": 76.12, "elapsed_time": "1 day, 8:19:28", "remaining_time": "10:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13658, "total_steps": 17941, "loss": 1.7296, "learning_rate": 1.3871070954566561e-05, "epoch": 0.7612730617022463, "percentage": 76.13, "elapsed_time": "1 day, 8:19:37", "remaining_time": "10:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13659, "total_steps": 17941, "loss": 1.5889, "learning_rate": 1.3864916128735727e-05, "epoch": 0.7613287999554094, "percentage": 76.13, "elapsed_time": "1 day, 8:19:46", "remaining_time": "10:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13660, "total_steps": 17941, "loss": 1.6957, "learning_rate": 1.3858762448899037e-05, "epoch": 0.7613845382085725, "percentage": 76.14, "elapsed_time": "1 day, 8:19:55", "remaining_time": "10:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13661, "total_steps": 17941, "loss": 1.504, "learning_rate": 1.3852609915251719e-05, "epoch": 0.7614402764617357, "percentage": 76.14, "elapsed_time": "1 day, 8:20:03", "remaining_time": "10:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13662, "total_steps": 17941, "loss": 1.5899, "learning_rate": 1.3846458527988842e-05, "epoch": 0.7614960147148988, "percentage": 76.15, "elapsed_time": "1 day, 8:20:12", "remaining_time": "10:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13663, "total_steps": 17941, "loss": 1.8645, "learning_rate": 1.3840308287305509e-05, "epoch": 0.761551752968062, "percentage": 76.16, "elapsed_time": "1 day, 8:20:21", "remaining_time": "10:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13664, "total_steps": 17941, "loss": 1.7324, "learning_rate": 1.3834159193396778e-05, "epoch": 0.7616074912212252, "percentage": 76.16, "elapsed_time": "1 day, 8:20:29", "remaining_time": "10:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13665, "total_steps": 17941, "loss": 1.8378, "learning_rate": 1.382801124645765e-05, "epoch": 0.7616632294743882, "percentage": 76.17, "elapsed_time": "1 day, 8:20:38", "remaining_time": "10:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13666, "total_steps": 17941, "loss": 1.7662, "learning_rate": 1.3821864446683125e-05, "epoch": 0.7617189677275514, "percentage": 76.17, "elapsed_time": "1 day, 8:20:46", "remaining_time": "10:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13667, "total_steps": 17941, "loss": 1.5952, "learning_rate": 1.3815718794268112e-05, "epoch": 0.7617747059807146, "percentage": 76.18, "elapsed_time": "1 day, 8:20:55", "remaining_time": "10:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13668, "total_steps": 17941, "loss": 1.5949, "learning_rate": 1.3809574289407529e-05, "epoch": 0.7618304442338777, "percentage": 76.18, "elapsed_time": "1 day, 8:21:03", "remaining_time": "10:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13669, "total_steps": 17941, "loss": 1.7301, "learning_rate": 1.3803430932296247e-05, "epoch": 0.7618861824870409, "percentage": 76.19, "elapsed_time": "1 day, 8:21:11", "remaining_time": "10:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13670, "total_steps": 17941, "loss": 1.6325, "learning_rate": 1.3797288723129093e-05, "epoch": 0.761941920740204, "percentage": 76.19, "elapsed_time": "1 day, 8:21:20", "remaining_time": "10:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13671, "total_steps": 17941, "loss": 1.7894, "learning_rate": 1.3791147662100867e-05, "epoch": 0.7619976589933671, "percentage": 76.2, "elapsed_time": "1 day, 8:21:28", "remaining_time": "10:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13672, "total_steps": 17941, "loss": 1.6614, "learning_rate": 1.378500774940632e-05, "epoch": 0.7620533972465303, "percentage": 76.21, "elapsed_time": "1 day, 8:21:37", "remaining_time": "10:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13673, "total_steps": 17941, "loss": 1.2925, "learning_rate": 1.3778868985240195e-05, "epoch": 0.7621091354996934, "percentage": 76.21, "elapsed_time": "1 day, 8:21:45", "remaining_time": "10:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13674, "total_steps": 17941, "loss": 1.4987, "learning_rate": 1.3772731369797154e-05, "epoch": 0.7621648737528566, "percentage": 76.22, "elapsed_time": "1 day, 8:21:54", "remaining_time": "10:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13675, "total_steps": 17941, "loss": 1.6826, "learning_rate": 1.3766594903271845e-05, "epoch": 0.7622206120060198, "percentage": 76.22, "elapsed_time": "1 day, 8:22:02", "remaining_time": "10:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13676, "total_steps": 17941, "loss": 1.7222, "learning_rate": 1.3760459585858897e-05, "epoch": 0.7622763502591828, "percentage": 76.23, "elapsed_time": "1 day, 8:22:10", "remaining_time": "10:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13677, "total_steps": 17941, "loss": 1.6004, "learning_rate": 1.3754325417752878e-05, "epoch": 0.762332088512346, "percentage": 76.23, "elapsed_time": "1 day, 8:22:19", "remaining_time": "10:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13678, "total_steps": 17941, "loss": 1.3402, "learning_rate": 1.374819239914834e-05, "epoch": 0.7623878267655092, "percentage": 76.24, "elapsed_time": "1 day, 8:22:27", "remaining_time": "10:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13679, "total_steps": 17941, "loss": 1.7393, "learning_rate": 1.3742060530239753e-05, "epoch": 0.7624435650186723, "percentage": 76.24, "elapsed_time": "1 day, 8:22:36", "remaining_time": "10:05:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13680, "total_steps": 17941, "loss": 1.7233, "learning_rate": 1.3735929811221637e-05, "epoch": 0.7624993032718355, "percentage": 76.25, "elapsed_time": "1 day, 8:22:44", "remaining_time": "10:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13681, "total_steps": 17941, "loss": 1.3896, "learning_rate": 1.372980024228837e-05, "epoch": 0.7625550415249986, "percentage": 76.26, "elapsed_time": "1 day, 8:22:53", "remaining_time": "10:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13682, "total_steps": 17941, "loss": 1.8186, "learning_rate": 1.3723671823634376e-05, "epoch": 0.7626107797781617, "percentage": 76.26, "elapsed_time": "1 day, 8:23:01", "remaining_time": "10:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13683, "total_steps": 17941, "loss": 1.721, "learning_rate": 1.3717544555454009e-05, "epoch": 0.7626665180313249, "percentage": 76.27, "elapsed_time": "1 day, 8:23:10", "remaining_time": "10:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13684, "total_steps": 17941, "loss": 1.462, "learning_rate": 1.3711418437941582e-05, "epoch": 0.7627222562844881, "percentage": 76.27, "elapsed_time": "1 day, 8:23:18", "remaining_time": "10:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13685, "total_steps": 17941, "loss": 1.5209, "learning_rate": 1.3705293471291403e-05, "epoch": 0.7627779945376512, "percentage": 76.28, "elapsed_time": "1 day, 8:23:27", "remaining_time": "10:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13686, "total_steps": 17941, "loss": 1.5621, "learning_rate": 1.3699169655697669e-05, "epoch": 0.7628337327908143, "percentage": 76.28, "elapsed_time": "1 day, 8:23:36", "remaining_time": "10:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13687, "total_steps": 17941, "loss": 1.7407, "learning_rate": 1.3693046991354658e-05, "epoch": 0.7628894710439775, "percentage": 76.29, "elapsed_time": "1 day, 8:23:44", "remaining_time": "10:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13688, "total_steps": 17941, "loss": 1.6656, "learning_rate": 1.3686925478456497e-05, "epoch": 0.7629452092971406, "percentage": 76.29, "elapsed_time": "1 day, 8:23:53", "remaining_time": "10:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13689, "total_steps": 17941, "loss": 1.4874, "learning_rate": 1.3680805117197344e-05, "epoch": 0.7630009475503038, "percentage": 76.3, "elapsed_time": "1 day, 8:24:01", "remaining_time": "10:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13690, "total_steps": 17941, "loss": 1.6193, "learning_rate": 1.367468590777129e-05, "epoch": 0.763056685803467, "percentage": 76.31, "elapsed_time": "1 day, 8:24:10", "remaining_time": "10:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13691, "total_steps": 17941, "loss": 1.5072, "learning_rate": 1.366856785037241e-05, "epoch": 0.76311242405663, "percentage": 76.31, "elapsed_time": "1 day, 8:24:18", "remaining_time": "10:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13692, "total_steps": 17941, "loss": 1.5143, "learning_rate": 1.3662450945194743e-05, "epoch": 0.7631681623097932, "percentage": 76.32, "elapsed_time": "1 day, 8:24:27", "remaining_time": "10:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13693, "total_steps": 17941, "loss": 1.6937, "learning_rate": 1.3656335192432258e-05, "epoch": 0.7632239005629563, "percentage": 76.32, "elapsed_time": "1 day, 8:24:35", "remaining_time": "10:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13694, "total_steps": 17941, "loss": 1.6081, "learning_rate": 1.3650220592278923e-05, "epoch": 0.7632796388161195, "percentage": 76.33, "elapsed_time": "1 day, 8:24:44", "remaining_time": "10:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13695, "total_steps": 17941, "loss": 1.5314, "learning_rate": 1.3644107144928658e-05, "epoch": 0.7633353770692827, "percentage": 76.33, "elapsed_time": "1 day, 8:24:52", "remaining_time": "10:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13696, "total_steps": 17941, "loss": 1.6142, "learning_rate": 1.3637994850575341e-05, "epoch": 0.7633911153224457, "percentage": 76.34, "elapsed_time": "1 day, 8:25:01", "remaining_time": "10:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13697, "total_steps": 17941, "loss": 1.683, "learning_rate": 1.3631883709412823e-05, "epoch": 0.7634468535756089, "percentage": 76.34, "elapsed_time": "1 day, 8:25:09", "remaining_time": "10:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13698, "total_steps": 17941, "loss": 1.6197, "learning_rate": 1.3625773721634915e-05, "epoch": 0.7635025918287721, "percentage": 76.35, "elapsed_time": "1 day, 8:25:18", "remaining_time": "10:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13699, "total_steps": 17941, "loss": 1.6233, "learning_rate": 1.3619664887435402e-05, "epoch": 0.7635583300819352, "percentage": 76.36, "elapsed_time": "1 day, 8:25:26", "remaining_time": "10:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13700, "total_steps": 17941, "loss": 1.5264, "learning_rate": 1.3613557207007988e-05, "epoch": 0.7636140683350984, "percentage": 76.36, "elapsed_time": "1 day, 8:25:34", "remaining_time": "10:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13701, "total_steps": 17941, "loss": 1.5529, "learning_rate": 1.3607450680546397e-05, "epoch": 0.7636698065882616, "percentage": 76.37, "elapsed_time": "1 day, 8:25:43", "remaining_time": "10:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13702, "total_steps": 17941, "loss": 1.8334, "learning_rate": 1.3601345308244284e-05, "epoch": 0.7637255448414246, "percentage": 76.37, "elapsed_time": "1 day, 8:25:51", "remaining_time": "10:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13703, "total_steps": 17941, "loss": 1.3872, "learning_rate": 1.359524109029528e-05, "epoch": 0.7637812830945878, "percentage": 76.38, "elapsed_time": "1 day, 8:26:00", "remaining_time": "10:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13704, "total_steps": 17941, "loss": 1.7196, "learning_rate": 1.3589138026892988e-05, "epoch": 0.763837021347751, "percentage": 76.38, "elapsed_time": "1 day, 8:26:08", "remaining_time": "10:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13705, "total_steps": 17941, "loss": 1.7068, "learning_rate": 1.3583036118230924e-05, "epoch": 0.7638927596009141, "percentage": 76.39, "elapsed_time": "1 day, 8:26:17", "remaining_time": "10:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13706, "total_steps": 17941, "loss": 1.6201, "learning_rate": 1.3576935364502653e-05, "epoch": 0.7639484978540773, "percentage": 76.39, "elapsed_time": "1 day, 8:26:25", "remaining_time": "10:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13707, "total_steps": 17941, "loss": 1.697, "learning_rate": 1.3570835765901612e-05, "epoch": 0.7640042361072404, "percentage": 76.4, "elapsed_time": "1 day, 8:26:34", "remaining_time": "10:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13708, "total_steps": 17941, "loss": 1.6438, "learning_rate": 1.3564737322621274e-05, "epoch": 0.7640599743604035, "percentage": 76.41, "elapsed_time": "1 day, 8:26:42", "remaining_time": "10:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13709, "total_steps": 17941, "loss": 1.7532, "learning_rate": 1.355864003485503e-05, "epoch": 0.7641157126135667, "percentage": 76.41, "elapsed_time": "1 day, 8:26:51", "remaining_time": "10:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13710, "total_steps": 17941, "loss": 1.3265, "learning_rate": 1.3552543902796256e-05, "epoch": 0.7641714508667299, "percentage": 76.42, "elapsed_time": "1 day, 8:27:00", "remaining_time": "10:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13711, "total_steps": 17941, "loss": 1.509, "learning_rate": 1.35464489266383e-05, "epoch": 0.764227189119893, "percentage": 76.42, "elapsed_time": "1 day, 8:27:08", "remaining_time": "10:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13712, "total_steps": 17941, "loss": 1.663, "learning_rate": 1.3540355106574416e-05, "epoch": 0.7642829273730561, "percentage": 76.43, "elapsed_time": "1 day, 8:27:17", "remaining_time": "10:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13713, "total_steps": 17941, "loss": 1.6732, "learning_rate": 1.3534262442797923e-05, "epoch": 0.7643386656262193, "percentage": 76.43, "elapsed_time": "1 day, 8:27:25", "remaining_time": "10:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13714, "total_steps": 17941, "loss": 1.5886, "learning_rate": 1.3528170935502005e-05, "epoch": 0.7643944038793824, "percentage": 76.44, "elapsed_time": "1 day, 8:27:33", "remaining_time": "10:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13715, "total_steps": 17941, "loss": 1.5023, "learning_rate": 1.3522080584879854e-05, "epoch": 0.7644501421325456, "percentage": 76.45, "elapsed_time": "1 day, 8:27:42", "remaining_time": "10:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13716, "total_steps": 17941, "loss": 1.5308, "learning_rate": 1.3515991391124627e-05, "epoch": 0.7645058803857087, "percentage": 76.45, "elapsed_time": "1 day, 8:27:50", "remaining_time": "10:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13717, "total_steps": 17941, "loss": 1.7049, "learning_rate": 1.3509903354429437e-05, "epoch": 0.7645616186388718, "percentage": 76.46, "elapsed_time": "1 day, 8:27:59", "remaining_time": "9:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13718, "total_steps": 17941, "loss": 1.6599, "learning_rate": 1.3503816474987379e-05, "epoch": 0.764617356892035, "percentage": 76.46, "elapsed_time": "1 day, 8:28:07", "remaining_time": "9:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13719, "total_steps": 17941, "loss": 1.8447, "learning_rate": 1.3497730752991455e-05, "epoch": 0.7646730951451981, "percentage": 76.47, "elapsed_time": "1 day, 8:28:16", "remaining_time": "9:59:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13720, "total_steps": 17941, "loss": 1.6414, "learning_rate": 1.3491646188634689e-05, "epoch": 0.7647288333983613, "percentage": 76.47, "elapsed_time": "1 day, 8:28:24", "remaining_time": "9:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13721, "total_steps": 17941, "loss": 1.5857, "learning_rate": 1.348556278211005e-05, "epoch": 0.7647845716515245, "percentage": 76.48, "elapsed_time": "1 day, 8:28:33", "remaining_time": "9:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13722, "total_steps": 17941, "loss": 1.7178, "learning_rate": 1.3479480533610468e-05, "epoch": 0.7648403099046875, "percentage": 76.48, "elapsed_time": "1 day, 8:28:41", "remaining_time": "9:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13723, "total_steps": 17941, "loss": 1.864, "learning_rate": 1.3473399443328826e-05, "epoch": 0.7648960481578507, "percentage": 76.49, "elapsed_time": "1 day, 8:28:50", "remaining_time": "9:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13724, "total_steps": 17941, "loss": 1.6681, "learning_rate": 1.3467319511457993e-05, "epoch": 0.7649517864110139, "percentage": 76.5, "elapsed_time": "1 day, 8:28:58", "remaining_time": "9:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13725, "total_steps": 17941, "loss": 1.5217, "learning_rate": 1.34612407381908e-05, "epoch": 0.765007524664177, "percentage": 76.5, "elapsed_time": "1 day, 8:29:06", "remaining_time": "9:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13726, "total_steps": 17941, "loss": 1.3252, "learning_rate": 1.3455163123719999e-05, "epoch": 0.7650632629173402, "percentage": 76.51, "elapsed_time": "1 day, 8:29:15", "remaining_time": "9:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13727, "total_steps": 17941, "loss": 1.5403, "learning_rate": 1.344908666823836e-05, "epoch": 0.7651190011705034, "percentage": 76.51, "elapsed_time": "1 day, 8:29:23", "remaining_time": "9:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13728, "total_steps": 17941, "loss": 1.7533, "learning_rate": 1.3443011371938574e-05, "epoch": 0.7651747394236664, "percentage": 76.52, "elapsed_time": "1 day, 8:29:32", "remaining_time": "9:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13729, "total_steps": 17941, "loss": 1.7345, "learning_rate": 1.3436937235013331e-05, "epoch": 0.7652304776768296, "percentage": 76.52, "elapsed_time": "1 day, 8:29:41", "remaining_time": "9:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13730, "total_steps": 17941, "loss": 1.5839, "learning_rate": 1.3430864257655273e-05, "epoch": 0.7652862159299928, "percentage": 76.53, "elapsed_time": "1 day, 8:29:49", "remaining_time": "9:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13731, "total_steps": 17941, "loss": 1.4791, "learning_rate": 1.3424792440056966e-05, "epoch": 0.7653419541831559, "percentage": 76.53, "elapsed_time": "1 day, 8:29:58", "remaining_time": "9:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13732, "total_steps": 17941, "loss": 1.5329, "learning_rate": 1.3418721782411015e-05, "epoch": 0.765397692436319, "percentage": 76.54, "elapsed_time": "1 day, 8:30:07", "remaining_time": "9:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13733, "total_steps": 17941, "loss": 1.7906, "learning_rate": 1.3412652284909916e-05, "epoch": 0.7654534306894822, "percentage": 76.55, "elapsed_time": "1 day, 8:30:15", "remaining_time": "9:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13734, "total_steps": 17941, "loss": 1.952, "learning_rate": 1.3406583947746166e-05, "epoch": 0.7655091689426453, "percentage": 76.55, "elapsed_time": "1 day, 8:30:23", "remaining_time": "9:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13735, "total_steps": 17941, "loss": 1.6007, "learning_rate": 1.340051677111222e-05, "epoch": 0.7655649071958085, "percentage": 76.56, "elapsed_time": "1 day, 8:30:32", "remaining_time": "9:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13736, "total_steps": 17941, "loss": 1.6623, "learning_rate": 1.3394450755200488e-05, "epoch": 0.7656206454489717, "percentage": 76.56, "elapsed_time": "1 day, 8:30:40", "remaining_time": "9:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13737, "total_steps": 17941, "loss": 1.7574, "learning_rate": 1.3388385900203371e-05, "epoch": 0.7656763837021348, "percentage": 76.57, "elapsed_time": "1 day, 8:30:49", "remaining_time": "9:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13738, "total_steps": 17941, "loss": 1.5834, "learning_rate": 1.3382322206313164e-05, "epoch": 0.7657321219552979, "percentage": 76.57, "elapsed_time": "1 day, 8:30:58", "remaining_time": "9:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13739, "total_steps": 17941, "loss": 1.7372, "learning_rate": 1.337625967372223e-05, "epoch": 0.765787860208461, "percentage": 76.58, "elapsed_time": "1 day, 8:31:07", "remaining_time": "9:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13740, "total_steps": 17941, "loss": 1.8107, "learning_rate": 1.3370198302622794e-05, "epoch": 0.7658435984616242, "percentage": 76.58, "elapsed_time": "1 day, 8:31:15", "remaining_time": "9:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13741, "total_steps": 17941, "loss": 1.4694, "learning_rate": 1.3364138093207096e-05, "epoch": 0.7658993367147874, "percentage": 76.59, "elapsed_time": "1 day, 8:31:24", "remaining_time": "9:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13742, "total_steps": 17941, "loss": 1.6048, "learning_rate": 1.3358079045667338e-05, "epoch": 0.7659550749679505, "percentage": 76.6, "elapsed_time": "1 day, 8:31:32", "remaining_time": "9:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13743, "total_steps": 17941, "loss": 1.5999, "learning_rate": 1.3352021160195676e-05, "epoch": 0.7660108132211136, "percentage": 76.6, "elapsed_time": "1 day, 8:31:40", "remaining_time": "9:56:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13744, "total_steps": 17941, "loss": 1.5563, "learning_rate": 1.3345964436984249e-05, "epoch": 0.7660665514742768, "percentage": 76.61, "elapsed_time": "1 day, 8:31:49", "remaining_time": "9:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13745, "total_steps": 17941, "loss": 1.4062, "learning_rate": 1.3339908876225105e-05, "epoch": 0.7661222897274399, "percentage": 76.61, "elapsed_time": "1 day, 8:31:57", "remaining_time": "9:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13746, "total_steps": 17941, "loss": 1.5772, "learning_rate": 1.3333854478110309e-05, "epoch": 0.7661780279806031, "percentage": 76.62, "elapsed_time": "1 day, 8:32:06", "remaining_time": "9:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13747, "total_steps": 17941, "loss": 1.7012, "learning_rate": 1.3327801242831867e-05, "epoch": 0.7662337662337663, "percentage": 76.62, "elapsed_time": "1 day, 8:32:14", "remaining_time": "9:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13748, "total_steps": 17941, "loss": 1.5764, "learning_rate": 1.332174917058176e-05, "epoch": 0.7662895044869293, "percentage": 76.63, "elapsed_time": "1 day, 8:32:23", "remaining_time": "9:55:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13749, "total_steps": 17941, "loss": 1.4723, "learning_rate": 1.3315698261551917e-05, "epoch": 0.7663452427400925, "percentage": 76.63, "elapsed_time": "1 day, 8:32:32", "remaining_time": "9:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13750, "total_steps": 17941, "loss": 1.6053, "learning_rate": 1.3309648515934241e-05, "epoch": 0.7664009809932557, "percentage": 76.64, "elapsed_time": "1 day, 8:32:40", "remaining_time": "9:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13751, "total_steps": 17941, "loss": 1.5209, "learning_rate": 1.3303599933920613e-05, "epoch": 0.7664567192464188, "percentage": 76.65, "elapsed_time": "1 day, 8:32:49", "remaining_time": "9:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13752, "total_steps": 17941, "loss": 1.8081, "learning_rate": 1.3297552515702822e-05, "epoch": 0.766512457499582, "percentage": 76.65, "elapsed_time": "1 day, 8:32:57", "remaining_time": "9:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13753, "total_steps": 17941, "loss": 1.754, "learning_rate": 1.3291506261472675e-05, "epoch": 0.7665681957527452, "percentage": 76.66, "elapsed_time": "1 day, 8:33:06", "remaining_time": "9:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13754, "total_steps": 17941, "loss": 1.622, "learning_rate": 1.3285461171421925e-05, "epoch": 0.7666239340059082, "percentage": 76.66, "elapsed_time": "1 day, 8:33:14", "remaining_time": "9:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13755, "total_steps": 17941, "loss": 1.6621, "learning_rate": 1.3279417245742286e-05, "epoch": 0.7666796722590714, "percentage": 76.67, "elapsed_time": "1 day, 8:33:23", "remaining_time": "9:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13756, "total_steps": 17941, "loss": 1.6559, "learning_rate": 1.327337448462545e-05, "epoch": 0.7667354105122346, "percentage": 76.67, "elapsed_time": "1 day, 8:33:31", "remaining_time": "9:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13757, "total_steps": 17941, "loss": 1.631, "learning_rate": 1.3267332888263013e-05, "epoch": 0.7667911487653977, "percentage": 76.68, "elapsed_time": "1 day, 8:33:39", "remaining_time": "9:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13758, "total_steps": 17941, "loss": 1.6011, "learning_rate": 1.3261292456846647e-05, "epoch": 0.7668468870185609, "percentage": 76.68, "elapsed_time": "1 day, 8:33:48", "remaining_time": "9:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13759, "total_steps": 17941, "loss": 1.7915, "learning_rate": 1.3255253190567863e-05, "epoch": 0.766902625271724, "percentage": 76.69, "elapsed_time": "1 day, 8:33:56", "remaining_time": "9:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13760, "total_steps": 17941, "loss": 1.6165, "learning_rate": 1.3249215089618211e-05, "epoch": 0.7669583635248871, "percentage": 76.7, "elapsed_time": "1 day, 8:34:05", "remaining_time": "9:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13761, "total_steps": 17941, "loss": 1.5416, "learning_rate": 1.3243178154189184e-05, "epoch": 0.7670141017780503, "percentage": 76.7, "elapsed_time": "1 day, 8:34:13", "remaining_time": "9:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13762, "total_steps": 17941, "loss": 1.678, "learning_rate": 1.323714238447224e-05, "epoch": 0.7670698400312134, "percentage": 76.71, "elapsed_time": "1 day, 8:34:22", "remaining_time": "9:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13763, "total_steps": 17941, "loss": 1.6428, "learning_rate": 1.3231107780658814e-05, "epoch": 0.7671255782843766, "percentage": 76.71, "elapsed_time": "1 day, 8:34:30", "remaining_time": "9:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13764, "total_steps": 17941, "loss": 1.6772, "learning_rate": 1.3225074342940235e-05, "epoch": 0.7671813165375397, "percentage": 76.72, "elapsed_time": "1 day, 8:34:39", "remaining_time": "9:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13765, "total_steps": 17941, "loss": 1.4968, "learning_rate": 1.321904207150792e-05, "epoch": 0.7672370547907028, "percentage": 76.72, "elapsed_time": "1 day, 8:34:47", "remaining_time": "9:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13766, "total_steps": 17941, "loss": 1.67, "learning_rate": 1.321301096655313e-05, "epoch": 0.767292793043866, "percentage": 76.73, "elapsed_time": "1 day, 8:34:56", "remaining_time": "9:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13767, "total_steps": 17941, "loss": 1.6711, "learning_rate": 1.3206981028267145e-05, "epoch": 0.7673485312970292, "percentage": 76.73, "elapsed_time": "1 day, 8:35:04", "remaining_time": "9:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13768, "total_steps": 17941, "loss": 1.7168, "learning_rate": 1.3200952256841204e-05, "epoch": 0.7674042695501923, "percentage": 76.74, "elapsed_time": "1 day, 8:35:13", "remaining_time": "9:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13769, "total_steps": 17941, "loss": 1.5528, "learning_rate": 1.3194924652466507e-05, "epoch": 0.7674600078033554, "percentage": 76.75, "elapsed_time": "1 day, 8:35:21", "remaining_time": "9:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13770, "total_steps": 17941, "loss": 1.668, "learning_rate": 1.3188898215334228e-05, "epoch": 0.7675157460565186, "percentage": 76.75, "elapsed_time": "1 day, 8:35:30", "remaining_time": "9:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13771, "total_steps": 17941, "loss": 1.5727, "learning_rate": 1.3182872945635455e-05, "epoch": 0.7675714843096817, "percentage": 76.76, "elapsed_time": "1 day, 8:35:38", "remaining_time": "9:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13772, "total_steps": 17941, "loss": 1.6687, "learning_rate": 1.317684884356129e-05, "epoch": 0.7676272225628449, "percentage": 76.76, "elapsed_time": "1 day, 8:35:47", "remaining_time": "9:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13773, "total_steps": 17941, "loss": 1.7627, "learning_rate": 1.3170825909302792e-05, "epoch": 0.7676829608160081, "percentage": 76.77, "elapsed_time": "1 day, 8:35:56", "remaining_time": "9:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13774, "total_steps": 17941, "loss": 1.4726, "learning_rate": 1.3164804143050963e-05, "epoch": 0.7677386990691711, "percentage": 76.77, "elapsed_time": "1 day, 8:36:04", "remaining_time": "9:51:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13775, "total_steps": 17941, "loss": 1.4011, "learning_rate": 1.3158783544996789e-05, "epoch": 0.7677944373223343, "percentage": 76.78, "elapsed_time": "1 day, 8:36:13", "remaining_time": "9:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13776, "total_steps": 17941, "loss": 1.5873, "learning_rate": 1.3152764115331195e-05, "epoch": 0.7678501755754975, "percentage": 76.79, "elapsed_time": "1 day, 8:36:21", "remaining_time": "9:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13777, "total_steps": 17941, "loss": 1.5637, "learning_rate": 1.3146745854245108e-05, "epoch": 0.7679059138286606, "percentage": 76.79, "elapsed_time": "1 day, 8:36:30", "remaining_time": "9:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13778, "total_steps": 17941, "loss": 1.6605, "learning_rate": 1.3140728761929356e-05, "epoch": 0.7679616520818238, "percentage": 76.8, "elapsed_time": "1 day, 8:36:38", "remaining_time": "9:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13779, "total_steps": 17941, "loss": 1.7208, "learning_rate": 1.313471283857478e-05, "epoch": 0.768017390334987, "percentage": 76.8, "elapsed_time": "1 day, 8:36:46", "remaining_time": "9:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13780, "total_steps": 17941, "loss": 1.8526, "learning_rate": 1.3128698084372182e-05, "epoch": 0.76807312858815, "percentage": 76.81, "elapsed_time": "1 day, 8:36:55", "remaining_time": "9:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13781, "total_steps": 17941, "loss": 1.4398, "learning_rate": 1.31226844995123e-05, "epoch": 0.7681288668413132, "percentage": 76.81, "elapsed_time": "1 day, 8:37:04", "remaining_time": "9:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13782, "total_steps": 17941, "loss": 1.6531, "learning_rate": 1.3116672084185872e-05, "epoch": 0.7681846050944764, "percentage": 76.82, "elapsed_time": "1 day, 8:37:12", "remaining_time": "9:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13783, "total_steps": 17941, "loss": 1.6007, "learning_rate": 1.3110660838583533e-05, "epoch": 0.7682403433476395, "percentage": 76.82, "elapsed_time": "1 day, 8:37:21", "remaining_time": "9:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13784, "total_steps": 17941, "loss": 1.4798, "learning_rate": 1.3104650762895975e-05, "epoch": 0.7682960816008026, "percentage": 76.83, "elapsed_time": "1 day, 8:37:29", "remaining_time": "9:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13785, "total_steps": 17941, "loss": 1.5713, "learning_rate": 1.3098641857313777e-05, "epoch": 0.7683518198539657, "percentage": 76.84, "elapsed_time": "1 day, 8:37:37", "remaining_time": "9:50:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13786, "total_steps": 17941, "loss": 1.7747, "learning_rate": 1.3092634122027497e-05, "epoch": 0.7684075581071289, "percentage": 76.84, "elapsed_time": "1 day, 8:37:46", "remaining_time": "9:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13787, "total_steps": 17941, "loss": 1.6071, "learning_rate": 1.3086627557227687e-05, "epoch": 0.7684632963602921, "percentage": 76.85, "elapsed_time": "1 day, 8:37:54", "remaining_time": "9:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13788, "total_steps": 17941, "loss": 1.823, "learning_rate": 1.3080622163104827e-05, "epoch": 0.7685190346134552, "percentage": 76.85, "elapsed_time": "1 day, 8:38:03", "remaining_time": "9:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13789, "total_steps": 17941, "loss": 1.5356, "learning_rate": 1.3074617939849393e-05, "epoch": 0.7685747728666183, "percentage": 76.86, "elapsed_time": "1 day, 8:38:11", "remaining_time": "9:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13790, "total_steps": 17941, "loss": 1.6255, "learning_rate": 1.3068614887651759e-05, "epoch": 0.7686305111197815, "percentage": 76.86, "elapsed_time": "1 day, 8:38:20", "remaining_time": "9:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13791, "total_steps": 17941, "loss": 1.7089, "learning_rate": 1.3062613006702361e-05, "epoch": 0.7686862493729446, "percentage": 76.87, "elapsed_time": "1 day, 8:38:28", "remaining_time": "9:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13792, "total_steps": 17941, "loss": 1.9307, "learning_rate": 1.3056612297191505e-05, "epoch": 0.7687419876261078, "percentage": 76.87, "elapsed_time": "1 day, 8:38:37", "remaining_time": "9:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13793, "total_steps": 17941, "loss": 1.5325, "learning_rate": 1.3050612759309515e-05, "epoch": 0.768797725879271, "percentage": 76.88, "elapsed_time": "1 day, 8:38:45", "remaining_time": "9:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13794, "total_steps": 17941, "loss": 1.5726, "learning_rate": 1.3044614393246662e-05, "epoch": 0.768853464132434, "percentage": 76.89, "elapsed_time": "1 day, 8:38:53", "remaining_time": "9:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13795, "total_steps": 17941, "loss": 1.5083, "learning_rate": 1.3038617199193171e-05, "epoch": 0.7689092023855972, "percentage": 76.89, "elapsed_time": "1 day, 8:39:02", "remaining_time": "9:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13796, "total_steps": 17941, "loss": 1.6135, "learning_rate": 1.3032621177339255e-05, "epoch": 0.7689649406387604, "percentage": 76.9, "elapsed_time": "1 day, 8:39:10", "remaining_time": "9:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13797, "total_steps": 17941, "loss": 1.5547, "learning_rate": 1.3026626327875052e-05, "epoch": 0.7690206788919235, "percentage": 76.9, "elapsed_time": "1 day, 8:39:19", "remaining_time": "9:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13798, "total_steps": 17941, "loss": 1.5781, "learning_rate": 1.3020632650990688e-05, "epoch": 0.7690764171450867, "percentage": 76.91, "elapsed_time": "1 day, 8:39:28", "remaining_time": "9:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13799, "total_steps": 17941, "loss": 1.7391, "learning_rate": 1.301464014687625e-05, "epoch": 0.7691321553982499, "percentage": 76.91, "elapsed_time": "1 day, 8:39:36", "remaining_time": "9:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13800, "total_steps": 17941, "loss": 1.6353, "learning_rate": 1.300864881572179e-05, "epoch": 0.7691878936514129, "percentage": 76.92, "elapsed_time": "1 day, 8:39:44", "remaining_time": "9:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13801, "total_steps": 17941, "loss": 1.7033, "learning_rate": 1.3002658657717314e-05, "epoch": 0.7692436319045761, "percentage": 76.92, "elapsed_time": "1 day, 8:39:53", "remaining_time": "9:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13802, "total_steps": 17941, "loss": 1.7809, "learning_rate": 1.2996669673052797e-05, "epoch": 0.7692993701577393, "percentage": 76.93, "elapsed_time": "1 day, 8:40:01", "remaining_time": "9:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13803, "total_steps": 17941, "loss": 1.3578, "learning_rate": 1.2990681861918186e-05, "epoch": 0.7693551084109024, "percentage": 76.94, "elapsed_time": "1 day, 8:40:10", "remaining_time": "9:47:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13804, "total_steps": 17941, "loss": 1.607, "learning_rate": 1.2984695224503351e-05, "epoch": 0.7694108466640656, "percentage": 76.94, "elapsed_time": "1 day, 8:40:18", "remaining_time": "9:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13805, "total_steps": 17941, "loss": 1.5583, "learning_rate": 1.2978709760998176e-05, "epoch": 0.7694665849172287, "percentage": 76.95, "elapsed_time": "1 day, 8:40:28", "remaining_time": "9:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13806, "total_steps": 17941, "loss": 1.6499, "learning_rate": 1.2972725471592473e-05, "epoch": 0.7695223231703918, "percentage": 76.95, "elapsed_time": "1 day, 8:40:36", "remaining_time": "9:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13807, "total_steps": 17941, "loss": 1.8379, "learning_rate": 1.2966742356476036e-05, "epoch": 0.769578061423555, "percentage": 76.96, "elapsed_time": "1 day, 8:40:44", "remaining_time": "9:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13808, "total_steps": 17941, "loss": 1.4554, "learning_rate": 1.2960760415838625e-05, "epoch": 0.7696337996767181, "percentage": 76.96, "elapsed_time": "1 day, 8:40:53", "remaining_time": "9:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13809, "total_steps": 17941, "loss": 1.6364, "learning_rate": 1.2954779649869914e-05, "epoch": 0.7696895379298813, "percentage": 76.97, "elapsed_time": "1 day, 8:41:01", "remaining_time": "9:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13810, "total_steps": 17941, "loss": 1.8723, "learning_rate": 1.294880005875963e-05, "epoch": 0.7697452761830444, "percentage": 76.97, "elapsed_time": "1 day, 8:41:10", "remaining_time": "9:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13811, "total_steps": 17941, "loss": 1.7793, "learning_rate": 1.2942821642697372e-05, "epoch": 0.7698010144362075, "percentage": 76.98, "elapsed_time": "1 day, 8:41:18", "remaining_time": "9:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13812, "total_steps": 17941, "loss": 1.3296, "learning_rate": 1.293684440187275e-05, "epoch": 0.7698567526893707, "percentage": 76.99, "elapsed_time": "1 day, 8:41:27", "remaining_time": "9:46:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13813, "total_steps": 17941, "loss": 1.8778, "learning_rate": 1.2930868336475332e-05, "epoch": 0.7699124909425339, "percentage": 76.99, "elapsed_time": "1 day, 8:41:35", "remaining_time": "9:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13814, "total_steps": 17941, "loss": 1.8938, "learning_rate": 1.2924893446694647e-05, "epoch": 0.769968229195697, "percentage": 77.0, "elapsed_time": "1 day, 8:41:44", "remaining_time": "9:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13815, "total_steps": 17941, "loss": 2.1305, "learning_rate": 1.2918919732720186e-05, "epoch": 0.7700239674488601, "percentage": 77.0, "elapsed_time": "1 day, 8:41:52", "remaining_time": "9:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13816, "total_steps": 17941, "loss": 1.7058, "learning_rate": 1.291294719474137e-05, "epoch": 0.7700797057020233, "percentage": 77.01, "elapsed_time": "1 day, 8:42:01", "remaining_time": "9:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13817, "total_steps": 17941, "loss": 1.7782, "learning_rate": 1.2906975832947665e-05, "epoch": 0.7701354439551864, "percentage": 77.01, "elapsed_time": "1 day, 8:42:09", "remaining_time": "9:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13818, "total_steps": 17941, "loss": 1.4945, "learning_rate": 1.2901005647528402e-05, "epoch": 0.7701911822083496, "percentage": 77.02, "elapsed_time": "1 day, 8:42:17", "remaining_time": "9:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13819, "total_steps": 17941, "loss": 1.7357, "learning_rate": 1.2895036638672937e-05, "epoch": 0.7702469204615128, "percentage": 77.02, "elapsed_time": "1 day, 8:42:26", "remaining_time": "9:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13820, "total_steps": 17941, "loss": 1.5099, "learning_rate": 1.2889068806570575e-05, "epoch": 0.7703026587146758, "percentage": 77.03, "elapsed_time": "1 day, 8:42:34", "remaining_time": "9:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13821, "total_steps": 17941, "loss": 1.6854, "learning_rate": 1.288310215141058e-05, "epoch": 0.770358396967839, "percentage": 77.04, "elapsed_time": "1 day, 8:42:44", "remaining_time": "9:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13822, "total_steps": 17941, "loss": 1.9443, "learning_rate": 1.287713667338219e-05, "epoch": 0.7704141352210022, "percentage": 77.04, "elapsed_time": "1 day, 8:42:53", "remaining_time": "9:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13823, "total_steps": 17941, "loss": 1.3639, "learning_rate": 1.2871172372674573e-05, "epoch": 0.7704698734741653, "percentage": 77.05, "elapsed_time": "1 day, 8:43:01", "remaining_time": "9:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13824, "total_steps": 17941, "loss": 1.3894, "learning_rate": 1.286520924947689e-05, "epoch": 0.7705256117273285, "percentage": 77.05, "elapsed_time": "1 day, 8:43:10", "remaining_time": "9:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13825, "total_steps": 17941, "loss": 1.6414, "learning_rate": 1.2859247303978255e-05, "epoch": 0.7705813499804917, "percentage": 77.06, "elapsed_time": "1 day, 8:43:19", "remaining_time": "9:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13826, "total_steps": 17941, "loss": 1.5018, "learning_rate": 1.2853286536367753e-05, "epoch": 0.7706370882336547, "percentage": 77.06, "elapsed_time": "1 day, 8:43:27", "remaining_time": "9:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13827, "total_steps": 17941, "loss": 1.8156, "learning_rate": 1.2847326946834426e-05, "epoch": 0.7706928264868179, "percentage": 77.07, "elapsed_time": "1 day, 8:43:36", "remaining_time": "9:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13828, "total_steps": 17941, "loss": 1.5758, "learning_rate": 1.2841368535567267e-05, "epoch": 0.7707485647399811, "percentage": 77.07, "elapsed_time": "1 day, 8:43:44", "remaining_time": "9:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13829, "total_steps": 17941, "loss": 1.4204, "learning_rate": 1.2835411302755262e-05, "epoch": 0.7708043029931442, "percentage": 77.08, "elapsed_time": "1 day, 8:43:53", "remaining_time": "9:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13830, "total_steps": 17941, "loss": 1.7024, "learning_rate": 1.2829455248587319e-05, "epoch": 0.7708600412463074, "percentage": 77.09, "elapsed_time": "1 day, 8:44:01", "remaining_time": "9:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13831, "total_steps": 17941, "loss": 1.534, "learning_rate": 1.2823500373252329e-05, "epoch": 0.7709157794994704, "percentage": 77.09, "elapsed_time": "1 day, 8:44:10", "remaining_time": "9:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13832, "total_steps": 17941, "loss": 1.7682, "learning_rate": 1.2817546676939158e-05, "epoch": 0.7709715177526336, "percentage": 77.1, "elapsed_time": "1 day, 8:44:19", "remaining_time": "9:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13833, "total_steps": 17941, "loss": 1.4134, "learning_rate": 1.281159415983661e-05, "epoch": 0.7710272560057968, "percentage": 77.1, "elapsed_time": "1 day, 8:44:27", "remaining_time": "9:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13834, "total_steps": 17941, "loss": 1.5439, "learning_rate": 1.2805642822133478e-05, "epoch": 0.7710829942589599, "percentage": 77.11, "elapsed_time": "1 day, 8:44:36", "remaining_time": "9:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13835, "total_steps": 17941, "loss": 1.7694, "learning_rate": 1.2799692664018498e-05, "epoch": 0.7711387325121231, "percentage": 77.11, "elapsed_time": "1 day, 8:44:44", "remaining_time": "9:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13836, "total_steps": 17941, "loss": 1.7029, "learning_rate": 1.2793743685680388e-05, "epoch": 0.7711944707652862, "percentage": 77.12, "elapsed_time": "1 day, 8:44:53", "remaining_time": "9:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13837, "total_steps": 17941, "loss": 1.8878, "learning_rate": 1.2787795887307784e-05, "epoch": 0.7712502090184493, "percentage": 77.13, "elapsed_time": "1 day, 8:45:01", "remaining_time": "9:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13838, "total_steps": 17941, "loss": 1.7172, "learning_rate": 1.278184926908933e-05, "epoch": 0.7713059472716125, "percentage": 77.13, "elapsed_time": "1 day, 8:45:10", "remaining_time": "9:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13839, "total_steps": 17941, "loss": 1.6341, "learning_rate": 1.2775903831213625e-05, "epoch": 0.7713616855247757, "percentage": 77.14, "elapsed_time": "1 day, 8:45:18", "remaining_time": "9:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13840, "total_steps": 17941, "loss": 1.7551, "learning_rate": 1.2769959573869217e-05, "epoch": 0.7714174237779388, "percentage": 77.14, "elapsed_time": "1 day, 8:45:26", "remaining_time": "9:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13841, "total_steps": 17941, "loss": 1.6185, "learning_rate": 1.2764016497244641e-05, "epoch": 0.7714731620311019, "percentage": 77.15, "elapsed_time": "1 day, 8:45:35", "remaining_time": "9:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13842, "total_steps": 17941, "loss": 1.7512, "learning_rate": 1.275807460152833e-05, "epoch": 0.7715289002842651, "percentage": 77.15, "elapsed_time": "1 day, 8:45:43", "remaining_time": "9:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13843, "total_steps": 17941, "loss": 1.6764, "learning_rate": 1.275213388690879e-05, "epoch": 0.7715846385374282, "percentage": 77.16, "elapsed_time": "1 day, 8:45:52", "remaining_time": "9:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13844, "total_steps": 17941, "loss": 1.5101, "learning_rate": 1.2746194353574375e-05, "epoch": 0.7716403767905914, "percentage": 77.16, "elapsed_time": "1 day, 8:46:00", "remaining_time": "9:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13845, "total_steps": 17941, "loss": 1.3814, "learning_rate": 1.2740256001713468e-05, "epoch": 0.7716961150437546, "percentage": 77.17, "elapsed_time": "1 day, 8:46:09", "remaining_time": "9:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13846, "total_steps": 17941, "loss": 1.1882, "learning_rate": 1.2734318831514408e-05, "epoch": 0.7717518532969176, "percentage": 77.18, "elapsed_time": "1 day, 8:46:17", "remaining_time": "9:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13847, "total_steps": 17941, "loss": 1.615, "learning_rate": 1.2728382843165477e-05, "epoch": 0.7718075915500808, "percentage": 77.18, "elapsed_time": "1 day, 8:46:26", "remaining_time": "9:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13848, "total_steps": 17941, "loss": 1.6113, "learning_rate": 1.272244803685495e-05, "epoch": 0.771863329803244, "percentage": 77.19, "elapsed_time": "1 day, 8:46:34", "remaining_time": "9:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13849, "total_steps": 17941, "loss": 1.5951, "learning_rate": 1.2716514412771008e-05, "epoch": 0.7719190680564071, "percentage": 77.19, "elapsed_time": "1 day, 8:46:43", "remaining_time": "9:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13850, "total_steps": 17941, "loss": 1.5873, "learning_rate": 1.2710581971101854e-05, "epoch": 0.7719748063095703, "percentage": 77.2, "elapsed_time": "1 day, 8:46:51", "remaining_time": "9:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13851, "total_steps": 17941, "loss": 1.7727, "learning_rate": 1.2704650712035632e-05, "epoch": 0.7720305445627335, "percentage": 77.2, "elapsed_time": "1 day, 8:46:59", "remaining_time": "9:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13852, "total_steps": 17941, "loss": 1.7201, "learning_rate": 1.2698720635760435e-05, "epoch": 0.7720862828158965, "percentage": 77.21, "elapsed_time": "1 day, 8:47:08", "remaining_time": "9:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13853, "total_steps": 17941, "loss": 1.5452, "learning_rate": 1.2692791742464343e-05, "epoch": 0.7721420210690597, "percentage": 77.21, "elapsed_time": "1 day, 8:47:16", "remaining_time": "9:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13854, "total_steps": 17941, "loss": 1.7422, "learning_rate": 1.2686864032335376e-05, "epoch": 0.7721977593222228, "percentage": 77.22, "elapsed_time": "1 day, 8:47:25", "remaining_time": "9:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13855, "total_steps": 17941, "loss": 1.5116, "learning_rate": 1.2680937505561552e-05, "epoch": 0.772253497575386, "percentage": 77.23, "elapsed_time": "1 day, 8:47:33", "remaining_time": "9:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13856, "total_steps": 17941, "loss": 1.7639, "learning_rate": 1.267501216233079e-05, "epoch": 0.7723092358285492, "percentage": 77.23, "elapsed_time": "1 day, 8:47:42", "remaining_time": "9:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13857, "total_steps": 17941, "loss": 1.7836, "learning_rate": 1.266908800283102e-05, "epoch": 0.7723649740817122, "percentage": 77.24, "elapsed_time": "1 day, 8:47:50", "remaining_time": "9:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13858, "total_steps": 17941, "loss": 1.5314, "learning_rate": 1.2663165027250124e-05, "epoch": 0.7724207123348754, "percentage": 77.24, "elapsed_time": "1 day, 8:47:58", "remaining_time": "9:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13859, "total_steps": 17941, "loss": 1.738, "learning_rate": 1.2657243235775945e-05, "epoch": 0.7724764505880386, "percentage": 77.25, "elapsed_time": "1 day, 8:48:07", "remaining_time": "9:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13860, "total_steps": 17941, "loss": 1.8642, "learning_rate": 1.2651322628596285e-05, "epoch": 0.7725321888412017, "percentage": 77.25, "elapsed_time": "1 day, 8:48:15", "remaining_time": "9:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13861, "total_steps": 17941, "loss": 1.7399, "learning_rate": 1.2645403205898914e-05, "epoch": 0.7725879270943649, "percentage": 77.26, "elapsed_time": "1 day, 8:48:24", "remaining_time": "9:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13862, "total_steps": 17941, "loss": 1.5345, "learning_rate": 1.2639484967871578e-05, "epoch": 0.772643665347528, "percentage": 77.26, "elapsed_time": "1 day, 8:48:32", "remaining_time": "9:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13863, "total_steps": 17941, "loss": 1.5579, "learning_rate": 1.2633567914701939e-05, "epoch": 0.7726994036006911, "percentage": 77.27, "elapsed_time": "1 day, 8:48:40", "remaining_time": "9:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13864, "total_steps": 17941, "loss": 1.686, "learning_rate": 1.2627652046577659e-05, "epoch": 0.7727551418538543, "percentage": 77.28, "elapsed_time": "1 day, 8:48:49", "remaining_time": "9:38:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13865, "total_steps": 17941, "loss": 1.5364, "learning_rate": 1.2621737363686365e-05, "epoch": 0.7728108801070175, "percentage": 77.28, "elapsed_time": "1 day, 8:48:57", "remaining_time": "9:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13866, "total_steps": 17941, "loss": 1.8273, "learning_rate": 1.2615823866215626e-05, "epoch": 0.7728666183601806, "percentage": 77.29, "elapsed_time": "1 day, 8:49:07", "remaining_time": "9:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13867, "total_steps": 17941, "loss": 1.6975, "learning_rate": 1.260991155435301e-05, "epoch": 0.7729223566133437, "percentage": 77.29, "elapsed_time": "1 day, 8:49:15", "remaining_time": "9:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13868, "total_steps": 17941, "loss": 1.6625, "learning_rate": 1.2604000428285967e-05, "epoch": 0.7729780948665069, "percentage": 77.3, "elapsed_time": "1 day, 8:49:23", "remaining_time": "9:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13869, "total_steps": 17941, "loss": 1.6419, "learning_rate": 1.2598090488202025e-05, "epoch": 0.77303383311967, "percentage": 77.3, "elapsed_time": "1 day, 8:49:33", "remaining_time": "9:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13870, "total_steps": 17941, "loss": 1.8036, "learning_rate": 1.2592181734288572e-05, "epoch": 0.7730895713728332, "percentage": 77.31, "elapsed_time": "1 day, 8:49:41", "remaining_time": "9:38:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13871, "total_steps": 17941, "loss": 1.6237, "learning_rate": 1.2586274166733009e-05, "epoch": 0.7731453096259964, "percentage": 77.31, "elapsed_time": "1 day, 8:49:49", "remaining_time": "9:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13872, "total_steps": 17941, "loss": 1.6326, "learning_rate": 1.2580367785722697e-05, "epoch": 0.7732010478791594, "percentage": 77.32, "elapsed_time": "1 day, 8:49:59", "remaining_time": "9:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13873, "total_steps": 17941, "loss": 1.5155, "learning_rate": 1.257446259144494e-05, "epoch": 0.7732567861323226, "percentage": 77.33, "elapsed_time": "1 day, 8:50:08", "remaining_time": "9:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13874, "total_steps": 17941, "loss": 1.4979, "learning_rate": 1.2568558584087048e-05, "epoch": 0.7733125243854858, "percentage": 77.33, "elapsed_time": "1 day, 8:50:16", "remaining_time": "9:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13875, "total_steps": 17941, "loss": 1.4564, "learning_rate": 1.2562655763836217e-05, "epoch": 0.7733682626386489, "percentage": 77.34, "elapsed_time": "1 day, 8:50:25", "remaining_time": "9:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13876, "total_steps": 17941, "loss": 1.5123, "learning_rate": 1.2556754130879666e-05, "epoch": 0.7734240008918121, "percentage": 77.34, "elapsed_time": "1 day, 8:50:33", "remaining_time": "9:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13877, "total_steps": 17941, "loss": 1.7825, "learning_rate": 1.2550853685404573e-05, "epoch": 0.7734797391449751, "percentage": 77.35, "elapsed_time": "1 day, 8:50:42", "remaining_time": "9:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13878, "total_steps": 17941, "loss": 1.5749, "learning_rate": 1.2544954427598066e-05, "epoch": 0.7735354773981383, "percentage": 77.35, "elapsed_time": "1 day, 8:50:50", "remaining_time": "9:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13879, "total_steps": 17941, "loss": 1.6941, "learning_rate": 1.25390563576472e-05, "epoch": 0.7735912156513015, "percentage": 77.36, "elapsed_time": "1 day, 8:50:58", "remaining_time": "9:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13880, "total_steps": 17941, "loss": 1.6413, "learning_rate": 1.253315947573907e-05, "epoch": 0.7736469539044646, "percentage": 77.36, "elapsed_time": "1 day, 8:51:07", "remaining_time": "9:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13881, "total_steps": 17941, "loss": 1.6178, "learning_rate": 1.2527263782060689e-05, "epoch": 0.7737026921576278, "percentage": 77.37, "elapsed_time": "1 day, 8:51:15", "remaining_time": "9:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13882, "total_steps": 17941, "loss": 1.7388, "learning_rate": 1.2521369276799e-05, "epoch": 0.773758430410791, "percentage": 77.38, "elapsed_time": "1 day, 8:51:24", "remaining_time": "9:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13883, "total_steps": 17941, "loss": 1.8371, "learning_rate": 1.2515475960140966e-05, "epoch": 0.773814168663954, "percentage": 77.38, "elapsed_time": "1 day, 8:51:33", "remaining_time": "9:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13884, "total_steps": 17941, "loss": 1.4842, "learning_rate": 1.2509583832273486e-05, "epoch": 0.7738699069171172, "percentage": 77.39, "elapsed_time": "1 day, 8:51:41", "remaining_time": "9:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13885, "total_steps": 17941, "loss": 1.836, "learning_rate": 1.2503692893383424e-05, "epoch": 0.7739256451702804, "percentage": 77.39, "elapsed_time": "1 day, 8:51:49", "remaining_time": "9:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13886, "total_steps": 17941, "loss": 1.5868, "learning_rate": 1.24978031436576e-05, "epoch": 0.7739813834234435, "percentage": 77.4, "elapsed_time": "1 day, 8:51:58", "remaining_time": "9:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13887, "total_steps": 17941, "loss": 1.5224, "learning_rate": 1.2491914583282805e-05, "epoch": 0.7740371216766067, "percentage": 77.4, "elapsed_time": "1 day, 8:52:06", "remaining_time": "9:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13888, "total_steps": 17941, "loss": 1.6178, "learning_rate": 1.2486027212445812e-05, "epoch": 0.7740928599297698, "percentage": 77.41, "elapsed_time": "1 day, 8:52:15", "remaining_time": "9:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13889, "total_steps": 17941, "loss": 1.5006, "learning_rate": 1.2480141031333299e-05, "epoch": 0.7741485981829329, "percentage": 77.41, "elapsed_time": "1 day, 8:52:23", "remaining_time": "9:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13890, "total_steps": 17941, "loss": 1.6473, "learning_rate": 1.2474256040131955e-05, "epoch": 0.7742043364360961, "percentage": 77.42, "elapsed_time": "1 day, 8:52:33", "remaining_time": "9:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13891, "total_steps": 17941, "loss": 1.7462, "learning_rate": 1.246837223902842e-05, "epoch": 0.7742600746892593, "percentage": 77.43, "elapsed_time": "1 day, 8:52:41", "remaining_time": "9:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13892, "total_steps": 17941, "loss": 1.5555, "learning_rate": 1.246248962820929e-05, "epoch": 0.7743158129424224, "percentage": 77.43, "elapsed_time": "1 day, 8:52:50", "remaining_time": "9:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13893, "total_steps": 17941, "loss": 1.4746, "learning_rate": 1.2456608207861147e-05, "epoch": 0.7743715511955855, "percentage": 77.44, "elapsed_time": "1 day, 8:52:58", "remaining_time": "9:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13894, "total_steps": 17941, "loss": 1.6586, "learning_rate": 1.2450727978170473e-05, "epoch": 0.7744272894487487, "percentage": 77.44, "elapsed_time": "1 day, 8:53:07", "remaining_time": "9:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13895, "total_steps": 17941, "loss": 1.7492, "learning_rate": 1.2444848939323805e-05, "epoch": 0.7744830277019118, "percentage": 77.45, "elapsed_time": "1 day, 8:53:15", "remaining_time": "9:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13896, "total_steps": 17941, "loss": 1.5381, "learning_rate": 1.243897109150755e-05, "epoch": 0.774538765955075, "percentage": 77.45, "elapsed_time": "1 day, 8:53:24", "remaining_time": "9:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13897, "total_steps": 17941, "loss": 1.4131, "learning_rate": 1.2433094434908143e-05, "epoch": 0.7745945042082382, "percentage": 77.46, "elapsed_time": "1 day, 8:53:32", "remaining_time": "9:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13898, "total_steps": 17941, "loss": 1.3415, "learning_rate": 1.2427218969711945e-05, "epoch": 0.7746502424614012, "percentage": 77.47, "elapsed_time": "1 day, 8:53:41", "remaining_time": "9:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13899, "total_steps": 17941, "loss": 1.6424, "learning_rate": 1.2421344696105298e-05, "epoch": 0.7747059807145644, "percentage": 77.47, "elapsed_time": "1 day, 8:53:50", "remaining_time": "9:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13900, "total_steps": 17941, "loss": 1.8077, "learning_rate": 1.2415471614274515e-05, "epoch": 0.7747617189677275, "percentage": 77.48, "elapsed_time": "1 day, 8:53:58", "remaining_time": "9:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13901, "total_steps": 17941, "loss": 1.6892, "learning_rate": 1.2409599724405807e-05, "epoch": 0.7748174572208907, "percentage": 77.48, "elapsed_time": "1 day, 8:54:07", "remaining_time": "9:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13902, "total_steps": 17941, "loss": 1.722, "learning_rate": 1.2403729026685462e-05, "epoch": 0.7748731954740539, "percentage": 77.49, "elapsed_time": "1 day, 8:54:15", "remaining_time": "9:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13903, "total_steps": 17941, "loss": 1.5116, "learning_rate": 1.2397859521299615e-05, "epoch": 0.7749289337272169, "percentage": 77.49, "elapsed_time": "1 day, 8:54:24", "remaining_time": "9:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13904, "total_steps": 17941, "loss": 1.6784, "learning_rate": 1.2391991208434439e-05, "epoch": 0.7749846719803801, "percentage": 77.5, "elapsed_time": "1 day, 8:54:32", "remaining_time": "9:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13905, "total_steps": 17941, "loss": 1.7135, "learning_rate": 1.2386124088276007e-05, "epoch": 0.7750404102335433, "percentage": 77.5, "elapsed_time": "1 day, 8:54:40", "remaining_time": "9:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13906, "total_steps": 17941, "loss": 1.6567, "learning_rate": 1.2380258161010427e-05, "epoch": 0.7750961484867064, "percentage": 77.51, "elapsed_time": "1 day, 8:54:49", "remaining_time": "9:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13907, "total_steps": 17941, "loss": 1.5234, "learning_rate": 1.2374393426823733e-05, "epoch": 0.7751518867398696, "percentage": 77.52, "elapsed_time": "1 day, 8:54:57", "remaining_time": "9:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13908, "total_steps": 17941, "loss": 1.4218, "learning_rate": 1.2368529885901898e-05, "epoch": 0.7752076249930328, "percentage": 77.52, "elapsed_time": "1 day, 8:55:06", "remaining_time": "9:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13909, "total_steps": 17941, "loss": 1.6467, "learning_rate": 1.2362667538430883e-05, "epoch": 0.7752633632461958, "percentage": 77.53, "elapsed_time": "1 day, 8:55:14", "remaining_time": "9:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13910, "total_steps": 17941, "loss": 1.5709, "learning_rate": 1.2356806384596614e-05, "epoch": 0.775319101499359, "percentage": 77.53, "elapsed_time": "1 day, 8:55:23", "remaining_time": "9:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13911, "total_steps": 17941, "loss": 1.7064, "learning_rate": 1.235094642458497e-05, "epoch": 0.7753748397525222, "percentage": 77.54, "elapsed_time": "1 day, 8:55:31", "remaining_time": "9:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13912, "total_steps": 17941, "loss": 1.7045, "learning_rate": 1.23450876585818e-05, "epoch": 0.7754305780056853, "percentage": 77.54, "elapsed_time": "1 day, 8:55:39", "remaining_time": "9:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13913, "total_steps": 17941, "loss": 1.5096, "learning_rate": 1.2339230086772907e-05, "epoch": 0.7754863162588485, "percentage": 77.55, "elapsed_time": "1 day, 8:55:48", "remaining_time": "9:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13914, "total_steps": 17941, "loss": 1.8464, "learning_rate": 1.2333373709344065e-05, "epoch": 0.7755420545120116, "percentage": 77.55, "elapsed_time": "1 day, 8:55:56", "remaining_time": "9:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13915, "total_steps": 17941, "loss": 1.4544, "learning_rate": 1.2327518526480992e-05, "epoch": 0.7755977927651747, "percentage": 77.56, "elapsed_time": "1 day, 8:56:05", "remaining_time": "9:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13916, "total_steps": 17941, "loss": 1.851, "learning_rate": 1.2321664538369382e-05, "epoch": 0.7756535310183379, "percentage": 77.57, "elapsed_time": "1 day, 8:56:13", "remaining_time": "9:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13917, "total_steps": 17941, "loss": 1.732, "learning_rate": 1.231581174519489e-05, "epoch": 0.7757092692715011, "percentage": 77.57, "elapsed_time": "1 day, 8:56:22", "remaining_time": "9:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13918, "total_steps": 17941, "loss": 1.6381, "learning_rate": 1.2309960147143134e-05, "epoch": 0.7757650075246642, "percentage": 77.58, "elapsed_time": "1 day, 8:56:30", "remaining_time": "9:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13919, "total_steps": 17941, "loss": 1.5694, "learning_rate": 1.2304109744399716e-05, "epoch": 0.7758207457778273, "percentage": 77.58, "elapsed_time": "1 day, 8:56:38", "remaining_time": "9:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13920, "total_steps": 17941, "loss": 1.7807, "learning_rate": 1.2298260537150119e-05, "epoch": 0.7758764840309905, "percentage": 77.59, "elapsed_time": "1 day, 8:56:47", "remaining_time": "9:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13921, "total_steps": 17941, "loss": 1.7266, "learning_rate": 1.2292412525579916e-05, "epoch": 0.7759322222841536, "percentage": 77.59, "elapsed_time": "1 day, 8:56:55", "remaining_time": "9:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13922, "total_steps": 17941, "loss": 1.4124, "learning_rate": 1.228656570987452e-05, "epoch": 0.7759879605373168, "percentage": 77.6, "elapsed_time": "1 day, 8:57:04", "remaining_time": "9:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13923, "total_steps": 17941, "loss": 1.5466, "learning_rate": 1.2280720090219372e-05, "epoch": 0.7760436987904799, "percentage": 77.6, "elapsed_time": "1 day, 8:57:12", "remaining_time": "9:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13924, "total_steps": 17941, "loss": 1.8677, "learning_rate": 1.2274875666799867e-05, "epoch": 0.776099437043643, "percentage": 77.61, "elapsed_time": "1 day, 8:57:21", "remaining_time": "9:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13925, "total_steps": 17941, "loss": 1.862, "learning_rate": 1.2269032439801353e-05, "epoch": 0.7761551752968062, "percentage": 77.62, "elapsed_time": "1 day, 8:57:29", "remaining_time": "9:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13926, "total_steps": 17941, "loss": 1.9658, "learning_rate": 1.226319040940916e-05, "epoch": 0.7762109135499693, "percentage": 77.62, "elapsed_time": "1 day, 8:57:38", "remaining_time": "9:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13927, "total_steps": 17941, "loss": 1.488, "learning_rate": 1.2257349575808513e-05, "epoch": 0.7762666518031325, "percentage": 77.63, "elapsed_time": "1 day, 8:57:46", "remaining_time": "9:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13928, "total_steps": 17941, "loss": 1.8711, "learning_rate": 1.2251509939184713e-05, "epoch": 0.7763223900562957, "percentage": 77.63, "elapsed_time": "1 day, 8:57:55", "remaining_time": "9:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13929, "total_steps": 17941, "loss": 1.6375, "learning_rate": 1.2245671499722916e-05, "epoch": 0.7763781283094587, "percentage": 77.64, "elapsed_time": "1 day, 8:58:03", "remaining_time": "9:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13930, "total_steps": 17941, "loss": 1.9096, "learning_rate": 1.2239834257608312e-05, "epoch": 0.7764338665626219, "percentage": 77.64, "elapsed_time": "1 day, 8:58:12", "remaining_time": "9:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13931, "total_steps": 17941, "loss": 1.7417, "learning_rate": 1.2233998213025977e-05, "epoch": 0.7764896048157851, "percentage": 77.65, "elapsed_time": "1 day, 8:58:20", "remaining_time": "9:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13932, "total_steps": 17941, "loss": 1.6114, "learning_rate": 1.2228163366161038e-05, "epoch": 0.7765453430689482, "percentage": 77.65, "elapsed_time": "1 day, 8:58:29", "remaining_time": "9:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13933, "total_steps": 17941, "loss": 1.6181, "learning_rate": 1.2222329717198556e-05, "epoch": 0.7766010813221114, "percentage": 77.66, "elapsed_time": "1 day, 8:58:37", "remaining_time": "9:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13934, "total_steps": 17941, "loss": 1.6174, "learning_rate": 1.2216497266323495e-05, "epoch": 0.7766568195752745, "percentage": 77.67, "elapsed_time": "1 day, 8:58:46", "remaining_time": "9:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13935, "total_steps": 17941, "loss": 1.5781, "learning_rate": 1.2210666013720845e-05, "epoch": 0.7767125578284376, "percentage": 77.67, "elapsed_time": "1 day, 8:58:54", "remaining_time": "9:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13936, "total_steps": 17941, "loss": 1.6628, "learning_rate": 1.2204835959575545e-05, "epoch": 0.7767682960816008, "percentage": 77.68, "elapsed_time": "1 day, 8:59:03", "remaining_time": "9:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13937, "total_steps": 17941, "loss": 1.506, "learning_rate": 1.219900710407249e-05, "epoch": 0.776824034334764, "percentage": 77.68, "elapsed_time": "1 day, 8:59:11", "remaining_time": "9:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13938, "total_steps": 17941, "loss": 1.8301, "learning_rate": 1.219317944739653e-05, "epoch": 0.7768797725879271, "percentage": 77.69, "elapsed_time": "1 day, 8:59:20", "remaining_time": "9:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13939, "total_steps": 17941, "loss": 1.6372, "learning_rate": 1.2187352989732493e-05, "epoch": 0.7769355108410902, "percentage": 77.69, "elapsed_time": "1 day, 8:59:28", "remaining_time": "9:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13940, "total_steps": 17941, "loss": 1.5859, "learning_rate": 1.2181527731265169e-05, "epoch": 0.7769912490942534, "percentage": 77.7, "elapsed_time": "1 day, 8:59:36", "remaining_time": "9:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13941, "total_steps": 17941, "loss": 1.756, "learning_rate": 1.2175703672179273e-05, "epoch": 0.7770469873474165, "percentage": 77.7, "elapsed_time": "1 day, 8:59:45", "remaining_time": "9:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13942, "total_steps": 17941, "loss": 1.682, "learning_rate": 1.2169880812659529e-05, "epoch": 0.7771027256005797, "percentage": 77.71, "elapsed_time": "1 day, 8:59:53", "remaining_time": "9:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13943, "total_steps": 17941, "loss": 1.5255, "learning_rate": 1.21640591528906e-05, "epoch": 0.7771584638537429, "percentage": 77.72, "elapsed_time": "1 day, 9:00:02", "remaining_time": "9:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13944, "total_steps": 17941, "loss": 1.724, "learning_rate": 1.2158238693057112e-05, "epoch": 0.777214202106906, "percentage": 77.72, "elapsed_time": "1 day, 9:00:10", "remaining_time": "9:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13945, "total_steps": 17941, "loss": 1.6637, "learning_rate": 1.2152419433343676e-05, "epoch": 0.7772699403600691, "percentage": 77.73, "elapsed_time": "1 day, 9:00:19", "remaining_time": "9:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13946, "total_steps": 17941, "loss": 1.732, "learning_rate": 1.2146601373934801e-05, "epoch": 0.7773256786132322, "percentage": 77.73, "elapsed_time": "1 day, 9:00:28", "remaining_time": "9:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13947, "total_steps": 17941, "loss": 1.6216, "learning_rate": 1.2140784515015058e-05, "epoch": 0.7773814168663954, "percentage": 77.74, "elapsed_time": "1 day, 9:00:36", "remaining_time": "9:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13948, "total_steps": 17941, "loss": 1.9204, "learning_rate": 1.213496885676888e-05, "epoch": 0.7774371551195586, "percentage": 77.74, "elapsed_time": "1 day, 9:00:45", "remaining_time": "9:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13949, "total_steps": 17941, "loss": 1.4757, "learning_rate": 1.212915439938072e-05, "epoch": 0.7774928933727216, "percentage": 77.75, "elapsed_time": "1 day, 9:00:53", "remaining_time": "9:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13950, "total_steps": 17941, "loss": 1.7228, "learning_rate": 1.2123341143034988e-05, "epoch": 0.7775486316258848, "percentage": 77.75, "elapsed_time": "1 day, 9:01:02", "remaining_time": "9:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13951, "total_steps": 17941, "loss": 1.6262, "learning_rate": 1.211752908791603e-05, "epoch": 0.777604369879048, "percentage": 77.76, "elapsed_time": "1 day, 9:01:10", "remaining_time": "9:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13952, "total_steps": 17941, "loss": 1.7301, "learning_rate": 1.2111718234208197e-05, "epoch": 0.7776601081322111, "percentage": 77.77, "elapsed_time": "1 day, 9:01:19", "remaining_time": "9:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13953, "total_steps": 17941, "loss": 1.6193, "learning_rate": 1.2105908582095731e-05, "epoch": 0.7777158463853743, "percentage": 77.77, "elapsed_time": "1 day, 9:01:28", "remaining_time": "9:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13954, "total_steps": 17941, "loss": 1.8068, "learning_rate": 1.2100100131762932e-05, "epoch": 0.7777715846385375, "percentage": 77.78, "elapsed_time": "1 day, 9:01:36", "remaining_time": "9:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13955, "total_steps": 17941, "loss": 1.5966, "learning_rate": 1.2094292883393976e-05, "epoch": 0.7778273228917005, "percentage": 77.78, "elapsed_time": "1 day, 9:01:44", "remaining_time": "9:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13956, "total_steps": 17941, "loss": 1.8582, "learning_rate": 1.2088486837173051e-05, "epoch": 0.7778830611448637, "percentage": 77.79, "elapsed_time": "1 day, 9:01:53", "remaining_time": "9:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13957, "total_steps": 17941, "loss": 1.7307, "learning_rate": 1.2082681993284261e-05, "epoch": 0.7779387993980269, "percentage": 77.79, "elapsed_time": "1 day, 9:02:01", "remaining_time": "9:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13958, "total_steps": 17941, "loss": 1.7103, "learning_rate": 1.2076878351911736e-05, "epoch": 0.77799453765119, "percentage": 77.8, "elapsed_time": "1 day, 9:02:10", "remaining_time": "9:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13959, "total_steps": 17941, "loss": 1.7988, "learning_rate": 1.2071075913239538e-05, "epoch": 0.7780502759043532, "percentage": 77.81, "elapsed_time": "1 day, 9:02:18", "remaining_time": "9:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13960, "total_steps": 17941, "loss": 1.7373, "learning_rate": 1.206527467745166e-05, "epoch": 0.7781060141575163, "percentage": 77.81, "elapsed_time": "1 day, 9:02:27", "remaining_time": "9:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13961, "total_steps": 17941, "loss": 1.7231, "learning_rate": 1.2059474644732088e-05, "epoch": 0.7781617524106794, "percentage": 77.82, "elapsed_time": "1 day, 9:02:35", "remaining_time": "9:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13962, "total_steps": 17941, "loss": 1.6934, "learning_rate": 1.2053675815264776e-05, "epoch": 0.7782174906638426, "percentage": 77.82, "elapsed_time": "1 day, 9:02:44", "remaining_time": "9:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13963, "total_steps": 17941, "loss": 1.7624, "learning_rate": 1.2047878189233625e-05, "epoch": 0.7782732289170058, "percentage": 77.83, "elapsed_time": "1 day, 9:02:52", "remaining_time": "9:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13964, "total_steps": 17941, "loss": 1.6195, "learning_rate": 1.2042081766822499e-05, "epoch": 0.7783289671701689, "percentage": 77.83, "elapsed_time": "1 day, 9:03:00", "remaining_time": "9:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13965, "total_steps": 17941, "loss": 1.8619, "learning_rate": 1.2036286548215231e-05, "epoch": 0.778384705423332, "percentage": 77.84, "elapsed_time": "1 day, 9:03:09", "remaining_time": "9:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13966, "total_steps": 17941, "loss": 1.7022, "learning_rate": 1.2030492533595623e-05, "epoch": 0.7784404436764952, "percentage": 77.84, "elapsed_time": "1 day, 9:03:17", "remaining_time": "9:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13967, "total_steps": 17941, "loss": 1.6003, "learning_rate": 1.2024699723147403e-05, "epoch": 0.7784961819296583, "percentage": 77.85, "elapsed_time": "1 day, 9:03:26", "remaining_time": "9:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13968, "total_steps": 17941, "loss": 1.488, "learning_rate": 1.2018908117054295e-05, "epoch": 0.7785519201828215, "percentage": 77.86, "elapsed_time": "1 day, 9:03:34", "remaining_time": "9:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13969, "total_steps": 17941, "loss": 1.7595, "learning_rate": 1.2013117715499972e-05, "epoch": 0.7786076584359846, "percentage": 77.86, "elapsed_time": "1 day, 9:03:43", "remaining_time": "9:24:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13970, "total_steps": 17941, "loss": 1.6972, "learning_rate": 1.2007328518668082e-05, "epoch": 0.7786633966891477, "percentage": 77.87, "elapsed_time": "1 day, 9:03:51", "remaining_time": "9:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13971, "total_steps": 17941, "loss": 1.6437, "learning_rate": 1.2001540526742234e-05, "epoch": 0.7787191349423109, "percentage": 77.87, "elapsed_time": "1 day, 9:03:59", "remaining_time": "9:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13972, "total_steps": 17941, "loss": 1.455, "learning_rate": 1.199575373990594e-05, "epoch": 0.778774873195474, "percentage": 77.88, "elapsed_time": "1 day, 9:04:08", "remaining_time": "9:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13973, "total_steps": 17941, "loss": 1.6241, "learning_rate": 1.198996815834279e-05, "epoch": 0.7788306114486372, "percentage": 77.88, "elapsed_time": "1 day, 9:04:17", "remaining_time": "9:23:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13974, "total_steps": 17941, "loss": 1.7752, "learning_rate": 1.1984183782236219e-05, "epoch": 0.7788863497018004, "percentage": 77.89, "elapsed_time": "1 day, 9:04:26", "remaining_time": "9:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13975, "total_steps": 17941, "loss": 1.5402, "learning_rate": 1.197840061176969e-05, "epoch": 0.7789420879549634, "percentage": 77.89, "elapsed_time": "1 day, 9:04:34", "remaining_time": "9:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13976, "total_steps": 17941, "loss": 1.6849, "learning_rate": 1.1972618647126616e-05, "epoch": 0.7789978262081266, "percentage": 77.9, "elapsed_time": "1 day, 9:04:43", "remaining_time": "9:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13977, "total_steps": 17941, "loss": 1.6473, "learning_rate": 1.1966837888490361e-05, "epoch": 0.7790535644612898, "percentage": 77.91, "elapsed_time": "1 day, 9:04:52", "remaining_time": "9:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13978, "total_steps": 17941, "loss": 1.5457, "learning_rate": 1.1961058336044274e-05, "epoch": 0.7791093027144529, "percentage": 77.91, "elapsed_time": "1 day, 9:05:00", "remaining_time": "9:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13979, "total_steps": 17941, "loss": 1.5844, "learning_rate": 1.1955279989971607e-05, "epoch": 0.7791650409676161, "percentage": 77.92, "elapsed_time": "1 day, 9:05:08", "remaining_time": "9:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13980, "total_steps": 17941, "loss": 1.6657, "learning_rate": 1.1949502850455669e-05, "epoch": 0.7792207792207793, "percentage": 77.92, "elapsed_time": "1 day, 9:05:17", "remaining_time": "9:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13981, "total_steps": 17941, "loss": 1.5395, "learning_rate": 1.1943726917679637e-05, "epoch": 0.7792765174739423, "percentage": 77.93, "elapsed_time": "1 day, 9:05:25", "remaining_time": "9:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13982, "total_steps": 17941, "loss": 1.4989, "learning_rate": 1.1937952191826723e-05, "epoch": 0.7793322557271055, "percentage": 77.93, "elapsed_time": "1 day, 9:05:35", "remaining_time": "9:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13983, "total_steps": 17941, "loss": 1.692, "learning_rate": 1.1932178673080014e-05, "epoch": 0.7793879939802687, "percentage": 77.94, "elapsed_time": "1 day, 9:05:43", "remaining_time": "9:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13984, "total_steps": 17941, "loss": 1.7339, "learning_rate": 1.1926406361622661e-05, "epoch": 0.7794437322334318, "percentage": 77.94, "elapsed_time": "1 day, 9:05:51", "remaining_time": "9:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13985, "total_steps": 17941, "loss": 1.7289, "learning_rate": 1.192063525763773e-05, "epoch": 0.779499470486595, "percentage": 77.95, "elapsed_time": "1 day, 9:06:00", "remaining_time": "9:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13986, "total_steps": 17941, "loss": 1.6664, "learning_rate": 1.1914865361308213e-05, "epoch": 0.7795552087397581, "percentage": 77.96, "elapsed_time": "1 day, 9:06:08", "remaining_time": "9:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13987, "total_steps": 17941, "loss": 1.8228, "learning_rate": 1.1909096672817121e-05, "epoch": 0.7796109469929212, "percentage": 77.96, "elapsed_time": "1 day, 9:06:17", "remaining_time": "9:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13988, "total_steps": 17941, "loss": 1.7243, "learning_rate": 1.1903329192347395e-05, "epoch": 0.7796666852460844, "percentage": 77.97, "elapsed_time": "1 day, 9:06:25", "remaining_time": "9:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13989, "total_steps": 17941, "loss": 1.4968, "learning_rate": 1.1897562920081945e-05, "epoch": 0.7797224234992476, "percentage": 77.97, "elapsed_time": "1 day, 9:06:35", "remaining_time": "9:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13990, "total_steps": 17941, "loss": 1.6693, "learning_rate": 1.1891797856203651e-05, "epoch": 0.7797781617524107, "percentage": 77.98, "elapsed_time": "1 day, 9:06:43", "remaining_time": "9:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13991, "total_steps": 17941, "loss": 1.6512, "learning_rate": 1.188603400089534e-05, "epoch": 0.7798339000055738, "percentage": 77.98, "elapsed_time": "1 day, 9:06:51", "remaining_time": "9:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13992, "total_steps": 17941, "loss": 1.6319, "learning_rate": 1.1880271354339822e-05, "epoch": 0.7798896382587369, "percentage": 77.99, "elapsed_time": "1 day, 9:07:00", "remaining_time": "9:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13993, "total_steps": 17941, "loss": 1.6541, "learning_rate": 1.1874509916719834e-05, "epoch": 0.7799453765119001, "percentage": 77.99, "elapsed_time": "1 day, 9:07:08", "remaining_time": "9:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13994, "total_steps": 17941, "loss": 1.6669, "learning_rate": 1.1868749688218106e-05, "epoch": 0.7800011147650633, "percentage": 78.0, "elapsed_time": "1 day, 9:07:17", "remaining_time": "9:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13995, "total_steps": 17941, "loss": 2.0342, "learning_rate": 1.186299066901731e-05, "epoch": 0.7800568530182264, "percentage": 78.01, "elapsed_time": "1 day, 9:07:25", "remaining_time": "9:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13996, "total_steps": 17941, "loss": 1.7769, "learning_rate": 1.18572328593001e-05, "epoch": 0.7801125912713895, "percentage": 78.01, "elapsed_time": "1 day, 9:07:34", "remaining_time": "9:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13997, "total_steps": 17941, "loss": 1.5211, "learning_rate": 1.185147625924909e-05, "epoch": 0.7801683295245527, "percentage": 78.02, "elapsed_time": "1 day, 9:07:43", "remaining_time": "9:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13998, "total_steps": 17941, "loss": 1.4663, "learning_rate": 1.1845720869046805e-05, "epoch": 0.7802240677777158, "percentage": 78.02, "elapsed_time": "1 day, 9:07:51", "remaining_time": "9:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13999, "total_steps": 17941, "loss": 1.6968, "learning_rate": 1.1839966688875825e-05, "epoch": 0.780279806030879, "percentage": 78.03, "elapsed_time": "1 day, 9:08:00", "remaining_time": "9:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14000, "total_steps": 17941, "loss": 1.6897, "learning_rate": 1.1834213718918602e-05, "epoch": 0.7803355442840422, "percentage": 78.03, "elapsed_time": "1 day, 9:08:09", "remaining_time": "9:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14001, "total_steps": 17941, "loss": 1.7622, "learning_rate": 1.1828461959357595e-05, "epoch": 0.7803912825372052, "percentage": 78.04, "elapsed_time": "1 day, 9:08:17", "remaining_time": "9:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14002, "total_steps": 17941, "loss": 1.5367, "learning_rate": 1.182271141037522e-05, "epoch": 0.7804470207903684, "percentage": 78.04, "elapsed_time": "1 day, 9:08:26", "remaining_time": "9:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14003, "total_steps": 17941, "loss": 1.8351, "learning_rate": 1.1816962072153848e-05, "epoch": 0.7805027590435316, "percentage": 78.05, "elapsed_time": "1 day, 9:08:34", "remaining_time": "9:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14004, "total_steps": 17941, "loss": 1.5502, "learning_rate": 1.1811213944875832e-05, "epoch": 0.7805584972966947, "percentage": 78.06, "elapsed_time": "1 day, 9:08:43", "remaining_time": "9:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14005, "total_steps": 17941, "loss": 1.5114, "learning_rate": 1.1805467028723426e-05, "epoch": 0.7806142355498579, "percentage": 78.06, "elapsed_time": "1 day, 9:08:51", "remaining_time": "9:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14006, "total_steps": 17941, "loss": 1.5488, "learning_rate": 1.1799721323878943e-05, "epoch": 0.7806699738030211, "percentage": 78.07, "elapsed_time": "1 day, 9:08:59", "remaining_time": "9:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14007, "total_steps": 17941, "loss": 1.5781, "learning_rate": 1.1793976830524567e-05, "epoch": 0.7807257120561841, "percentage": 78.07, "elapsed_time": "1 day, 9:09:08", "remaining_time": "9:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14008, "total_steps": 17941, "loss": 1.6267, "learning_rate": 1.1788233548842486e-05, "epoch": 0.7807814503093473, "percentage": 78.08, "elapsed_time": "1 day, 9:09:16", "remaining_time": "9:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14009, "total_steps": 17941, "loss": 1.7858, "learning_rate": 1.1782491479014846e-05, "epoch": 0.7808371885625105, "percentage": 78.08, "elapsed_time": "1 day, 9:09:25", "remaining_time": "9:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14010, "total_steps": 17941, "loss": 1.394, "learning_rate": 1.1776750621223754e-05, "epoch": 0.7808929268156736, "percentage": 78.09, "elapsed_time": "1 day, 9:09:33", "remaining_time": "9:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14011, "total_steps": 17941, "loss": 1.8826, "learning_rate": 1.1771010975651287e-05, "epoch": 0.7809486650688368, "percentage": 78.09, "elapsed_time": "1 day, 9:09:42", "remaining_time": "9:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14012, "total_steps": 17941, "loss": 1.6163, "learning_rate": 1.176527254247945e-05, "epoch": 0.7810044033219999, "percentage": 78.1, "elapsed_time": "1 day, 9:09:50", "remaining_time": "9:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14013, "total_steps": 17941, "loss": 1.6258, "learning_rate": 1.1759535321890247e-05, "epoch": 0.781060141575163, "percentage": 78.11, "elapsed_time": "1 day, 9:09:59", "remaining_time": "9:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14014, "total_steps": 17941, "loss": 1.7727, "learning_rate": 1.1753799314065622e-05, "epoch": 0.7811158798283262, "percentage": 78.11, "elapsed_time": "1 day, 9:10:07", "remaining_time": "9:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14015, "total_steps": 17941, "loss": 1.5458, "learning_rate": 1.1748064519187507e-05, "epoch": 0.7811716180814893, "percentage": 78.12, "elapsed_time": "1 day, 9:10:15", "remaining_time": "9:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14016, "total_steps": 17941, "loss": 1.5589, "learning_rate": 1.1742330937437729e-05, "epoch": 0.7812273563346525, "percentage": 78.12, "elapsed_time": "1 day, 9:10:24", "remaining_time": "9:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14017, "total_steps": 17941, "loss": 1.752, "learning_rate": 1.1736598568998175e-05, "epoch": 0.7812830945878156, "percentage": 78.13, "elapsed_time": "1 day, 9:10:32", "remaining_time": "9:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14018, "total_steps": 17941, "loss": 1.8233, "learning_rate": 1.1730867414050634e-05, "epoch": 0.7813388328409787, "percentage": 78.13, "elapsed_time": "1 day, 9:10:41", "remaining_time": "9:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14019, "total_steps": 17941, "loss": 1.3202, "learning_rate": 1.1725137472776842e-05, "epoch": 0.7813945710941419, "percentage": 78.14, "elapsed_time": "1 day, 9:10:49", "remaining_time": "9:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14020, "total_steps": 17941, "loss": 1.7173, "learning_rate": 1.1719408745358534e-05, "epoch": 0.7814503093473051, "percentage": 78.15, "elapsed_time": "1 day, 9:10:58", "remaining_time": "9:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14021, "total_steps": 17941, "loss": 1.6645, "learning_rate": 1.1713681231977387e-05, "epoch": 0.7815060476004682, "percentage": 78.15, "elapsed_time": "1 day, 9:11:06", "remaining_time": "9:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14022, "total_steps": 17941, "loss": 1.6041, "learning_rate": 1.1707954932815046e-05, "epoch": 0.7815617858536313, "percentage": 78.16, "elapsed_time": "1 day, 9:11:16", "remaining_time": "9:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14023, "total_steps": 17941, "loss": 1.6196, "learning_rate": 1.1702229848053131e-05, "epoch": 0.7816175241067945, "percentage": 78.16, "elapsed_time": "1 day, 9:11:24", "remaining_time": "9:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14024, "total_steps": 17941, "loss": 1.9201, "learning_rate": 1.1696505977873167e-05, "epoch": 0.7816732623599576, "percentage": 78.17, "elapsed_time": "1 day, 9:11:32", "remaining_time": "9:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14025, "total_steps": 17941, "loss": 1.596, "learning_rate": 1.1690783322456734e-05, "epoch": 0.7817290006131208, "percentage": 78.17, "elapsed_time": "1 day, 9:11:41", "remaining_time": "9:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14026, "total_steps": 17941, "loss": 1.6196, "learning_rate": 1.1685061881985282e-05, "epoch": 0.781784738866284, "percentage": 78.18, "elapsed_time": "1 day, 9:11:49", "remaining_time": "9:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14027, "total_steps": 17941, "loss": 1.7333, "learning_rate": 1.1679341656640275e-05, "epoch": 0.781840477119447, "percentage": 78.18, "elapsed_time": "1 day, 9:11:58", "remaining_time": "9:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14028, "total_steps": 17941, "loss": 1.6193, "learning_rate": 1.1673622646603127e-05, "epoch": 0.7818962153726102, "percentage": 78.19, "elapsed_time": "1 day, 9:12:06", "remaining_time": "9:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14029, "total_steps": 17941, "loss": 1.6827, "learning_rate": 1.1667904852055212e-05, "epoch": 0.7819519536257734, "percentage": 78.2, "elapsed_time": "1 day, 9:12:15", "remaining_time": "9:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14030, "total_steps": 17941, "loss": 1.5779, "learning_rate": 1.1662188273177877e-05, "epoch": 0.7820076918789365, "percentage": 78.2, "elapsed_time": "1 day, 9:12:23", "remaining_time": "9:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14031, "total_steps": 17941, "loss": 1.5118, "learning_rate": 1.1656472910152376e-05, "epoch": 0.7820634301320997, "percentage": 78.21, "elapsed_time": "1 day, 9:12:32", "remaining_time": "9:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14032, "total_steps": 17941, "loss": 1.7555, "learning_rate": 1.1650758763160025e-05, "epoch": 0.7821191683852629, "percentage": 78.21, "elapsed_time": "1 day, 9:12:40", "remaining_time": "9:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14033, "total_steps": 17941, "loss": 1.8431, "learning_rate": 1.1645045832381995e-05, "epoch": 0.7821749066384259, "percentage": 78.22, "elapsed_time": "1 day, 9:12:49", "remaining_time": "9:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14034, "total_steps": 17941, "loss": 1.523, "learning_rate": 1.1639334117999496e-05, "epoch": 0.7822306448915891, "percentage": 78.22, "elapsed_time": "1 day, 9:12:57", "remaining_time": "9:14:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14035, "total_steps": 17941, "loss": 1.6873, "learning_rate": 1.163362362019365e-05, "epoch": 0.7822863831447523, "percentage": 78.23, "elapsed_time": "1 day, 9:13:06", "remaining_time": "9:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14036, "total_steps": 17941, "loss": 1.7052, "learning_rate": 1.162791433914558e-05, "epoch": 0.7823421213979154, "percentage": 78.23, "elapsed_time": "1 day, 9:13:14", "remaining_time": "9:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14037, "total_steps": 17941, "loss": 1.8216, "learning_rate": 1.1622206275036352e-05, "epoch": 0.7823978596510786, "percentage": 78.24, "elapsed_time": "1 day, 9:13:23", "remaining_time": "9:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14038, "total_steps": 17941, "loss": 1.5163, "learning_rate": 1.1616499428046974e-05, "epoch": 0.7824535979042416, "percentage": 78.25, "elapsed_time": "1 day, 9:13:31", "remaining_time": "9:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14039, "total_steps": 17941, "loss": 1.5863, "learning_rate": 1.1610793798358433e-05, "epoch": 0.7825093361574048, "percentage": 78.25, "elapsed_time": "1 day, 9:13:40", "remaining_time": "9:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14040, "total_steps": 17941, "loss": 1.5654, "learning_rate": 1.1605089386151695e-05, "epoch": 0.782565074410568, "percentage": 78.26, "elapsed_time": "1 day, 9:13:49", "remaining_time": "9:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14041, "total_steps": 17941, "loss": 1.6553, "learning_rate": 1.1599386191607675e-05, "epoch": 0.7826208126637311, "percentage": 78.26, "elapsed_time": "1 day, 9:13:57", "remaining_time": "9:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14042, "total_steps": 17941, "loss": 1.5521, "learning_rate": 1.1593684214907207e-05, "epoch": 0.7826765509168943, "percentage": 78.27, "elapsed_time": "1 day, 9:14:06", "remaining_time": "9:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14043, "total_steps": 17941, "loss": 1.6284, "learning_rate": 1.1587983456231166e-05, "epoch": 0.7827322891700574, "percentage": 78.27, "elapsed_time": "1 day, 9:14:14", "remaining_time": "9:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14044, "total_steps": 17941, "loss": 1.29, "learning_rate": 1.158228391576035e-05, "epoch": 0.7827880274232205, "percentage": 78.28, "elapsed_time": "1 day, 9:14:23", "remaining_time": "9:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14045, "total_steps": 17941, "loss": 1.5505, "learning_rate": 1.1576585593675477e-05, "epoch": 0.7828437656763837, "percentage": 78.28, "elapsed_time": "1 day, 9:14:31", "remaining_time": "9:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14046, "total_steps": 17941, "loss": 1.369, "learning_rate": 1.1570888490157289e-05, "epoch": 0.7828995039295469, "percentage": 78.29, "elapsed_time": "1 day, 9:14:39", "remaining_time": "9:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14047, "total_steps": 17941, "loss": 1.7068, "learning_rate": 1.156519260538646e-05, "epoch": 0.78295524218271, "percentage": 78.3, "elapsed_time": "1 day, 9:14:48", "remaining_time": "9:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14048, "total_steps": 17941, "loss": 1.5027, "learning_rate": 1.155949793954363e-05, "epoch": 0.7830109804358731, "percentage": 78.3, "elapsed_time": "1 day, 9:14:57", "remaining_time": "9:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14049, "total_steps": 17941, "loss": 1.9128, "learning_rate": 1.1553804492809417e-05, "epoch": 0.7830667186890363, "percentage": 78.31, "elapsed_time": "1 day, 9:15:05", "remaining_time": "9:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14050, "total_steps": 17941, "loss": 1.7097, "learning_rate": 1.1548112265364336e-05, "epoch": 0.7831224569421994, "percentage": 78.31, "elapsed_time": "1 day, 9:15:14", "remaining_time": "9:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14051, "total_steps": 17941, "loss": 1.78, "learning_rate": 1.154242125738898e-05, "epoch": 0.7831781951953626, "percentage": 78.32, "elapsed_time": "1 day, 9:15:22", "remaining_time": "9:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14052, "total_steps": 17941, "loss": 2.0257, "learning_rate": 1.1536731469063777e-05, "epoch": 0.7832339334485258, "percentage": 78.32, "elapsed_time": "1 day, 9:15:31", "remaining_time": "9:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14053, "total_steps": 17941, "loss": 1.5198, "learning_rate": 1.15310429005692e-05, "epoch": 0.7832896717016888, "percentage": 78.33, "elapsed_time": "1 day, 9:15:39", "remaining_time": "9:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14054, "total_steps": 17941, "loss": 1.2568, "learning_rate": 1.1525355552085648e-05, "epoch": 0.783345409954852, "percentage": 78.33, "elapsed_time": "1 day, 9:15:47", "remaining_time": "9:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14055, "total_steps": 17941, "loss": 1.6483, "learning_rate": 1.15196694237935e-05, "epoch": 0.7834011482080152, "percentage": 78.34, "elapsed_time": "1 day, 9:15:56", "remaining_time": "9:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14056, "total_steps": 17941, "loss": 1.5516, "learning_rate": 1.1513984515873094e-05, "epoch": 0.7834568864611783, "percentage": 78.35, "elapsed_time": "1 day, 9:16:04", "remaining_time": "9:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14057, "total_steps": 17941, "loss": 1.8275, "learning_rate": 1.150830082850468e-05, "epoch": 0.7835126247143415, "percentage": 78.35, "elapsed_time": "1 day, 9:16:13", "remaining_time": "9:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14058, "total_steps": 17941, "loss": 1.5679, "learning_rate": 1.1502618361868572e-05, "epoch": 0.7835683629675047, "percentage": 78.36, "elapsed_time": "1 day, 9:16:21", "remaining_time": "9:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14059, "total_steps": 17941, "loss": 1.6907, "learning_rate": 1.149693711614494e-05, "epoch": 0.7836241012206677, "percentage": 78.36, "elapsed_time": "1 day, 9:16:30", "remaining_time": "9:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14060, "total_steps": 17941, "loss": 1.4673, "learning_rate": 1.1491257091513974e-05, "epoch": 0.7836798394738309, "percentage": 78.37, "elapsed_time": "1 day, 9:16:38", "remaining_time": "9:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14061, "total_steps": 17941, "loss": 1.4492, "learning_rate": 1.1485578288155813e-05, "epoch": 0.783735577726994, "percentage": 78.37, "elapsed_time": "1 day, 9:16:47", "remaining_time": "9:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14062, "total_steps": 17941, "loss": 1.6429, "learning_rate": 1.1479900706250552e-05, "epoch": 0.7837913159801572, "percentage": 78.38, "elapsed_time": "1 day, 9:16:55", "remaining_time": "9:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14063, "total_steps": 17941, "loss": 1.6883, "learning_rate": 1.1474224345978268e-05, "epoch": 0.7838470542333204, "percentage": 78.38, "elapsed_time": "1 day, 9:17:04", "remaining_time": "9:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14064, "total_steps": 17941, "loss": 1.6511, "learning_rate": 1.1468549207518953e-05, "epoch": 0.7839027924864834, "percentage": 78.39, "elapsed_time": "1 day, 9:17:12", "remaining_time": "9:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14065, "total_steps": 17941, "loss": 1.7315, "learning_rate": 1.1462875291052604e-05, "epoch": 0.7839585307396466, "percentage": 78.4, "elapsed_time": "1 day, 9:17:21", "remaining_time": "9:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14066, "total_steps": 17941, "loss": 1.2648, "learning_rate": 1.1457202596759165e-05, "epoch": 0.7840142689928098, "percentage": 78.4, "elapsed_time": "1 day, 9:17:29", "remaining_time": "9:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14067, "total_steps": 17941, "loss": 1.5514, "learning_rate": 1.1451531124818548e-05, "epoch": 0.7840700072459729, "percentage": 78.41, "elapsed_time": "1 day, 9:17:38", "remaining_time": "9:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14068, "total_steps": 17941, "loss": 1.5198, "learning_rate": 1.1445860875410586e-05, "epoch": 0.784125745499136, "percentage": 78.41, "elapsed_time": "1 day, 9:17:47", "remaining_time": "9:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14069, "total_steps": 17941, "loss": 1.6896, "learning_rate": 1.1440191848715143e-05, "epoch": 0.7841814837522992, "percentage": 78.42, "elapsed_time": "1 day, 9:17:56", "remaining_time": "9:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14070, "total_steps": 17941, "loss": 1.4559, "learning_rate": 1.1434524044912009e-05, "epoch": 0.7842372220054623, "percentage": 78.42, "elapsed_time": "1 day, 9:18:04", "remaining_time": "9:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14071, "total_steps": 17941, "loss": 1.6122, "learning_rate": 1.1428857464180908e-05, "epoch": 0.7842929602586255, "percentage": 78.43, "elapsed_time": "1 day, 9:18:13", "remaining_time": "9:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14072, "total_steps": 17941, "loss": 1.7864, "learning_rate": 1.1423192106701563e-05, "epoch": 0.7843486985117887, "percentage": 78.43, "elapsed_time": "1 day, 9:18:21", "remaining_time": "9:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14073, "total_steps": 17941, "loss": 1.6808, "learning_rate": 1.1417527972653647e-05, "epoch": 0.7844044367649518, "percentage": 78.44, "elapsed_time": "1 day, 9:18:30", "remaining_time": "9:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14074, "total_steps": 17941, "loss": 1.7022, "learning_rate": 1.1411865062216792e-05, "epoch": 0.7844601750181149, "percentage": 78.45, "elapsed_time": "1 day, 9:18:38", "remaining_time": "9:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14075, "total_steps": 17941, "loss": 1.5988, "learning_rate": 1.140620337557059e-05, "epoch": 0.7845159132712781, "percentage": 78.45, "elapsed_time": "1 day, 9:18:47", "remaining_time": "9:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14076, "total_steps": 17941, "loss": 1.5858, "learning_rate": 1.1400542912894602e-05, "epoch": 0.7845716515244412, "percentage": 78.46, "elapsed_time": "1 day, 9:18:56", "remaining_time": "9:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14077, "total_steps": 17941, "loss": 1.795, "learning_rate": 1.1394883674368356e-05, "epoch": 0.7846273897776044, "percentage": 78.46, "elapsed_time": "1 day, 9:19:04", "remaining_time": "9:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14078, "total_steps": 17941, "loss": 1.7813, "learning_rate": 1.1389225660171299e-05, "epoch": 0.7846831280307676, "percentage": 78.47, "elapsed_time": "1 day, 9:19:13", "remaining_time": "9:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14079, "total_steps": 17941, "loss": 1.6134, "learning_rate": 1.1383568870482891e-05, "epoch": 0.7847388662839306, "percentage": 78.47, "elapsed_time": "1 day, 9:19:21", "remaining_time": "9:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14080, "total_steps": 17941, "loss": 1.6329, "learning_rate": 1.137791330548253e-05, "epoch": 0.7847946045370938, "percentage": 78.48, "elapsed_time": "1 day, 9:19:29", "remaining_time": "9:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14081, "total_steps": 17941, "loss": 1.6439, "learning_rate": 1.1372258965349575e-05, "epoch": 0.784850342790257, "percentage": 78.49, "elapsed_time": "1 day, 9:19:38", "remaining_time": "9:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14082, "total_steps": 17941, "loss": 1.5401, "learning_rate": 1.1366605850263368e-05, "epoch": 0.7849060810434201, "percentage": 78.49, "elapsed_time": "1 day, 9:19:47", "remaining_time": "9:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14083, "total_steps": 17941, "loss": 1.7608, "learning_rate": 1.1360953960403142e-05, "epoch": 0.7849618192965833, "percentage": 78.5, "elapsed_time": "1 day, 9:19:55", "remaining_time": "9:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14084, "total_steps": 17941, "loss": 1.7358, "learning_rate": 1.1355303295948205e-05, "epoch": 0.7850175575497463, "percentage": 78.5, "elapsed_time": "1 day, 9:20:03", "remaining_time": "9:07:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14085, "total_steps": 17941, "loss": 1.7373, "learning_rate": 1.1349653857077718e-05, "epoch": 0.7850732958029095, "percentage": 78.51, "elapsed_time": "1 day, 9:20:12", "remaining_time": "9:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14086, "total_steps": 17941, "loss": 1.6794, "learning_rate": 1.1344005643970863e-05, "epoch": 0.7851290340560727, "percentage": 78.51, "elapsed_time": "1 day, 9:20:20", "remaining_time": "9:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14087, "total_steps": 17941, "loss": 1.7308, "learning_rate": 1.1338358656806769e-05, "epoch": 0.7851847723092358, "percentage": 78.52, "elapsed_time": "1 day, 9:20:29", "remaining_time": "9:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14088, "total_steps": 17941, "loss": 1.602, "learning_rate": 1.133271289576453e-05, "epoch": 0.785240510562399, "percentage": 78.52, "elapsed_time": "1 day, 9:20:38", "remaining_time": "9:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14089, "total_steps": 17941, "loss": 1.803, "learning_rate": 1.1327068361023202e-05, "epoch": 0.7852962488155621, "percentage": 78.53, "elapsed_time": "1 day, 9:20:46", "remaining_time": "9:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14090, "total_steps": 17941, "loss": 1.4317, "learning_rate": 1.132142505276177e-05, "epoch": 0.7853519870687252, "percentage": 78.54, "elapsed_time": "1 day, 9:20:55", "remaining_time": "9:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14091, "total_steps": 17941, "loss": 1.6327, "learning_rate": 1.1315782971159227e-05, "epoch": 0.7854077253218884, "percentage": 78.54, "elapsed_time": "1 day, 9:21:03", "remaining_time": "9:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14092, "total_steps": 17941, "loss": 1.7124, "learning_rate": 1.1310142116394506e-05, "epoch": 0.7854634635750516, "percentage": 78.55, "elapsed_time": "1 day, 9:21:12", "remaining_time": "9:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14093, "total_steps": 17941, "loss": 1.7282, "learning_rate": 1.1304502488646513e-05, "epoch": 0.7855192018282147, "percentage": 78.55, "elapsed_time": "1 day, 9:21:20", "remaining_time": "9:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14094, "total_steps": 17941, "loss": 1.3171, "learning_rate": 1.1298864088094058e-05, "epoch": 0.7855749400813778, "percentage": 78.56, "elapsed_time": "1 day, 9:21:29", "remaining_time": "9:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14095, "total_steps": 17941, "loss": 1.52, "learning_rate": 1.1293226914916006e-05, "epoch": 0.785630678334541, "percentage": 78.56, "elapsed_time": "1 day, 9:21:38", "remaining_time": "9:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14096, "total_steps": 17941, "loss": 1.6558, "learning_rate": 1.128759096929114e-05, "epoch": 0.7856864165877041, "percentage": 78.57, "elapsed_time": "1 day, 9:21:46", "remaining_time": "9:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14097, "total_steps": 17941, "loss": 1.6298, "learning_rate": 1.1281956251398157e-05, "epoch": 0.7857421548408673, "percentage": 78.57, "elapsed_time": "1 day, 9:21:55", "remaining_time": "9:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14098, "total_steps": 17941, "loss": 1.4396, "learning_rate": 1.1276322761415786e-05, "epoch": 0.7857978930940305, "percentage": 78.58, "elapsed_time": "1 day, 9:22:03", "remaining_time": "9:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14099, "total_steps": 17941, "loss": 2.072, "learning_rate": 1.127069049952268e-05, "epoch": 0.7858536313471935, "percentage": 78.59, "elapsed_time": "1 day, 9:22:12", "remaining_time": "9:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14100, "total_steps": 17941, "loss": 1.6547, "learning_rate": 1.1265059465897465e-05, "epoch": 0.7859093696003567, "percentage": 78.59, "elapsed_time": "1 day, 9:22:20", "remaining_time": "9:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14101, "total_steps": 17941, "loss": 1.6223, "learning_rate": 1.1259429660718723e-05, "epoch": 0.7859651078535199, "percentage": 78.6, "elapsed_time": "1 day, 9:22:28", "remaining_time": "9:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14102, "total_steps": 17941, "loss": 1.632, "learning_rate": 1.1253801084164995e-05, "epoch": 0.786020846106683, "percentage": 78.6, "elapsed_time": "1 day, 9:22:37", "remaining_time": "9:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14103, "total_steps": 17941, "loss": 1.7907, "learning_rate": 1.1248173736414808e-05, "epoch": 0.7860765843598462, "percentage": 78.61, "elapsed_time": "1 day, 9:22:46", "remaining_time": "9:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14104, "total_steps": 17941, "loss": 1.7747, "learning_rate": 1.1242547617646598e-05, "epoch": 0.7861323226130094, "percentage": 78.61, "elapsed_time": "1 day, 9:22:54", "remaining_time": "9:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14105, "total_steps": 17941, "loss": 1.5891, "learning_rate": 1.1236922728038807e-05, "epoch": 0.7861880608661724, "percentage": 78.62, "elapsed_time": "1 day, 9:23:03", "remaining_time": "9:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14106, "total_steps": 17941, "loss": 1.5138, "learning_rate": 1.1231299067769818e-05, "epoch": 0.7862437991193356, "percentage": 78.62, "elapsed_time": "1 day, 9:23:11", "remaining_time": "9:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14107, "total_steps": 17941, "loss": 1.5725, "learning_rate": 1.122567663701799e-05, "epoch": 0.7862995373724987, "percentage": 78.63, "elapsed_time": "1 day, 9:23:20", "remaining_time": "9:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14108, "total_steps": 17941, "loss": 1.8054, "learning_rate": 1.122005543596164e-05, "epoch": 0.7863552756256619, "percentage": 78.64, "elapsed_time": "1 day, 9:23:28", "remaining_time": "9:04:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14109, "total_steps": 17941, "loss": 1.6492, "learning_rate": 1.1214435464779006e-05, "epoch": 0.7864110138788251, "percentage": 78.64, "elapsed_time": "1 day, 9:23:37", "remaining_time": "9:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14110, "total_steps": 17941, "loss": 1.5806, "learning_rate": 1.1208816723648364e-05, "epoch": 0.7864667521319881, "percentage": 78.65, "elapsed_time": "1 day, 9:23:45", "remaining_time": "9:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14111, "total_steps": 17941, "loss": 1.691, "learning_rate": 1.1203199212747878e-05, "epoch": 0.7865224903851513, "percentage": 78.65, "elapsed_time": "1 day, 9:23:53", "remaining_time": "9:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14112, "total_steps": 17941, "loss": 1.7296, "learning_rate": 1.1197582932255712e-05, "epoch": 0.7865782286383145, "percentage": 78.66, "elapsed_time": "1 day, 9:24:02", "remaining_time": "9:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14113, "total_steps": 17941, "loss": 1.5213, "learning_rate": 1.119196788234998e-05, "epoch": 0.7866339668914776, "percentage": 78.66, "elapsed_time": "1 day, 9:24:11", "remaining_time": "9:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14114, "total_steps": 17941, "loss": 1.6295, "learning_rate": 1.1186354063208759e-05, "epoch": 0.7866897051446408, "percentage": 78.67, "elapsed_time": "1 day, 9:24:19", "remaining_time": "9:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14115, "total_steps": 17941, "loss": 1.5283, "learning_rate": 1.1180741475010104e-05, "epoch": 0.786745443397804, "percentage": 78.67, "elapsed_time": "1 day, 9:24:27", "remaining_time": "9:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14116, "total_steps": 17941, "loss": 1.3781, "learning_rate": 1.1175130117931987e-05, "epoch": 0.786801181650967, "percentage": 78.68, "elapsed_time": "1 day, 9:24:36", "remaining_time": "9:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14117, "total_steps": 17941, "loss": 1.554, "learning_rate": 1.1169519992152372e-05, "epoch": 0.7868569199041302, "percentage": 78.69, "elapsed_time": "1 day, 9:24:45", "remaining_time": "9:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14118, "total_steps": 17941, "loss": 1.5795, "learning_rate": 1.1163911097849189e-05, "epoch": 0.7869126581572934, "percentage": 78.69, "elapsed_time": "1 day, 9:24:54", "remaining_time": "9:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14119, "total_steps": 17941, "loss": 1.7236, "learning_rate": 1.1158303435200324e-05, "epoch": 0.7869683964104565, "percentage": 78.7, "elapsed_time": "1 day, 9:25:02", "remaining_time": "9:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14120, "total_steps": 17941, "loss": 1.7392, "learning_rate": 1.115269700438359e-05, "epoch": 0.7870241346636196, "percentage": 78.7, "elapsed_time": "1 day, 9:25:11", "remaining_time": "9:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14121, "total_steps": 17941, "loss": 1.6407, "learning_rate": 1.114709180557682e-05, "epoch": 0.7870798729167828, "percentage": 78.71, "elapsed_time": "1 day, 9:25:19", "remaining_time": "9:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14122, "total_steps": 17941, "loss": 1.6539, "learning_rate": 1.1141487838957787e-05, "epoch": 0.7871356111699459, "percentage": 78.71, "elapsed_time": "1 day, 9:25:27", "remaining_time": "9:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14123, "total_steps": 17941, "loss": 1.3411, "learning_rate": 1.1135885104704186e-05, "epoch": 0.7871913494231091, "percentage": 78.72, "elapsed_time": "1 day, 9:25:36", "remaining_time": "9:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14124, "total_steps": 17941, "loss": 1.6036, "learning_rate": 1.1130283602993718e-05, "epoch": 0.7872470876762723, "percentage": 78.72, "elapsed_time": "1 day, 9:25:45", "remaining_time": "9:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14125, "total_steps": 17941, "loss": 1.8074, "learning_rate": 1.1124683334004021e-05, "epoch": 0.7873028259294353, "percentage": 78.73, "elapsed_time": "1 day, 9:25:53", "remaining_time": "9:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14126, "total_steps": 17941, "loss": 1.893, "learning_rate": 1.1119084297912729e-05, "epoch": 0.7873585641825985, "percentage": 78.74, "elapsed_time": "1 day, 9:26:02", "remaining_time": "9:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14127, "total_steps": 17941, "loss": 1.5241, "learning_rate": 1.1113486494897363e-05, "epoch": 0.7874143024357617, "percentage": 78.74, "elapsed_time": "1 day, 9:26:10", "remaining_time": "9:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14128, "total_steps": 17941, "loss": 1.4693, "learning_rate": 1.1107889925135495e-05, "epoch": 0.7874700406889248, "percentage": 78.75, "elapsed_time": "1 day, 9:26:18", "remaining_time": "9:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14129, "total_steps": 17941, "loss": 1.8778, "learning_rate": 1.1102294588804613e-05, "epoch": 0.787525778942088, "percentage": 78.75, "elapsed_time": "1 day, 9:26:27", "remaining_time": "9:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14130, "total_steps": 17941, "loss": 1.5998, "learning_rate": 1.1096700486082146e-05, "epoch": 0.787581517195251, "percentage": 78.76, "elapsed_time": "1 day, 9:26:36", "remaining_time": "9:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14131, "total_steps": 17941, "loss": 1.473, "learning_rate": 1.1091107617145519e-05, "epoch": 0.7876372554484142, "percentage": 78.76, "elapsed_time": "1 day, 9:26:45", "remaining_time": "9:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14132, "total_steps": 17941, "loss": 1.4516, "learning_rate": 1.10855159821721e-05, "epoch": 0.7876929937015774, "percentage": 78.77, "elapsed_time": "1 day, 9:26:53", "remaining_time": "9:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14133, "total_steps": 17941, "loss": 1.8915, "learning_rate": 1.1079925581339229e-05, "epoch": 0.7877487319547405, "percentage": 78.77, "elapsed_time": "1 day, 9:27:01", "remaining_time": "9:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14134, "total_steps": 17941, "loss": 1.5509, "learning_rate": 1.1074336414824215e-05, "epoch": 0.7878044702079037, "percentage": 78.78, "elapsed_time": "1 day, 9:27:10", "remaining_time": "9:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14135, "total_steps": 17941, "loss": 1.4576, "learning_rate": 1.1068748482804264e-05, "epoch": 0.7878602084610669, "percentage": 78.79, "elapsed_time": "1 day, 9:27:18", "remaining_time": "9:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14136, "total_steps": 17941, "loss": 1.8418, "learning_rate": 1.106316178545666e-05, "epoch": 0.7879159467142299, "percentage": 78.79, "elapsed_time": "1 day, 9:27:27", "remaining_time": "9:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14137, "total_steps": 17941, "loss": 1.6923, "learning_rate": 1.105757632295853e-05, "epoch": 0.7879716849673931, "percentage": 78.8, "elapsed_time": "1 day, 9:27:35", "remaining_time": "9:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14138, "total_steps": 17941, "loss": 1.6677, "learning_rate": 1.1051992095487029e-05, "epoch": 0.7880274232205563, "percentage": 78.8, "elapsed_time": "1 day, 9:27:44", "remaining_time": "9:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14139, "total_steps": 17941, "loss": 2.0795, "learning_rate": 1.1046409103219251e-05, "epoch": 0.7880831614737194, "percentage": 78.81, "elapsed_time": "1 day, 9:27:52", "remaining_time": "8:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14140, "total_steps": 17941, "loss": 1.572, "learning_rate": 1.1040827346332272e-05, "epoch": 0.7881388997268826, "percentage": 78.81, "elapsed_time": "1 day, 9:28:01", "remaining_time": "8:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14141, "total_steps": 17941, "loss": 1.7121, "learning_rate": 1.103524682500311e-05, "epoch": 0.7881946379800457, "percentage": 78.82, "elapsed_time": "1 day, 9:28:09", "remaining_time": "8:59:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14142, "total_steps": 17941, "loss": 1.8675, "learning_rate": 1.1029667539408723e-05, "epoch": 0.7882503762332088, "percentage": 78.83, "elapsed_time": "1 day, 9:28:18", "remaining_time": "8:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14143, "total_steps": 17941, "loss": 1.7795, "learning_rate": 1.102408948972607e-05, "epoch": 0.788306114486372, "percentage": 78.83, "elapsed_time": "1 day, 9:28:26", "remaining_time": "8:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14144, "total_steps": 17941, "loss": 1.3756, "learning_rate": 1.1018512676132054e-05, "epoch": 0.7883618527395352, "percentage": 78.84, "elapsed_time": "1 day, 9:28:35", "remaining_time": "8:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14145, "total_steps": 17941, "loss": 1.5751, "learning_rate": 1.101293709880355e-05, "epoch": 0.7884175909926983, "percentage": 78.84, "elapsed_time": "1 day, 9:28:43", "remaining_time": "8:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14146, "total_steps": 17941, "loss": 1.5829, "learning_rate": 1.1007362757917344e-05, "epoch": 0.7884733292458614, "percentage": 78.85, "elapsed_time": "1 day, 9:28:51", "remaining_time": "8:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14147, "total_steps": 17941, "loss": 1.6555, "learning_rate": 1.1001789653650264e-05, "epoch": 0.7885290674990246, "percentage": 78.85, "elapsed_time": "1 day, 9:29:00", "remaining_time": "8:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14148, "total_steps": 17941, "loss": 1.8102, "learning_rate": 1.0996217786179052e-05, "epoch": 0.7885848057521877, "percentage": 78.86, "elapsed_time": "1 day, 9:29:08", "remaining_time": "8:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14149, "total_steps": 17941, "loss": 1.6791, "learning_rate": 1.099064715568039e-05, "epoch": 0.7886405440053509, "percentage": 78.86, "elapsed_time": "1 day, 9:29:17", "remaining_time": "8:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14150, "total_steps": 17941, "loss": 1.6076, "learning_rate": 1.0985077762330963e-05, "epoch": 0.7886962822585141, "percentage": 78.87, "elapsed_time": "1 day, 9:29:25", "remaining_time": "8:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14151, "total_steps": 17941, "loss": 1.6604, "learning_rate": 1.0979509606307398e-05, "epoch": 0.7887520205116771, "percentage": 78.88, "elapsed_time": "1 day, 9:29:34", "remaining_time": "8:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14152, "total_steps": 17941, "loss": 1.588, "learning_rate": 1.0973942687786293e-05, "epoch": 0.7888077587648403, "percentage": 78.88, "elapsed_time": "1 day, 9:29:42", "remaining_time": "8:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14153, "total_steps": 17941, "loss": 1.4434, "learning_rate": 1.0968377006944158e-05, "epoch": 0.7888634970180034, "percentage": 78.89, "elapsed_time": "1 day, 9:29:51", "remaining_time": "8:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14154, "total_steps": 17941, "loss": 1.5954, "learning_rate": 1.0962812563957552e-05, "epoch": 0.7889192352711666, "percentage": 78.89, "elapsed_time": "1 day, 9:29:59", "remaining_time": "8:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14155, "total_steps": 17941, "loss": 1.359, "learning_rate": 1.095724935900294e-05, "epoch": 0.7889749735243298, "percentage": 78.9, "elapsed_time": "1 day, 9:30:08", "remaining_time": "8:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14156, "total_steps": 17941, "loss": 1.5071, "learning_rate": 1.0951687392256738e-05, "epoch": 0.7890307117774928, "percentage": 78.9, "elapsed_time": "1 day, 9:30:16", "remaining_time": "8:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14157, "total_steps": 17941, "loss": 1.7058, "learning_rate": 1.0946126663895335e-05, "epoch": 0.789086450030656, "percentage": 78.91, "elapsed_time": "1 day, 9:30:25", "remaining_time": "8:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14158, "total_steps": 17941, "loss": 1.6391, "learning_rate": 1.0940567174095101e-05, "epoch": 0.7891421882838192, "percentage": 78.91, "elapsed_time": "1 day, 9:30:33", "remaining_time": "8:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14159, "total_steps": 17941, "loss": 1.3799, "learning_rate": 1.0935008923032336e-05, "epoch": 0.7891979265369823, "percentage": 78.92, "elapsed_time": "1 day, 9:30:41", "remaining_time": "8:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14160, "total_steps": 17941, "loss": 1.5895, "learning_rate": 1.0929451910883343e-05, "epoch": 0.7892536647901455, "percentage": 78.93, "elapsed_time": "1 day, 9:30:50", "remaining_time": "8:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14161, "total_steps": 17941, "loss": 1.3587, "learning_rate": 1.0923896137824308e-05, "epoch": 0.7893094030433087, "percentage": 78.93, "elapsed_time": "1 day, 9:30:58", "remaining_time": "8:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14162, "total_steps": 17941, "loss": 1.6722, "learning_rate": 1.0918341604031491e-05, "epoch": 0.7893651412964717, "percentage": 78.94, "elapsed_time": "1 day, 9:31:07", "remaining_time": "8:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14163, "total_steps": 17941, "loss": 1.3863, "learning_rate": 1.0912788309680999e-05, "epoch": 0.7894208795496349, "percentage": 78.94, "elapsed_time": "1 day, 9:31:15", "remaining_time": "8:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14164, "total_steps": 17941, "loss": 1.6009, "learning_rate": 1.0907236254948967e-05, "epoch": 0.7894766178027981, "percentage": 78.95, "elapsed_time": "1 day, 9:31:24", "remaining_time": "8:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14165, "total_steps": 17941, "loss": 1.5707, "learning_rate": 1.0901685440011471e-05, "epoch": 0.7895323560559612, "percentage": 78.95, "elapsed_time": "1 day, 9:31:33", "remaining_time": "8:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14166, "total_steps": 17941, "loss": 1.4619, "learning_rate": 1.089613586504456e-05, "epoch": 0.7895880943091244, "percentage": 78.96, "elapsed_time": "1 day, 9:31:41", "remaining_time": "8:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14167, "total_steps": 17941, "loss": 1.5639, "learning_rate": 1.0890587530224239e-05, "epoch": 0.7896438325622875, "percentage": 78.96, "elapsed_time": "1 day, 9:31:50", "remaining_time": "8:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14168, "total_steps": 17941, "loss": 1.7238, "learning_rate": 1.088504043572643e-05, "epoch": 0.7896995708154506, "percentage": 78.97, "elapsed_time": "1 day, 9:31:59", "remaining_time": "8:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14169, "total_steps": 17941, "loss": 1.5679, "learning_rate": 1.0879494581727112e-05, "epoch": 0.7897553090686138, "percentage": 78.98, "elapsed_time": "1 day, 9:32:07", "remaining_time": "8:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14170, "total_steps": 17941, "loss": 1.6117, "learning_rate": 1.087394996840212e-05, "epoch": 0.789811047321777, "percentage": 78.98, "elapsed_time": "1 day, 9:32:16", "remaining_time": "8:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14171, "total_steps": 17941, "loss": 1.5702, "learning_rate": 1.0868406595927327e-05, "epoch": 0.7898667855749401, "percentage": 78.99, "elapsed_time": "1 day, 9:32:24", "remaining_time": "8:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14172, "total_steps": 17941, "loss": 1.8501, "learning_rate": 1.0862864464478501e-05, "epoch": 0.7899225238281032, "percentage": 78.99, "elapsed_time": "1 day, 9:32:33", "remaining_time": "8:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14173, "total_steps": 17941, "loss": 1.7125, "learning_rate": 1.0857323574231443e-05, "epoch": 0.7899782620812664, "percentage": 79.0, "elapsed_time": "1 day, 9:32:41", "remaining_time": "8:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14174, "total_steps": 17941, "loss": 1.8166, "learning_rate": 1.0851783925361875e-05, "epoch": 0.7900340003344295, "percentage": 79.0, "elapsed_time": "1 day, 9:32:50", "remaining_time": "8:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14175, "total_steps": 17941, "loss": 1.5777, "learning_rate": 1.0846245518045457e-05, "epoch": 0.7900897385875927, "percentage": 79.01, "elapsed_time": "1 day, 9:32:58", "remaining_time": "8:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14176, "total_steps": 17941, "loss": 1.8449, "learning_rate": 1.0840708352457851e-05, "epoch": 0.7901454768407558, "percentage": 79.01, "elapsed_time": "1 day, 9:33:07", "remaining_time": "8:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14177, "total_steps": 17941, "loss": 1.8072, "learning_rate": 1.0835172428774659e-05, "epoch": 0.7902012150939189, "percentage": 79.02, "elapsed_time": "1 day, 9:33:15", "remaining_time": "8:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14178, "total_steps": 17941, "loss": 1.4591, "learning_rate": 1.0829637747171468e-05, "epoch": 0.7902569533470821, "percentage": 79.03, "elapsed_time": "1 day, 9:33:24", "remaining_time": "8:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14179, "total_steps": 17941, "loss": 1.5205, "learning_rate": 1.0824104307823756e-05, "epoch": 0.7903126916002452, "percentage": 79.03, "elapsed_time": "1 day, 9:33:32", "remaining_time": "8:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14180, "total_steps": 17941, "loss": 1.5751, "learning_rate": 1.081857211090706e-05, "epoch": 0.7903684298534084, "percentage": 79.04, "elapsed_time": "1 day, 9:33:41", "remaining_time": "8:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14181, "total_steps": 17941, "loss": 1.445, "learning_rate": 1.0813041156596826e-05, "epoch": 0.7904241681065716, "percentage": 79.04, "elapsed_time": "1 day, 9:33:49", "remaining_time": "8:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14182, "total_steps": 17941, "loss": 1.3204, "learning_rate": 1.080751144506844e-05, "epoch": 0.7904799063597346, "percentage": 79.05, "elapsed_time": "1 day, 9:33:58", "remaining_time": "8:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14183, "total_steps": 17941, "loss": 1.6754, "learning_rate": 1.0801982976497283e-05, "epoch": 0.7905356446128978, "percentage": 79.05, "elapsed_time": "1 day, 9:34:06", "remaining_time": "8:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14184, "total_steps": 17941, "loss": 1.685, "learning_rate": 1.0796455751058682e-05, "epoch": 0.790591382866061, "percentage": 79.06, "elapsed_time": "1 day, 9:34:15", "remaining_time": "8:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14185, "total_steps": 17941, "loss": 1.6895, "learning_rate": 1.0790929768927932e-05, "epoch": 0.7906471211192241, "percentage": 79.06, "elapsed_time": "1 day, 9:34:23", "remaining_time": "8:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14186, "total_steps": 17941, "loss": 1.512, "learning_rate": 1.0785405030280305e-05, "epoch": 0.7907028593723873, "percentage": 79.07, "elapsed_time": "1 day, 9:34:32", "remaining_time": "8:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14187, "total_steps": 17941, "loss": 1.6243, "learning_rate": 1.077988153529096e-05, "epoch": 0.7907585976255505, "percentage": 79.08, "elapsed_time": "1 day, 9:34:40", "remaining_time": "8:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14188, "total_steps": 17941, "loss": 1.5732, "learning_rate": 1.0774359284135133e-05, "epoch": 0.7908143358787135, "percentage": 79.08, "elapsed_time": "1 day, 9:34:49", "remaining_time": "8:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14189, "total_steps": 17941, "loss": 1.7611, "learning_rate": 1.0768838276987914e-05, "epoch": 0.7908700741318767, "percentage": 79.09, "elapsed_time": "1 day, 9:34:57", "remaining_time": "8:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14190, "total_steps": 17941, "loss": 1.5442, "learning_rate": 1.0763318514024412e-05, "epoch": 0.7909258123850399, "percentage": 79.09, "elapsed_time": "1 day, 9:35:06", "remaining_time": "8:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14191, "total_steps": 17941, "loss": 1.7336, "learning_rate": 1.0757799995419677e-05, "epoch": 0.790981550638203, "percentage": 79.1, "elapsed_time": "1 day, 9:35:15", "remaining_time": "8:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14192, "total_steps": 17941, "loss": 1.794, "learning_rate": 1.0752282721348733e-05, "epoch": 0.7910372888913662, "percentage": 79.1, "elapsed_time": "1 day, 9:35:23", "remaining_time": "8:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14193, "total_steps": 17941, "loss": 1.7035, "learning_rate": 1.0746766691986565e-05, "epoch": 0.7910930271445293, "percentage": 79.11, "elapsed_time": "1 day, 9:35:32", "remaining_time": "8:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14194, "total_steps": 17941, "loss": 1.5022, "learning_rate": 1.0741251907508065e-05, "epoch": 0.7911487653976924, "percentage": 79.11, "elapsed_time": "1 day, 9:35:40", "remaining_time": "8:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14195, "total_steps": 17941, "loss": 1.6407, "learning_rate": 1.0735738368088188e-05, "epoch": 0.7912045036508556, "percentage": 79.12, "elapsed_time": "1 day, 9:35:49", "remaining_time": "8:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14196, "total_steps": 17941, "loss": 1.5304, "learning_rate": 1.073022607390175e-05, "epoch": 0.7912602419040188, "percentage": 79.13, "elapsed_time": "1 day, 9:35:57", "remaining_time": "8:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14197, "total_steps": 17941, "loss": 1.6339, "learning_rate": 1.0724715025123599e-05, "epoch": 0.7913159801571819, "percentage": 79.13, "elapsed_time": "1 day, 9:36:06", "remaining_time": "8:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14198, "total_steps": 17941, "loss": 1.7463, "learning_rate": 1.0719205221928464e-05, "epoch": 0.791371718410345, "percentage": 79.14, "elapsed_time": "1 day, 9:36:14", "remaining_time": "8:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14199, "total_steps": 17941, "loss": 1.5111, "learning_rate": 1.0713696664491134e-05, "epoch": 0.7914274566635081, "percentage": 79.14, "elapsed_time": "1 day, 9:36:23", "remaining_time": "8:51:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14200, "total_steps": 17941, "loss": 1.5489, "learning_rate": 1.0708189352986304e-05, "epoch": 0.7914831949166713, "percentage": 79.15, "elapsed_time": "1 day, 9:36:31", "remaining_time": "8:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14201, "total_steps": 17941, "loss": 1.7422, "learning_rate": 1.0702683287588606e-05, "epoch": 0.7915389331698345, "percentage": 79.15, "elapsed_time": "1 day, 9:36:40", "remaining_time": "8:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14202, "total_steps": 17941, "loss": 1.6753, "learning_rate": 1.0697178468472674e-05, "epoch": 0.7915946714229976, "percentage": 79.16, "elapsed_time": "1 day, 9:36:48", "remaining_time": "8:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14203, "total_steps": 17941, "loss": 1.5724, "learning_rate": 1.0691674895813092e-05, "epoch": 0.7916504096761607, "percentage": 79.17, "elapsed_time": "1 day, 9:36:57", "remaining_time": "8:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14204, "total_steps": 17941, "loss": 1.6701, "learning_rate": 1.0686172569784415e-05, "epoch": 0.7917061479293239, "percentage": 79.17, "elapsed_time": "1 day, 9:37:06", "remaining_time": "8:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14205, "total_steps": 17941, "loss": 1.6701, "learning_rate": 1.0680671490561095e-05, "epoch": 0.791761886182487, "percentage": 79.18, "elapsed_time": "1 day, 9:37:14", "remaining_time": "8:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14206, "total_steps": 17941, "loss": 1.6881, "learning_rate": 1.0675171658317645e-05, "epoch": 0.7918176244356502, "percentage": 79.18, "elapsed_time": "1 day, 9:37:23", "remaining_time": "8:50:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14207, "total_steps": 17941, "loss": 1.7261, "learning_rate": 1.0669673073228482e-05, "epoch": 0.7918733626888134, "percentage": 79.19, "elapsed_time": "1 day, 9:37:32", "remaining_time": "8:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14208, "total_steps": 17941, "loss": 1.8894, "learning_rate": 1.0664175735467963e-05, "epoch": 0.7919291009419764, "percentage": 79.19, "elapsed_time": "1 day, 9:37:41", "remaining_time": "8:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14209, "total_steps": 17941, "loss": 1.4879, "learning_rate": 1.0658679645210445e-05, "epoch": 0.7919848391951396, "percentage": 79.2, "elapsed_time": "1 day, 9:37:49", "remaining_time": "8:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14210, "total_steps": 17941, "loss": 1.7824, "learning_rate": 1.065318480263024e-05, "epoch": 0.7920405774483028, "percentage": 79.2, "elapsed_time": "1 day, 9:37:58", "remaining_time": "8:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14211, "total_steps": 17941, "loss": 1.4463, "learning_rate": 1.06476912079016e-05, "epoch": 0.7920963157014659, "percentage": 79.21, "elapsed_time": "1 day, 9:38:06", "remaining_time": "8:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14212, "total_steps": 17941, "loss": 1.6579, "learning_rate": 1.0642198861198771e-05, "epoch": 0.7921520539546291, "percentage": 79.22, "elapsed_time": "1 day, 9:38:14", "remaining_time": "8:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14213, "total_steps": 17941, "loss": 1.6839, "learning_rate": 1.0636707762695891e-05, "epoch": 0.7922077922077922, "percentage": 79.22, "elapsed_time": "1 day, 9:38:23", "remaining_time": "8:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14214, "total_steps": 17941, "loss": 1.7319, "learning_rate": 1.0631217912567165e-05, "epoch": 0.7922635304609553, "percentage": 79.23, "elapsed_time": "1 day, 9:38:31", "remaining_time": "8:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14215, "total_steps": 17941, "loss": 1.7223, "learning_rate": 1.0625729310986659e-05, "epoch": 0.7923192687141185, "percentage": 79.23, "elapsed_time": "1 day, 9:38:40", "remaining_time": "8:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14216, "total_steps": 17941, "loss": 1.6946, "learning_rate": 1.0620241958128451e-05, "epoch": 0.7923750069672817, "percentage": 79.24, "elapsed_time": "1 day, 9:38:49", "remaining_time": "8:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14217, "total_steps": 17941, "loss": 1.7499, "learning_rate": 1.061475585416657e-05, "epoch": 0.7924307452204448, "percentage": 79.24, "elapsed_time": "1 day, 9:38:57", "remaining_time": "8:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14218, "total_steps": 17941, "loss": 1.6454, "learning_rate": 1.0609270999275e-05, "epoch": 0.792486483473608, "percentage": 79.25, "elapsed_time": "1 day, 9:39:06", "remaining_time": "8:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14219, "total_steps": 17941, "loss": 1.7257, "learning_rate": 1.0603787393627701e-05, "epoch": 0.7925422217267711, "percentage": 79.25, "elapsed_time": "1 day, 9:39:15", "remaining_time": "8:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14220, "total_steps": 17941, "loss": 1.5123, "learning_rate": 1.0598305037398543e-05, "epoch": 0.7925979599799342, "percentage": 79.26, "elapsed_time": "1 day, 9:39:24", "remaining_time": "8:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14221, "total_steps": 17941, "loss": 1.5896, "learning_rate": 1.0592823930761454e-05, "epoch": 0.7926536982330974, "percentage": 79.27, "elapsed_time": "1 day, 9:39:32", "remaining_time": "8:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14222, "total_steps": 17941, "loss": 1.6032, "learning_rate": 1.0587344073890209e-05, "epoch": 0.7927094364862605, "percentage": 79.27, "elapsed_time": "1 day, 9:39:41", "remaining_time": "8:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14223, "total_steps": 17941, "loss": 1.685, "learning_rate": 1.058186546695864e-05, "epoch": 0.7927651747394237, "percentage": 79.28, "elapsed_time": "1 day, 9:39:49", "remaining_time": "8:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14224, "total_steps": 17941, "loss": 1.4667, "learning_rate": 1.0576388110140444e-05, "epoch": 0.7928209129925868, "percentage": 79.28, "elapsed_time": "1 day, 9:39:58", "remaining_time": "8:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14225, "total_steps": 17941, "loss": 1.7501, "learning_rate": 1.0570912003609374e-05, "epoch": 0.7928766512457499, "percentage": 79.29, "elapsed_time": "1 day, 9:40:06", "remaining_time": "8:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14226, "total_steps": 17941, "loss": 1.6845, "learning_rate": 1.0565437147539104e-05, "epoch": 0.7929323894989131, "percentage": 79.29, "elapsed_time": "1 day, 9:40:15", "remaining_time": "8:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14227, "total_steps": 17941, "loss": 1.6876, "learning_rate": 1.055996354210323e-05, "epoch": 0.7929881277520763, "percentage": 79.3, "elapsed_time": "1 day, 9:40:23", "remaining_time": "8:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14228, "total_steps": 17941, "loss": 1.6564, "learning_rate": 1.0554491187475363e-05, "epoch": 0.7930438660052394, "percentage": 79.3, "elapsed_time": "1 day, 9:40:32", "remaining_time": "8:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14229, "total_steps": 17941, "loss": 1.5664, "learning_rate": 1.0549020083829053e-05, "epoch": 0.7930996042584025, "percentage": 79.31, "elapsed_time": "1 day, 9:40:40", "remaining_time": "8:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14230, "total_steps": 17941, "loss": 1.6195, "learning_rate": 1.0543550231337824e-05, "epoch": 0.7931553425115657, "percentage": 79.32, "elapsed_time": "1 day, 9:40:49", "remaining_time": "8:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14231, "total_steps": 17941, "loss": 1.8589, "learning_rate": 1.0538081630175106e-05, "epoch": 0.7932110807647288, "percentage": 79.32, "elapsed_time": "1 day, 9:40:57", "remaining_time": "8:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14232, "total_steps": 17941, "loss": 1.5969, "learning_rate": 1.0532614280514374e-05, "epoch": 0.793266819017892, "percentage": 79.33, "elapsed_time": "1 day, 9:41:06", "remaining_time": "8:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14233, "total_steps": 17941, "loss": 1.914, "learning_rate": 1.0527148182529023e-05, "epoch": 0.7933225572710552, "percentage": 79.33, "elapsed_time": "1 day, 9:41:14", "remaining_time": "8:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14234, "total_steps": 17941, "loss": 1.5224, "learning_rate": 1.0521683336392374e-05, "epoch": 0.7933782955242182, "percentage": 79.34, "elapsed_time": "1 day, 9:41:23", "remaining_time": "8:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14235, "total_steps": 17941, "loss": 1.7211, "learning_rate": 1.0516219742277755e-05, "epoch": 0.7934340337773814, "percentage": 79.34, "elapsed_time": "1 day, 9:41:31", "remaining_time": "8:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14236, "total_steps": 17941, "loss": 1.193, "learning_rate": 1.051075740035844e-05, "epoch": 0.7934897720305446, "percentage": 79.35, "elapsed_time": "1 day, 9:41:40", "remaining_time": "8:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14237, "total_steps": 17941, "loss": 1.7133, "learning_rate": 1.050529631080766e-05, "epoch": 0.7935455102837077, "percentage": 79.35, "elapsed_time": "1 day, 9:41:48", "remaining_time": "8:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14238, "total_steps": 17941, "loss": 1.4363, "learning_rate": 1.0499836473798624e-05, "epoch": 0.7936012485368709, "percentage": 79.36, "elapsed_time": "1 day, 9:41:56", "remaining_time": "8:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14239, "total_steps": 17941, "loss": 1.4707, "learning_rate": 1.0494377889504448e-05, "epoch": 0.793656986790034, "percentage": 79.37, "elapsed_time": "1 day, 9:42:05", "remaining_time": "8:45:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14240, "total_steps": 17941, "loss": 1.5554, "learning_rate": 1.0488920558098298e-05, "epoch": 0.7937127250431971, "percentage": 79.37, "elapsed_time": "1 day, 9:42:13", "remaining_time": "8:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14241, "total_steps": 17941, "loss": 1.7977, "learning_rate": 1.0483464479753207e-05, "epoch": 0.7937684632963603, "percentage": 79.38, "elapsed_time": "1 day, 9:42:22", "remaining_time": "8:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14242, "total_steps": 17941, "loss": 1.5221, "learning_rate": 1.0478009654642229e-05, "epoch": 0.7938242015495235, "percentage": 79.38, "elapsed_time": "1 day, 9:42:31", "remaining_time": "8:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14243, "total_steps": 17941, "loss": 1.4287, "learning_rate": 1.047255608293835e-05, "epoch": 0.7938799398026866, "percentage": 79.39, "elapsed_time": "1 day, 9:42:40", "remaining_time": "8:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14244, "total_steps": 17941, "loss": 1.5659, "learning_rate": 1.0467103764814534e-05, "epoch": 0.7939356780558497, "percentage": 79.39, "elapsed_time": "1 day, 9:42:48", "remaining_time": "8:45:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14245, "total_steps": 17941, "loss": 1.8926, "learning_rate": 1.0461652700443708e-05, "epoch": 0.7939914163090128, "percentage": 79.4, "elapsed_time": "1 day, 9:42:57", "remaining_time": "8:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14246, "total_steps": 17941, "loss": 1.5393, "learning_rate": 1.0456202889998706e-05, "epoch": 0.794047154562176, "percentage": 79.4, "elapsed_time": "1 day, 9:43:05", "remaining_time": "8:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14247, "total_steps": 17941, "loss": 1.7159, "learning_rate": 1.0450754333652423e-05, "epoch": 0.7941028928153392, "percentage": 79.41, "elapsed_time": "1 day, 9:43:14", "remaining_time": "8:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14248, "total_steps": 17941, "loss": 1.7552, "learning_rate": 1.0445307031577606e-05, "epoch": 0.7941586310685023, "percentage": 79.42, "elapsed_time": "1 day, 9:43:22", "remaining_time": "8:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14249, "total_steps": 17941, "loss": 1.7994, "learning_rate": 1.0439860983947031e-05, "epoch": 0.7942143693216654, "percentage": 79.42, "elapsed_time": "1 day, 9:43:31", "remaining_time": "8:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14250, "total_steps": 17941, "loss": 1.6273, "learning_rate": 1.0434416190933415e-05, "epoch": 0.7942701075748286, "percentage": 79.43, "elapsed_time": "1 day, 9:43:39", "remaining_time": "8:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14251, "total_steps": 17941, "loss": 1.7099, "learning_rate": 1.0428972652709435e-05, "epoch": 0.7943258458279917, "percentage": 79.43, "elapsed_time": "1 day, 9:43:48", "remaining_time": "8:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14252, "total_steps": 17941, "loss": 1.4654, "learning_rate": 1.0423530369447736e-05, "epoch": 0.7943815840811549, "percentage": 79.44, "elapsed_time": "1 day, 9:43:56", "remaining_time": "8:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14253, "total_steps": 17941, "loss": 1.4411, "learning_rate": 1.0418089341320902e-05, "epoch": 0.7944373223343181, "percentage": 79.44, "elapsed_time": "1 day, 9:44:05", "remaining_time": "8:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14254, "total_steps": 17941, "loss": 1.6224, "learning_rate": 1.0412649568501487e-05, "epoch": 0.7944930605874811, "percentage": 79.45, "elapsed_time": "1 day, 9:44:13", "remaining_time": "8:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14255, "total_steps": 17941, "loss": 1.5888, "learning_rate": 1.0407211051162024e-05, "epoch": 0.7945487988406443, "percentage": 79.45, "elapsed_time": "1 day, 9:44:21", "remaining_time": "8:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14256, "total_steps": 17941, "loss": 1.6535, "learning_rate": 1.0401773789474994e-05, "epoch": 0.7946045370938075, "percentage": 79.46, "elapsed_time": "1 day, 9:44:30", "remaining_time": "8:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14257, "total_steps": 17941, "loss": 1.4711, "learning_rate": 1.0396337783612797e-05, "epoch": 0.7946602753469706, "percentage": 79.47, "elapsed_time": "1 day, 9:44:39", "remaining_time": "8:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14258, "total_steps": 17941, "loss": 1.838, "learning_rate": 1.0390903033747879e-05, "epoch": 0.7947160136001338, "percentage": 79.47, "elapsed_time": "1 day, 9:44:47", "remaining_time": "8:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14259, "total_steps": 17941, "loss": 1.7793, "learning_rate": 1.0385469540052589e-05, "epoch": 0.794771751853297, "percentage": 79.48, "elapsed_time": "1 day, 9:44:55", "remaining_time": "8:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14260, "total_steps": 17941, "loss": 1.6085, "learning_rate": 1.0380037302699225e-05, "epoch": 0.79482749010646, "percentage": 79.48, "elapsed_time": "1 day, 9:45:04", "remaining_time": "8:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14261, "total_steps": 17941, "loss": 1.8404, "learning_rate": 1.0374606321860076e-05, "epoch": 0.7948832283596232, "percentage": 79.49, "elapsed_time": "1 day, 9:45:12", "remaining_time": "8:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14262, "total_steps": 17941, "loss": 1.4937, "learning_rate": 1.0369176597707386e-05, "epoch": 0.7949389666127864, "percentage": 79.49, "elapsed_time": "1 day, 9:45:21", "remaining_time": "8:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14263, "total_steps": 17941, "loss": 1.7009, "learning_rate": 1.0363748130413358e-05, "epoch": 0.7949947048659495, "percentage": 79.5, "elapsed_time": "1 day, 9:45:29", "remaining_time": "8:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14264, "total_steps": 17941, "loss": 1.5766, "learning_rate": 1.0358320920150132e-05, "epoch": 0.7950504431191127, "percentage": 79.51, "elapsed_time": "1 day, 9:45:39", "remaining_time": "8:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14265, "total_steps": 17941, "loss": 1.6995, "learning_rate": 1.0352894967089833e-05, "epoch": 0.7951061813722758, "percentage": 79.51, "elapsed_time": "1 day, 9:45:47", "remaining_time": "8:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14266, "total_steps": 17941, "loss": 1.7647, "learning_rate": 1.0347470271404569e-05, "epoch": 0.7951619196254389, "percentage": 79.52, "elapsed_time": "1 day, 9:45:56", "remaining_time": "8:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14267, "total_steps": 17941, "loss": 1.3858, "learning_rate": 1.0342046833266339e-05, "epoch": 0.7952176578786021, "percentage": 79.52, "elapsed_time": "1 day, 9:46:04", "remaining_time": "8:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14268, "total_steps": 17941, "loss": 1.7127, "learning_rate": 1.033662465284717e-05, "epoch": 0.7952733961317652, "percentage": 79.53, "elapsed_time": "1 day, 9:46:13", "remaining_time": "8:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14269, "total_steps": 17941, "loss": 1.5011, "learning_rate": 1.033120373031901e-05, "epoch": 0.7953291343849284, "percentage": 79.53, "elapsed_time": "1 day, 9:46:21", "remaining_time": "8:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14270, "total_steps": 17941, "loss": 1.5378, "learning_rate": 1.0325784065853783e-05, "epoch": 0.7953848726380915, "percentage": 79.54, "elapsed_time": "1 day, 9:46:30", "remaining_time": "8:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14271, "total_steps": 17941, "loss": 1.7753, "learning_rate": 1.0320365659623377e-05, "epoch": 0.7954406108912546, "percentage": 79.54, "elapsed_time": "1 day, 9:46:38", "remaining_time": "8:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14272, "total_steps": 17941, "loss": 1.7533, "learning_rate": 1.0314948511799605e-05, "epoch": 0.7954963491444178, "percentage": 79.55, "elapsed_time": "1 day, 9:46:47", "remaining_time": "8:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14273, "total_steps": 17941, "loss": 1.7726, "learning_rate": 1.0309532622554308e-05, "epoch": 0.795552087397581, "percentage": 79.56, "elapsed_time": "1 day, 9:46:55", "remaining_time": "8:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14274, "total_steps": 17941, "loss": 1.7032, "learning_rate": 1.0304117992059215e-05, "epoch": 0.7956078256507441, "percentage": 79.56, "elapsed_time": "1 day, 9:47:04", "remaining_time": "8:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14275, "total_steps": 17941, "loss": 1.648, "learning_rate": 1.0298704620486055e-05, "epoch": 0.7956635639039072, "percentage": 79.57, "elapsed_time": "1 day, 9:47:13", "remaining_time": "8:40:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14276, "total_steps": 17941, "loss": 1.8069, "learning_rate": 1.0293292508006507e-05, "epoch": 0.7957193021570704, "percentage": 79.57, "elapsed_time": "1 day, 9:47:22", "remaining_time": "8:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14277, "total_steps": 17941, "loss": 1.643, "learning_rate": 1.028788165479222e-05, "epoch": 0.7957750404102335, "percentage": 79.58, "elapsed_time": "1 day, 9:47:30", "remaining_time": "8:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14278, "total_steps": 17941, "loss": 1.4351, "learning_rate": 1.0282472061014797e-05, "epoch": 0.7958307786633967, "percentage": 79.58, "elapsed_time": "1 day, 9:47:39", "remaining_time": "8:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14279, "total_steps": 17941, "loss": 1.6967, "learning_rate": 1.0277063726845781e-05, "epoch": 0.7958865169165599, "percentage": 79.59, "elapsed_time": "1 day, 9:47:47", "remaining_time": "8:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14280, "total_steps": 17941, "loss": 1.7828, "learning_rate": 1.02716566524567e-05, "epoch": 0.795942255169723, "percentage": 79.59, "elapsed_time": "1 day, 9:47:56", "remaining_time": "8:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14281, "total_steps": 17941, "loss": 1.5625, "learning_rate": 1.0266250838019036e-05, "epoch": 0.7959979934228861, "percentage": 79.6, "elapsed_time": "1 day, 9:48:04", "remaining_time": "8:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14282, "total_steps": 17941, "loss": 1.607, "learning_rate": 1.026084628370425e-05, "epoch": 0.7960537316760493, "percentage": 79.61, "elapsed_time": "1 day, 9:48:13", "remaining_time": "8:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14283, "total_steps": 17941, "loss": 1.8911, "learning_rate": 1.0255442989683694e-05, "epoch": 0.7961094699292124, "percentage": 79.61, "elapsed_time": "1 day, 9:48:21", "remaining_time": "8:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14284, "total_steps": 17941, "loss": 1.6691, "learning_rate": 1.0250040956128776e-05, "epoch": 0.7961652081823756, "percentage": 79.62, "elapsed_time": "1 day, 9:48:30", "remaining_time": "8:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14285, "total_steps": 17941, "loss": 1.6303, "learning_rate": 1.0244640183210814e-05, "epoch": 0.7962209464355388, "percentage": 79.62, "elapsed_time": "1 day, 9:48:38", "remaining_time": "8:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14286, "total_steps": 17941, "loss": 1.7553, "learning_rate": 1.0239240671101063e-05, "epoch": 0.7962766846887018, "percentage": 79.63, "elapsed_time": "1 day, 9:48:47", "remaining_time": "8:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14287, "total_steps": 17941, "loss": 1.58, "learning_rate": 1.0233842419970773e-05, "epoch": 0.796332422941865, "percentage": 79.63, "elapsed_time": "1 day, 9:48:55", "remaining_time": "8:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14288, "total_steps": 17941, "loss": 1.5677, "learning_rate": 1.0228445429991151e-05, "epoch": 0.7963881611950282, "percentage": 79.64, "elapsed_time": "1 day, 9:49:05", "remaining_time": "8:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14289, "total_steps": 17941, "loss": 1.8649, "learning_rate": 1.0223049701333371e-05, "epoch": 0.7964438994481913, "percentage": 79.64, "elapsed_time": "1 day, 9:49:13", "remaining_time": "8:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14290, "total_steps": 17941, "loss": 1.7821, "learning_rate": 1.0217655234168522e-05, "epoch": 0.7964996377013545, "percentage": 79.65, "elapsed_time": "1 day, 9:49:22", "remaining_time": "8:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14291, "total_steps": 17941, "loss": 1.7406, "learning_rate": 1.0212262028667686e-05, "epoch": 0.7965553759545175, "percentage": 79.66, "elapsed_time": "1 day, 9:49:31", "remaining_time": "8:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14292, "total_steps": 17941, "loss": 1.6126, "learning_rate": 1.0206870085001952e-05, "epoch": 0.7966111142076807, "percentage": 79.66, "elapsed_time": "1 day, 9:49:39", "remaining_time": "8:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14293, "total_steps": 17941, "loss": 1.5392, "learning_rate": 1.0201479403342273e-05, "epoch": 0.7966668524608439, "percentage": 79.67, "elapsed_time": "1 day, 9:49:48", "remaining_time": "8:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14294, "total_steps": 17941, "loss": 1.4339, "learning_rate": 1.0196089983859624e-05, "epoch": 0.796722590714007, "percentage": 79.67, "elapsed_time": "1 day, 9:49:56", "remaining_time": "8:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14295, "total_steps": 17941, "loss": 1.6336, "learning_rate": 1.0190701826724929e-05, "epoch": 0.7967783289671702, "percentage": 79.68, "elapsed_time": "1 day, 9:50:05", "remaining_time": "8:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14296, "total_steps": 17941, "loss": 1.5615, "learning_rate": 1.0185314932109069e-05, "epoch": 0.7968340672203333, "percentage": 79.68, "elapsed_time": "1 day, 9:50:13", "remaining_time": "8:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14297, "total_steps": 17941, "loss": 1.4878, "learning_rate": 1.01799293001829e-05, "epoch": 0.7968898054734964, "percentage": 79.69, "elapsed_time": "1 day, 9:50:22", "remaining_time": "8:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14298, "total_steps": 17941, "loss": 1.6865, "learning_rate": 1.0174544931117175e-05, "epoch": 0.7969455437266596, "percentage": 79.69, "elapsed_time": "1 day, 9:50:31", "remaining_time": "8:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14299, "total_steps": 17941, "loss": 1.6865, "learning_rate": 1.0169161825082718e-05, "epoch": 0.7970012819798228, "percentage": 79.7, "elapsed_time": "1 day, 9:50:39", "remaining_time": "8:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14300, "total_steps": 17941, "loss": 1.6237, "learning_rate": 1.0163779982250199e-05, "epoch": 0.7970570202329859, "percentage": 79.71, "elapsed_time": "1 day, 9:50:48", "remaining_time": "8:37:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14301, "total_steps": 17941, "loss": 1.7827, "learning_rate": 1.015839940279032e-05, "epoch": 0.797112758486149, "percentage": 79.71, "elapsed_time": "1 day, 9:50:56", "remaining_time": "8:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14302, "total_steps": 17941, "loss": 1.4354, "learning_rate": 1.015302008687372e-05, "epoch": 0.7971684967393122, "percentage": 79.72, "elapsed_time": "1 day, 9:51:05", "remaining_time": "8:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14303, "total_steps": 17941, "loss": 1.6831, "learning_rate": 1.0147642034670996e-05, "epoch": 0.7972242349924753, "percentage": 79.72, "elapsed_time": "1 day, 9:51:13", "remaining_time": "8:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14304, "total_steps": 17941, "loss": 1.7572, "learning_rate": 1.0142265246352728e-05, "epoch": 0.7972799732456385, "percentage": 79.73, "elapsed_time": "1 day, 9:51:22", "remaining_time": "8:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14305, "total_steps": 17941, "loss": 1.6094, "learning_rate": 1.0136889722089404e-05, "epoch": 0.7973357114988017, "percentage": 79.73, "elapsed_time": "1 day, 9:51:30", "remaining_time": "8:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14306, "total_steps": 17941, "loss": 1.9664, "learning_rate": 1.0131515462051521e-05, "epoch": 0.7973914497519647, "percentage": 79.74, "elapsed_time": "1 day, 9:51:38", "remaining_time": "8:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14307, "total_steps": 17941, "loss": 1.7449, "learning_rate": 1.0126142466409517e-05, "epoch": 0.7974471880051279, "percentage": 79.74, "elapsed_time": "1 day, 9:51:47", "remaining_time": "8:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14308, "total_steps": 17941, "loss": 1.4495, "learning_rate": 1.0120770735333807e-05, "epoch": 0.7975029262582911, "percentage": 79.75, "elapsed_time": "1 day, 9:51:56", "remaining_time": "8:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14309, "total_steps": 17941, "loss": 1.5221, "learning_rate": 1.0115400268994713e-05, "epoch": 0.7975586645114542, "percentage": 79.76, "elapsed_time": "1 day, 9:52:04", "remaining_time": "8:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14310, "total_steps": 17941, "loss": 1.4912, "learning_rate": 1.0110031067562592e-05, "epoch": 0.7976144027646174, "percentage": 79.76, "elapsed_time": "1 day, 9:52:12", "remaining_time": "8:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14311, "total_steps": 17941, "loss": 1.7532, "learning_rate": 1.010466313120772e-05, "epoch": 0.7976701410177806, "percentage": 79.77, "elapsed_time": "1 day, 9:52:21", "remaining_time": "8:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14312, "total_steps": 17941, "loss": 1.7185, "learning_rate": 1.0099296460100322e-05, "epoch": 0.7977258792709436, "percentage": 79.77, "elapsed_time": "1 day, 9:52:30", "remaining_time": "8:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14313, "total_steps": 17941, "loss": 1.5657, "learning_rate": 1.0093931054410594e-05, "epoch": 0.7977816175241068, "percentage": 79.78, "elapsed_time": "1 day, 9:52:38", "remaining_time": "8:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14314, "total_steps": 17941, "loss": 1.6364, "learning_rate": 1.008856691430871e-05, "epoch": 0.7978373557772699, "percentage": 79.78, "elapsed_time": "1 day, 9:52:47", "remaining_time": "8:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14315, "total_steps": 17941, "loss": 1.5217, "learning_rate": 1.0083204039964794e-05, "epoch": 0.7978930940304331, "percentage": 79.79, "elapsed_time": "1 day, 9:52:55", "remaining_time": "8:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14316, "total_steps": 17941, "loss": 1.7008, "learning_rate": 1.0077842431548906e-05, "epoch": 0.7979488322835963, "percentage": 79.79, "elapsed_time": "1 day, 9:53:03", "remaining_time": "8:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14317, "total_steps": 17941, "loss": 1.5748, "learning_rate": 1.0072482089231078e-05, "epoch": 0.7980045705367593, "percentage": 79.8, "elapsed_time": "1 day, 9:53:12", "remaining_time": "8:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14318, "total_steps": 17941, "loss": 1.6165, "learning_rate": 1.006712301318135e-05, "epoch": 0.7980603087899225, "percentage": 79.81, "elapsed_time": "1 day, 9:53:20", "remaining_time": "8:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14319, "total_steps": 17941, "loss": 1.1837, "learning_rate": 1.0061765203569639e-05, "epoch": 0.7981160470430857, "percentage": 79.81, "elapsed_time": "1 day, 9:53:29", "remaining_time": "8:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14320, "total_steps": 17941, "loss": 1.7098, "learning_rate": 1.0056408660565885e-05, "epoch": 0.7981717852962488, "percentage": 79.82, "elapsed_time": "1 day, 9:53:37", "remaining_time": "8:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14321, "total_steps": 17941, "loss": 1.8916, "learning_rate": 1.0051053384339959e-05, "epoch": 0.798227523549412, "percentage": 79.82, "elapsed_time": "1 day, 9:53:46", "remaining_time": "8:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14322, "total_steps": 17941, "loss": 1.6068, "learning_rate": 1.0045699375061701e-05, "epoch": 0.7982832618025751, "percentage": 79.83, "elapsed_time": "1 day, 9:53:54", "remaining_time": "8:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14323, "total_steps": 17941, "loss": 1.5894, "learning_rate": 1.0040346632900921e-05, "epoch": 0.7983390000557382, "percentage": 79.83, "elapsed_time": "1 day, 9:54:03", "remaining_time": "8:33:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14324, "total_steps": 17941, "loss": 1.634, "learning_rate": 1.0034995158027343e-05, "epoch": 0.7983947383089014, "percentage": 79.84, "elapsed_time": "1 day, 9:54:11", "remaining_time": "8:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14325, "total_steps": 17941, "loss": 1.6313, "learning_rate": 1.0029644950610728e-05, "epoch": 0.7984504765620646, "percentage": 79.85, "elapsed_time": "1 day, 9:54:20", "remaining_time": "8:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14326, "total_steps": 17941, "loss": 1.5917, "learning_rate": 1.0024296010820721e-05, "epoch": 0.7985062148152277, "percentage": 79.85, "elapsed_time": "1 day, 9:54:28", "remaining_time": "8:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14327, "total_steps": 17941, "loss": 1.6068, "learning_rate": 1.0018948338826972e-05, "epoch": 0.7985619530683908, "percentage": 79.86, "elapsed_time": "1 day, 9:54:37", "remaining_time": "8:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14328, "total_steps": 17941, "loss": 1.7385, "learning_rate": 1.0013601934799072e-05, "epoch": 0.798617691321554, "percentage": 79.86, "elapsed_time": "1 day, 9:54:45", "remaining_time": "8:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14329, "total_steps": 17941, "loss": 1.6175, "learning_rate": 1.0008256798906585e-05, "epoch": 0.7986734295747171, "percentage": 79.87, "elapsed_time": "1 day, 9:54:54", "remaining_time": "8:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14330, "total_steps": 17941, "loss": 1.623, "learning_rate": 1.0002912931319036e-05, "epoch": 0.7987291678278803, "percentage": 79.87, "elapsed_time": "1 day, 9:55:02", "remaining_time": "8:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14331, "total_steps": 17941, "loss": 1.4983, "learning_rate": 9.997570332205875e-06, "epoch": 0.7987849060810435, "percentage": 79.88, "elapsed_time": "1 day, 9:55:10", "remaining_time": "8:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14332, "total_steps": 17941, "loss": 1.435, "learning_rate": 9.992229001736553e-06, "epoch": 0.7988406443342065, "percentage": 79.88, "elapsed_time": "1 day, 9:55:19", "remaining_time": "8:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14333, "total_steps": 17941, "loss": 1.4607, "learning_rate": 9.986888940080468e-06, "epoch": 0.7988963825873697, "percentage": 79.89, "elapsed_time": "1 day, 9:55:27", "remaining_time": "8:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14334, "total_steps": 17941, "loss": 1.556, "learning_rate": 9.981550147406987e-06, "epoch": 0.7989521208405329, "percentage": 79.9, "elapsed_time": "1 day, 9:55:37", "remaining_time": "8:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14335, "total_steps": 17941, "loss": 1.668, "learning_rate": 9.976212623885384e-06, "epoch": 0.799007859093696, "percentage": 79.9, "elapsed_time": "1 day, 9:55:46", "remaining_time": "8:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14336, "total_steps": 17941, "loss": 1.6566, "learning_rate": 9.970876369684973e-06, "epoch": 0.7990635973468592, "percentage": 79.91, "elapsed_time": "1 day, 9:55:54", "remaining_time": "8:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14337, "total_steps": 17941, "loss": 1.2366, "learning_rate": 9.96554138497499e-06, "epoch": 0.7991193356000222, "percentage": 79.91, "elapsed_time": "1 day, 9:56:02", "remaining_time": "8:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14338, "total_steps": 17941, "loss": 1.916, "learning_rate": 9.960207669924603e-06, "epoch": 0.7991750738531854, "percentage": 79.92, "elapsed_time": "1 day, 9:56:11", "remaining_time": "8:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14339, "total_steps": 17941, "loss": 1.5393, "learning_rate": 9.960207669924603e-06, "epoch": 0.7992308121063486, "percentage": 79.92, "elapsed_time": "1 day, 9:56:19", "remaining_time": "8:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14340, "total_steps": 17941, "loss": 1.5587, "learning_rate": 9.954875224702986e-06, "epoch": 0.7992865503595117, "percentage": 79.93, "elapsed_time": "1 day, 9:56:28", "remaining_time": "8:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14341, "total_steps": 17941, "loss": 1.4697, "learning_rate": 9.949544049479247e-06, "epoch": 0.7993422886126749, "percentage": 79.93, "elapsed_time": "1 day, 9:56:36", "remaining_time": "8:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14342, "total_steps": 17941, "loss": 1.3914, "learning_rate": 9.94421414442247e-06, "epoch": 0.799398026865838, "percentage": 79.94, "elapsed_time": "1 day, 9:56:45", "remaining_time": "8:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14343, "total_steps": 17941, "loss": 1.4728, "learning_rate": 9.938885509701657e-06, "epoch": 0.7994537651190011, "percentage": 79.95, "elapsed_time": "1 day, 9:56:53", "remaining_time": "8:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14344, "total_steps": 17941, "loss": 1.3721, "learning_rate": 9.933558145485833e-06, "epoch": 0.7995095033721643, "percentage": 79.95, "elapsed_time": "1 day, 9:57:02", "remaining_time": "8:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14345, "total_steps": 17941, "loss": 1.7802, "learning_rate": 9.928232051943953e-06, "epoch": 0.7995652416253275, "percentage": 79.96, "elapsed_time": "1 day, 9:57:10", "remaining_time": "8:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14346, "total_steps": 17941, "loss": 1.4227, "learning_rate": 9.922907229244904e-06, "epoch": 0.7996209798784906, "percentage": 79.96, "elapsed_time": "1 day, 9:57:19", "remaining_time": "8:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14347, "total_steps": 17941, "loss": 1.6922, "learning_rate": 9.917583677557574e-06, "epoch": 0.7996767181316538, "percentage": 79.97, "elapsed_time": "1 day, 9:57:28", "remaining_time": "8:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14348, "total_steps": 17941, "loss": 1.5325, "learning_rate": 9.912261397050792e-06, "epoch": 0.7997324563848169, "percentage": 79.97, "elapsed_time": "1 day, 9:57:36", "remaining_time": "8:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14349, "total_steps": 17941, "loss": 1.7558, "learning_rate": 9.906940387893354e-06, "epoch": 0.79978819463798, "percentage": 79.98, "elapsed_time": "1 day, 9:57:45", "remaining_time": "8:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14350, "total_steps": 17941, "loss": 1.3819, "learning_rate": 9.901620650254017e-06, "epoch": 0.7998439328911432, "percentage": 79.98, "elapsed_time": "1 day, 9:57:53", "remaining_time": "8:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14351, "total_steps": 17941, "loss": 1.7104, "learning_rate": 9.896302184301465e-06, "epoch": 0.7998996711443064, "percentage": 79.99, "elapsed_time": "1 day, 9:58:02", "remaining_time": "8:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14352, "total_steps": 17941, "loss": 1.7376, "learning_rate": 9.890984990204404e-06, "epoch": 0.7999554093974695, "percentage": 80.0, "elapsed_time": "1 day, 9:58:10", "remaining_time": "8:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14353, "total_steps": 17941, "loss": 2.0308, "learning_rate": 9.885669068131437e-06, "epoch": 0.8000111476506326, "percentage": 80.0, "elapsed_time": "1 day, 9:58:18", "remaining_time": "8:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14354, "total_steps": 17941, "loss": 1.4996, "learning_rate": 9.880354418251165e-06, "epoch": 0.8000668859037958, "percentage": 80.01, "elapsed_time": "1 day, 9:58:27", "remaining_time": "8:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14355, "total_steps": 17941, "loss": 1.6186, "learning_rate": 9.875041040732136e-06, "epoch": 0.8001226241569589, "percentage": 80.01, "elapsed_time": "1 day, 9:58:35", "remaining_time": "8:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14356, "total_steps": 17941, "loss": 1.4683, "learning_rate": 9.869728935742862e-06, "epoch": 0.8001783624101221, "percentage": 80.02, "elapsed_time": "1 day, 9:58:44", "remaining_time": "8:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14357, "total_steps": 17941, "loss": 1.8107, "learning_rate": 9.864418103451828e-06, "epoch": 0.8002341006632853, "percentage": 80.02, "elapsed_time": "1 day, 9:58:53", "remaining_time": "8:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14358, "total_steps": 17941, "loss": 1.6458, "learning_rate": 9.859108544027423e-06, "epoch": 0.8002898389164483, "percentage": 80.03, "elapsed_time": "1 day, 9:59:01", "remaining_time": "8:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14359, "total_steps": 17941, "loss": 1.6334, "learning_rate": 9.853800257638063e-06, "epoch": 0.8003455771696115, "percentage": 80.03, "elapsed_time": "1 day, 9:59:10", "remaining_time": "8:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14360, "total_steps": 17941, "loss": 1.6904, "learning_rate": 9.848493244452089e-06, "epoch": 0.8004013154227746, "percentage": 80.04, "elapsed_time": "1 day, 9:59:19", "remaining_time": "8:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14361, "total_steps": 17941, "loss": 1.6743, "learning_rate": 9.843187504637824e-06, "epoch": 0.8004570536759378, "percentage": 80.05, "elapsed_time": "1 day, 9:59:27", "remaining_time": "8:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14362, "total_steps": 17941, "loss": 1.6923, "learning_rate": 9.837883038363494e-06, "epoch": 0.800512791929101, "percentage": 80.05, "elapsed_time": "1 day, 9:59:36", "remaining_time": "8:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14363, "total_steps": 17941, "loss": 1.858, "learning_rate": 9.832579845797362e-06, "epoch": 0.800568530182264, "percentage": 80.06, "elapsed_time": "1 day, 9:59:44", "remaining_time": "8:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14364, "total_steps": 17941, "loss": 1.6314, "learning_rate": 9.82727792710762e-06, "epoch": 0.8006242684354272, "percentage": 80.06, "elapsed_time": "1 day, 9:59:53", "remaining_time": "8:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14365, "total_steps": 17941, "loss": 1.5115, "learning_rate": 9.821977282462387e-06, "epoch": 0.8006800066885904, "percentage": 80.07, "elapsed_time": "1 day, 10:00:01", "remaining_time": "8:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14366, "total_steps": 17941, "loss": 1.5325, "learning_rate": 9.81667791202978e-06, "epoch": 0.8007357449417535, "percentage": 80.07, "elapsed_time": "1 day, 10:00:10", "remaining_time": "8:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14367, "total_steps": 17941, "loss": 1.4287, "learning_rate": 9.811379815977866e-06, "epoch": 0.8007914831949167, "percentage": 80.08, "elapsed_time": "1 day, 10:00:18", "remaining_time": "8:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14368, "total_steps": 17941, "loss": 1.7301, "learning_rate": 9.80608299447468e-06, "epoch": 0.8008472214480798, "percentage": 80.08, "elapsed_time": "1 day, 10:00:27", "remaining_time": "8:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14369, "total_steps": 17941, "loss": 1.4684, "learning_rate": 9.80078744768817e-06, "epoch": 0.8009029597012429, "percentage": 80.09, "elapsed_time": "1 day, 10:00:36", "remaining_time": "8:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14370, "total_steps": 17941, "loss": 1.6985, "learning_rate": 9.795493175786318e-06, "epoch": 0.8009586979544061, "percentage": 80.1, "elapsed_time": "1 day, 10:00:44", "remaining_time": "8:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14371, "total_steps": 17941, "loss": 1.5258, "learning_rate": 9.790200178937026e-06, "epoch": 0.8010144362075693, "percentage": 80.1, "elapsed_time": "1 day, 10:00:52", "remaining_time": "8:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14372, "total_steps": 17941, "loss": 1.6424, "learning_rate": 9.784908457308128e-06, "epoch": 0.8010701744607324, "percentage": 80.11, "elapsed_time": "1 day, 10:01:01", "remaining_time": "8:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14373, "total_steps": 17941, "loss": 1.5519, "learning_rate": 9.779618011067471e-06, "epoch": 0.8011259127138955, "percentage": 80.11, "elapsed_time": "1 day, 10:01:10", "remaining_time": "8:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14374, "total_steps": 17941, "loss": 1.5504, "learning_rate": 9.774328840382824e-06, "epoch": 0.8011816509670587, "percentage": 80.12, "elapsed_time": "1 day, 10:01:18", "remaining_time": "8:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14375, "total_steps": 17941, "loss": 1.5899, "learning_rate": 9.769040945421948e-06, "epoch": 0.8012373892202218, "percentage": 80.12, "elapsed_time": "1 day, 10:01:26", "remaining_time": "8:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14376, "total_steps": 17941, "loss": 1.6959, "learning_rate": 9.76375432635252e-06, "epoch": 0.801293127473385, "percentage": 80.13, "elapsed_time": "1 day, 10:01:35", "remaining_time": "8:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14377, "total_steps": 17941, "loss": 1.6766, "learning_rate": 9.758468983342194e-06, "epoch": 0.8013488657265482, "percentage": 80.13, "elapsed_time": "1 day, 10:01:44", "remaining_time": "8:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14378, "total_steps": 17941, "loss": 1.4319, "learning_rate": 9.753184916558633e-06, "epoch": 0.8014046039797112, "percentage": 80.14, "elapsed_time": "1 day, 10:01:52", "remaining_time": "8:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14379, "total_steps": 17941, "loss": 1.8583, "learning_rate": 9.747902126169383e-06, "epoch": 0.8014603422328744, "percentage": 80.15, "elapsed_time": "1 day, 10:02:01", "remaining_time": "8:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14380, "total_steps": 17941, "loss": 1.4291, "learning_rate": 9.74262061234199e-06, "epoch": 0.8015160804860376, "percentage": 80.15, "elapsed_time": "1 day, 10:02:09", "remaining_time": "8:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14381, "total_steps": 17941, "loss": 1.6524, "learning_rate": 9.737340375243953e-06, "epoch": 0.8015718187392007, "percentage": 80.16, "elapsed_time": "1 day, 10:02:18", "remaining_time": "8:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14382, "total_steps": 17941, "loss": 1.7465, "learning_rate": 9.732061415042732e-06, "epoch": 0.8016275569923639, "percentage": 80.16, "elapsed_time": "1 day, 10:02:26", "remaining_time": "8:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14383, "total_steps": 17941, "loss": 1.6151, "learning_rate": 9.726783731905759e-06, "epoch": 0.801683295245527, "percentage": 80.17, "elapsed_time": "1 day, 10:02:35", "remaining_time": "8:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14384, "total_steps": 17941, "loss": 1.5089, "learning_rate": 9.721507326000383e-06, "epoch": 0.8017390334986901, "percentage": 80.17, "elapsed_time": "1 day, 10:02:43", "remaining_time": "8:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14385, "total_steps": 17941, "loss": 1.3962, "learning_rate": 9.716232197493957e-06, "epoch": 0.8017947717518533, "percentage": 80.18, "elapsed_time": "1 day, 10:02:51", "remaining_time": "8:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14386, "total_steps": 17941, "loss": 1.6131, "learning_rate": 9.710958346553772e-06, "epoch": 0.8018505100050164, "percentage": 80.19, "elapsed_time": "1 day, 10:03:00", "remaining_time": "8:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14387, "total_steps": 17941, "loss": 1.5955, "learning_rate": 9.705685773347101e-06, "epoch": 0.8019062482581796, "percentage": 80.19, "elapsed_time": "1 day, 10:03:09", "remaining_time": "8:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14388, "total_steps": 17941, "loss": 1.4416, "learning_rate": 9.70041447804112e-06, "epoch": 0.8019619865113428, "percentage": 80.2, "elapsed_time": "1 day, 10:03:17", "remaining_time": "8:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14389, "total_steps": 17941, "loss": 1.4565, "learning_rate": 9.69514446080304e-06, "epoch": 0.8020177247645058, "percentage": 80.2, "elapsed_time": "1 day, 10:03:26", "remaining_time": "8:24:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14390, "total_steps": 17941, "loss": 1.6088, "learning_rate": 9.689875721799995e-06, "epoch": 0.802073463017669, "percentage": 80.21, "elapsed_time": "1 day, 10:03:34", "remaining_time": "8:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14391, "total_steps": 17941, "loss": 1.6619, "learning_rate": 9.684608261199058e-06, "epoch": 0.8021292012708322, "percentage": 80.21, "elapsed_time": "1 day, 10:03:43", "remaining_time": "8:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14392, "total_steps": 17941, "loss": 1.884, "learning_rate": 9.679342079167291e-06, "epoch": 0.8021849395239953, "percentage": 80.22, "elapsed_time": "1 day, 10:03:51", "remaining_time": "8:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14393, "total_steps": 17941, "loss": 1.6299, "learning_rate": 9.674077175871709e-06, "epoch": 0.8022406777771585, "percentage": 80.22, "elapsed_time": "1 day, 10:04:00", "remaining_time": "8:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14394, "total_steps": 17941, "loss": 1.5954, "learning_rate": 9.668813551479295e-06, "epoch": 0.8022964160303216, "percentage": 80.23, "elapsed_time": "1 day, 10:04:08", "remaining_time": "8:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14395, "total_steps": 17941, "loss": 1.6079, "learning_rate": 9.66355120615694e-06, "epoch": 0.8023521542834847, "percentage": 80.24, "elapsed_time": "1 day, 10:04:17", "remaining_time": "8:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14396, "total_steps": 17941, "loss": 1.5324, "learning_rate": 9.65829014007158e-06, "epoch": 0.8024078925366479, "percentage": 80.24, "elapsed_time": "1 day, 10:04:26", "remaining_time": "8:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14397, "total_steps": 17941, "loss": 1.919, "learning_rate": 9.653030353390058e-06, "epoch": 0.8024636307898111, "percentage": 80.25, "elapsed_time": "1 day, 10:04:34", "remaining_time": "8:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14398, "total_steps": 17941, "loss": 1.5565, "learning_rate": 9.647771846279162e-06, "epoch": 0.8025193690429742, "percentage": 80.25, "elapsed_time": "1 day, 10:04:44", "remaining_time": "8:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14399, "total_steps": 17941, "loss": 1.429, "learning_rate": 9.642514618905673e-06, "epoch": 0.8025751072961373, "percentage": 80.26, "elapsed_time": "1 day, 10:04:52", "remaining_time": "8:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14400, "total_steps": 17941, "loss": 1.6777, "learning_rate": 9.637258671436317e-06, "epoch": 0.8026308455493005, "percentage": 80.26, "elapsed_time": "1 day, 10:05:01", "remaining_time": "8:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14401, "total_steps": 17941, "loss": 1.4368, "learning_rate": 9.632004004037804e-06, "epoch": 0.8026865838024636, "percentage": 80.27, "elapsed_time": "1 day, 10:05:09", "remaining_time": "8:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14402, "total_steps": 17941, "loss": 1.4163, "learning_rate": 9.626750616876745e-06, "epoch": 0.8027423220556268, "percentage": 80.27, "elapsed_time": "1 day, 10:05:18", "remaining_time": "8:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14403, "total_steps": 17941, "loss": 1.5634, "learning_rate": 9.621498510119754e-06, "epoch": 0.80279806030879, "percentage": 80.28, "elapsed_time": "1 day, 10:05:26", "remaining_time": "8:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14404, "total_steps": 17941, "loss": 1.4767, "learning_rate": 9.616247683933428e-06, "epoch": 0.802853798561953, "percentage": 80.29, "elapsed_time": "1 day, 10:05:35", "remaining_time": "8:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14405, "total_steps": 17941, "loss": 1.753, "learning_rate": 9.610998138484262e-06, "epoch": 0.8029095368151162, "percentage": 80.29, "elapsed_time": "1 day, 10:05:43", "remaining_time": "8:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14406, "total_steps": 17941, "loss": 1.6291, "learning_rate": 9.605749873938752e-06, "epoch": 0.8029652750682793, "percentage": 80.3, "elapsed_time": "1 day, 10:05:52", "remaining_time": "8:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14407, "total_steps": 17941, "loss": 1.658, "learning_rate": 9.600502890463341e-06, "epoch": 0.8030210133214425, "percentage": 80.3, "elapsed_time": "1 day, 10:06:00", "remaining_time": "8:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14408, "total_steps": 17941, "loss": 1.8136, "learning_rate": 9.595257188224433e-06, "epoch": 0.8030767515746057, "percentage": 80.31, "elapsed_time": "1 day, 10:06:09", "remaining_time": "8:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14409, "total_steps": 17941, "loss": 1.3871, "learning_rate": 9.590012767388402e-06, "epoch": 0.8031324898277687, "percentage": 80.31, "elapsed_time": "1 day, 10:06:17", "remaining_time": "8:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14410, "total_steps": 17941, "loss": 1.4633, "learning_rate": 9.584769628121548e-06, "epoch": 0.8031882280809319, "percentage": 80.32, "elapsed_time": "1 day, 10:06:26", "remaining_time": "8:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14411, "total_steps": 17941, "loss": 1.7256, "learning_rate": 9.579527770590163e-06, "epoch": 0.8032439663340951, "percentage": 80.32, "elapsed_time": "1 day, 10:06:34", "remaining_time": "8:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14412, "total_steps": 17941, "loss": 1.5641, "learning_rate": 9.574287194960491e-06, "epoch": 0.8032997045872582, "percentage": 80.33, "elapsed_time": "1 day, 10:06:43", "remaining_time": "8:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14413, "total_steps": 17941, "loss": 1.5298, "learning_rate": 9.569047901398742e-06, "epoch": 0.8033554428404214, "percentage": 80.34, "elapsed_time": "1 day, 10:06:51", "remaining_time": "8:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14414, "total_steps": 17941, "loss": 1.5445, "learning_rate": 9.56380989007104e-06, "epoch": 0.8034111810935846, "percentage": 80.34, "elapsed_time": "1 day, 10:06:59", "remaining_time": "8:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14415, "total_steps": 17941, "loss": 1.7519, "learning_rate": 9.558573161143542e-06, "epoch": 0.8034669193467476, "percentage": 80.35, "elapsed_time": "1 day, 10:07:08", "remaining_time": "8:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14416, "total_steps": 17941, "loss": 1.7039, "learning_rate": 9.553337714782324e-06, "epoch": 0.8035226575999108, "percentage": 80.35, "elapsed_time": "1 day, 10:07:16", "remaining_time": "8:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14417, "total_steps": 17941, "loss": 1.6528, "learning_rate": 9.548103551153403e-06, "epoch": 0.803578395853074, "percentage": 80.36, "elapsed_time": "1 day, 10:07:25", "remaining_time": "8:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14418, "total_steps": 17941, "loss": 1.6934, "learning_rate": 9.542870670422787e-06, "epoch": 0.8036341341062371, "percentage": 80.36, "elapsed_time": "1 day, 10:07:33", "remaining_time": "8:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14419, "total_steps": 17941, "loss": 1.5557, "learning_rate": 9.537639072756432e-06, "epoch": 0.8036898723594003, "percentage": 80.37, "elapsed_time": "1 day, 10:07:42", "remaining_time": "8:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14420, "total_steps": 17941, "loss": 1.5267, "learning_rate": 9.532408758320267e-06, "epoch": 0.8037456106125634, "percentage": 80.37, "elapsed_time": "1 day, 10:07:51", "remaining_time": "8:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14421, "total_steps": 17941, "loss": 1.8426, "learning_rate": 9.527179727280122e-06, "epoch": 0.8038013488657265, "percentage": 80.38, "elapsed_time": "1 day, 10:07:59", "remaining_time": "8:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14422, "total_steps": 17941, "loss": 1.8076, "learning_rate": 9.52195197980188e-06, "epoch": 0.8038570871188897, "percentage": 80.39, "elapsed_time": "1 day, 10:08:08", "remaining_time": "8:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14423, "total_steps": 17941, "loss": 1.6287, "learning_rate": 9.516725516051333e-06, "epoch": 0.8039128253720529, "percentage": 80.39, "elapsed_time": "1 day, 10:08:16", "remaining_time": "8:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14424, "total_steps": 17941, "loss": 1.6721, "learning_rate": 9.5115003361942e-06, "epoch": 0.803968563625216, "percentage": 80.4, "elapsed_time": "1 day, 10:08:25", "remaining_time": "8:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14425, "total_steps": 17941, "loss": 1.6215, "learning_rate": 9.506276440396223e-06, "epoch": 0.8040243018783791, "percentage": 80.4, "elapsed_time": "1 day, 10:08:33", "remaining_time": "8:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14426, "total_steps": 17941, "loss": 1.7268, "learning_rate": 9.501053828823053e-06, "epoch": 0.8040800401315423, "percentage": 80.41, "elapsed_time": "1 day, 10:08:42", "remaining_time": "8:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14427, "total_steps": 17941, "loss": 1.7804, "learning_rate": 9.495832501640344e-06, "epoch": 0.8041357783847054, "percentage": 80.41, "elapsed_time": "1 day, 10:08:50", "remaining_time": "8:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14428, "total_steps": 17941, "loss": 1.6868, "learning_rate": 9.490612459013664e-06, "epoch": 0.8041915166378686, "percentage": 80.42, "elapsed_time": "1 day, 10:08:59", "remaining_time": "8:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14429, "total_steps": 17941, "loss": 1.4381, "learning_rate": 9.485393701108552e-06, "epoch": 0.8042472548910317, "percentage": 80.42, "elapsed_time": "1 day, 10:09:07", "remaining_time": "8:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14430, "total_steps": 17941, "loss": 1.6462, "learning_rate": 9.480176228090566e-06, "epoch": 0.8043029931441948, "percentage": 80.43, "elapsed_time": "1 day, 10:09:16", "remaining_time": "8:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14431, "total_steps": 17941, "loss": 1.6948, "learning_rate": 9.47496004012513e-06, "epoch": 0.804358731397358, "percentage": 80.44, "elapsed_time": "1 day, 10:09:24", "remaining_time": "8:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14432, "total_steps": 17941, "loss": 1.5765, "learning_rate": 9.469745137377678e-06, "epoch": 0.8044144696505211, "percentage": 80.44, "elapsed_time": "1 day, 10:09:33", "remaining_time": "8:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14433, "total_steps": 17941, "loss": 1.463, "learning_rate": 9.464531520013608e-06, "epoch": 0.8044702079036843, "percentage": 80.45, "elapsed_time": "1 day, 10:09:42", "remaining_time": "8:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14434, "total_steps": 17941, "loss": 1.4668, "learning_rate": 9.459319188198262e-06, "epoch": 0.8045259461568475, "percentage": 80.45, "elapsed_time": "1 day, 10:09:50", "remaining_time": "8:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14435, "total_steps": 17941, "loss": 1.7968, "learning_rate": 9.454108142096951e-06, "epoch": 0.8045816844100105, "percentage": 80.46, "elapsed_time": "1 day, 10:09:59", "remaining_time": "8:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14436, "total_steps": 17941, "loss": 1.5935, "learning_rate": 9.448898381874904e-06, "epoch": 0.8046374226631737, "percentage": 80.46, "elapsed_time": "1 day, 10:10:07", "remaining_time": "8:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14437, "total_steps": 17941, "loss": 1.8367, "learning_rate": 9.4436899076974e-06, "epoch": 0.8046931609163369, "percentage": 80.47, "elapsed_time": "1 day, 10:10:16", "remaining_time": "8:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14438, "total_steps": 17941, "loss": 1.726, "learning_rate": 9.438482719729579e-06, "epoch": 0.8047488991695, "percentage": 80.47, "elapsed_time": "1 day, 10:10:25", "remaining_time": "8:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14439, "total_steps": 17941, "loss": 1.7836, "learning_rate": 9.43327681813661e-06, "epoch": 0.8048046374226632, "percentage": 80.48, "elapsed_time": "1 day, 10:10:33", "remaining_time": "8:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14440, "total_steps": 17941, "loss": 1.7362, "learning_rate": 9.428072203083554e-06, "epoch": 0.8048603756758264, "percentage": 80.49, "elapsed_time": "1 day, 10:10:42", "remaining_time": "8:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14441, "total_steps": 17941, "loss": 1.8533, "learning_rate": 9.422868874735507e-06, "epoch": 0.8049161139289894, "percentage": 80.49, "elapsed_time": "1 day, 10:10:50", "remaining_time": "8:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14442, "total_steps": 17941, "loss": 1.5445, "learning_rate": 9.417666833257493e-06, "epoch": 0.8049718521821526, "percentage": 80.5, "elapsed_time": "1 day, 10:10:59", "remaining_time": "8:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14443, "total_steps": 17941, "loss": 1.7809, "learning_rate": 9.412466078814463e-06, "epoch": 0.8050275904353158, "percentage": 80.5, "elapsed_time": "1 day, 10:11:07", "remaining_time": "8:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14444, "total_steps": 17941, "loss": 1.547, "learning_rate": 9.407266611571368e-06, "epoch": 0.8050833286884789, "percentage": 80.51, "elapsed_time": "1 day, 10:11:16", "remaining_time": "8:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14445, "total_steps": 17941, "loss": 1.5924, "learning_rate": 9.402068431693101e-06, "epoch": 0.8051390669416421, "percentage": 80.51, "elapsed_time": "1 day, 10:11:24", "remaining_time": "8:16:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14446, "total_steps": 17941, "loss": 1.5457, "learning_rate": 9.396871539344537e-06, "epoch": 0.8051948051948052, "percentage": 80.52, "elapsed_time": "1 day, 10:11:33", "remaining_time": "8:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14447, "total_steps": 17941, "loss": 1.3105, "learning_rate": 9.391675934690447e-06, "epoch": 0.8052505434479683, "percentage": 80.53, "elapsed_time": "1 day, 10:11:41", "remaining_time": "8:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14448, "total_steps": 17941, "loss": 1.9536, "learning_rate": 9.386481617895648e-06, "epoch": 0.8053062817011315, "percentage": 80.53, "elapsed_time": "1 day, 10:11:50", "remaining_time": "8:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14449, "total_steps": 17941, "loss": 1.5554, "learning_rate": 9.381288589124876e-06, "epoch": 0.8053620199542947, "percentage": 80.54, "elapsed_time": "1 day, 10:11:58", "remaining_time": "8:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14450, "total_steps": 17941, "loss": 1.3512, "learning_rate": 9.376096848542788e-06, "epoch": 0.8054177582074578, "percentage": 80.54, "elapsed_time": "1 day, 10:12:07", "remaining_time": "8:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14451, "total_steps": 17941, "loss": 1.5164, "learning_rate": 9.370906396314055e-06, "epoch": 0.8054734964606209, "percentage": 80.55, "elapsed_time": "1 day, 10:12:15", "remaining_time": "8:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14452, "total_steps": 17941, "loss": 1.4119, "learning_rate": 9.365717232603283e-06, "epoch": 0.805529234713784, "percentage": 80.55, "elapsed_time": "1 day, 10:12:24", "remaining_time": "8:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14453, "total_steps": 17941, "loss": 1.5208, "learning_rate": 9.360529357575066e-06, "epoch": 0.8055849729669472, "percentage": 80.56, "elapsed_time": "1 day, 10:12:32", "remaining_time": "8:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14454, "total_steps": 17941, "loss": 1.5729, "learning_rate": 9.3553427713939e-06, "epoch": 0.8056407112201104, "percentage": 80.56, "elapsed_time": "1 day, 10:12:41", "remaining_time": "8:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14455, "total_steps": 17941, "loss": 1.615, "learning_rate": 9.350157474224268e-06, "epoch": 0.8056964494732735, "percentage": 80.57, "elapsed_time": "1 day, 10:12:49", "remaining_time": "8:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14456, "total_steps": 17941, "loss": 1.5061, "learning_rate": 9.344973466230667e-06, "epoch": 0.8057521877264366, "percentage": 80.58, "elapsed_time": "1 day, 10:12:58", "remaining_time": "8:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14457, "total_steps": 17941, "loss": 1.2955, "learning_rate": 9.339790747577453e-06, "epoch": 0.8058079259795998, "percentage": 80.58, "elapsed_time": "1 day, 10:13:06", "remaining_time": "8:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14458, "total_steps": 17941, "loss": 1.6353, "learning_rate": 9.334609318429016e-06, "epoch": 0.8058636642327629, "percentage": 80.59, "elapsed_time": "1 day, 10:13:15", "remaining_time": "8:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14459, "total_steps": 17941, "loss": 1.7109, "learning_rate": 9.329429178949678e-06, "epoch": 0.8059194024859261, "percentage": 80.59, "elapsed_time": "1 day, 10:13:24", "remaining_time": "8:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14460, "total_steps": 17941, "loss": 1.4907, "learning_rate": 9.324250329303713e-06, "epoch": 0.8059751407390893, "percentage": 80.6, "elapsed_time": "1 day, 10:13:33", "remaining_time": "8:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14461, "total_steps": 17941, "loss": 1.6438, "learning_rate": 9.31907276965539e-06, "epoch": 0.8060308789922523, "percentage": 80.6, "elapsed_time": "1 day, 10:13:41", "remaining_time": "8:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14462, "total_steps": 17941, "loss": 1.6177, "learning_rate": 9.313896500168867e-06, "epoch": 0.8060866172454155, "percentage": 80.61, "elapsed_time": "1 day, 10:13:50", "remaining_time": "8:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14463, "total_steps": 17941, "loss": 1.7162, "learning_rate": 9.308721521008357e-06, "epoch": 0.8061423554985787, "percentage": 80.61, "elapsed_time": "1 day, 10:13:58", "remaining_time": "8:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14464, "total_steps": 17941, "loss": 1.8492, "learning_rate": 9.303547832337934e-06, "epoch": 0.8061980937517418, "percentage": 80.62, "elapsed_time": "1 day, 10:14:06", "remaining_time": "8:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14465, "total_steps": 17941, "loss": 1.7473, "learning_rate": 9.298375434321716e-06, "epoch": 0.806253832004905, "percentage": 80.63, "elapsed_time": "1 day, 10:14:15", "remaining_time": "8:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14466, "total_steps": 17941, "loss": 1.5024, "learning_rate": 9.293204327123694e-06, "epoch": 0.8063095702580682, "percentage": 80.63, "elapsed_time": "1 day, 10:14:24", "remaining_time": "8:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14467, "total_steps": 17941, "loss": 1.6197, "learning_rate": 9.288034510907912e-06, "epoch": 0.8063653085112312, "percentage": 80.64, "elapsed_time": "1 day, 10:14:32", "remaining_time": "8:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14468, "total_steps": 17941, "loss": 1.7008, "learning_rate": 9.282865985838313e-06, "epoch": 0.8064210467643944, "percentage": 80.64, "elapsed_time": "1 day, 10:14:40", "remaining_time": "8:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14469, "total_steps": 17941, "loss": 1.8471, "learning_rate": 9.277698752078801e-06, "epoch": 0.8064767850175576, "percentage": 80.65, "elapsed_time": "1 day, 10:14:49", "remaining_time": "8:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14470, "total_steps": 17941, "loss": 1.5663, "learning_rate": 9.272532809793254e-06, "epoch": 0.8065325232707207, "percentage": 80.65, "elapsed_time": "1 day, 10:14:57", "remaining_time": "8:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14471, "total_steps": 17941, "loss": 1.4549, "learning_rate": 9.267368159145506e-06, "epoch": 0.8065882615238839, "percentage": 80.66, "elapsed_time": "1 day, 10:15:06", "remaining_time": "8:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14472, "total_steps": 17941, "loss": 1.4818, "learning_rate": 9.262204800299373e-06, "epoch": 0.806643999777047, "percentage": 80.66, "elapsed_time": "1 day, 10:15:14", "remaining_time": "8:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14473, "total_steps": 17941, "loss": 1.5863, "learning_rate": 9.257042733418552e-06, "epoch": 0.8066997380302101, "percentage": 80.67, "elapsed_time": "1 day, 10:15:23", "remaining_time": "8:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14474, "total_steps": 17941, "loss": 1.461, "learning_rate": 9.251881958666802e-06, "epoch": 0.8067554762833733, "percentage": 80.68, "elapsed_time": "1 day, 10:15:31", "remaining_time": "8:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14475, "total_steps": 17941, "loss": 1.4981, "learning_rate": 9.246722476207797e-06, "epoch": 0.8068112145365364, "percentage": 80.68, "elapsed_time": "1 day, 10:15:40", "remaining_time": "8:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14476, "total_steps": 17941, "loss": 1.6121, "learning_rate": 9.24156428620513e-06, "epoch": 0.8068669527896996, "percentage": 80.69, "elapsed_time": "1 day, 10:15:48", "remaining_time": "8:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14477, "total_steps": 17941, "loss": 1.5065, "learning_rate": 9.236407388822405e-06, "epoch": 0.8069226910428627, "percentage": 80.69, "elapsed_time": "1 day, 10:15:57", "remaining_time": "8:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14478, "total_steps": 17941, "loss": 1.47, "learning_rate": 9.23125178422317e-06, "epoch": 0.8069784292960258, "percentage": 80.7, "elapsed_time": "1 day, 10:16:06", "remaining_time": "8:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14479, "total_steps": 17941, "loss": 1.4377, "learning_rate": 9.226097472570943e-06, "epoch": 0.807034167549189, "percentage": 80.7, "elapsed_time": "1 day, 10:16:14", "remaining_time": "8:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14480, "total_steps": 17941, "loss": 1.6211, "learning_rate": 9.220944454029162e-06, "epoch": 0.8070899058023522, "percentage": 80.71, "elapsed_time": "1 day, 10:16:23", "remaining_time": "8:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14481, "total_steps": 17941, "loss": 1.5581, "learning_rate": 9.215792728761253e-06, "epoch": 0.8071456440555153, "percentage": 80.71, "elapsed_time": "1 day, 10:16:32", "remaining_time": "8:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14482, "total_steps": 17941, "loss": 1.5311, "learning_rate": 9.210642296930638e-06, "epoch": 0.8072013823086784, "percentage": 80.72, "elapsed_time": "1 day, 10:16:40", "remaining_time": "8:11:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14483, "total_steps": 17941, "loss": 1.6832, "learning_rate": 9.205493158700618e-06, "epoch": 0.8072571205618416, "percentage": 80.73, "elapsed_time": "1 day, 10:16:49", "remaining_time": "8:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14484, "total_steps": 17941, "loss": 1.5659, "learning_rate": 9.200345314234504e-06, "epoch": 0.8073128588150047, "percentage": 80.73, "elapsed_time": "1 day, 10:16:57", "remaining_time": "8:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14485, "total_steps": 17941, "loss": 1.5639, "learning_rate": 9.195198763695557e-06, "epoch": 0.8073685970681679, "percentage": 80.74, "elapsed_time": "1 day, 10:17:06", "remaining_time": "8:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14486, "total_steps": 17941, "loss": 1.7787, "learning_rate": 9.190053507246999e-06, "epoch": 0.8074243353213311, "percentage": 80.74, "elapsed_time": "1 day, 10:17:14", "remaining_time": "8:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14487, "total_steps": 17941, "loss": 1.5598, "learning_rate": 9.184909545052017e-06, "epoch": 0.8074800735744941, "percentage": 80.75, "elapsed_time": "1 day, 10:17:23", "remaining_time": "8:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14488, "total_steps": 17941, "loss": 1.5103, "learning_rate": 9.17976687727371e-06, "epoch": 0.8075358118276573, "percentage": 80.75, "elapsed_time": "1 day, 10:17:31", "remaining_time": "8:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14489, "total_steps": 17941, "loss": 1.7456, "learning_rate": 9.174625504075225e-06, "epoch": 0.8075915500808205, "percentage": 80.76, "elapsed_time": "1 day, 10:17:40", "remaining_time": "8:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14490, "total_steps": 17941, "loss": 1.7104, "learning_rate": 9.169485425619578e-06, "epoch": 0.8076472883339836, "percentage": 80.76, "elapsed_time": "1 day, 10:17:49", "remaining_time": "8:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14491, "total_steps": 17941, "loss": 1.814, "learning_rate": 9.164346642069804e-06, "epoch": 0.8077030265871468, "percentage": 80.77, "elapsed_time": "1 day, 10:17:57", "remaining_time": "8:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14492, "total_steps": 17941, "loss": 1.6125, "learning_rate": 9.159209153588849e-06, "epoch": 0.80775876484031, "percentage": 80.78, "elapsed_time": "1 day, 10:18:05", "remaining_time": "8:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14493, "total_steps": 17941, "loss": 1.627, "learning_rate": 9.154072960339666e-06, "epoch": 0.807814503093473, "percentage": 80.78, "elapsed_time": "1 day, 10:18:14", "remaining_time": "8:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14494, "total_steps": 17941, "loss": 1.5063, "learning_rate": 9.148938062485157e-06, "epoch": 0.8078702413466362, "percentage": 80.79, "elapsed_time": "1 day, 10:18:22", "remaining_time": "8:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14495, "total_steps": 17941, "loss": 1.6385, "learning_rate": 9.143804460188143e-06, "epoch": 0.8079259795997994, "percentage": 80.79, "elapsed_time": "1 day, 10:18:31", "remaining_time": "8:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14496, "total_steps": 17941, "loss": 1.6554, "learning_rate": 9.138672153611439e-06, "epoch": 0.8079817178529625, "percentage": 80.8, "elapsed_time": "1 day, 10:18:39", "remaining_time": "8:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14497, "total_steps": 17941, "loss": 1.7165, "learning_rate": 9.133541142917823e-06, "epoch": 0.8080374561061257, "percentage": 80.8, "elapsed_time": "1 day, 10:18:48", "remaining_time": "8:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14498, "total_steps": 17941, "loss": 2.0642, "learning_rate": 9.128411428270018e-06, "epoch": 0.8080931943592887, "percentage": 80.81, "elapsed_time": "1 day, 10:18:56", "remaining_time": "8:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14499, "total_steps": 17941, "loss": 1.6783, "learning_rate": 9.123283009830686e-06, "epoch": 0.8081489326124519, "percentage": 80.81, "elapsed_time": "1 day, 10:19:05", "remaining_time": "8:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14500, "total_steps": 17941, "loss": 1.6466, "learning_rate": 9.118155887762496e-06, "epoch": 0.8082046708656151, "percentage": 80.82, "elapsed_time": "1 day, 10:19:13", "remaining_time": "8:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14501, "total_steps": 17941, "loss": 1.4418, "learning_rate": 9.113030062228063e-06, "epoch": 0.8082604091187782, "percentage": 80.83, "elapsed_time": "1 day, 10:19:22", "remaining_time": "8:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14502, "total_steps": 17941, "loss": 1.4944, "learning_rate": 9.107905533389915e-06, "epoch": 0.8083161473719414, "percentage": 80.83, "elapsed_time": "1 day, 10:19:31", "remaining_time": "8:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14503, "total_steps": 17941, "loss": 1.6503, "learning_rate": 9.102782301410584e-06, "epoch": 0.8083718856251045, "percentage": 80.84, "elapsed_time": "1 day, 10:19:39", "remaining_time": "8:08:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14504, "total_steps": 17941, "loss": 1.7528, "learning_rate": 9.097660366452548e-06, "epoch": 0.8084276238782676, "percentage": 80.84, "elapsed_time": "1 day, 10:19:48", "remaining_time": "8:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14505, "total_steps": 17941, "loss": 1.7108, "learning_rate": 9.092539728678262e-06, "epoch": 0.8084833621314308, "percentage": 80.85, "elapsed_time": "1 day, 10:19:57", "remaining_time": "8:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14506, "total_steps": 17941, "loss": 1.5113, "learning_rate": 9.087420388250101e-06, "epoch": 0.808539100384594, "percentage": 80.85, "elapsed_time": "1 day, 10:20:05", "remaining_time": "8:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14507, "total_steps": 17941, "loss": 1.9957, "learning_rate": 9.082302345330413e-06, "epoch": 0.808594838637757, "percentage": 80.86, "elapsed_time": "1 day, 10:20:14", "remaining_time": "8:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14508, "total_steps": 17941, "loss": 1.4357, "learning_rate": 9.077185600081551e-06, "epoch": 0.8086505768909202, "percentage": 80.87, "elapsed_time": "1 day, 10:20:23", "remaining_time": "8:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14509, "total_steps": 17941, "loss": 1.7057, "learning_rate": 9.072070152665758e-06, "epoch": 0.8087063151440834, "percentage": 80.87, "elapsed_time": "1 day, 10:20:31", "remaining_time": "8:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14510, "total_steps": 17941, "loss": 1.737, "learning_rate": 9.066956003245264e-06, "epoch": 0.8087620533972465, "percentage": 80.88, "elapsed_time": "1 day, 10:20:39", "remaining_time": "8:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14511, "total_steps": 17941, "loss": 1.5738, "learning_rate": 9.06184315198228e-06, "epoch": 0.8088177916504097, "percentage": 80.88, "elapsed_time": "1 day, 10:20:48", "remaining_time": "8:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14512, "total_steps": 17941, "loss": 1.4052, "learning_rate": 9.056731599038948e-06, "epoch": 0.8088735299035729, "percentage": 80.89, "elapsed_time": "1 day, 10:20:56", "remaining_time": "8:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14513, "total_steps": 17941, "loss": 1.9542, "learning_rate": 9.051621344577371e-06, "epoch": 0.8089292681567359, "percentage": 80.89, "elapsed_time": "1 day, 10:21:05", "remaining_time": "8:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14514, "total_steps": 17941, "loss": 1.6902, "learning_rate": 9.046512388759598e-06, "epoch": 0.8089850064098991, "percentage": 80.9, "elapsed_time": "1 day, 10:21:13", "remaining_time": "8:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14515, "total_steps": 17941, "loss": 1.7517, "learning_rate": 9.041404731747705e-06, "epoch": 0.8090407446630623, "percentage": 80.9, "elapsed_time": "1 day, 10:21:22", "remaining_time": "8:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14516, "total_steps": 17941, "loss": 1.7549, "learning_rate": 9.036298373703638e-06, "epoch": 0.8090964829162254, "percentage": 80.91, "elapsed_time": "1 day, 10:21:30", "remaining_time": "8:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14517, "total_steps": 17941, "loss": 1.596, "learning_rate": 9.03119331478935e-06, "epoch": 0.8091522211693886, "percentage": 80.92, "elapsed_time": "1 day, 10:21:38", "remaining_time": "8:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14518, "total_steps": 17941, "loss": 1.5824, "learning_rate": 9.026089555166745e-06, "epoch": 0.8092079594225517, "percentage": 80.92, "elapsed_time": "1 day, 10:21:47", "remaining_time": "8:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14519, "total_steps": 17941, "loss": 1.5729, "learning_rate": 9.020987094997691e-06, "epoch": 0.8092636976757148, "percentage": 80.93, "elapsed_time": "1 day, 10:21:55", "remaining_time": "8:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14520, "total_steps": 17941, "loss": 1.7344, "learning_rate": 9.015885934444007e-06, "epoch": 0.809319435928878, "percentage": 80.93, "elapsed_time": "1 day, 10:22:04", "remaining_time": "8:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14521, "total_steps": 17941, "loss": 1.6726, "learning_rate": 9.010786073667455e-06, "epoch": 0.8093751741820411, "percentage": 80.94, "elapsed_time": "1 day, 10:22:12", "remaining_time": "8:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14522, "total_steps": 17941, "loss": 1.7196, "learning_rate": 9.005687512829786e-06, "epoch": 0.8094309124352043, "percentage": 80.94, "elapsed_time": "1 day, 10:22:21", "remaining_time": "8:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14523, "total_steps": 17941, "loss": 1.6435, "learning_rate": 9.0005902520927e-06, "epoch": 0.8094866506883674, "percentage": 80.95, "elapsed_time": "1 day, 10:22:29", "remaining_time": "8:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14524, "total_steps": 17941, "loss": 1.7616, "learning_rate": 8.995494291617856e-06, "epoch": 0.8095423889415305, "percentage": 80.95, "elapsed_time": "1 day, 10:22:38", "remaining_time": "8:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14525, "total_steps": 17941, "loss": 1.6495, "learning_rate": 8.990399631566837e-06, "epoch": 0.8095981271946937, "percentage": 80.96, "elapsed_time": "1 day, 10:22:46", "remaining_time": "8:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14526, "total_steps": 17941, "loss": 1.6081, "learning_rate": 8.985306272101252e-06, "epoch": 0.8096538654478569, "percentage": 80.97, "elapsed_time": "1 day, 10:22:54", "remaining_time": "8:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14527, "total_steps": 17941, "loss": 1.4755, "learning_rate": 8.980214213382632e-06, "epoch": 0.80970960370102, "percentage": 80.97, "elapsed_time": "1 day, 10:23:03", "remaining_time": "8:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14528, "total_steps": 17941, "loss": 1.5668, "learning_rate": 8.975123455572443e-06, "epoch": 0.8097653419541831, "percentage": 80.98, "elapsed_time": "1 day, 10:23:11", "remaining_time": "8:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14529, "total_steps": 17941, "loss": 1.2416, "learning_rate": 8.970033998832145e-06, "epoch": 0.8098210802073463, "percentage": 80.98, "elapsed_time": "1 day, 10:23:20", "remaining_time": "8:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14530, "total_steps": 17941, "loss": 1.8587, "learning_rate": 8.964945843323147e-06, "epoch": 0.8098768184605094, "percentage": 80.99, "elapsed_time": "1 day, 10:23:28", "remaining_time": "8:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14531, "total_steps": 17941, "loss": 1.6583, "learning_rate": 8.959858989206827e-06, "epoch": 0.8099325567136726, "percentage": 80.99, "elapsed_time": "1 day, 10:23:37", "remaining_time": "8:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14532, "total_steps": 17941, "loss": 1.6193, "learning_rate": 8.954773436644492e-06, "epoch": 0.8099882949668358, "percentage": 81.0, "elapsed_time": "1 day, 10:23:45", "remaining_time": "8:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14533, "total_steps": 17941, "loss": 1.7473, "learning_rate": 8.949689185797416e-06, "epoch": 0.8100440332199988, "percentage": 81.0, "elapsed_time": "1 day, 10:23:54", "remaining_time": "8:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14534, "total_steps": 17941, "loss": 1.6444, "learning_rate": 8.944606236826885e-06, "epoch": 0.810099771473162, "percentage": 81.01, "elapsed_time": "1 day, 10:24:02", "remaining_time": "8:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14535, "total_steps": 17941, "loss": 1.7083, "learning_rate": 8.939524589894067e-06, "epoch": 0.8101555097263252, "percentage": 81.02, "elapsed_time": "1 day, 10:24:11", "remaining_time": "8:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14536, "total_steps": 17941, "loss": 1.6985, "learning_rate": 8.934444245160123e-06, "epoch": 0.8102112479794883, "percentage": 81.02, "elapsed_time": "1 day, 10:24:20", "remaining_time": "8:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14537, "total_steps": 17941, "loss": 1.487, "learning_rate": 8.929365202786183e-06, "epoch": 0.8102669862326515, "percentage": 81.03, "elapsed_time": "1 day, 10:24:28", "remaining_time": "8:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14538, "total_steps": 17941, "loss": 1.4259, "learning_rate": 8.924287462933328e-06, "epoch": 0.8103227244858147, "percentage": 81.03, "elapsed_time": "1 day, 10:24:37", "remaining_time": "8:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14539, "total_steps": 17941, "loss": 1.4425, "learning_rate": 8.919211025762581e-06, "epoch": 0.8103784627389777, "percentage": 81.04, "elapsed_time": "1 day, 10:24:45", "remaining_time": "8:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14540, "total_steps": 17941, "loss": 1.467, "learning_rate": 8.914135891434927e-06, "epoch": 0.8104342009921409, "percentage": 81.04, "elapsed_time": "1 day, 10:24:54", "remaining_time": "8:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14541, "total_steps": 17941, "loss": 1.6551, "learning_rate": 8.909062060111357e-06, "epoch": 0.8104899392453041, "percentage": 81.05, "elapsed_time": "1 day, 10:25:02", "remaining_time": "8:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14542, "total_steps": 17941, "loss": 1.6874, "learning_rate": 8.903989531952755e-06, "epoch": 0.8105456774984672, "percentage": 81.05, "elapsed_time": "1 day, 10:25:10", "remaining_time": "8:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14543, "total_steps": 17941, "loss": 1.5656, "learning_rate": 8.89891830711999e-06, "epoch": 0.8106014157516304, "percentage": 81.06, "elapsed_time": "1 day, 10:25:19", "remaining_time": "8:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14544, "total_steps": 17941, "loss": 1.6318, "learning_rate": 8.893848385773911e-06, "epoch": 0.8106571540047934, "percentage": 81.07, "elapsed_time": "1 day, 10:25:28", "remaining_time": "8:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14545, "total_steps": 17941, "loss": 1.7456, "learning_rate": 8.88877976807529e-06, "epoch": 0.8107128922579566, "percentage": 81.07, "elapsed_time": "1 day, 10:25:36", "remaining_time": "8:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14546, "total_steps": 17941, "loss": 1.7037, "learning_rate": 8.883712454184894e-06, "epoch": 0.8107686305111198, "percentage": 81.08, "elapsed_time": "1 day, 10:25:45", "remaining_time": "8:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14547, "total_steps": 17941, "loss": 1.6516, "learning_rate": 8.8786464442634e-06, "epoch": 0.8108243687642829, "percentage": 81.08, "elapsed_time": "1 day, 10:25:54", "remaining_time": "8:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14548, "total_steps": 17941, "loss": 1.8242, "learning_rate": 8.873581738471486e-06, "epoch": 0.8108801070174461, "percentage": 81.09, "elapsed_time": "1 day, 10:26:03", "remaining_time": "8:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14549, "total_steps": 17941, "loss": 1.6742, "learning_rate": 8.868518336969779e-06, "epoch": 0.8109358452706092, "percentage": 81.09, "elapsed_time": "1 day, 10:26:11", "remaining_time": "8:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14550, "total_steps": 17941, "loss": 1.7067, "learning_rate": 8.863456239918866e-06, "epoch": 0.8109915835237723, "percentage": 81.1, "elapsed_time": "1 day, 10:26:19", "remaining_time": "8:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14551, "total_steps": 17941, "loss": 1.5587, "learning_rate": 8.858395447479257e-06, "epoch": 0.8110473217769355, "percentage": 81.1, "elapsed_time": "1 day, 10:26:28", "remaining_time": "8:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14552, "total_steps": 17941, "loss": 1.8265, "learning_rate": 8.853335959811482e-06, "epoch": 0.8111030600300987, "percentage": 81.11, "elapsed_time": "1 day, 10:26:36", "remaining_time": "8:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14553, "total_steps": 17941, "loss": 1.6465, "learning_rate": 8.848277777076003e-06, "epoch": 0.8111587982832618, "percentage": 81.12, "elapsed_time": "1 day, 10:26:45", "remaining_time": "8:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14554, "total_steps": 17941, "loss": 1.6282, "learning_rate": 8.843220899433207e-06, "epoch": 0.811214536536425, "percentage": 81.12, "elapsed_time": "1 day, 10:26:53", "remaining_time": "8:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14555, "total_steps": 17941, "loss": 1.6087, "learning_rate": 8.838165327043485e-06, "epoch": 0.8112702747895881, "percentage": 81.13, "elapsed_time": "1 day, 10:27:02", "remaining_time": "8:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14556, "total_steps": 17941, "loss": 1.5522, "learning_rate": 8.833111060067172e-06, "epoch": 0.8113260130427512, "percentage": 81.13, "elapsed_time": "1 day, 10:27:11", "remaining_time": "8:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14557, "total_steps": 17941, "loss": 1.5523, "learning_rate": 8.828058098664566e-06, "epoch": 0.8113817512959144, "percentage": 81.14, "elapsed_time": "1 day, 10:27:19", "remaining_time": "8:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14558, "total_steps": 17941, "loss": 1.6946, "learning_rate": 8.823006442995895e-06, "epoch": 0.8114374895490776, "percentage": 81.14, "elapsed_time": "1 day, 10:27:28", "remaining_time": "8:00:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14559, "total_steps": 17941, "loss": 1.7758, "learning_rate": 8.817956093221369e-06, "epoch": 0.8114932278022406, "percentage": 81.15, "elapsed_time": "1 day, 10:27:36", "remaining_time": "8:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14560, "total_steps": 17941, "loss": 1.8656, "learning_rate": 8.81290704950119e-06, "epoch": 0.8115489660554038, "percentage": 81.15, "elapsed_time": "1 day, 10:27:44", "remaining_time": "8:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14561, "total_steps": 17941, "loss": 1.4917, "learning_rate": 8.807859311995454e-06, "epoch": 0.811604704308567, "percentage": 81.16, "elapsed_time": "1 day, 10:27:53", "remaining_time": "8:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14562, "total_steps": 17941, "loss": 1.808, "learning_rate": 8.802812880864252e-06, "epoch": 0.8116604425617301, "percentage": 81.17, "elapsed_time": "1 day, 10:28:02", "remaining_time": "7:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14563, "total_steps": 17941, "loss": 1.4685, "learning_rate": 8.797767756267628e-06, "epoch": 0.8117161808148933, "percentage": 81.17, "elapsed_time": "1 day, 10:28:10", "remaining_time": "7:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14564, "total_steps": 17941, "loss": 1.6824, "learning_rate": 8.792723938365599e-06, "epoch": 0.8117719190680565, "percentage": 81.18, "elapsed_time": "1 day, 10:28:18", "remaining_time": "7:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14565, "total_steps": 17941, "loss": 1.5778, "learning_rate": 8.787681427318095e-06, "epoch": 0.8118276573212195, "percentage": 81.18, "elapsed_time": "1 day, 10:28:28", "remaining_time": "7:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14566, "total_steps": 17941, "loss": 1.7507, "learning_rate": 8.782640223285043e-06, "epoch": 0.8118833955743827, "percentage": 81.19, "elapsed_time": "1 day, 10:28:36", "remaining_time": "7:59:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14567, "total_steps": 17941, "loss": 1.647, "learning_rate": 8.777600326426356e-06, "epoch": 0.8119391338275458, "percentage": 81.19, "elapsed_time": "1 day, 10:28:45", "remaining_time": "7:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14568, "total_steps": 17941, "loss": 1.6628, "learning_rate": 8.77256173690183e-06, "epoch": 0.811994872080709, "percentage": 81.2, "elapsed_time": "1 day, 10:28:53", "remaining_time": "7:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14569, "total_steps": 17941, "loss": 1.4677, "learning_rate": 8.767524454871273e-06, "epoch": 0.8120506103338722, "percentage": 81.21, "elapsed_time": "1 day, 10:29:02", "remaining_time": "7:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14570, "total_steps": 17941, "loss": 1.6471, "learning_rate": 8.762488480494435e-06, "epoch": 0.8121063485870352, "percentage": 81.21, "elapsed_time": "1 day, 10:29:10", "remaining_time": "7:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14571, "total_steps": 17941, "loss": 1.5768, "learning_rate": 8.757453813931032e-06, "epoch": 0.8121620868401984, "percentage": 81.22, "elapsed_time": "1 day, 10:29:19", "remaining_time": "7:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14572, "total_steps": 17941, "loss": 1.6616, "learning_rate": 8.752420455340749e-06, "epoch": 0.8122178250933616, "percentage": 81.22, "elapsed_time": "1 day, 10:29:27", "remaining_time": "7:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14573, "total_steps": 17941, "loss": 1.659, "learning_rate": 8.747388404883183e-06, "epoch": 0.8122735633465247, "percentage": 81.23, "elapsed_time": "1 day, 10:29:35", "remaining_time": "7:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14574, "total_steps": 17941, "loss": 1.5695, "learning_rate": 8.742357662717943e-06, "epoch": 0.8123293015996879, "percentage": 81.23, "elapsed_time": "1 day, 10:29:44", "remaining_time": "7:58:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14575, "total_steps": 17941, "loss": 1.6397, "learning_rate": 8.737328229004565e-06, "epoch": 0.812385039852851, "percentage": 81.24, "elapsed_time": "1 day, 10:29:52", "remaining_time": "7:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14576, "total_steps": 17941, "loss": 1.639, "learning_rate": 8.732300103902568e-06, "epoch": 0.8124407781060141, "percentage": 81.24, "elapsed_time": "1 day, 10:30:01", "remaining_time": "7:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14577, "total_steps": 17941, "loss": 1.6974, "learning_rate": 8.72727328757138e-06, "epoch": 0.8124965163591773, "percentage": 81.25, "elapsed_time": "1 day, 10:30:09", "remaining_time": "7:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14578, "total_steps": 17941, "loss": 1.5893, "learning_rate": 8.722247780170461e-06, "epoch": 0.8125522546123405, "percentage": 81.26, "elapsed_time": "1 day, 10:30:18", "remaining_time": "7:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14579, "total_steps": 17941, "loss": 1.7204, "learning_rate": 8.717223581859191e-06, "epoch": 0.8126079928655036, "percentage": 81.26, "elapsed_time": "1 day, 10:30:26", "remaining_time": "7:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14580, "total_steps": 17941, "loss": 1.6458, "learning_rate": 8.71220069279688e-06, "epoch": 0.8126637311186667, "percentage": 81.27, "elapsed_time": "1 day, 10:30:35", "remaining_time": "7:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14581, "total_steps": 17941, "loss": 1.3501, "learning_rate": 8.707179113142839e-06, "epoch": 0.8127194693718299, "percentage": 81.27, "elapsed_time": "1 day, 10:30:43", "remaining_time": "7:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14582, "total_steps": 17941, "loss": 1.694, "learning_rate": 8.702158843056319e-06, "epoch": 0.812775207624993, "percentage": 81.28, "elapsed_time": "1 day, 10:30:52", "remaining_time": "7:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14583, "total_steps": 17941, "loss": 1.5596, "learning_rate": 8.697139882696548e-06, "epoch": 0.8128309458781562, "percentage": 81.28, "elapsed_time": "1 day, 10:31:00", "remaining_time": "7:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14584, "total_steps": 17941, "loss": 1.7084, "learning_rate": 8.692122232222683e-06, "epoch": 0.8128866841313194, "percentage": 81.29, "elapsed_time": "1 day, 10:31:09", "remaining_time": "7:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14585, "total_steps": 17941, "loss": 1.4451, "learning_rate": 8.68710589179384e-06, "epoch": 0.8129424223844824, "percentage": 81.29, "elapsed_time": "1 day, 10:31:17", "remaining_time": "7:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14586, "total_steps": 17941, "loss": 1.4804, "learning_rate": 8.682090861569153e-06, "epoch": 0.8129981606376456, "percentage": 81.3, "elapsed_time": "1 day, 10:31:26", "remaining_time": "7:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14587, "total_steps": 17941, "loss": 1.6313, "learning_rate": 8.677077141707635e-06, "epoch": 0.8130538988908088, "percentage": 81.31, "elapsed_time": "1 day, 10:31:34", "remaining_time": "7:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14588, "total_steps": 17941, "loss": 1.4384, "learning_rate": 8.672064732368301e-06, "epoch": 0.8131096371439719, "percentage": 81.31, "elapsed_time": "1 day, 10:31:43", "remaining_time": "7:56:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14589, "total_steps": 17941, "loss": 1.7108, "learning_rate": 8.667053633710109e-06, "epoch": 0.8131653753971351, "percentage": 81.32, "elapsed_time": "1 day, 10:31:51", "remaining_time": "7:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14590, "total_steps": 17941, "loss": 1.4508, "learning_rate": 8.662043845892004e-06, "epoch": 0.8132211136502983, "percentage": 81.32, "elapsed_time": "1 day, 10:32:00", "remaining_time": "7:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14591, "total_steps": 17941, "loss": 1.7348, "learning_rate": 8.65703536907284e-06, "epoch": 0.8132768519034613, "percentage": 81.33, "elapsed_time": "1 day, 10:32:09", "remaining_time": "7:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14592, "total_steps": 17941, "loss": 1.6383, "learning_rate": 8.652028203411455e-06, "epoch": 0.8133325901566245, "percentage": 81.33, "elapsed_time": "1 day, 10:32:18", "remaining_time": "7:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14593, "total_steps": 17941, "loss": 1.8188, "learning_rate": 8.647022349066686e-06, "epoch": 0.8133883284097876, "percentage": 81.34, "elapsed_time": "1 day, 10:32:26", "remaining_time": "7:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14594, "total_steps": 17941, "loss": 1.5536, "learning_rate": 8.64201780619725e-06, "epoch": 0.8134440666629508, "percentage": 81.34, "elapsed_time": "1 day, 10:32:35", "remaining_time": "7:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14595, "total_steps": 17941, "loss": 1.68, "learning_rate": 8.637014574961872e-06, "epoch": 0.813499804916114, "percentage": 81.35, "elapsed_time": "1 day, 10:32:43", "remaining_time": "7:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14596, "total_steps": 17941, "loss": 1.4752, "learning_rate": 8.632012655519234e-06, "epoch": 0.813555543169277, "percentage": 81.36, "elapsed_time": "1 day, 10:32:51", "remaining_time": "7:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14597, "total_steps": 17941, "loss": 1.6428, "learning_rate": 8.62701204802796e-06, "epoch": 0.8136112814224402, "percentage": 81.36, "elapsed_time": "1 day, 10:33:00", "remaining_time": "7:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14598, "total_steps": 17941, "loss": 1.6523, "learning_rate": 8.622012752646652e-06, "epoch": 0.8136670196756034, "percentage": 81.37, "elapsed_time": "1 day, 10:33:08", "remaining_time": "7:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14599, "total_steps": 17941, "loss": 1.8712, "learning_rate": 8.617014769533843e-06, "epoch": 0.8137227579287665, "percentage": 81.37, "elapsed_time": "1 day, 10:33:17", "remaining_time": "7:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14600, "total_steps": 17941, "loss": 1.6655, "learning_rate": 8.612018098848041e-06, "epoch": 0.8137784961819297, "percentage": 81.38, "elapsed_time": "1 day, 10:33:25", "remaining_time": "7:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14601, "total_steps": 17941, "loss": 1.7306, "learning_rate": 8.607022740747716e-06, "epoch": 0.8138342344350928, "percentage": 81.38, "elapsed_time": "1 day, 10:33:34", "remaining_time": "7:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14602, "total_steps": 17941, "loss": 1.5182, "learning_rate": 8.602028695391307e-06, "epoch": 0.8138899726882559, "percentage": 81.39, "elapsed_time": "1 day, 10:33:42", "remaining_time": "7:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14603, "total_steps": 17941, "loss": 1.5408, "learning_rate": 8.597035962937156e-06, "epoch": 0.8139457109414191, "percentage": 81.39, "elapsed_time": "1 day, 10:33:51", "remaining_time": "7:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14604, "total_steps": 17941, "loss": 1.5651, "learning_rate": 8.592044543543643e-06, "epoch": 0.8140014491945823, "percentage": 81.4, "elapsed_time": "1 day, 10:33:59", "remaining_time": "7:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14605, "total_steps": 17941, "loss": 1.7391, "learning_rate": 8.587054437369057e-06, "epoch": 0.8140571874477454, "percentage": 81.41, "elapsed_time": "1 day, 10:34:07", "remaining_time": "7:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14606, "total_steps": 17941, "loss": 1.5022, "learning_rate": 8.582065644571647e-06, "epoch": 0.8141129257009085, "percentage": 81.41, "elapsed_time": "1 day, 10:34:17", "remaining_time": "7:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14607, "total_steps": 17941, "loss": 1.6308, "learning_rate": 8.577078165309621e-06, "epoch": 0.8141686639540717, "percentage": 81.42, "elapsed_time": "1 day, 10:34:25", "remaining_time": "7:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14608, "total_steps": 17941, "loss": 1.825, "learning_rate": 8.572091999741172e-06, "epoch": 0.8142244022072348, "percentage": 81.42, "elapsed_time": "1 day, 10:34:34", "remaining_time": "7:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14609, "total_steps": 17941, "loss": 1.5367, "learning_rate": 8.567107148024434e-06, "epoch": 0.814280140460398, "percentage": 81.43, "elapsed_time": "1 day, 10:34:42", "remaining_time": "7:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14610, "total_steps": 17941, "loss": 1.7769, "learning_rate": 8.562123610317457e-06, "epoch": 0.8143358787135612, "percentage": 81.43, "elapsed_time": "1 day, 10:34:50", "remaining_time": "7:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14611, "total_steps": 17941, "loss": 1.4503, "learning_rate": 8.557141386778334e-06, "epoch": 0.8143916169667242, "percentage": 81.44, "elapsed_time": "1 day, 10:34:59", "remaining_time": "7:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14612, "total_steps": 17941, "loss": 1.3287, "learning_rate": 8.552160477565075e-06, "epoch": 0.8144473552198874, "percentage": 81.44, "elapsed_time": "1 day, 10:35:07", "remaining_time": "7:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14613, "total_steps": 17941, "loss": 1.8482, "learning_rate": 8.547180882835609e-06, "epoch": 0.8145030934730506, "percentage": 81.45, "elapsed_time": "1 day, 10:35:16", "remaining_time": "7:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14614, "total_steps": 17941, "loss": 1.4672, "learning_rate": 8.542202602747884e-06, "epoch": 0.8145588317262137, "percentage": 81.46, "elapsed_time": "1 day, 10:35:24", "remaining_time": "7:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14615, "total_steps": 17941, "loss": 1.7671, "learning_rate": 8.537225637459773e-06, "epoch": 0.8146145699793769, "percentage": 81.46, "elapsed_time": "1 day, 10:35:33", "remaining_time": "7:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14616, "total_steps": 17941, "loss": 1.6654, "learning_rate": 8.532249987129132e-06, "epoch": 0.8146703082325399, "percentage": 81.47, "elapsed_time": "1 day, 10:35:41", "remaining_time": "7:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14617, "total_steps": 17941, "loss": 1.7017, "learning_rate": 8.527275651913735e-06, "epoch": 0.8147260464857031, "percentage": 81.47, "elapsed_time": "1 day, 10:35:49", "remaining_time": "7:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14618, "total_steps": 17941, "loss": 1.6954, "learning_rate": 8.522302631971341e-06, "epoch": 0.8147817847388663, "percentage": 81.48, "elapsed_time": "1 day, 10:35:58", "remaining_time": "7:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14619, "total_steps": 17941, "loss": 1.6882, "learning_rate": 8.517330927459704e-06, "epoch": 0.8148375229920294, "percentage": 81.48, "elapsed_time": "1 day, 10:36:06", "remaining_time": "7:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14620, "total_steps": 17941, "loss": 1.6532, "learning_rate": 8.512360538536452e-06, "epoch": 0.8148932612451926, "percentage": 81.49, "elapsed_time": "1 day, 10:36:15", "remaining_time": "7:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14621, "total_steps": 17941, "loss": 1.6373, "learning_rate": 8.507391465359238e-06, "epoch": 0.8149489994983558, "percentage": 81.49, "elapsed_time": "1 day, 10:36:23", "remaining_time": "7:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14622, "total_steps": 17941, "loss": 1.5834, "learning_rate": 8.502423708085644e-06, "epoch": 0.8150047377515188, "percentage": 81.5, "elapsed_time": "1 day, 10:36:32", "remaining_time": "7:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14623, "total_steps": 17941, "loss": 1.5779, "learning_rate": 8.497457266873233e-06, "epoch": 0.815060476004682, "percentage": 81.51, "elapsed_time": "1 day, 10:36:40", "remaining_time": "7:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14624, "total_steps": 17941, "loss": 1.7272, "learning_rate": 8.492492141879493e-06, "epoch": 0.8151162142578452, "percentage": 81.51, "elapsed_time": "1 day, 10:36:49", "remaining_time": "7:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14625, "total_steps": 17941, "loss": 1.597, "learning_rate": 8.487528333261896e-06, "epoch": 0.8151719525110083, "percentage": 81.52, "elapsed_time": "1 day, 10:36:57", "remaining_time": "7:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14626, "total_steps": 17941, "loss": 1.7181, "learning_rate": 8.482565841177864e-06, "epoch": 0.8152276907641715, "percentage": 81.52, "elapsed_time": "1 day, 10:37:05", "remaining_time": "7:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14627, "total_steps": 17941, "loss": 1.4208, "learning_rate": 8.477604665784782e-06, "epoch": 0.8152834290173346, "percentage": 81.53, "elapsed_time": "1 day, 10:37:14", "remaining_time": "7:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14628, "total_steps": 17941, "loss": 1.6251, "learning_rate": 8.47264480724e-06, "epoch": 0.8153391672704977, "percentage": 81.53, "elapsed_time": "1 day, 10:37:22", "remaining_time": "7:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14629, "total_steps": 17941, "loss": 1.5518, "learning_rate": 8.467686265700775e-06, "epoch": 0.8153949055236609, "percentage": 81.54, "elapsed_time": "1 day, 10:37:31", "remaining_time": "7:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14630, "total_steps": 17941, "loss": 1.751, "learning_rate": 8.462729041324407e-06, "epoch": 0.8154506437768241, "percentage": 81.55, "elapsed_time": "1 day, 10:37:39", "remaining_time": "7:50:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14631, "total_steps": 17941, "loss": 1.4874, "learning_rate": 8.45777313426811e-06, "epoch": 0.8155063820299872, "percentage": 81.55, "elapsed_time": "1 day, 10:37:48", "remaining_time": "7:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14632, "total_steps": 17941, "loss": 1.5309, "learning_rate": 8.452818544689023e-06, "epoch": 0.8155621202831503, "percentage": 81.56, "elapsed_time": "1 day, 10:37:56", "remaining_time": "7:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14633, "total_steps": 17941, "loss": 1.598, "learning_rate": 8.447865272744299e-06, "epoch": 0.8156178585363135, "percentage": 81.56, "elapsed_time": "1 day, 10:38:04", "remaining_time": "7:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14634, "total_steps": 17941, "loss": 1.6158, "learning_rate": 8.442913318591022e-06, "epoch": 0.8156735967894766, "percentage": 81.57, "elapsed_time": "1 day, 10:38:13", "remaining_time": "7:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14635, "total_steps": 17941, "loss": 1.6812, "learning_rate": 8.437962682386252e-06, "epoch": 0.8157293350426398, "percentage": 81.57, "elapsed_time": "1 day, 10:38:22", "remaining_time": "7:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14636, "total_steps": 17941, "loss": 1.5881, "learning_rate": 8.433013364286957e-06, "epoch": 0.815785073295803, "percentage": 81.58, "elapsed_time": "1 day, 10:38:30", "remaining_time": "7:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14637, "total_steps": 17941, "loss": 1.7401, "learning_rate": 8.428065364450138e-06, "epoch": 0.815840811548966, "percentage": 81.58, "elapsed_time": "1 day, 10:38:38", "remaining_time": "7:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14638, "total_steps": 17941, "loss": 1.6026, "learning_rate": 8.423118683032715e-06, "epoch": 0.8158965498021292, "percentage": 81.59, "elapsed_time": "1 day, 10:38:48", "remaining_time": "7:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14639, "total_steps": 17941, "loss": 1.764, "learning_rate": 8.418173320191547e-06, "epoch": 0.8159522880552923, "percentage": 81.6, "elapsed_time": "1 day, 10:38:56", "remaining_time": "7:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14640, "total_steps": 17941, "loss": 1.813, "learning_rate": 8.413229276083484e-06, "epoch": 0.8160080263084555, "percentage": 81.6, "elapsed_time": "1 day, 10:39:05", "remaining_time": "7:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14641, "total_steps": 17941, "loss": 1.7731, "learning_rate": 8.408286550865318e-06, "epoch": 0.8160637645616187, "percentage": 81.61, "elapsed_time": "1 day, 10:39:13", "remaining_time": "7:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14642, "total_steps": 17941, "loss": 1.606, "learning_rate": 8.40334514469382e-06, "epoch": 0.8161195028147817, "percentage": 81.61, "elapsed_time": "1 day, 10:39:22", "remaining_time": "7:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14643, "total_steps": 17941, "loss": 1.6438, "learning_rate": 8.398405057725678e-06, "epoch": 0.8161752410679449, "percentage": 81.62, "elapsed_time": "1 day, 10:39:30", "remaining_time": "7:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14644, "total_steps": 17941, "loss": 1.5923, "learning_rate": 8.393466290117557e-06, "epoch": 0.8162309793211081, "percentage": 81.62, "elapsed_time": "1 day, 10:39:38", "remaining_time": "7:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14645, "total_steps": 17941, "loss": 1.5047, "learning_rate": 8.388528842026128e-06, "epoch": 0.8162867175742712, "percentage": 81.63, "elapsed_time": "1 day, 10:39:47", "remaining_time": "7:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14646, "total_steps": 17941, "loss": 1.669, "learning_rate": 8.38359271360794e-06, "epoch": 0.8163424558274344, "percentage": 81.63, "elapsed_time": "1 day, 10:39:56", "remaining_time": "7:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14647, "total_steps": 17941, "loss": 1.6667, "learning_rate": 8.378657905019555e-06, "epoch": 0.8163981940805976, "percentage": 81.64, "elapsed_time": "1 day, 10:40:05", "remaining_time": "7:47:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14648, "total_steps": 17941, "loss": 1.8452, "learning_rate": 8.373724416417467e-06, "epoch": 0.8164539323337606, "percentage": 81.65, "elapsed_time": "1 day, 10:40:13", "remaining_time": "7:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14649, "total_steps": 17941, "loss": 1.755, "learning_rate": 8.368792247958157e-06, "epoch": 0.8165096705869238, "percentage": 81.65, "elapsed_time": "1 day, 10:40:22", "remaining_time": "7:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14650, "total_steps": 17941, "loss": 1.6841, "learning_rate": 8.363861399798018e-06, "epoch": 0.816565408840087, "percentage": 81.66, "elapsed_time": "1 day, 10:40:30", "remaining_time": "7:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14651, "total_steps": 17941, "loss": 1.6548, "learning_rate": 8.358931872093439e-06, "epoch": 0.8166211470932501, "percentage": 81.66, "elapsed_time": "1 day, 10:40:39", "remaining_time": "7:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14652, "total_steps": 17941, "loss": 1.6098, "learning_rate": 8.354003665000754e-06, "epoch": 0.8166768853464133, "percentage": 81.67, "elapsed_time": "1 day, 10:40:47", "remaining_time": "7:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14653, "total_steps": 17941, "loss": 1.4819, "learning_rate": 8.349076778676262e-06, "epoch": 0.8167326235995764, "percentage": 81.67, "elapsed_time": "1 day, 10:40:55", "remaining_time": "7:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14654, "total_steps": 17941, "loss": 2.0069, "learning_rate": 8.34415121327623e-06, "epoch": 0.8167883618527395, "percentage": 81.68, "elapsed_time": "1 day, 10:41:04", "remaining_time": "7:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14655, "total_steps": 17941, "loss": 1.6903, "learning_rate": 8.33922696895682e-06, "epoch": 0.8168441001059027, "percentage": 81.68, "elapsed_time": "1 day, 10:41:12", "remaining_time": "7:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14656, "total_steps": 17941, "loss": 1.5395, "learning_rate": 8.334304045874247e-06, "epoch": 0.8168998383590659, "percentage": 81.69, "elapsed_time": "1 day, 10:41:21", "remaining_time": "7:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14657, "total_steps": 17941, "loss": 1.6031, "learning_rate": 8.329382444184636e-06, "epoch": 0.816955576612229, "percentage": 81.7, "elapsed_time": "1 day, 10:41:29", "remaining_time": "7:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14658, "total_steps": 17941, "loss": 1.6411, "learning_rate": 8.32446216404404e-06, "epoch": 0.8170113148653921, "percentage": 81.7, "elapsed_time": "1 day, 10:41:38", "remaining_time": "7:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14659, "total_steps": 17941, "loss": 1.5835, "learning_rate": 8.319543205608522e-06, "epoch": 0.8170670531185553, "percentage": 81.71, "elapsed_time": "1 day, 10:41:46", "remaining_time": "7:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14660, "total_steps": 17941, "loss": 1.6486, "learning_rate": 8.31462556903408e-06, "epoch": 0.8171227913717184, "percentage": 81.71, "elapsed_time": "1 day, 10:41:55", "remaining_time": "7:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14661, "total_steps": 17941, "loss": 1.6764, "learning_rate": 8.309709254476682e-06, "epoch": 0.8171785296248816, "percentage": 81.72, "elapsed_time": "1 day, 10:42:03", "remaining_time": "7:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14662, "total_steps": 17941, "loss": 1.6329, "learning_rate": 8.304794262092208e-06, "epoch": 0.8172342678780447, "percentage": 81.72, "elapsed_time": "1 day, 10:42:11", "remaining_time": "7:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14663, "total_steps": 17941, "loss": 2.0122, "learning_rate": 8.299880592036579e-06, "epoch": 0.8172900061312078, "percentage": 81.73, "elapsed_time": "1 day, 10:42:20", "remaining_time": "7:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14664, "total_steps": 17941, "loss": 1.7526, "learning_rate": 8.294968244465618e-06, "epoch": 0.817345744384371, "percentage": 81.73, "elapsed_time": "1 day, 10:42:28", "remaining_time": "7:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14665, "total_steps": 17941, "loss": 1.7203, "learning_rate": 8.290057219535097e-06, "epoch": 0.8174014826375341, "percentage": 81.74, "elapsed_time": "1 day, 10:42:37", "remaining_time": "7:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14666, "total_steps": 17941, "loss": 1.5719, "learning_rate": 8.28514751740077e-06, "epoch": 0.8174572208906973, "percentage": 81.75, "elapsed_time": "1 day, 10:42:45", "remaining_time": "7:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14667, "total_steps": 17941, "loss": 1.6364, "learning_rate": 8.280239138218354e-06, "epoch": 0.8175129591438605, "percentage": 81.75, "elapsed_time": "1 day, 10:42:54", "remaining_time": "7:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14668, "total_steps": 17941, "loss": 1.4977, "learning_rate": 8.275332082143522e-06, "epoch": 0.8175686973970235, "percentage": 81.76, "elapsed_time": "1 day, 10:43:02", "remaining_time": "7:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14669, "total_steps": 17941, "loss": 1.5391, "learning_rate": 8.270426349331872e-06, "epoch": 0.8176244356501867, "percentage": 81.76, "elapsed_time": "1 day, 10:43:11", "remaining_time": "7:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14670, "total_steps": 17941, "loss": 1.8799, "learning_rate": 8.265521939938987e-06, "epoch": 0.8176801739033499, "percentage": 81.77, "elapsed_time": "1 day, 10:43:19", "remaining_time": "7:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14671, "total_steps": 17941, "loss": 1.637, "learning_rate": 8.260618854120439e-06, "epoch": 0.817735912156513, "percentage": 81.77, "elapsed_time": "1 day, 10:43:27", "remaining_time": "7:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14672, "total_steps": 17941, "loss": 1.5, "learning_rate": 8.25571709203169e-06, "epoch": 0.8177916504096762, "percentage": 81.78, "elapsed_time": "1 day, 10:43:36", "remaining_time": "7:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14673, "total_steps": 17941, "loss": 1.5887, "learning_rate": 8.250816653828208e-06, "epoch": 0.8178473886628393, "percentage": 81.78, "elapsed_time": "1 day, 10:43:44", "remaining_time": "7:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14674, "total_steps": 17941, "loss": 1.7618, "learning_rate": 8.245917539665409e-06, "epoch": 0.8179031269160024, "percentage": 81.79, "elapsed_time": "1 day, 10:43:53", "remaining_time": "7:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14675, "total_steps": 17941, "loss": 1.9131, "learning_rate": 8.241019749698675e-06, "epoch": 0.8179588651691656, "percentage": 81.8, "elapsed_time": "1 day, 10:44:02", "remaining_time": "7:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14676, "total_steps": 17941, "loss": 1.4943, "learning_rate": 8.236123284083314e-06, "epoch": 0.8180146034223288, "percentage": 81.8, "elapsed_time": "1 day, 10:44:10", "remaining_time": "7:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14677, "total_steps": 17941, "loss": 1.9758, "learning_rate": 8.231228142974606e-06, "epoch": 0.8180703416754919, "percentage": 81.81, "elapsed_time": "1 day, 10:44:19", "remaining_time": "7:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14678, "total_steps": 17941, "loss": 1.6154, "learning_rate": 8.226334326527834e-06, "epoch": 0.818126079928655, "percentage": 81.81, "elapsed_time": "1 day, 10:44:27", "remaining_time": "7:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14679, "total_steps": 17941, "loss": 1.6926, "learning_rate": 8.221441834898175e-06, "epoch": 0.8181818181818182, "percentage": 81.82, "elapsed_time": "1 day, 10:44:35", "remaining_time": "7:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14680, "total_steps": 17941, "loss": 1.7325, "learning_rate": 8.216550668240803e-06, "epoch": 0.8182375564349813, "percentage": 81.82, "elapsed_time": "1 day, 10:44:44", "remaining_time": "7:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14681, "total_steps": 17941, "loss": 1.6233, "learning_rate": 8.211660826710804e-06, "epoch": 0.8182932946881445, "percentage": 81.83, "elapsed_time": "1 day, 10:44:53", "remaining_time": "7:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14682, "total_steps": 17941, "loss": 1.5409, "learning_rate": 8.206772310463295e-06, "epoch": 0.8183490329413077, "percentage": 81.83, "elapsed_time": "1 day, 10:45:01", "remaining_time": "7:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14683, "total_steps": 17941, "loss": 1.9611, "learning_rate": 8.201885119653308e-06, "epoch": 0.8184047711944707, "percentage": 81.84, "elapsed_time": "1 day, 10:45:10", "remaining_time": "7:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14684, "total_steps": 17941, "loss": 1.7156, "learning_rate": 8.196999254435816e-06, "epoch": 0.8184605094476339, "percentage": 81.85, "elapsed_time": "1 day, 10:45:18", "remaining_time": "7:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14685, "total_steps": 17941, "loss": 1.7105, "learning_rate": 8.192114714965776e-06, "epoch": 0.818516247700797, "percentage": 81.85, "elapsed_time": "1 day, 10:45:27", "remaining_time": "7:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14686, "total_steps": 17941, "loss": 1.7029, "learning_rate": 8.187231501398102e-06, "epoch": 0.8185719859539602, "percentage": 81.86, "elapsed_time": "1 day, 10:45:35", "remaining_time": "7:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14687, "total_steps": 17941, "loss": 1.3432, "learning_rate": 8.18234961388767e-06, "epoch": 0.8186277242071234, "percentage": 81.86, "elapsed_time": "1 day, 10:45:44", "remaining_time": "7:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14688, "total_steps": 17941, "loss": 1.6022, "learning_rate": 8.17746905258927e-06, "epoch": 0.8186834624602864, "percentage": 81.87, "elapsed_time": "1 day, 10:45:52", "remaining_time": "7:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14689, "total_steps": 17941, "loss": 1.4637, "learning_rate": 8.172589817657721e-06, "epoch": 0.8187392007134496, "percentage": 81.87, "elapsed_time": "1 day, 10:46:00", "remaining_time": "7:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14690, "total_steps": 17941, "loss": 1.7603, "learning_rate": 8.167711909247766e-06, "epoch": 0.8187949389666128, "percentage": 81.88, "elapsed_time": "1 day, 10:46:09", "remaining_time": "7:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14691, "total_steps": 17941, "loss": 1.8689, "learning_rate": 8.16283532751408e-06, "epoch": 0.8188506772197759, "percentage": 81.89, "elapsed_time": "1 day, 10:46:17", "remaining_time": "7:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14692, "total_steps": 17941, "loss": 1.5218, "learning_rate": 8.157960072611326e-06, "epoch": 0.8189064154729391, "percentage": 81.89, "elapsed_time": "1 day, 10:46:26", "remaining_time": "7:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14693, "total_steps": 17941, "loss": 1.676, "learning_rate": 8.153086144694122e-06, "epoch": 0.8189621537261023, "percentage": 81.9, "elapsed_time": "1 day, 10:46:34", "remaining_time": "7:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14694, "total_steps": 17941, "loss": 1.7805, "learning_rate": 8.148213543917055e-06, "epoch": 0.8190178919792653, "percentage": 81.9, "elapsed_time": "1 day, 10:46:43", "remaining_time": "7:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14695, "total_steps": 17941, "loss": 1.524, "learning_rate": 8.143342270434629e-06, "epoch": 0.8190736302324285, "percentage": 81.91, "elapsed_time": "1 day, 10:46:51", "remaining_time": "7:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14696, "total_steps": 17941, "loss": 1.3755, "learning_rate": 8.138472324401335e-06, "epoch": 0.8191293684855917, "percentage": 81.91, "elapsed_time": "1 day, 10:47:00", "remaining_time": "7:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14697, "total_steps": 17941, "loss": 1.5122, "learning_rate": 8.133603705971649e-06, "epoch": 0.8191851067387548, "percentage": 81.92, "elapsed_time": "1 day, 10:47:08", "remaining_time": "7:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14698, "total_steps": 17941, "loss": 1.4538, "learning_rate": 8.128736415299948e-06, "epoch": 0.819240844991918, "percentage": 81.92, "elapsed_time": "1 day, 10:47:16", "remaining_time": "7:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14699, "total_steps": 17941, "loss": 1.8112, "learning_rate": 8.1238704525406e-06, "epoch": 0.8192965832450811, "percentage": 81.93, "elapsed_time": "1 day, 10:47:25", "remaining_time": "7:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14700, "total_steps": 17941, "loss": 1.6804, "learning_rate": 8.119005817847924e-06, "epoch": 0.8193523214982442, "percentage": 81.94, "elapsed_time": "1 day, 10:47:33", "remaining_time": "7:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14701, "total_steps": 17941, "loss": 1.7354, "learning_rate": 8.114142511376215e-06, "epoch": 0.8194080597514074, "percentage": 81.94, "elapsed_time": "1 day, 10:47:43", "remaining_time": "7:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14702, "total_steps": 17941, "loss": 1.6038, "learning_rate": 8.109280533279684e-06, "epoch": 0.8194637980045706, "percentage": 81.95, "elapsed_time": "1 day, 10:47:51", "remaining_time": "7:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14703, "total_steps": 17941, "loss": 1.7552, "learning_rate": 8.104419883712517e-06, "epoch": 0.8195195362577337, "percentage": 81.95, "elapsed_time": "1 day, 10:48:00", "remaining_time": "7:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14704, "total_steps": 17941, "loss": 1.5637, "learning_rate": 8.099560562828911e-06, "epoch": 0.8195752745108968, "percentage": 81.96, "elapsed_time": "1 day, 10:48:08", "remaining_time": "7:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14705, "total_steps": 17941, "loss": 1.495, "learning_rate": 8.094702570782936e-06, "epoch": 0.81963101276406, "percentage": 81.96, "elapsed_time": "1 day, 10:48:17", "remaining_time": "7:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14706, "total_steps": 17941, "loss": 1.7242, "learning_rate": 8.089845907728682e-06, "epoch": 0.8196867510172231, "percentage": 81.97, "elapsed_time": "1 day, 10:48:25", "remaining_time": "7:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14707, "total_steps": 17941, "loss": 1.4354, "learning_rate": 8.084990573820133e-06, "epoch": 0.8197424892703863, "percentage": 81.97, "elapsed_time": "1 day, 10:48:33", "remaining_time": "7:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14708, "total_steps": 17941, "loss": 1.7557, "learning_rate": 8.080136569211322e-06, "epoch": 0.8197982275235494, "percentage": 81.98, "elapsed_time": "1 day, 10:48:42", "remaining_time": "7:39:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14709, "total_steps": 17941, "loss": 1.6358, "learning_rate": 8.075283894056178e-06, "epoch": 0.8198539657767125, "percentage": 81.99, "elapsed_time": "1 day, 10:48:50", "remaining_time": "7:38:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14710, "total_steps": 17941, "loss": 1.572, "learning_rate": 8.070432548508578e-06, "epoch": 0.8199097040298757, "percentage": 81.99, "elapsed_time": "1 day, 10:48:59", "remaining_time": "7:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14711, "total_steps": 17941, "loss": 1.6363, "learning_rate": 8.065582532722394e-06, "epoch": 0.8199654422830388, "percentage": 82.0, "elapsed_time": "1 day, 10:49:07", "remaining_time": "7:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14712, "total_steps": 17941, "loss": 1.4092, "learning_rate": 8.060733846851432e-06, "epoch": 0.820021180536202, "percentage": 82.0, "elapsed_time": "1 day, 10:49:16", "remaining_time": "7:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14713, "total_steps": 17941, "loss": 1.8248, "learning_rate": 8.055886491049486e-06, "epoch": 0.8200769187893652, "percentage": 82.01, "elapsed_time": "1 day, 10:49:24", "remaining_time": "7:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14714, "total_steps": 17941, "loss": 1.517, "learning_rate": 8.051040465470245e-06, "epoch": 0.8201326570425282, "percentage": 82.01, "elapsed_time": "1 day, 10:49:32", "remaining_time": "7:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14715, "total_steps": 17941, "loss": 1.7852, "learning_rate": 8.046195770267428e-06, "epoch": 0.8201883952956914, "percentage": 82.02, "elapsed_time": "1 day, 10:49:41", "remaining_time": "7:38:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14716, "total_steps": 17941, "loss": 1.615, "learning_rate": 8.041352405594692e-06, "epoch": 0.8202441335488546, "percentage": 82.02, "elapsed_time": "1 day, 10:49:49", "remaining_time": "7:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14717, "total_steps": 17941, "loss": 1.6671, "learning_rate": 8.03651037160561e-06, "epoch": 0.8202998718020177, "percentage": 82.03, "elapsed_time": "1 day, 10:49:58", "remaining_time": "7:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14718, "total_steps": 17941, "loss": 1.682, "learning_rate": 8.031669668453752e-06, "epoch": 0.8203556100551809, "percentage": 82.04, "elapsed_time": "1 day, 10:50:06", "remaining_time": "7:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14719, "total_steps": 17941, "loss": 1.762, "learning_rate": 8.026830296292636e-06, "epoch": 0.8204113483083441, "percentage": 82.04, "elapsed_time": "1 day, 10:50:15", "remaining_time": "7:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14720, "total_steps": 17941, "loss": 1.73, "learning_rate": 8.021992255275763e-06, "epoch": 0.8204670865615071, "percentage": 82.05, "elapsed_time": "1 day, 10:50:23", "remaining_time": "7:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14721, "total_steps": 17941, "loss": 1.6057, "learning_rate": 8.017155545556527e-06, "epoch": 0.8205228248146703, "percentage": 82.05, "elapsed_time": "1 day, 10:50:32", "remaining_time": "7:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14722, "total_steps": 17941, "loss": 1.4836, "learning_rate": 8.012320167288334e-06, "epoch": 0.8205785630678335, "percentage": 82.06, "elapsed_time": "1 day, 10:50:40", "remaining_time": "7:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14723, "total_steps": 17941, "loss": 1.8501, "learning_rate": 8.007486120624559e-06, "epoch": 0.8206343013209966, "percentage": 82.06, "elapsed_time": "1 day, 10:50:48", "remaining_time": "7:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14724, "total_steps": 17941, "loss": 1.6392, "learning_rate": 8.002653405718485e-06, "epoch": 0.8206900395741598, "percentage": 82.07, "elapsed_time": "1 day, 10:50:57", "remaining_time": "7:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14725, "total_steps": 17941, "loss": 1.5372, "learning_rate": 7.997822022723378e-06, "epoch": 0.8207457778273229, "percentage": 82.07, "elapsed_time": "1 day, 10:51:05", "remaining_time": "7:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14726, "total_steps": 17941, "loss": 1.6999, "learning_rate": 7.992991971792469e-06, "epoch": 0.820801516080486, "percentage": 82.08, "elapsed_time": "1 day, 10:51:14", "remaining_time": "7:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14727, "total_steps": 17941, "loss": 1.6596, "learning_rate": 7.988163253078952e-06, "epoch": 0.8208572543336492, "percentage": 82.09, "elapsed_time": "1 day, 10:51:23", "remaining_time": "7:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14728, "total_steps": 17941, "loss": 1.4913, "learning_rate": 7.98333586673593e-06, "epoch": 0.8209129925868124, "percentage": 82.09, "elapsed_time": "1 day, 10:51:31", "remaining_time": "7:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14729, "total_steps": 17941, "loss": 1.7483, "learning_rate": 7.978509812916513e-06, "epoch": 0.8209687308399755, "percentage": 82.1, "elapsed_time": "1 day, 10:51:40", "remaining_time": "7:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14730, "total_steps": 17941, "loss": 1.5914, "learning_rate": 7.973685091773792e-06, "epoch": 0.8210244690931386, "percentage": 82.1, "elapsed_time": "1 day, 10:51:48", "remaining_time": "7:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14731, "total_steps": 17941, "loss": 1.5902, "learning_rate": 7.968861703460728e-06, "epoch": 0.8210802073463017, "percentage": 82.11, "elapsed_time": "1 day, 10:51:56", "remaining_time": "7:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14732, "total_steps": 17941, "loss": 1.6152, "learning_rate": 7.964039648130328e-06, "epoch": 0.8211359455994649, "percentage": 82.11, "elapsed_time": "1 day, 10:52:05", "remaining_time": "7:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14733, "total_steps": 17941, "loss": 1.3945, "learning_rate": 7.95921892593548e-06, "epoch": 0.8211916838526281, "percentage": 82.12, "elapsed_time": "1 day, 10:52:13", "remaining_time": "7:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14734, "total_steps": 17941, "loss": 1.5801, "learning_rate": 7.954399537029106e-06, "epoch": 0.8212474221057912, "percentage": 82.12, "elapsed_time": "1 day, 10:52:23", "remaining_time": "7:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14735, "total_steps": 17941, "loss": 1.56, "learning_rate": 7.94958148156405e-06, "epoch": 0.8213031603589543, "percentage": 82.13, "elapsed_time": "1 day, 10:52:31", "remaining_time": "7:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14736, "total_steps": 17941, "loss": 1.6339, "learning_rate": 7.94476475969308e-06, "epoch": 0.8213588986121175, "percentage": 82.14, "elapsed_time": "1 day, 10:52:40", "remaining_time": "7:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14737, "total_steps": 17941, "loss": 1.7142, "learning_rate": 7.939949371568977e-06, "epoch": 0.8214146368652806, "percentage": 82.14, "elapsed_time": "1 day, 10:52:48", "remaining_time": "7:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14738, "total_steps": 17941, "loss": 1.5694, "learning_rate": 7.935135317344455e-06, "epoch": 0.8214703751184438, "percentage": 82.15, "elapsed_time": "1 day, 10:52:57", "remaining_time": "7:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14739, "total_steps": 17941, "loss": 1.5784, "learning_rate": 7.930322597172191e-06, "epoch": 0.821526113371607, "percentage": 82.15, "elapsed_time": "1 day, 10:53:05", "remaining_time": "7:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14740, "total_steps": 17941, "loss": 1.6162, "learning_rate": 7.925511211204795e-06, "epoch": 0.82158185162477, "percentage": 82.16, "elapsed_time": "1 day, 10:53:13", "remaining_time": "7:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14741, "total_steps": 17941, "loss": 1.6094, "learning_rate": 7.92070115959488e-06, "epoch": 0.8216375898779332, "percentage": 82.16, "elapsed_time": "1 day, 10:53:23", "remaining_time": "7:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14742, "total_steps": 17941, "loss": 1.6552, "learning_rate": 7.915892442494994e-06, "epoch": 0.8216933281310964, "percentage": 82.17, "elapsed_time": "1 day, 10:53:31", "remaining_time": "7:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14743, "total_steps": 17941, "loss": 1.7177, "learning_rate": 7.911085060057621e-06, "epoch": 0.8217490663842595, "percentage": 82.17, "elapsed_time": "1 day, 10:53:40", "remaining_time": "7:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14744, "total_steps": 17941, "loss": 1.8521, "learning_rate": 7.906279012435237e-06, "epoch": 0.8218048046374227, "percentage": 82.18, "elapsed_time": "1 day, 10:53:48", "remaining_time": "7:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14745, "total_steps": 17941, "loss": 1.3688, "learning_rate": 7.901474299780258e-06, "epoch": 0.8218605428905859, "percentage": 82.19, "elapsed_time": "1 day, 10:53:57", "remaining_time": "7:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14746, "total_steps": 17941, "loss": 1.7278, "learning_rate": 7.89667092224508e-06, "epoch": 0.8219162811437489, "percentage": 82.19, "elapsed_time": "1 day, 10:54:05", "remaining_time": "7:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14747, "total_steps": 17941, "loss": 1.5499, "learning_rate": 7.891868879982001e-06, "epoch": 0.8219720193969121, "percentage": 82.2, "elapsed_time": "1 day, 10:54:13", "remaining_time": "7:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14748, "total_steps": 17941, "loss": 1.5249, "learning_rate": 7.887068173143325e-06, "epoch": 0.8220277576500753, "percentage": 82.2, "elapsed_time": "1 day, 10:54:22", "remaining_time": "7:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14749, "total_steps": 17941, "loss": 1.4663, "learning_rate": 7.882268801881337e-06, "epoch": 0.8220834959032384, "percentage": 82.21, "elapsed_time": "1 day, 10:54:30", "remaining_time": "7:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14750, "total_steps": 17941, "loss": 1.3222, "learning_rate": 7.877470766348206e-06, "epoch": 0.8221392341564016, "percentage": 82.21, "elapsed_time": "1 day, 10:54:39", "remaining_time": "7:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14751, "total_steps": 17941, "loss": 1.6223, "learning_rate": 7.872674066696112e-06, "epoch": 0.8221949724095647, "percentage": 82.22, "elapsed_time": "1 day, 10:54:47", "remaining_time": "7:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14752, "total_steps": 17941, "loss": 1.6545, "learning_rate": 7.867878703077175e-06, "epoch": 0.8222507106627278, "percentage": 82.23, "elapsed_time": "1 day, 10:54:56", "remaining_time": "7:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14753, "total_steps": 17941, "loss": 1.5277, "learning_rate": 7.86308467564349e-06, "epoch": 0.822306448915891, "percentage": 82.23, "elapsed_time": "1 day, 10:55:04", "remaining_time": "7:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14754, "total_steps": 17941, "loss": 1.6744, "learning_rate": 7.858291984547072e-06, "epoch": 0.8223621871690541, "percentage": 82.24, "elapsed_time": "1 day, 10:55:13", "remaining_time": "7:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14755, "total_steps": 17941, "loss": 1.7234, "learning_rate": 7.85350062993992e-06, "epoch": 0.8224179254222173, "percentage": 82.24, "elapsed_time": "1 day, 10:55:21", "remaining_time": "7:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14756, "total_steps": 17941, "loss": 1.6461, "learning_rate": 7.848710611974019e-06, "epoch": 0.8224736636753804, "percentage": 82.25, "elapsed_time": "1 day, 10:55:29", "remaining_time": "7:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14757, "total_steps": 17941, "loss": 1.427, "learning_rate": 7.843921930801245e-06, "epoch": 0.8225294019285435, "percentage": 82.25, "elapsed_time": "1 day, 10:55:38", "remaining_time": "7:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14758, "total_steps": 17941, "loss": 1.5931, "learning_rate": 7.839134586573493e-06, "epoch": 0.8225851401817067, "percentage": 82.26, "elapsed_time": "1 day, 10:55:46", "remaining_time": "7:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14759, "total_steps": 17941, "loss": 1.6162, "learning_rate": 7.834348579442553e-06, "epoch": 0.8226408784348699, "percentage": 82.26, "elapsed_time": "1 day, 10:55:55", "remaining_time": "7:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14760, "total_steps": 17941, "loss": 1.6442, "learning_rate": 7.829563909560256e-06, "epoch": 0.822696616688033, "percentage": 82.27, "elapsed_time": "1 day, 10:56:04", "remaining_time": "7:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14761, "total_steps": 17941, "loss": 1.7833, "learning_rate": 7.824780577078311e-06, "epoch": 0.8227523549411961, "percentage": 82.28, "elapsed_time": "1 day, 10:56:12", "remaining_time": "7:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14762, "total_steps": 17941, "loss": 1.7263, "learning_rate": 7.81999858214843e-06, "epoch": 0.8228080931943593, "percentage": 82.28, "elapsed_time": "1 day, 10:56:21", "remaining_time": "7:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14763, "total_steps": 17941, "loss": 1.6074, "learning_rate": 7.815217924922264e-06, "epoch": 0.8228638314475224, "percentage": 82.29, "elapsed_time": "1 day, 10:56:29", "remaining_time": "7:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14764, "total_steps": 17941, "loss": 1.7478, "learning_rate": 7.81043860555143e-06, "epoch": 0.8229195697006856, "percentage": 82.29, "elapsed_time": "1 day, 10:56:37", "remaining_time": "7:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14765, "total_steps": 17941, "loss": 1.6435, "learning_rate": 7.805660624187516e-06, "epoch": 0.8229753079538488, "percentage": 82.3, "elapsed_time": "1 day, 10:56:46", "remaining_time": "7:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14766, "total_steps": 17941, "loss": 1.5407, "learning_rate": 7.80088398098201e-06, "epoch": 0.8230310462070118, "percentage": 82.3, "elapsed_time": "1 day, 10:56:54", "remaining_time": "7:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14767, "total_steps": 17941, "loss": 1.7211, "learning_rate": 7.796108676086445e-06, "epoch": 0.823086784460175, "percentage": 82.31, "elapsed_time": "1 day, 10:57:03", "remaining_time": "7:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14768, "total_steps": 17941, "loss": 1.6505, "learning_rate": 7.791334709652254e-06, "epoch": 0.8231425227133382, "percentage": 82.31, "elapsed_time": "1 day, 10:57:12", "remaining_time": "7:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14769, "total_steps": 17941, "loss": 1.6837, "learning_rate": 7.786562081830817e-06, "epoch": 0.8231982609665013, "percentage": 82.32, "elapsed_time": "1 day, 10:57:20", "remaining_time": "7:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14770, "total_steps": 17941, "loss": 1.642, "learning_rate": 7.781790792773514e-06, "epoch": 0.8232539992196645, "percentage": 82.33, "elapsed_time": "1 day, 10:57:29", "remaining_time": "7:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14771, "total_steps": 17941, "loss": 1.6248, "learning_rate": 7.777020842631656e-06, "epoch": 0.8233097374728277, "percentage": 82.33, "elapsed_time": "1 day, 10:57:37", "remaining_time": "7:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14772, "total_steps": 17941, "loss": 1.7027, "learning_rate": 7.772252231556531e-06, "epoch": 0.8233654757259907, "percentage": 82.34, "elapsed_time": "1 day, 10:57:45", "remaining_time": "7:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14773, "total_steps": 17941, "loss": 1.5712, "learning_rate": 7.76748495969935e-06, "epoch": 0.8234212139791539, "percentage": 82.34, "elapsed_time": "1 day, 10:57:54", "remaining_time": "7:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14774, "total_steps": 17941, "loss": 1.3786, "learning_rate": 7.762719027211308e-06, "epoch": 0.8234769522323171, "percentage": 82.35, "elapsed_time": "1 day, 10:58:03", "remaining_time": "7:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14775, "total_steps": 17941, "loss": 1.5349, "learning_rate": 7.75795443424357e-06, "epoch": 0.8235326904854802, "percentage": 82.35, "elapsed_time": "1 day, 10:58:11", "remaining_time": "7:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14776, "total_steps": 17941, "loss": 1.7259, "learning_rate": 7.753191180947223e-06, "epoch": 0.8235884287386434, "percentage": 82.36, "elapsed_time": "1 day, 10:58:20", "remaining_time": "7:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14777, "total_steps": 17941, "loss": 1.5049, "learning_rate": 7.74842926747334e-06, "epoch": 0.8236441669918064, "percentage": 82.36, "elapsed_time": "1 day, 10:58:29", "remaining_time": "7:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14778, "total_steps": 17941, "loss": 1.5613, "learning_rate": 7.743668693972927e-06, "epoch": 0.8236999052449696, "percentage": 82.37, "elapsed_time": "1 day, 10:58:38", "remaining_time": "7:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14779, "total_steps": 17941, "loss": 1.744, "learning_rate": 7.738909460596994e-06, "epoch": 0.8237556434981328, "percentage": 82.38, "elapsed_time": "1 day, 10:58:46", "remaining_time": "7:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14780, "total_steps": 17941, "loss": 1.5413, "learning_rate": 7.734151567496434e-06, "epoch": 0.8238113817512959, "percentage": 82.38, "elapsed_time": "1 day, 10:58:55", "remaining_time": "7:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14781, "total_steps": 17941, "loss": 1.6224, "learning_rate": 7.729395014822149e-06, "epoch": 0.823867120004459, "percentage": 82.39, "elapsed_time": "1 day, 10:59:03", "remaining_time": "7:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14782, "total_steps": 17941, "loss": 1.7152, "learning_rate": 7.724639802725025e-06, "epoch": 0.8239228582576222, "percentage": 82.39, "elapsed_time": "1 day, 10:59:12", "remaining_time": "7:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14783, "total_steps": 17941, "loss": 1.7338, "learning_rate": 7.71988593135583e-06, "epoch": 0.8239785965107853, "percentage": 82.4, "elapsed_time": "1 day, 10:59:20", "remaining_time": "7:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14784, "total_steps": 17941, "loss": 1.735, "learning_rate": 7.715133400865342e-06, "epoch": 0.8240343347639485, "percentage": 82.4, "elapsed_time": "1 day, 10:59:29", "remaining_time": "7:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14785, "total_steps": 17941, "loss": 1.7797, "learning_rate": 7.710382211404288e-06, "epoch": 0.8240900730171117, "percentage": 82.41, "elapsed_time": "1 day, 10:59:37", "remaining_time": "7:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14786, "total_steps": 17941, "loss": 1.7308, "learning_rate": 7.705632363123355e-06, "epoch": 0.8241458112702748, "percentage": 82.41, "elapsed_time": "1 day, 10:59:46", "remaining_time": "7:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14787, "total_steps": 17941, "loss": 1.4567, "learning_rate": 7.700883856173164e-06, "epoch": 0.8242015495234379, "percentage": 82.42, "elapsed_time": "1 day, 10:59:55", "remaining_time": "7:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14788, "total_steps": 17941, "loss": 1.3691, "learning_rate": 7.696136690704309e-06, "epoch": 0.8242572877766011, "percentage": 82.43, "elapsed_time": "1 day, 11:00:04", "remaining_time": "7:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14789, "total_steps": 17941, "loss": 1.578, "learning_rate": 7.691390866867348e-06, "epoch": 0.8243130260297642, "percentage": 82.43, "elapsed_time": "1 day, 11:00:12", "remaining_time": "7:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14790, "total_steps": 17941, "loss": 1.5294, "learning_rate": 7.686646384812802e-06, "epoch": 0.8243687642829274, "percentage": 82.44, "elapsed_time": "1 day, 11:00:21", "remaining_time": "7:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14791, "total_steps": 17941, "loss": 1.6699, "learning_rate": 7.68190324469113e-06, "epoch": 0.8244245025360906, "percentage": 82.44, "elapsed_time": "1 day, 11:00:29", "remaining_time": "7:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14792, "total_steps": 17941, "loss": 1.6154, "learning_rate": 7.677161446652736e-06, "epoch": 0.8244802407892536, "percentage": 82.45, "elapsed_time": "1 day, 11:00:37", "remaining_time": "7:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14793, "total_steps": 17941, "loss": 1.7302, "learning_rate": 7.672420990848033e-06, "epoch": 0.8245359790424168, "percentage": 82.45, "elapsed_time": "1 day, 11:00:46", "remaining_time": "7:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14794, "total_steps": 17941, "loss": 1.5814, "learning_rate": 7.667681877427363e-06, "epoch": 0.82459171729558, "percentage": 82.46, "elapsed_time": "1 day, 11:00:55", "remaining_time": "7:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14795, "total_steps": 17941, "loss": 1.6489, "learning_rate": 7.662944106540998e-06, "epoch": 0.8246474555487431, "percentage": 82.46, "elapsed_time": "1 day, 11:01:03", "remaining_time": "7:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14796, "total_steps": 17941, "loss": 1.8268, "learning_rate": 7.658207678339202e-06, "epoch": 0.8247031938019063, "percentage": 82.47, "elapsed_time": "1 day, 11:01:12", "remaining_time": "7:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14797, "total_steps": 17941, "loss": 1.6168, "learning_rate": 7.653472592972188e-06, "epoch": 0.8247589320550694, "percentage": 82.48, "elapsed_time": "1 day, 11:01:20", "remaining_time": "7:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14798, "total_steps": 17941, "loss": 1.5265, "learning_rate": 7.648738850590137e-06, "epoch": 0.8248146703082325, "percentage": 82.48, "elapsed_time": "1 day, 11:01:29", "remaining_time": "7:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14799, "total_steps": 17941, "loss": 1.774, "learning_rate": 7.644006451343156e-06, "epoch": 0.8248704085613957, "percentage": 82.49, "elapsed_time": "1 day, 11:01:37", "remaining_time": "7:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14800, "total_steps": 17941, "loss": 1.5918, "learning_rate": 7.639275395381324e-06, "epoch": 0.8249261468145588, "percentage": 82.49, "elapsed_time": "1 day, 11:01:46", "remaining_time": "7:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14801, "total_steps": 17941, "loss": 1.5562, "learning_rate": 7.63454568285472e-06, "epoch": 0.824981885067722, "percentage": 82.5, "elapsed_time": "1 day, 11:01:54", "remaining_time": "7:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14802, "total_steps": 17941, "loss": 1.6387, "learning_rate": 7.629817313913306e-06, "epoch": 0.8250376233208851, "percentage": 82.5, "elapsed_time": "1 day, 11:02:03", "remaining_time": "7:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14803, "total_steps": 17941, "loss": 1.5421, "learning_rate": 7.625090288707054e-06, "epoch": 0.8250933615740482, "percentage": 82.51, "elapsed_time": "1 day, 11:02:11", "remaining_time": "7:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14804, "total_steps": 17941, "loss": 1.6407, "learning_rate": 7.620364607385877e-06, "epoch": 0.8251490998272114, "percentage": 82.51, "elapsed_time": "1 day, 11:02:20", "remaining_time": "7:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14805, "total_steps": 17941, "loss": 1.7231, "learning_rate": 7.61564027009965e-06, "epoch": 0.8252048380803746, "percentage": 82.52, "elapsed_time": "1 day, 11:02:28", "remaining_time": "7:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14806, "total_steps": 17941, "loss": 1.4615, "learning_rate": 7.610917276998192e-06, "epoch": 0.8252605763335377, "percentage": 82.53, "elapsed_time": "1 day, 11:02:37", "remaining_time": "7:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14807, "total_steps": 17941, "loss": 1.6183, "learning_rate": 7.606195628231272e-06, "epoch": 0.8253163145867008, "percentage": 82.53, "elapsed_time": "1 day, 11:02:45", "remaining_time": "7:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14808, "total_steps": 17941, "loss": 1.4315, "learning_rate": 7.6014753239486815e-06, "epoch": 0.825372052839864, "percentage": 82.54, "elapsed_time": "1 day, 11:02:54", "remaining_time": "7:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14809, "total_steps": 17941, "loss": 1.7067, "learning_rate": 7.596756364300084e-06, "epoch": 0.8254277910930271, "percentage": 82.54, "elapsed_time": "1 day, 11:03:02", "remaining_time": "7:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14810, "total_steps": 17941, "loss": 1.7114, "learning_rate": 7.592038749435143e-06, "epoch": 0.8254835293461903, "percentage": 82.55, "elapsed_time": "1 day, 11:03:11", "remaining_time": "7:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14811, "total_steps": 17941, "loss": 1.5799, "learning_rate": 7.587322479503478e-06, "epoch": 0.8255392675993535, "percentage": 82.55, "elapsed_time": "1 day, 11:03:19", "remaining_time": "7:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14812, "total_steps": 17941, "loss": 1.6757, "learning_rate": 7.582607554654669e-06, "epoch": 0.8255950058525166, "percentage": 82.56, "elapsed_time": "1 day, 11:03:29", "remaining_time": "7:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14813, "total_steps": 17941, "loss": 1.6212, "learning_rate": 7.577893975038231e-06, "epoch": 0.8256507441056797, "percentage": 82.57, "elapsed_time": "1 day, 11:03:37", "remaining_time": "7:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14814, "total_steps": 17941, "loss": 1.5161, "learning_rate": 7.573181740803659e-06, "epoch": 0.8257064823588429, "percentage": 82.57, "elapsed_time": "1 day, 11:03:46", "remaining_time": "7:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14815, "total_steps": 17941, "loss": 1.2616, "learning_rate": 7.568470852100396e-06, "epoch": 0.825762220612006, "percentage": 82.58, "elapsed_time": "1 day, 11:03:54", "remaining_time": "7:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14816, "total_steps": 17941, "loss": 1.7431, "learning_rate": 7.563761309077838e-06, "epoch": 0.8258179588651692, "percentage": 82.58, "elapsed_time": "1 day, 11:04:02", "remaining_time": "7:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14817, "total_steps": 17941, "loss": 1.5336, "learning_rate": 7.559053111885372e-06, "epoch": 0.8258736971183324, "percentage": 82.59, "elapsed_time": "1 day, 11:04:11", "remaining_time": "7:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14818, "total_steps": 17941, "loss": 1.5636, "learning_rate": 7.5543462606722624e-06, "epoch": 0.8259294353714954, "percentage": 82.59, "elapsed_time": "1 day, 11:04:19", "remaining_time": "7:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14819, "total_steps": 17941, "loss": 1.6993, "learning_rate": 7.5496407555878276e-06, "epoch": 0.8259851736246586, "percentage": 82.6, "elapsed_time": "1 day, 11:04:28", "remaining_time": "7:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14820, "total_steps": 17941, "loss": 1.4985, "learning_rate": 7.544936596781299e-06, "epoch": 0.8260409118778218, "percentage": 82.6, "elapsed_time": "1 day, 11:04:36", "remaining_time": "7:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14821, "total_steps": 17941, "loss": 1.4959, "learning_rate": 7.54023378440184e-06, "epoch": 0.8260966501309849, "percentage": 82.61, "elapsed_time": "1 day, 11:04:45", "remaining_time": "7:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14822, "total_steps": 17941, "loss": 1.5709, "learning_rate": 7.535532318598609e-06, "epoch": 0.8261523883841481, "percentage": 82.62, "elapsed_time": "1 day, 11:04:53", "remaining_time": "7:22:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14823, "total_steps": 17941, "loss": 1.8395, "learning_rate": 7.530832199520705e-06, "epoch": 0.8262081266373111, "percentage": 82.62, "elapsed_time": "1 day, 11:05:02", "remaining_time": "7:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14824, "total_steps": 17941, "loss": 1.7728, "learning_rate": 7.5261334273172e-06, "epoch": 0.8262638648904743, "percentage": 82.63, "elapsed_time": "1 day, 11:05:10", "remaining_time": "7:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14825, "total_steps": 17941, "loss": 1.6189, "learning_rate": 7.5214360021371e-06, "epoch": 0.8263196031436375, "percentage": 82.63, "elapsed_time": "1 day, 11:05:19", "remaining_time": "7:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14826, "total_steps": 17941, "loss": 1.4719, "learning_rate": 7.516739924129362e-06, "epoch": 0.8263753413968006, "percentage": 82.64, "elapsed_time": "1 day, 11:05:27", "remaining_time": "7:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14827, "total_steps": 17941, "loss": 1.6933, "learning_rate": 7.512045193442968e-06, "epoch": 0.8264310796499638, "percentage": 82.64, "elapsed_time": "1 day, 11:05:36", "remaining_time": "7:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14828, "total_steps": 17941, "loss": 1.9048, "learning_rate": 7.507351810226765e-06, "epoch": 0.826486817903127, "percentage": 82.65, "elapsed_time": "1 day, 11:05:44", "remaining_time": "7:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14829, "total_steps": 17941, "loss": 1.6225, "learning_rate": 7.502659774629612e-06, "epoch": 0.82654255615629, "percentage": 82.65, "elapsed_time": "1 day, 11:05:53", "remaining_time": "7:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14830, "total_steps": 17941, "loss": 1.6123, "learning_rate": 7.4979690868003165e-06, "epoch": 0.8265982944094532, "percentage": 82.66, "elapsed_time": "1 day, 11:06:01", "remaining_time": "7:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14831, "total_steps": 17941, "loss": 1.5044, "learning_rate": 7.493279746887649e-06, "epoch": 0.8266540326626164, "percentage": 82.67, "elapsed_time": "1 day, 11:06:10", "remaining_time": "7:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14832, "total_steps": 17941, "loss": 1.4167, "learning_rate": 7.488591755040303e-06, "epoch": 0.8267097709157795, "percentage": 82.67, "elapsed_time": "1 day, 11:06:18", "remaining_time": "7:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14833, "total_steps": 17941, "loss": 1.565, "learning_rate": 7.483905111406958e-06, "epoch": 0.8267655091689426, "percentage": 82.68, "elapsed_time": "1 day, 11:06:27", "remaining_time": "7:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14834, "total_steps": 17941, "loss": 1.503, "learning_rate": 7.479219816136279e-06, "epoch": 0.8268212474221058, "percentage": 82.68, "elapsed_time": "1 day, 11:06:35", "remaining_time": "7:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14835, "total_steps": 17941, "loss": 1.4863, "learning_rate": 7.474535869376819e-06, "epoch": 0.8268769856752689, "percentage": 82.69, "elapsed_time": "1 day, 11:06:43", "remaining_time": "7:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14836, "total_steps": 17941, "loss": 1.5387, "learning_rate": 7.46985327127715e-06, "epoch": 0.8269327239284321, "percentage": 82.69, "elapsed_time": "1 day, 11:06:52", "remaining_time": "7:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14837, "total_steps": 17941, "loss": 1.6446, "learning_rate": 7.465172021985761e-06, "epoch": 0.8269884621815953, "percentage": 82.7, "elapsed_time": "1 day, 11:07:00", "remaining_time": "7:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14838, "total_steps": 17941, "loss": 1.3285, "learning_rate": 7.46049212165113e-06, "epoch": 0.8270442004347583, "percentage": 82.7, "elapsed_time": "1 day, 11:07:09", "remaining_time": "7:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14839, "total_steps": 17941, "loss": 1.6796, "learning_rate": 7.45581357042166e-06, "epoch": 0.8270999386879215, "percentage": 82.71, "elapsed_time": "1 day, 11:07:18", "remaining_time": "7:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14840, "total_steps": 17941, "loss": 1.513, "learning_rate": 7.451136368445727e-06, "epoch": 0.8271556769410847, "percentage": 82.72, "elapsed_time": "1 day, 11:07:26", "remaining_time": "7:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14841, "total_steps": 17941, "loss": 1.4862, "learning_rate": 7.446460515871678e-06, "epoch": 0.8272114151942478, "percentage": 82.72, "elapsed_time": "1 day, 11:07:35", "remaining_time": "7:20:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14842, "total_steps": 17941, "loss": 1.6166, "learning_rate": 7.441786012847795e-06, "epoch": 0.827267153447411, "percentage": 82.73, "elapsed_time": "1 day, 11:07:43", "remaining_time": "7:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14843, "total_steps": 17941, "loss": 1.7089, "learning_rate": 7.437112859522339e-06, "epoch": 0.8273228917005742, "percentage": 82.73, "elapsed_time": "1 day, 11:07:52", "remaining_time": "7:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14844, "total_steps": 17941, "loss": 1.6842, "learning_rate": 7.4324410560434825e-06, "epoch": 0.8273786299537372, "percentage": 82.74, "elapsed_time": "1 day, 11:08:01", "remaining_time": "7:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14845, "total_steps": 17941, "loss": 1.7236, "learning_rate": 7.42777060255942e-06, "epoch": 0.8274343682069004, "percentage": 82.74, "elapsed_time": "1 day, 11:08:09", "remaining_time": "7:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14846, "total_steps": 17941, "loss": 1.7382, "learning_rate": 7.423101499218272e-06, "epoch": 0.8274901064600635, "percentage": 82.75, "elapsed_time": "1 day, 11:08:18", "remaining_time": "7:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14847, "total_steps": 17941, "loss": 1.5124, "learning_rate": 7.4184337461680905e-06, "epoch": 0.8275458447132267, "percentage": 82.75, "elapsed_time": "1 day, 11:08:26", "remaining_time": "7:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14848, "total_steps": 17941, "loss": 1.5824, "learning_rate": 7.4137673435569266e-06, "epoch": 0.8276015829663899, "percentage": 82.76, "elapsed_time": "1 day, 11:08:35", "remaining_time": "7:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14849, "total_steps": 17941, "loss": 1.5791, "learning_rate": 7.409102291532766e-06, "epoch": 0.8276573212195529, "percentage": 82.77, "elapsed_time": "1 day, 11:08:43", "remaining_time": "7:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14850, "total_steps": 17941, "loss": 1.69, "learning_rate": 7.404438590243568e-06, "epoch": 0.8277130594727161, "percentage": 82.77, "elapsed_time": "1 day, 11:08:51", "remaining_time": "7:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14851, "total_steps": 17941, "loss": 1.9097, "learning_rate": 7.399776239837208e-06, "epoch": 0.8277687977258793, "percentage": 82.78, "elapsed_time": "1 day, 11:09:00", "remaining_time": "7:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14852, "total_steps": 17941, "loss": 1.6214, "learning_rate": 7.395115240461581e-06, "epoch": 0.8278245359790424, "percentage": 82.78, "elapsed_time": "1 day, 11:09:08", "remaining_time": "7:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14853, "total_steps": 17941, "loss": 1.8655, "learning_rate": 7.390455592264506e-06, "epoch": 0.8278802742322056, "percentage": 82.79, "elapsed_time": "1 day, 11:09:17", "remaining_time": "7:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14854, "total_steps": 17941, "loss": 1.6002, "learning_rate": 7.385797295393732e-06, "epoch": 0.8279360124853687, "percentage": 82.79, "elapsed_time": "1 day, 11:09:25", "remaining_time": "7:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14855, "total_steps": 17941, "loss": 1.7274, "learning_rate": 7.381140349997018e-06, "epoch": 0.8279917507385318, "percentage": 82.8, "elapsed_time": "1 day, 11:09:34", "remaining_time": "7:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14856, "total_steps": 17941, "loss": 1.8171, "learning_rate": 7.376484756222041e-06, "epoch": 0.828047488991695, "percentage": 82.8, "elapsed_time": "1 day, 11:09:42", "remaining_time": "7:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14857, "total_steps": 17941, "loss": 1.6465, "learning_rate": 7.371830514216471e-06, "epoch": 0.8281032272448582, "percentage": 82.81, "elapsed_time": "1 day, 11:09:51", "remaining_time": "7:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14858, "total_steps": 17941, "loss": 1.5607, "learning_rate": 7.3671776241278856e-06, "epoch": 0.8281589654980213, "percentage": 82.82, "elapsed_time": "1 day, 11:09:59", "remaining_time": "7:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14859, "total_steps": 17941, "loss": 1.7207, "learning_rate": 7.362526086103844e-06, "epoch": 0.8282147037511844, "percentage": 82.82, "elapsed_time": "1 day, 11:10:08", "remaining_time": "7:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14860, "total_steps": 17941, "loss": 1.5266, "learning_rate": 7.357875900291905e-06, "epoch": 0.8282704420043476, "percentage": 82.83, "elapsed_time": "1 day, 11:10:16", "remaining_time": "7:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14861, "total_steps": 17941, "loss": 1.6808, "learning_rate": 7.353227066839513e-06, "epoch": 0.8283261802575107, "percentage": 82.83, "elapsed_time": "1 day, 11:10:25", "remaining_time": "7:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14862, "total_steps": 17941, "loss": 1.5349, "learning_rate": 7.348579585894111e-06, "epoch": 0.8283819185106739, "percentage": 82.84, "elapsed_time": "1 day, 11:10:34", "remaining_time": "7:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14863, "total_steps": 17941, "loss": 1.7059, "learning_rate": 7.3439334576030864e-06, "epoch": 0.8284376567638371, "percentage": 82.84, "elapsed_time": "1 day, 11:10:42", "remaining_time": "7:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14864, "total_steps": 17941, "loss": 1.7997, "learning_rate": 7.339288682113804e-06, "epoch": 0.8284933950170001, "percentage": 82.85, "elapsed_time": "1 day, 11:10:51", "remaining_time": "7:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14865, "total_steps": 17941, "loss": 1.4615, "learning_rate": 7.334645259573541e-06, "epoch": 0.8285491332701633, "percentage": 82.85, "elapsed_time": "1 day, 11:10:59", "remaining_time": "7:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14866, "total_steps": 17941, "loss": 1.6691, "learning_rate": 7.330003190129575e-06, "epoch": 0.8286048715233265, "percentage": 82.86, "elapsed_time": "1 day, 11:11:08", "remaining_time": "7:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14867, "total_steps": 17941, "loss": 1.6924, "learning_rate": 7.325362473929126e-06, "epoch": 0.8286606097764896, "percentage": 82.87, "elapsed_time": "1 day, 11:11:16", "remaining_time": "7:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14868, "total_steps": 17941, "loss": 1.8302, "learning_rate": 7.320723111119371e-06, "epoch": 0.8287163480296528, "percentage": 82.87, "elapsed_time": "1 day, 11:11:25", "remaining_time": "7:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14869, "total_steps": 17941, "loss": 1.5856, "learning_rate": 7.316085101847453e-06, "epoch": 0.8287720862828158, "percentage": 82.88, "elapsed_time": "1 day, 11:11:33", "remaining_time": "7:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14870, "total_steps": 17941, "loss": 1.5342, "learning_rate": 7.311448446260422e-06, "epoch": 0.828827824535979, "percentage": 82.88, "elapsed_time": "1 day, 11:11:42", "remaining_time": "7:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14871, "total_steps": 17941, "loss": 1.4847, "learning_rate": 7.306813144505381e-06, "epoch": 0.8288835627891422, "percentage": 82.89, "elapsed_time": "1 day, 11:11:51", "remaining_time": "7:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14872, "total_steps": 17941, "loss": 1.8871, "learning_rate": 7.3021791967292976e-06, "epoch": 0.8289393010423053, "percentage": 82.89, "elapsed_time": "1 day, 11:11:59", "remaining_time": "7:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14873, "total_steps": 17941, "loss": 1.5112, "learning_rate": 7.297546603079147e-06, "epoch": 0.8289950392954685, "percentage": 82.9, "elapsed_time": "1 day, 11:12:07", "remaining_time": "7:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14874, "total_steps": 17941, "loss": 1.2755, "learning_rate": 7.292915363701841e-06, "epoch": 0.8290507775486317, "percentage": 82.91, "elapsed_time": "1 day, 11:12:16", "remaining_time": "7:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14875, "total_steps": 17941, "loss": 1.5412, "learning_rate": 7.288285478744261e-06, "epoch": 0.8291065158017947, "percentage": 82.91, "elapsed_time": "1 day, 11:12:24", "remaining_time": "7:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14876, "total_steps": 17941, "loss": 1.7214, "learning_rate": 7.283656948353251e-06, "epoch": 0.8291622540549579, "percentage": 82.92, "elapsed_time": "1 day, 11:12:33", "remaining_time": "7:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14877, "total_steps": 17941, "loss": 1.9109, "learning_rate": 7.2790297726755716e-06, "epoch": 0.8292179923081211, "percentage": 82.92, "elapsed_time": "1 day, 11:12:41", "remaining_time": "7:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14878, "total_steps": 17941, "loss": 1.5359, "learning_rate": 7.274403951857994e-06, "epoch": 0.8292737305612842, "percentage": 82.93, "elapsed_time": "1 day, 11:12:50", "remaining_time": "7:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14879, "total_steps": 17941, "loss": 1.6992, "learning_rate": 7.2697794860472235e-06, "epoch": 0.8293294688144474, "percentage": 82.93, "elapsed_time": "1 day, 11:12:58", "remaining_time": "7:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14880, "total_steps": 17941, "loss": 1.6467, "learning_rate": 7.265156375389909e-06, "epoch": 0.8293852070676105, "percentage": 82.94, "elapsed_time": "1 day, 11:13:06", "remaining_time": "7:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14881, "total_steps": 17941, "loss": 1.7689, "learning_rate": 7.260534620032667e-06, "epoch": 0.8294409453207736, "percentage": 82.94, "elapsed_time": "1 day, 11:13:15", "remaining_time": "7:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14882, "total_steps": 17941, "loss": 1.7601, "learning_rate": 7.255914220122078e-06, "epoch": 0.8294966835739368, "percentage": 82.95, "elapsed_time": "1 day, 11:13:24", "remaining_time": "7:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14883, "total_steps": 17941, "loss": 1.731, "learning_rate": 7.25129517580469e-06, "epoch": 0.8295524218271, "percentage": 82.96, "elapsed_time": "1 day, 11:13:32", "remaining_time": "7:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14884, "total_steps": 17941, "loss": 1.6389, "learning_rate": 7.246677487226966e-06, "epoch": 0.8296081600802631, "percentage": 82.96, "elapsed_time": "1 day, 11:13:41", "remaining_time": "7:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14885, "total_steps": 17941, "loss": 1.6421, "learning_rate": 7.242061154535346e-06, "epoch": 0.8296638983334262, "percentage": 82.97, "elapsed_time": "1 day, 11:13:49", "remaining_time": "7:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14886, "total_steps": 17941, "loss": 1.4844, "learning_rate": 7.237446177876278e-06, "epoch": 0.8297196365865894, "percentage": 82.97, "elapsed_time": "1 day, 11:13:58", "remaining_time": "7:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14887, "total_steps": 17941, "loss": 1.478, "learning_rate": 7.23283255739608e-06, "epoch": 0.8297753748397525, "percentage": 82.98, "elapsed_time": "1 day, 11:14:06", "remaining_time": "7:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14888, "total_steps": 17941, "loss": 1.7255, "learning_rate": 7.228220293241084e-06, "epoch": 0.8298311130929157, "percentage": 82.98, "elapsed_time": "1 day, 11:14:15", "remaining_time": "7:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14889, "total_steps": 17941, "loss": 1.4374, "learning_rate": 7.223609385557567e-06, "epoch": 0.8298868513460789, "percentage": 82.99, "elapsed_time": "1 day, 11:14:23", "remaining_time": "7:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14890, "total_steps": 17941, "loss": 1.5534, "learning_rate": 7.2189998344917635e-06, "epoch": 0.8299425895992419, "percentage": 82.99, "elapsed_time": "1 day, 11:14:32", "remaining_time": "7:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14891, "total_steps": 17941, "loss": 1.683, "learning_rate": 7.214391640189844e-06, "epoch": 0.8299983278524051, "percentage": 83.0, "elapsed_time": "1 day, 11:14:41", "remaining_time": "7:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14892, "total_steps": 17941, "loss": 1.6317, "learning_rate": 7.209784802797964e-06, "epoch": 0.8300540661055682, "percentage": 83.01, "elapsed_time": "1 day, 11:14:50", "remaining_time": "7:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14893, "total_steps": 17941, "loss": 1.8489, "learning_rate": 7.20517932246223e-06, "epoch": 0.8301098043587314, "percentage": 83.01, "elapsed_time": "1 day, 11:14:59", "remaining_time": "7:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14894, "total_steps": 17941, "loss": 1.6475, "learning_rate": 7.200575199328691e-06, "epoch": 0.8301655426118946, "percentage": 83.02, "elapsed_time": "1 day, 11:15:08", "remaining_time": "7:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14895, "total_steps": 17941, "loss": 1.5613, "learning_rate": 7.195972433543386e-06, "epoch": 0.8302212808650576, "percentage": 83.02, "elapsed_time": "1 day, 11:15:17", "remaining_time": "7:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14896, "total_steps": 17941, "loss": 1.5859, "learning_rate": 7.191371025252242e-06, "epoch": 0.8302770191182208, "percentage": 83.03, "elapsed_time": "1 day, 11:15:25", "remaining_time": "7:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14897, "total_steps": 17941, "loss": 1.7449, "learning_rate": 7.186770974601242e-06, "epoch": 0.830332757371384, "percentage": 83.03, "elapsed_time": "1 day, 11:15:34", "remaining_time": "7:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14898, "total_steps": 17941, "loss": 1.6864, "learning_rate": 7.182172281736244e-06, "epoch": 0.8303884956245471, "percentage": 83.04, "elapsed_time": "1 day, 11:15:42", "remaining_time": "7:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14899, "total_steps": 17941, "loss": 1.752, "learning_rate": 7.177574946803084e-06, "epoch": 0.8304442338777103, "percentage": 83.04, "elapsed_time": "1 day, 11:15:51", "remaining_time": "7:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14900, "total_steps": 17941, "loss": 1.5253, "learning_rate": 7.172978969947586e-06, "epoch": 0.8304999721308735, "percentage": 83.05, "elapsed_time": "1 day, 11:16:00", "remaining_time": "7:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14901, "total_steps": 17941, "loss": 1.7083, "learning_rate": 7.168384351315488e-06, "epoch": 0.8305557103840365, "percentage": 83.06, "elapsed_time": "1 day, 11:16:09", "remaining_time": "7:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14902, "total_steps": 17941, "loss": 1.5918, "learning_rate": 7.163791091052524e-06, "epoch": 0.8306114486371997, "percentage": 83.06, "elapsed_time": "1 day, 11:16:17", "remaining_time": "7:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14903, "total_steps": 17941, "loss": 1.673, "learning_rate": 7.1591991893043384e-06, "epoch": 0.8306671868903629, "percentage": 83.07, "elapsed_time": "1 day, 11:16:26", "remaining_time": "7:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14904, "total_steps": 17941, "loss": 1.837, "learning_rate": 7.1546086462165816e-06, "epoch": 0.830722925143526, "percentage": 83.07, "elapsed_time": "1 day, 11:16:34", "remaining_time": "7:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14905, "total_steps": 17941, "loss": 1.7407, "learning_rate": 7.150019461934843e-06, "epoch": 0.8307786633966892, "percentage": 83.08, "elapsed_time": "1 day, 11:16:43", "remaining_time": "7:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14906, "total_steps": 17941, "loss": 1.4998, "learning_rate": 7.145431636604644e-06, "epoch": 0.8308344016498523, "percentage": 83.08, "elapsed_time": "1 day, 11:16:51", "remaining_time": "7:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14907, "total_steps": 17941, "loss": 1.5029, "learning_rate": 7.140845170371496e-06, "epoch": 0.8308901399030154, "percentage": 83.09, "elapsed_time": "1 day, 11:17:00", "remaining_time": "7:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14908, "total_steps": 17941, "loss": 1.5846, "learning_rate": 7.136260063380851e-06, "epoch": 0.8309458781561786, "percentage": 83.09, "elapsed_time": "1 day, 11:17:08", "remaining_time": "7:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14909, "total_steps": 17941, "loss": 1.749, "learning_rate": 7.131676315778135e-06, "epoch": 0.8310016164093418, "percentage": 83.1, "elapsed_time": "1 day, 11:17:17", "remaining_time": "7:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14910, "total_steps": 17941, "loss": 1.6114, "learning_rate": 7.1270939277087e-06, "epoch": 0.8310573546625049, "percentage": 83.11, "elapsed_time": "1 day, 11:17:25", "remaining_time": "7:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14911, "total_steps": 17941, "loss": 1.7493, "learning_rate": 7.122512899317862e-06, "epoch": 0.831113092915668, "percentage": 83.11, "elapsed_time": "1 day, 11:17:33", "remaining_time": "7:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14912, "total_steps": 17941, "loss": 1.5338, "learning_rate": 7.11793323075095e-06, "epoch": 0.8311688311688312, "percentage": 83.12, "elapsed_time": "1 day, 11:17:42", "remaining_time": "7:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14913, "total_steps": 17941, "loss": 1.6078, "learning_rate": 7.113354922153159e-06, "epoch": 0.8312245694219943, "percentage": 83.12, "elapsed_time": "1 day, 11:17:51", "remaining_time": "7:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14914, "total_steps": 17941, "loss": 1.8323, "learning_rate": 7.108777973669706e-06, "epoch": 0.8312803076751575, "percentage": 83.13, "elapsed_time": "1 day, 11:17:59", "remaining_time": "7:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14915, "total_steps": 17941, "loss": 1.6329, "learning_rate": 7.104202385445741e-06, "epoch": 0.8313360459283206, "percentage": 83.13, "elapsed_time": "1 day, 11:18:08", "remaining_time": "7:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14916, "total_steps": 17941, "loss": 1.5872, "learning_rate": 7.099628157626392e-06, "epoch": 0.8313917841814837, "percentage": 83.14, "elapsed_time": "1 day, 11:18:17", "remaining_time": "7:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14917, "total_steps": 17941, "loss": 1.6175, "learning_rate": 7.095055290356694e-06, "epoch": 0.8314475224346469, "percentage": 83.14, "elapsed_time": "1 day, 11:18:26", "remaining_time": "7:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14918, "total_steps": 17941, "loss": 1.5957, "learning_rate": 7.090483783781693e-06, "epoch": 0.83150326068781, "percentage": 83.15, "elapsed_time": "1 day, 11:18:34", "remaining_time": "7:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14919, "total_steps": 17941, "loss": 1.3375, "learning_rate": 7.085913638046366e-06, "epoch": 0.8315589989409732, "percentage": 83.16, "elapsed_time": "1 day, 11:18:43", "remaining_time": "7:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14920, "total_steps": 17941, "loss": 1.6729, "learning_rate": 7.081344853295652e-06, "epoch": 0.8316147371941364, "percentage": 83.16, "elapsed_time": "1 day, 11:18:51", "remaining_time": "7:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14921, "total_steps": 17941, "loss": 1.5751, "learning_rate": 7.076777429674458e-06, "epoch": 0.8316704754472994, "percentage": 83.17, "elapsed_time": "1 day, 11:19:00", "remaining_time": "7:08:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14922, "total_steps": 17941, "loss": 1.6183, "learning_rate": 7.072211367327603e-06, "epoch": 0.8317262137004626, "percentage": 83.17, "elapsed_time": "1 day, 11:19:08", "remaining_time": "7:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14923, "total_steps": 17941, "loss": 1.5727, "learning_rate": 7.0676466663999355e-06, "epoch": 0.8317819519536258, "percentage": 83.18, "elapsed_time": "1 day, 11:19:17", "remaining_time": "7:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14924, "total_steps": 17941, "loss": 1.8146, "learning_rate": 7.063083327036191e-06, "epoch": 0.8318376902067889, "percentage": 83.18, "elapsed_time": "1 day, 11:19:25", "remaining_time": "7:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14925, "total_steps": 17941, "loss": 1.8472, "learning_rate": 7.058521349381109e-06, "epoch": 0.8318934284599521, "percentage": 83.19, "elapsed_time": "1 day, 11:19:34", "remaining_time": "7:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14926, "total_steps": 17941, "loss": 1.5908, "learning_rate": 7.0539607335793565e-06, "epoch": 0.8319491667131153, "percentage": 83.19, "elapsed_time": "1 day, 11:19:42", "remaining_time": "7:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14927, "total_steps": 17941, "loss": 1.7789, "learning_rate": 7.04940147977558e-06, "epoch": 0.8320049049662783, "percentage": 83.2, "elapsed_time": "1 day, 11:19:51", "remaining_time": "7:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14928, "total_steps": 17941, "loss": 1.7592, "learning_rate": 7.044843588114386e-06, "epoch": 0.8320606432194415, "percentage": 83.21, "elapsed_time": "1 day, 11:19:59", "remaining_time": "7:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14929, "total_steps": 17941, "loss": 1.8732, "learning_rate": 7.04028705874028e-06, "epoch": 0.8321163814726047, "percentage": 83.21, "elapsed_time": "1 day, 11:20:08", "remaining_time": "7:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14930, "total_steps": 17941, "loss": 1.7596, "learning_rate": 7.035731891797803e-06, "epoch": 0.8321721197257678, "percentage": 83.22, "elapsed_time": "1 day, 11:20:17", "remaining_time": "7:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14931, "total_steps": 17941, "loss": 1.738, "learning_rate": 7.031178087431428e-06, "epoch": 0.832227857978931, "percentage": 83.22, "elapsed_time": "1 day, 11:20:26", "remaining_time": "7:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14932, "total_steps": 17941, "loss": 1.5169, "learning_rate": 7.026625645785551e-06, "epoch": 0.8322835962320941, "percentage": 83.23, "elapsed_time": "1 day, 11:20:35", "remaining_time": "7:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14933, "total_steps": 17941, "loss": 1.7271, "learning_rate": 7.022074567004549e-06, "epoch": 0.8323393344852572, "percentage": 83.23, "elapsed_time": "1 day, 11:20:43", "remaining_time": "7:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14934, "total_steps": 17941, "loss": 1.6145, "learning_rate": 7.017524851232765e-06, "epoch": 0.8323950727384204, "percentage": 83.24, "elapsed_time": "1 day, 11:20:52", "remaining_time": "7:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14935, "total_steps": 17941, "loss": 1.6458, "learning_rate": 7.012976498614498e-06, "epoch": 0.8324508109915836, "percentage": 83.25, "elapsed_time": "1 day, 11:21:00", "remaining_time": "7:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14936, "total_steps": 17941, "loss": 1.5222, "learning_rate": 7.008429509293979e-06, "epoch": 0.8325065492447467, "percentage": 83.25, "elapsed_time": "1 day, 11:21:09", "remaining_time": "7:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14937, "total_steps": 17941, "loss": 1.6804, "learning_rate": 7.003883883415402e-06, "epoch": 0.8325622874979098, "percentage": 83.26, "elapsed_time": "1 day, 11:21:18", "remaining_time": "7:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14938, "total_steps": 17941, "loss": 1.4962, "learning_rate": 6.9993396211229635e-06, "epoch": 0.8326180257510729, "percentage": 83.26, "elapsed_time": "1 day, 11:21:26", "remaining_time": "7:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14939, "total_steps": 17941, "loss": 1.9543, "learning_rate": 6.994796722560754e-06, "epoch": 0.8326737640042361, "percentage": 83.27, "elapsed_time": "1 day, 11:21:35", "remaining_time": "7:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14940, "total_steps": 17941, "loss": 1.6622, "learning_rate": 6.990255187872851e-06, "epoch": 0.8327295022573993, "percentage": 83.27, "elapsed_time": "1 day, 11:21:43", "remaining_time": "7:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14941, "total_steps": 17941, "loss": 1.4973, "learning_rate": 6.985715017203293e-06, "epoch": 0.8327852405105624, "percentage": 83.28, "elapsed_time": "1 day, 11:21:52", "remaining_time": "7:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14942, "total_steps": 17941, "loss": 1.7641, "learning_rate": 6.981176210696077e-06, "epoch": 0.8328409787637255, "percentage": 83.28, "elapsed_time": "1 day, 11:22:00", "remaining_time": "7:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14943, "total_steps": 17941, "loss": 1.6925, "learning_rate": 6.97663876849512e-06, "epoch": 0.8328967170168887, "percentage": 83.29, "elapsed_time": "1 day, 11:22:09", "remaining_time": "7:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14944, "total_steps": 17941, "loss": 1.7473, "learning_rate": 6.972102690744325e-06, "epoch": 0.8329524552700518, "percentage": 83.3, "elapsed_time": "1 day, 11:22:17", "remaining_time": "7:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14945, "total_steps": 17941, "loss": 1.7243, "learning_rate": 6.967567977587586e-06, "epoch": 0.833008193523215, "percentage": 83.3, "elapsed_time": "1 day, 11:22:26", "remaining_time": "7:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14946, "total_steps": 17941, "loss": 1.4805, "learning_rate": 6.963034629168685e-06, "epoch": 0.8330639317763782, "percentage": 83.31, "elapsed_time": "1 day, 11:22:34", "remaining_time": "7:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14947, "total_steps": 17941, "loss": 0.9261, "learning_rate": 6.958502645631409e-06, "epoch": 0.8331196700295412, "percentage": 83.31, "elapsed_time": "1 day, 11:22:43", "remaining_time": "7:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14948, "total_steps": 17941, "loss": 1.5988, "learning_rate": 6.953972027119466e-06, "epoch": 0.8331754082827044, "percentage": 83.32, "elapsed_time": "1 day, 11:22:51", "remaining_time": "7:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14949, "total_steps": 17941, "loss": 1.399, "learning_rate": 6.949442773776571e-06, "epoch": 0.8332311465358676, "percentage": 83.32, "elapsed_time": "1 day, 11:23:00", "remaining_time": "7:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14950, "total_steps": 17941, "loss": 1.6314, "learning_rate": 6.944914885746334e-06, "epoch": 0.8332868847890307, "percentage": 83.33, "elapsed_time": "1 day, 11:23:08", "remaining_time": "7:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14951, "total_steps": 17941, "loss": 1.5388, "learning_rate": 6.940388363172373e-06, "epoch": 0.8333426230421939, "percentage": 83.33, "elapsed_time": "1 day, 11:23:17", "remaining_time": "7:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14952, "total_steps": 17941, "loss": 1.5226, "learning_rate": 6.93586320619824e-06, "epoch": 0.833398361295357, "percentage": 83.34, "elapsed_time": "1 day, 11:23:25", "remaining_time": "7:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14953, "total_steps": 17941, "loss": 1.4901, "learning_rate": 6.931339414967441e-06, "epoch": 0.8334540995485201, "percentage": 83.35, "elapsed_time": "1 day, 11:23:33", "remaining_time": "7:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14954, "total_steps": 17941, "loss": 1.5107, "learning_rate": 6.926816989623464e-06, "epoch": 0.8335098378016833, "percentage": 83.35, "elapsed_time": "1 day, 11:23:42", "remaining_time": "7:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14955, "total_steps": 17941, "loss": 1.5848, "learning_rate": 6.922295930309691e-06, "epoch": 0.8335655760548465, "percentage": 83.36, "elapsed_time": "1 day, 11:23:50", "remaining_time": "7:04:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14956, "total_steps": 17941, "loss": 1.5865, "learning_rate": 6.917776237169543e-06, "epoch": 0.8336213143080096, "percentage": 83.36, "elapsed_time": "1 day, 11:23:59", "remaining_time": "7:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14957, "total_steps": 17941, "loss": 1.6705, "learning_rate": 6.91325791034636e-06, "epoch": 0.8336770525611727, "percentage": 83.37, "elapsed_time": "1 day, 11:24:07", "remaining_time": "7:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14958, "total_steps": 17941, "loss": 1.5818, "learning_rate": 6.908740949983411e-06, "epoch": 0.8337327908143359, "percentage": 83.37, "elapsed_time": "1 day, 11:24:16", "remaining_time": "7:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14959, "total_steps": 17941, "loss": 1.6364, "learning_rate": 6.904225356223954e-06, "epoch": 0.833788529067499, "percentage": 83.38, "elapsed_time": "1 day, 11:24:24", "remaining_time": "7:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14960, "total_steps": 17941, "loss": 1.5349, "learning_rate": 6.899711129211206e-06, "epoch": 0.8338442673206622, "percentage": 83.38, "elapsed_time": "1 day, 11:24:32", "remaining_time": "7:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14961, "total_steps": 17941, "loss": 1.6409, "learning_rate": 6.895198269088343e-06, "epoch": 0.8339000055738253, "percentage": 83.39, "elapsed_time": "1 day, 11:24:41", "remaining_time": "7:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14962, "total_steps": 17941, "loss": 1.8578, "learning_rate": 6.890686775998462e-06, "epoch": 0.8339557438269884, "percentage": 83.4, "elapsed_time": "1 day, 11:24:49", "remaining_time": "7:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14963, "total_steps": 17941, "loss": 1.4316, "learning_rate": 6.8861766500846356e-06, "epoch": 0.8340114820801516, "percentage": 83.4, "elapsed_time": "1 day, 11:24:58", "remaining_time": "7:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14964, "total_steps": 17941, "loss": 1.6223, "learning_rate": 6.88166789148994e-06, "epoch": 0.8340672203333147, "percentage": 83.41, "elapsed_time": "1 day, 11:25:06", "remaining_time": "7:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14965, "total_steps": 17941, "loss": 1.5812, "learning_rate": 6.877160500357327e-06, "epoch": 0.8341229585864779, "percentage": 83.41, "elapsed_time": "1 day, 11:25:14", "remaining_time": "7:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14966, "total_steps": 17941, "loss": 1.6649, "learning_rate": 6.872654476829765e-06, "epoch": 0.8341786968396411, "percentage": 83.42, "elapsed_time": "1 day, 11:25:23", "remaining_time": "7:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14967, "total_steps": 17941, "loss": 1.6446, "learning_rate": 6.868149821050152e-06, "epoch": 0.8342344350928041, "percentage": 83.42, "elapsed_time": "1 day, 11:25:31", "remaining_time": "7:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14968, "total_steps": 17941, "loss": 1.702, "learning_rate": 6.8636465331613555e-06, "epoch": 0.8342901733459673, "percentage": 83.43, "elapsed_time": "1 day, 11:25:40", "remaining_time": "7:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14969, "total_steps": 17941, "loss": 1.8365, "learning_rate": 6.859144613306185e-06, "epoch": 0.8343459115991305, "percentage": 83.43, "elapsed_time": "1 day, 11:25:48", "remaining_time": "7:02:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14970, "total_steps": 17941, "loss": 1.6186, "learning_rate": 6.8546440616274024e-06, "epoch": 0.8344016498522936, "percentage": 83.44, "elapsed_time": "1 day, 11:25:57", "remaining_time": "7:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14971, "total_steps": 17941, "loss": 1.6608, "learning_rate": 6.850144878267784e-06, "epoch": 0.8344573881054568, "percentage": 83.45, "elapsed_time": "1 day, 11:26:05", "remaining_time": "7:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14972, "total_steps": 17941, "loss": 1.4615, "learning_rate": 6.84564706336997e-06, "epoch": 0.83451312635862, "percentage": 83.45, "elapsed_time": "1 day, 11:26:14", "remaining_time": "7:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14973, "total_steps": 17941, "loss": 1.7102, "learning_rate": 6.841150617076636e-06, "epoch": 0.834568864611783, "percentage": 83.46, "elapsed_time": "1 day, 11:26:22", "remaining_time": "7:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14974, "total_steps": 17941, "loss": 1.5415, "learning_rate": 6.836655539530351e-06, "epoch": 0.8346246028649462, "percentage": 83.46, "elapsed_time": "1 day, 11:26:30", "remaining_time": "7:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14975, "total_steps": 17941, "loss": 1.6088, "learning_rate": 6.832161830873718e-06, "epoch": 0.8346803411181094, "percentage": 83.47, "elapsed_time": "1 day, 11:26:39", "remaining_time": "7:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14976, "total_steps": 17941, "loss": 1.5481, "learning_rate": 6.827669491249211e-06, "epoch": 0.8347360793712725, "percentage": 83.47, "elapsed_time": "1 day, 11:26:47", "remaining_time": "7:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14977, "total_steps": 17941, "loss": 1.6031, "learning_rate": 6.823178520799317e-06, "epoch": 0.8347918176244357, "percentage": 83.48, "elapsed_time": "1 day, 11:26:56", "remaining_time": "7:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14978, "total_steps": 17941, "loss": 1.647, "learning_rate": 6.8186889196664605e-06, "epoch": 0.8348475558775988, "percentage": 83.48, "elapsed_time": "1 day, 11:27:04", "remaining_time": "7:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14979, "total_steps": 17941, "loss": 1.5902, "learning_rate": 6.814200687993028e-06, "epoch": 0.8349032941307619, "percentage": 83.49, "elapsed_time": "1 day, 11:27:13", "remaining_time": "7:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14980, "total_steps": 17941, "loss": 1.5765, "learning_rate": 6.809713825921371e-06, "epoch": 0.8349590323839251, "percentage": 83.5, "elapsed_time": "1 day, 11:27:21", "remaining_time": "7:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14981, "total_steps": 17941, "loss": 1.6666, "learning_rate": 6.80522833359375e-06, "epoch": 0.8350147706370883, "percentage": 83.5, "elapsed_time": "1 day, 11:27:29", "remaining_time": "7:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14982, "total_steps": 17941, "loss": 1.7652, "learning_rate": 6.800744211152454e-06, "epoch": 0.8350705088902514, "percentage": 83.51, "elapsed_time": "1 day, 11:27:38", "remaining_time": "7:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14983, "total_steps": 17941, "loss": 1.6158, "learning_rate": 6.796261458739695e-06, "epoch": 0.8351262471434145, "percentage": 83.51, "elapsed_time": "1 day, 11:27:47", "remaining_time": "7:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14984, "total_steps": 17941, "loss": 1.6253, "learning_rate": 6.791780076497617e-06, "epoch": 0.8351819853965776, "percentage": 83.52, "elapsed_time": "1 day, 11:27:55", "remaining_time": "6:59:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14985, "total_steps": 17941, "loss": 1.7899, "learning_rate": 6.787300064568353e-06, "epoch": 0.8352377236497408, "percentage": 83.52, "elapsed_time": "1 day, 11:28:04", "remaining_time": "6:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14986, "total_steps": 17941, "loss": 1.8485, "learning_rate": 6.7828214230939825e-06, "epoch": 0.835293461902904, "percentage": 83.53, "elapsed_time": "1 day, 11:28:12", "remaining_time": "6:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14987, "total_steps": 17941, "loss": 1.5262, "learning_rate": 6.778344152216553e-06, "epoch": 0.8353492001560671, "percentage": 83.53, "elapsed_time": "1 day, 11:28:21", "remaining_time": "6:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14988, "total_steps": 17941, "loss": 1.6569, "learning_rate": 6.7738682520780415e-06, "epoch": 0.8354049384092302, "percentage": 83.54, "elapsed_time": "1 day, 11:28:29", "remaining_time": "6:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14989, "total_steps": 17941, "loss": 1.7483, "learning_rate": 6.7693937228203885e-06, "epoch": 0.8354606766623934, "percentage": 83.55, "elapsed_time": "1 day, 11:28:38", "remaining_time": "6:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14990, "total_steps": 17941, "loss": 1.708, "learning_rate": 6.764920564585536e-06, "epoch": 0.8355164149155565, "percentage": 83.55, "elapsed_time": "1 day, 11:28:46", "remaining_time": "6:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14991, "total_steps": 17941, "loss": 1.9626, "learning_rate": 6.760448777515316e-06, "epoch": 0.8355721531687197, "percentage": 83.56, "elapsed_time": "1 day, 11:28:55", "remaining_time": "6:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14992, "total_steps": 17941, "loss": 1.2251, "learning_rate": 6.755978361751553e-06, "epoch": 0.8356278914218829, "percentage": 83.56, "elapsed_time": "1 day, 11:29:03", "remaining_time": "6:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14993, "total_steps": 17941, "loss": 1.7765, "learning_rate": 6.7515093174360275e-06, "epoch": 0.835683629675046, "percentage": 83.57, "elapsed_time": "1 day, 11:29:12", "remaining_time": "6:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14994, "total_steps": 17941, "loss": 1.777, "learning_rate": 6.7470416447104834e-06, "epoch": 0.8357393679282091, "percentage": 83.57, "elapsed_time": "1 day, 11:29:21", "remaining_time": "6:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14995, "total_steps": 17941, "loss": 1.695, "learning_rate": 6.742575343716584e-06, "epoch": 0.8357951061813723, "percentage": 83.58, "elapsed_time": "1 day, 11:29:29", "remaining_time": "6:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14996, "total_steps": 17941, "loss": 1.6019, "learning_rate": 6.738110414595977e-06, "epoch": 0.8358508444345354, "percentage": 83.59, "elapsed_time": "1 day, 11:29:38", "remaining_time": "6:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14997, "total_steps": 17941, "loss": 1.4083, "learning_rate": 6.733646857490294e-06, "epoch": 0.8359065826876986, "percentage": 83.59, "elapsed_time": "1 day, 11:29:46", "remaining_time": "6:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14998, "total_steps": 17941, "loss": 1.5974, "learning_rate": 6.729184672541061e-06, "epoch": 0.8359623209408618, "percentage": 83.6, "elapsed_time": "1 day, 11:29:55", "remaining_time": "6:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14999, "total_steps": 17941, "loss": 1.5756, "learning_rate": 6.7247238598898145e-06, "epoch": 0.8360180591940248, "percentage": 83.6, "elapsed_time": "1 day, 11:30:03", "remaining_time": "6:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15000, "total_steps": 17941, "loss": 1.8554, "learning_rate": 6.720264419677996e-06, "epoch": 0.836073797447188, "percentage": 83.61, "elapsed_time": "1 day, 11:30:12", "remaining_time": "6:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15001, "total_steps": 17941, "loss": 1.5994, "learning_rate": 6.715806352047072e-06, "epoch": 0.8361295357003512, "percentage": 83.61, "elapsed_time": "1 day, 11:30:21", "remaining_time": "6:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15002, "total_steps": 17941, "loss": 1.6864, "learning_rate": 6.711349657138394e-06, "epoch": 0.8361852739535143, "percentage": 83.62, "elapsed_time": "1 day, 11:30:30", "remaining_time": "6:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15003, "total_steps": 17941, "loss": 1.7365, "learning_rate": 6.706894335093311e-06, "epoch": 0.8362410122066775, "percentage": 83.62, "elapsed_time": "1 day, 11:30:38", "remaining_time": "6:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15004, "total_steps": 17941, "loss": 1.8279, "learning_rate": 6.702440386053127e-06, "epoch": 0.8362967504598406, "percentage": 83.63, "elapsed_time": "1 day, 11:30:47", "remaining_time": "6:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15005, "total_steps": 17941, "loss": 1.5776, "learning_rate": 6.697987810159095e-06, "epoch": 0.8363524887130037, "percentage": 83.64, "elapsed_time": "1 day, 11:30:55", "remaining_time": "6:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15006, "total_steps": 17941, "loss": 1.7631, "learning_rate": 6.6935366075524305e-06, "epoch": 0.8364082269661669, "percentage": 83.64, "elapsed_time": "1 day, 11:31:04", "remaining_time": "6:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15007, "total_steps": 17941, "loss": 1.757, "learning_rate": 6.689086778374265e-06, "epoch": 0.83646396521933, "percentage": 83.65, "elapsed_time": "1 day, 11:31:12", "remaining_time": "6:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15008, "total_steps": 17941, "loss": 1.5883, "learning_rate": 6.684638322765774e-06, "epoch": 0.8365197034724932, "percentage": 83.65, "elapsed_time": "1 day, 11:31:21", "remaining_time": "6:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15009, "total_steps": 17941, "loss": 1.5605, "learning_rate": 6.680191240867995e-06, "epoch": 0.8365754417256563, "percentage": 83.66, "elapsed_time": "1 day, 11:31:29", "remaining_time": "6:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15010, "total_steps": 17941, "loss": 1.2555, "learning_rate": 6.675745532821975e-06, "epoch": 0.8366311799788194, "percentage": 83.66, "elapsed_time": "1 day, 11:31:38", "remaining_time": "6:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15011, "total_steps": 17941, "loss": 1.7833, "learning_rate": 6.671301198768715e-06, "epoch": 0.8366869182319826, "percentage": 83.67, "elapsed_time": "1 day, 11:31:46", "remaining_time": "6:56:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15012, "total_steps": 17941, "loss": 1.4817, "learning_rate": 6.666858238849155e-06, "epoch": 0.8367426564851458, "percentage": 83.67, "elapsed_time": "1 day, 11:31:55", "remaining_time": "6:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15013, "total_steps": 17941, "loss": 1.8673, "learning_rate": 6.662416653204212e-06, "epoch": 0.8367983947383089, "percentage": 83.68, "elapsed_time": "1 day, 11:32:03", "remaining_time": "6:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15014, "total_steps": 17941, "loss": 1.5881, "learning_rate": 6.657976441974722e-06, "epoch": 0.836854132991472, "percentage": 83.69, "elapsed_time": "1 day, 11:32:12", "remaining_time": "6:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15015, "total_steps": 17941, "loss": 1.6088, "learning_rate": 6.653537605301513e-06, "epoch": 0.8369098712446352, "percentage": 83.69, "elapsed_time": "1 day, 11:32:21", "remaining_time": "6:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15016, "total_steps": 17941, "loss": 2.0219, "learning_rate": 6.6491001433253875e-06, "epoch": 0.8369656094977983, "percentage": 83.7, "elapsed_time": "1 day, 11:32:29", "remaining_time": "6:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15017, "total_steps": 17941, "loss": 1.6178, "learning_rate": 6.6446640561870335e-06, "epoch": 0.8370213477509615, "percentage": 83.7, "elapsed_time": "1 day, 11:32:38", "remaining_time": "6:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15018, "total_steps": 17941, "loss": 1.7283, "learning_rate": 6.64022934402716e-06, "epoch": 0.8370770860041247, "percentage": 83.71, "elapsed_time": "1 day, 11:32:46", "remaining_time": "6:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15019, "total_steps": 17941, "loss": 1.8185, "learning_rate": 6.635796006986411e-06, "epoch": 0.8371328242572877, "percentage": 83.71, "elapsed_time": "1 day, 11:32:55", "remaining_time": "6:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15020, "total_steps": 17941, "loss": 1.3608, "learning_rate": 6.631364045205391e-06, "epoch": 0.8371885625104509, "percentage": 83.72, "elapsed_time": "1 day, 11:33:04", "remaining_time": "6:54:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15021, "total_steps": 17941, "loss": 1.6448, "learning_rate": 6.62693345882463e-06, "epoch": 0.8372443007636141, "percentage": 83.72, "elapsed_time": "1 day, 11:33:13", "remaining_time": "6:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15022, "total_steps": 17941, "loss": 1.5787, "learning_rate": 6.622504247984651e-06, "epoch": 0.8373000390167772, "percentage": 83.73, "elapsed_time": "1 day, 11:33:22", "remaining_time": "6:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15023, "total_steps": 17941, "loss": 1.6616, "learning_rate": 6.618076412825952e-06, "epoch": 0.8373557772699404, "percentage": 83.74, "elapsed_time": "1 day, 11:33:30", "remaining_time": "6:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15024, "total_steps": 17941, "loss": 1.7556, "learning_rate": 6.613649953488921e-06, "epoch": 0.8374115155231036, "percentage": 83.74, "elapsed_time": "1 day, 11:33:39", "remaining_time": "6:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15025, "total_steps": 17941, "loss": 1.7979, "learning_rate": 6.6092248701139556e-06, "epoch": 0.8374672537762666, "percentage": 83.75, "elapsed_time": "1 day, 11:33:47", "remaining_time": "6:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15026, "total_steps": 17941, "loss": 1.3892, "learning_rate": 6.60480116284139e-06, "epoch": 0.8375229920294298, "percentage": 83.75, "elapsed_time": "1 day, 11:33:56", "remaining_time": "6:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15027, "total_steps": 17941, "loss": 1.554, "learning_rate": 6.6003788318115265e-06, "epoch": 0.837578730282593, "percentage": 83.76, "elapsed_time": "1 day, 11:34:04", "remaining_time": "6:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15028, "total_steps": 17941, "loss": 1.3891, "learning_rate": 6.595957877164604e-06, "epoch": 0.8376344685357561, "percentage": 83.76, "elapsed_time": "1 day, 11:34:13", "remaining_time": "6:53:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15029, "total_steps": 17941, "loss": 1.6932, "learning_rate": 6.591538299040833e-06, "epoch": 0.8376902067889193, "percentage": 83.77, "elapsed_time": "1 day, 11:34:21", "remaining_time": "6:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15030, "total_steps": 17941, "loss": 1.6175, "learning_rate": 6.587120097580379e-06, "epoch": 0.8377459450420823, "percentage": 83.77, "elapsed_time": "1 day, 11:34:29", "remaining_time": "6:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15031, "total_steps": 17941, "loss": 1.7834, "learning_rate": 6.582703272923363e-06, "epoch": 0.8378016832952455, "percentage": 83.78, "elapsed_time": "1 day, 11:34:38", "remaining_time": "6:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15032, "total_steps": 17941, "loss": 1.6085, "learning_rate": 6.578287825209866e-06, "epoch": 0.8378574215484087, "percentage": 83.79, "elapsed_time": "1 day, 11:34:46", "remaining_time": "6:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15033, "total_steps": 17941, "loss": 1.562, "learning_rate": 6.573873754579896e-06, "epoch": 0.8379131598015718, "percentage": 83.79, "elapsed_time": "1 day, 11:34:55", "remaining_time": "6:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15034, "total_steps": 17941, "loss": 1.7156, "learning_rate": 6.569461061173476e-06, "epoch": 0.837968898054735, "percentage": 83.8, "elapsed_time": "1 day, 11:35:04", "remaining_time": "6:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15035, "total_steps": 17941, "loss": 1.7941, "learning_rate": 6.5650497451305246e-06, "epoch": 0.8380246363078981, "percentage": 83.8, "elapsed_time": "1 day, 11:35:12", "remaining_time": "6:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15036, "total_steps": 17941, "loss": 1.5525, "learning_rate": 6.560639806590951e-06, "epoch": 0.8380803745610612, "percentage": 83.81, "elapsed_time": "1 day, 11:35:21", "remaining_time": "6:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15037, "total_steps": 17941, "loss": 1.8809, "learning_rate": 6.556231245694611e-06, "epoch": 0.8381361128142244, "percentage": 83.81, "elapsed_time": "1 day, 11:35:29", "remaining_time": "6:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15038, "total_steps": 17941, "loss": 1.7528, "learning_rate": 6.5518240625813246e-06, "epoch": 0.8381918510673876, "percentage": 83.82, "elapsed_time": "1 day, 11:35:37", "remaining_time": "6:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15039, "total_steps": 17941, "loss": 1.7202, "learning_rate": 6.547418257390869e-06, "epoch": 0.8382475893205507, "percentage": 83.82, "elapsed_time": "1 day, 11:35:46", "remaining_time": "6:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15040, "total_steps": 17941, "loss": 1.5567, "learning_rate": 6.543013830262951e-06, "epoch": 0.8383033275737138, "percentage": 83.83, "elapsed_time": "1 day, 11:35:54", "remaining_time": "6:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15041, "total_steps": 17941, "loss": 1.4171, "learning_rate": 6.538610781337246e-06, "epoch": 0.838359065826877, "percentage": 83.84, "elapsed_time": "1 day, 11:36:03", "remaining_time": "6:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15042, "total_steps": 17941, "loss": 1.5516, "learning_rate": 6.534209110753436e-06, "epoch": 0.8384148040800401, "percentage": 83.84, "elapsed_time": "1 day, 11:36:11", "remaining_time": "6:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15043, "total_steps": 17941, "loss": 1.5619, "learning_rate": 6.529808818651079e-06, "epoch": 0.8384705423332033, "percentage": 83.85, "elapsed_time": "1 day, 11:36:20", "remaining_time": "6:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15044, "total_steps": 17941, "loss": 1.5283, "learning_rate": 6.525409905169733e-06, "epoch": 0.8385262805863665, "percentage": 83.85, "elapsed_time": "1 day, 11:36:29", "remaining_time": "6:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15045, "total_steps": 17941, "loss": 1.6015, "learning_rate": 6.5210123704489144e-06, "epoch": 0.8385820188395295, "percentage": 83.86, "elapsed_time": "1 day, 11:36:38", "remaining_time": "6:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15046, "total_steps": 17941, "loss": 1.8035, "learning_rate": 6.516616214628096e-06, "epoch": 0.8386377570926927, "percentage": 83.86, "elapsed_time": "1 day, 11:36:46", "remaining_time": "6:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15047, "total_steps": 17941, "loss": 1.5109, "learning_rate": 6.512221437846672e-06, "epoch": 0.8386934953458559, "percentage": 83.87, "elapsed_time": "1 day, 11:36:55", "remaining_time": "6:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15048, "total_steps": 17941, "loss": 1.7845, "learning_rate": 6.507828040244018e-06, "epoch": 0.838749233599019, "percentage": 83.87, "elapsed_time": "1 day, 11:37:03", "remaining_time": "6:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15049, "total_steps": 17941, "loss": 1.625, "learning_rate": 6.503436021959508e-06, "epoch": 0.8388049718521822, "percentage": 83.88, "elapsed_time": "1 day, 11:37:12", "remaining_time": "6:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15050, "total_steps": 17941, "loss": 1.6112, "learning_rate": 6.499045383132396e-06, "epoch": 0.8388607101053454, "percentage": 83.89, "elapsed_time": "1 day, 11:37:20", "remaining_time": "6:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15051, "total_steps": 17941, "loss": 1.4907, "learning_rate": 6.494656123901932e-06, "epoch": 0.8389164483585084, "percentage": 83.89, "elapsed_time": "1 day, 11:37:29", "remaining_time": "6:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15052, "total_steps": 17941, "loss": 1.2179, "learning_rate": 6.490268244407321e-06, "epoch": 0.8389721866116716, "percentage": 83.9, "elapsed_time": "1 day, 11:37:37", "remaining_time": "6:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15053, "total_steps": 17941, "loss": 1.6479, "learning_rate": 6.485881744787736e-06, "epoch": 0.8390279248648347, "percentage": 83.9, "elapsed_time": "1 day, 11:37:46", "remaining_time": "6:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15054, "total_steps": 17941, "loss": 1.6279, "learning_rate": 6.481496625182271e-06, "epoch": 0.8390836631179979, "percentage": 83.91, "elapsed_time": "1 day, 11:37:54", "remaining_time": "6:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15055, "total_steps": 17941, "loss": 1.4366, "learning_rate": 6.477112885729997e-06, "epoch": 0.839139401371161, "percentage": 83.91, "elapsed_time": "1 day, 11:38:03", "remaining_time": "6:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15056, "total_steps": 17941, "loss": 1.4023, "learning_rate": 6.472730526569942e-06, "epoch": 0.8391951396243241, "percentage": 83.92, "elapsed_time": "1 day, 11:38:12", "remaining_time": "6:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15057, "total_steps": 17941, "loss": 1.6455, "learning_rate": 6.468349547841102e-06, "epoch": 0.8392508778774873, "percentage": 83.93, "elapsed_time": "1 day, 11:38:20", "remaining_time": "6:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15058, "total_steps": 17941, "loss": 1.7753, "learning_rate": 6.463969949682413e-06, "epoch": 0.8393066161306505, "percentage": 83.93, "elapsed_time": "1 day, 11:38:29", "remaining_time": "6:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15059, "total_steps": 17941, "loss": 1.7581, "learning_rate": 6.459591732232739e-06, "epoch": 0.8393623543838136, "percentage": 83.94, "elapsed_time": "1 day, 11:38:38", "remaining_time": "6:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15060, "total_steps": 17941, "loss": 1.6923, "learning_rate": 6.4552148956309845e-06, "epoch": 0.8394180926369768, "percentage": 83.94, "elapsed_time": "1 day, 11:38:46", "remaining_time": "6:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15061, "total_steps": 17941, "loss": 1.3142, "learning_rate": 6.450839440015921e-06, "epoch": 0.8394738308901399, "percentage": 83.95, "elapsed_time": "1 day, 11:38:55", "remaining_time": "6:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15062, "total_steps": 17941, "loss": 1.4404, "learning_rate": 6.446465365526316e-06, "epoch": 0.839529569143303, "percentage": 83.95, "elapsed_time": "1 day, 11:39:03", "remaining_time": "6:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15063, "total_steps": 17941, "loss": 1.5676, "learning_rate": 6.442092672300898e-06, "epoch": 0.8395853073964662, "percentage": 83.96, "elapsed_time": "1 day, 11:39:12", "remaining_time": "6:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15064, "total_steps": 17941, "loss": 1.6463, "learning_rate": 6.437721360478338e-06, "epoch": 0.8396410456496294, "percentage": 83.96, "elapsed_time": "1 day, 11:39:20", "remaining_time": "6:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15065, "total_steps": 17941, "loss": 1.6032, "learning_rate": 6.433351430197282e-06, "epoch": 0.8396967839027925, "percentage": 83.97, "elapsed_time": "1 day, 11:39:29", "remaining_time": "6:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15066, "total_steps": 17941, "loss": 1.7303, "learning_rate": 6.428982881596296e-06, "epoch": 0.8397525221559556, "percentage": 83.98, "elapsed_time": "1 day, 11:39:37", "remaining_time": "6:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15067, "total_steps": 17941, "loss": 1.771, "learning_rate": 6.42461571481393e-06, "epoch": 0.8398082604091188, "percentage": 83.98, "elapsed_time": "1 day, 11:39:45", "remaining_time": "6:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15068, "total_steps": 17941, "loss": 1.6365, "learning_rate": 6.420249929988709e-06, "epoch": 0.8398639986622819, "percentage": 83.99, "elapsed_time": "1 day, 11:39:54", "remaining_time": "6:48:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15069, "total_steps": 17941, "loss": 1.7606, "learning_rate": 6.415885527259064e-06, "epoch": 0.8399197369154451, "percentage": 83.99, "elapsed_time": "1 day, 11:40:02", "remaining_time": "6:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15070, "total_steps": 17941, "loss": 1.4675, "learning_rate": 6.411522506763412e-06, "epoch": 0.8399754751686083, "percentage": 84.0, "elapsed_time": "1 day, 11:40:11", "remaining_time": "6:47:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15071, "total_steps": 17941, "loss": 1.7661, "learning_rate": 6.407160868640133e-06, "epoch": 0.8400312134217713, "percentage": 84.0, "elapsed_time": "1 day, 11:40:19", "remaining_time": "6:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15072, "total_steps": 17941, "loss": 1.5774, "learning_rate": 6.402800613027554e-06, "epoch": 0.8400869516749345, "percentage": 84.01, "elapsed_time": "1 day, 11:40:28", "remaining_time": "6:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15073, "total_steps": 17941, "loss": 1.46, "learning_rate": 6.398441740063943e-06, "epoch": 0.8401426899280977, "percentage": 84.01, "elapsed_time": "1 day, 11:40:36", "remaining_time": "6:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15074, "total_steps": 17941, "loss": 1.5676, "learning_rate": 6.394084249887533e-06, "epoch": 0.8401984281812608, "percentage": 84.02, "elapsed_time": "1 day, 11:40:45", "remaining_time": "6:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15075, "total_steps": 17941, "loss": 1.5891, "learning_rate": 6.389728142636553e-06, "epoch": 0.840254166434424, "percentage": 84.03, "elapsed_time": "1 day, 11:40:53", "remaining_time": "6:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15076, "total_steps": 17941, "loss": 1.5158, "learning_rate": 6.3853734184491195e-06, "epoch": 0.840309904687587, "percentage": 84.03, "elapsed_time": "1 day, 11:41:01", "remaining_time": "6:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15077, "total_steps": 17941, "loss": 1.4915, "learning_rate": 6.381020077463351e-06, "epoch": 0.8403656429407502, "percentage": 84.04, "elapsed_time": "1 day, 11:41:10", "remaining_time": "6:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15078, "total_steps": 17941, "loss": 1.9049, "learning_rate": 6.376668119817308e-06, "epoch": 0.8404213811939134, "percentage": 84.04, "elapsed_time": "1 day, 11:41:18", "remaining_time": "6:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15079, "total_steps": 17941, "loss": 1.5713, "learning_rate": 6.37231754564902e-06, "epoch": 0.8404771194470765, "percentage": 84.05, "elapsed_time": "1 day, 11:41:27", "remaining_time": "6:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15080, "total_steps": 17941, "loss": 1.5207, "learning_rate": 6.367968355096449e-06, "epoch": 0.8405328577002397, "percentage": 84.05, "elapsed_time": "1 day, 11:41:35", "remaining_time": "6:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15081, "total_steps": 17941, "loss": 1.8841, "learning_rate": 6.363620548297522e-06, "epoch": 0.8405885959534029, "percentage": 84.06, "elapsed_time": "1 day, 11:41:44", "remaining_time": "6:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15082, "total_steps": 17941, "loss": 1.7406, "learning_rate": 6.359274125390135e-06, "epoch": 0.8406443342065659, "percentage": 84.06, "elapsed_time": "1 day, 11:41:52", "remaining_time": "6:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15083, "total_steps": 17941, "loss": 1.7603, "learning_rate": 6.3549290865121294e-06, "epoch": 0.8407000724597291, "percentage": 84.07, "elapsed_time": "1 day, 11:42:01", "remaining_time": "6:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15084, "total_steps": 17941, "loss": 1.5523, "learning_rate": 6.350585431801314e-06, "epoch": 0.8407558107128923, "percentage": 84.08, "elapsed_time": "1 day, 11:42:09", "remaining_time": "6:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15085, "total_steps": 17941, "loss": 1.5157, "learning_rate": 6.346243161395421e-06, "epoch": 0.8408115489660554, "percentage": 84.08, "elapsed_time": "1 day, 11:42:18", "remaining_time": "6:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15086, "total_steps": 17941, "loss": 1.685, "learning_rate": 6.341902275432188e-06, "epoch": 0.8408672872192186, "percentage": 84.09, "elapsed_time": "1 day, 11:42:26", "remaining_time": "6:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15087, "total_steps": 17941, "loss": 1.6276, "learning_rate": 6.337562774049266e-06, "epoch": 0.8409230254723817, "percentage": 84.09, "elapsed_time": "1 day, 11:42:35", "remaining_time": "6:45:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15088, "total_steps": 17941, "loss": 1.5399, "learning_rate": 6.333224657384279e-06, "epoch": 0.8409787637255448, "percentage": 84.1, "elapsed_time": "1 day, 11:42:43", "remaining_time": "6:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15089, "total_steps": 17941, "loss": 1.6095, "learning_rate": 6.328887925574812e-06, "epoch": 0.841034501978708, "percentage": 84.1, "elapsed_time": "1 day, 11:42:52", "remaining_time": "6:45:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15090, "total_steps": 17941, "loss": 1.6613, "learning_rate": 6.324552578758403e-06, "epoch": 0.8410902402318712, "percentage": 84.11, "elapsed_time": "1 day, 11:43:00", "remaining_time": "6:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15091, "total_steps": 17941, "loss": 1.8106, "learning_rate": 6.3202186170725485e-06, "epoch": 0.8411459784850343, "percentage": 84.11, "elapsed_time": "1 day, 11:43:09", "remaining_time": "6:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15092, "total_steps": 17941, "loss": 1.6608, "learning_rate": 6.315886040654679e-06, "epoch": 0.8412017167381974, "percentage": 84.12, "elapsed_time": "1 day, 11:43:17", "remaining_time": "6:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15093, "total_steps": 17941, "loss": 1.6227, "learning_rate": 6.311554849642198e-06, "epoch": 0.8412574549913606, "percentage": 84.13, "elapsed_time": "1 day, 11:43:25", "remaining_time": "6:44:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15094, "total_steps": 17941, "loss": 1.7769, "learning_rate": 6.307225044172493e-06, "epoch": 0.8413131932445237, "percentage": 84.13, "elapsed_time": "1 day, 11:43:34", "remaining_time": "6:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15095, "total_steps": 17941, "loss": 1.6509, "learning_rate": 6.302896624382859e-06, "epoch": 0.8413689314976869, "percentage": 84.14, "elapsed_time": "1 day, 11:43:42", "remaining_time": "6:44:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15096, "total_steps": 17941, "loss": 1.8361, "learning_rate": 6.298569590410569e-06, "epoch": 0.8414246697508501, "percentage": 84.14, "elapsed_time": "1 day, 11:43:51", "remaining_time": "6:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15097, "total_steps": 17941, "loss": 1.426, "learning_rate": 6.294243942392852e-06, "epoch": 0.8414804080040131, "percentage": 84.15, "elapsed_time": "1 day, 11:43:59", "remaining_time": "6:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15098, "total_steps": 17941, "loss": 1.6749, "learning_rate": 6.28991968046691e-06, "epoch": 0.8415361462571763, "percentage": 84.15, "elapsed_time": "1 day, 11:44:08", "remaining_time": "6:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15099, "total_steps": 17941, "loss": 1.442, "learning_rate": 6.285596804769856e-06, "epoch": 0.8415918845103394, "percentage": 84.16, "elapsed_time": "1 day, 11:44:16", "remaining_time": "6:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15100, "total_steps": 17941, "loss": 1.6696, "learning_rate": 6.281275315438784e-06, "epoch": 0.8416476227635026, "percentage": 84.16, "elapsed_time": "1 day, 11:44:25", "remaining_time": "6:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15101, "total_steps": 17941, "loss": 1.6203, "learning_rate": 6.276955212610785e-06, "epoch": 0.8417033610166658, "percentage": 84.17, "elapsed_time": "1 day, 11:44:33", "remaining_time": "6:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15102, "total_steps": 17941, "loss": 1.5446, "learning_rate": 6.272636496422835e-06, "epoch": 0.8417590992698288, "percentage": 84.18, "elapsed_time": "1 day, 11:44:42", "remaining_time": "6:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15103, "total_steps": 17941, "loss": 1.7728, "learning_rate": 6.2683191670119105e-06, "epoch": 0.841814837522992, "percentage": 84.18, "elapsed_time": "1 day, 11:44:50", "remaining_time": "6:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15104, "total_steps": 17941, "loss": 1.7175, "learning_rate": 6.264003224514925e-06, "epoch": 0.8418705757761552, "percentage": 84.19, "elapsed_time": "1 day, 11:44:58", "remaining_time": "6:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15105, "total_steps": 17941, "loss": 1.6456, "learning_rate": 6.259688669068764e-06, "epoch": 0.8419263140293183, "percentage": 84.19, "elapsed_time": "1 day, 11:45:07", "remaining_time": "6:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15106, "total_steps": 17941, "loss": 1.429, "learning_rate": 6.255375500810251e-06, "epoch": 0.8419820522824815, "percentage": 84.2, "elapsed_time": "1 day, 11:45:15", "remaining_time": "6:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15107, "total_steps": 17941, "loss": 1.4268, "learning_rate": 6.251063719876177e-06, "epoch": 0.8420377905356446, "percentage": 84.2, "elapsed_time": "1 day, 11:45:24", "remaining_time": "6:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15108, "total_steps": 17941, "loss": 1.6279, "learning_rate": 6.246753326403287e-06, "epoch": 0.8420935287888077, "percentage": 84.21, "elapsed_time": "1 day, 11:45:33", "remaining_time": "6:42:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15109, "total_steps": 17941, "loss": 1.5042, "learning_rate": 6.242444320528279e-06, "epoch": 0.8421492670419709, "percentage": 84.21, "elapsed_time": "1 day, 11:45:41", "remaining_time": "6:42:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15110, "total_steps": 17941, "loss": 1.6186, "learning_rate": 6.238136702387831e-06, "epoch": 0.8422050052951341, "percentage": 84.22, "elapsed_time": "1 day, 11:45:50", "remaining_time": "6:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15111, "total_steps": 17941, "loss": 1.5597, "learning_rate": 6.233830472118507e-06, "epoch": 0.8422607435482972, "percentage": 84.23, "elapsed_time": "1 day, 11:45:58", "remaining_time": "6:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15112, "total_steps": 17941, "loss": 1.5839, "learning_rate": 6.229525629856936e-06, "epoch": 0.8423164818014603, "percentage": 84.23, "elapsed_time": "1 day, 11:46:07", "remaining_time": "6:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15113, "total_steps": 17941, "loss": 1.5685, "learning_rate": 6.225222175739598e-06, "epoch": 0.8423722200546235, "percentage": 84.24, "elapsed_time": "1 day, 11:46:15", "remaining_time": "6:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15114, "total_steps": 17941, "loss": 1.7948, "learning_rate": 6.220920109902989e-06, "epoch": 0.8424279583077866, "percentage": 84.24, "elapsed_time": "1 day, 11:46:23", "remaining_time": "6:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15115, "total_steps": 17941, "loss": 1.5943, "learning_rate": 6.216619432483539e-06, "epoch": 0.8424836965609498, "percentage": 84.25, "elapsed_time": "1 day, 11:46:32", "remaining_time": "6:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15116, "total_steps": 17941, "loss": 1.6435, "learning_rate": 6.21232014361765e-06, "epoch": 0.842539434814113, "percentage": 84.25, "elapsed_time": "1 day, 11:46:40", "remaining_time": "6:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15117, "total_steps": 17941, "loss": 1.712, "learning_rate": 6.20802224344168e-06, "epoch": 0.842595173067276, "percentage": 84.26, "elapsed_time": "1 day, 11:46:49", "remaining_time": "6:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15118, "total_steps": 17941, "loss": 1.8713, "learning_rate": 6.203725732091891e-06, "epoch": 0.8426509113204392, "percentage": 84.27, "elapsed_time": "1 day, 11:46:57", "remaining_time": "6:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15119, "total_steps": 17941, "loss": 1.7247, "learning_rate": 6.199430609704598e-06, "epoch": 0.8427066495736024, "percentage": 84.27, "elapsed_time": "1 day, 11:47:06", "remaining_time": "6:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15120, "total_steps": 17941, "loss": 1.093, "learning_rate": 6.19513687641598e-06, "epoch": 0.8427623878267655, "percentage": 84.28, "elapsed_time": "1 day, 11:47:14", "remaining_time": "6:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15121, "total_steps": 17941, "loss": 1.6697, "learning_rate": 6.190844532362222e-06, "epoch": 0.8428181260799287, "percentage": 84.28, "elapsed_time": "1 day, 11:47:23", "remaining_time": "6:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15122, "total_steps": 17941, "loss": 1.6949, "learning_rate": 6.186553577679449e-06, "epoch": 0.8428738643330917, "percentage": 84.29, "elapsed_time": "1 day, 11:47:31", "remaining_time": "6:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15123, "total_steps": 17941, "loss": 1.8087, "learning_rate": 6.182264012503741e-06, "epoch": 0.8429296025862549, "percentage": 84.29, "elapsed_time": "1 day, 11:47:40", "remaining_time": "6:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15124, "total_steps": 17941, "loss": 1.6954, "learning_rate": 6.177975836971161e-06, "epoch": 0.8429853408394181, "percentage": 84.3, "elapsed_time": "1 day, 11:47:49", "remaining_time": "6:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15125, "total_steps": 17941, "loss": 1.6088, "learning_rate": 6.173689051217674e-06, "epoch": 0.8430410790925812, "percentage": 84.3, "elapsed_time": "1 day, 11:47:57", "remaining_time": "6:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15126, "total_steps": 17941, "loss": 1.5706, "learning_rate": 6.169403655379235e-06, "epoch": 0.8430968173457444, "percentage": 84.31, "elapsed_time": "1 day, 11:48:05", "remaining_time": "6:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15127, "total_steps": 17941, "loss": 1.4777, "learning_rate": 6.165119649591783e-06, "epoch": 0.8431525555989076, "percentage": 84.32, "elapsed_time": "1 day, 11:48:14", "remaining_time": "6:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15128, "total_steps": 17941, "loss": 1.676, "learning_rate": 6.160837033991152e-06, "epoch": 0.8432082938520706, "percentage": 84.32, "elapsed_time": "1 day, 11:48:22", "remaining_time": "6:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15129, "total_steps": 17941, "loss": 1.6371, "learning_rate": 6.156555808713166e-06, "epoch": 0.8432640321052338, "percentage": 84.33, "elapsed_time": "1 day, 11:48:31", "remaining_time": "6:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15130, "total_steps": 17941, "loss": 1.4938, "learning_rate": 6.1522759738936066e-06, "epoch": 0.843319770358397, "percentage": 84.33, "elapsed_time": "1 day, 11:48:39", "remaining_time": "6:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15131, "total_steps": 17941, "loss": 1.7965, "learning_rate": 6.147997529668214e-06, "epoch": 0.8433755086115601, "percentage": 84.34, "elapsed_time": "1 day, 11:48:48", "remaining_time": "6:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15132, "total_steps": 17941, "loss": 1.4601, "learning_rate": 6.143720476172654e-06, "epoch": 0.8434312468647233, "percentage": 84.34, "elapsed_time": "1 day, 11:48:57", "remaining_time": "6:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15133, "total_steps": 17941, "loss": 1.4532, "learning_rate": 6.139444813542583e-06, "epoch": 0.8434869851178864, "percentage": 84.35, "elapsed_time": "1 day, 11:49:05", "remaining_time": "6:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15134, "total_steps": 17941, "loss": 1.7473, "learning_rate": 6.135170541913599e-06, "epoch": 0.8435427233710495, "percentage": 84.35, "elapsed_time": "1 day, 11:49:14", "remaining_time": "6:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15135, "total_steps": 17941, "loss": 1.7668, "learning_rate": 6.130897661421248e-06, "epoch": 0.8435984616242127, "percentage": 84.36, "elapsed_time": "1 day, 11:49:22", "remaining_time": "6:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15136, "total_steps": 17941, "loss": 1.4973, "learning_rate": 6.1266261722010666e-06, "epoch": 0.8436541998773759, "percentage": 84.37, "elapsed_time": "1 day, 11:49:31", "remaining_time": "6:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15137, "total_steps": 17941, "loss": 1.4502, "learning_rate": 6.12235607438848e-06, "epoch": 0.843709938130539, "percentage": 84.37, "elapsed_time": "1 day, 11:49:39", "remaining_time": "6:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15138, "total_steps": 17941, "loss": 1.7002, "learning_rate": 6.118087368118952e-06, "epoch": 0.8437656763837021, "percentage": 84.38, "elapsed_time": "1 day, 11:49:47", "remaining_time": "6:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15139, "total_steps": 17941, "loss": 1.8362, "learning_rate": 6.113820053527836e-06, "epoch": 0.8438214146368653, "percentage": 84.38, "elapsed_time": "1 day, 11:49:56", "remaining_time": "6:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15140, "total_steps": 17941, "loss": 1.8748, "learning_rate": 6.109554130750472e-06, "epoch": 0.8438771528900284, "percentage": 84.39, "elapsed_time": "1 day, 11:50:04", "remaining_time": "6:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15141, "total_steps": 17941, "loss": 1.6823, "learning_rate": 6.105289599922154e-06, "epoch": 0.8439328911431916, "percentage": 84.39, "elapsed_time": "1 day, 11:50:13", "remaining_time": "6:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15142, "total_steps": 17941, "loss": 1.2737, "learning_rate": 6.1010264611781275e-06, "epoch": 0.8439886293963548, "percentage": 84.4, "elapsed_time": "1 day, 11:50:21", "remaining_time": "6:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15143, "total_steps": 17941, "loss": 1.5777, "learning_rate": 6.096764714653602e-06, "epoch": 0.8440443676495178, "percentage": 84.4, "elapsed_time": "1 day, 11:50:30", "remaining_time": "6:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15144, "total_steps": 17941, "loss": 1.9725, "learning_rate": 6.092504360483703e-06, "epoch": 0.844100105902681, "percentage": 84.41, "elapsed_time": "1 day, 11:50:38", "remaining_time": "6:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15145, "total_steps": 17941, "loss": 1.2087, "learning_rate": 6.088245398803588e-06, "epoch": 0.8441558441558441, "percentage": 84.42, "elapsed_time": "1 day, 11:50:47", "remaining_time": "6:37:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15146, "total_steps": 17941, "loss": 1.6881, "learning_rate": 6.0839878297483e-06, "epoch": 0.8442115824090073, "percentage": 84.42, "elapsed_time": "1 day, 11:50:55", "remaining_time": "6:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15147, "total_steps": 17941, "loss": 1.5091, "learning_rate": 6.0797316534528636e-06, "epoch": 0.8442673206621705, "percentage": 84.43, "elapsed_time": "1 day, 11:51:04", "remaining_time": "6:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15148, "total_steps": 17941, "loss": 1.5777, "learning_rate": 6.075476870052271e-06, "epoch": 0.8443230589153335, "percentage": 84.43, "elapsed_time": "1 day, 11:51:12", "remaining_time": "6:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15149, "total_steps": 17941, "loss": 1.7263, "learning_rate": 6.071223479681454e-06, "epoch": 0.8443787971684967, "percentage": 84.44, "elapsed_time": "1 day, 11:51:21", "remaining_time": "6:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15150, "total_steps": 17941, "loss": 1.6941, "learning_rate": 6.0669714824753144e-06, "epoch": 0.8444345354216599, "percentage": 84.44, "elapsed_time": "1 day, 11:51:29", "remaining_time": "6:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15151, "total_steps": 17941, "loss": 1.6013, "learning_rate": 6.062720878568684e-06, "epoch": 0.844490273674823, "percentage": 84.45, "elapsed_time": "1 day, 11:51:38", "remaining_time": "6:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15152, "total_steps": 17941, "loss": 1.6914, "learning_rate": 6.058471668096361e-06, "epoch": 0.8445460119279862, "percentage": 84.45, "elapsed_time": "1 day, 11:51:46", "remaining_time": "6:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15153, "total_steps": 17941, "loss": 1.7909, "learning_rate": 6.054223851193141e-06, "epoch": 0.8446017501811494, "percentage": 84.46, "elapsed_time": "1 day, 11:51:55", "remaining_time": "6:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15154, "total_steps": 17941, "loss": 1.6129, "learning_rate": 6.049977427993714e-06, "epoch": 0.8446574884343124, "percentage": 84.47, "elapsed_time": "1 day, 11:52:03", "remaining_time": "6:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15155, "total_steps": 17941, "loss": 1.6981, "learning_rate": 6.045732398632753e-06, "epoch": 0.8447132266874756, "percentage": 84.47, "elapsed_time": "1 day, 11:52:11", "remaining_time": "6:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15156, "total_steps": 17941, "loss": 1.6413, "learning_rate": 6.0414887632448845e-06, "epoch": 0.8447689649406388, "percentage": 84.48, "elapsed_time": "1 day, 11:52:20", "remaining_time": "6:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15157, "total_steps": 17941, "loss": 1.5987, "learning_rate": 6.037246521964712e-06, "epoch": 0.8448247031938019, "percentage": 84.48, "elapsed_time": "1 day, 11:52:28", "remaining_time": "6:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15158, "total_steps": 17941, "loss": 1.625, "learning_rate": 6.03300567492675e-06, "epoch": 0.8448804414469651, "percentage": 84.49, "elapsed_time": "1 day, 11:52:37", "remaining_time": "6:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15159, "total_steps": 17941, "loss": 1.4054, "learning_rate": 6.028766222265498e-06, "epoch": 0.8449361797001282, "percentage": 84.49, "elapsed_time": "1 day, 11:52:45", "remaining_time": "6:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15160, "total_steps": 17941, "loss": 1.6633, "learning_rate": 6.024528164115417e-06, "epoch": 0.8449919179532913, "percentage": 84.5, "elapsed_time": "1 day, 11:52:54", "remaining_time": "6:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15161, "total_steps": 17941, "loss": 1.62, "learning_rate": 6.020291500610903e-06, "epoch": 0.8450476562064545, "percentage": 84.5, "elapsed_time": "1 day, 11:53:02", "remaining_time": "6:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15162, "total_steps": 17941, "loss": 1.5042, "learning_rate": 6.016056231886335e-06, "epoch": 0.8451033944596177, "percentage": 84.51, "elapsed_time": "1 day, 11:53:10", "remaining_time": "6:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15163, "total_steps": 17941, "loss": 1.6623, "learning_rate": 6.011822358075997e-06, "epoch": 0.8451591327127808, "percentage": 84.52, "elapsed_time": "1 day, 11:53:19", "remaining_time": "6:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15164, "total_steps": 17941, "loss": 1.5602, "learning_rate": 6.007589879314207e-06, "epoch": 0.8452148709659439, "percentage": 84.52, "elapsed_time": "1 day, 11:53:27", "remaining_time": "6:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15165, "total_steps": 17941, "loss": 1.4476, "learning_rate": 6.003358795735164e-06, "epoch": 0.8452706092191071, "percentage": 84.53, "elapsed_time": "1 day, 11:53:36", "remaining_time": "6:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15166, "total_steps": 17941, "loss": 1.7579, "learning_rate": 5.999129107473062e-06, "epoch": 0.8453263474722702, "percentage": 84.53, "elapsed_time": "1 day, 11:53:44", "remaining_time": "6:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15167, "total_steps": 17941, "loss": 1.49, "learning_rate": 5.994900814662041e-06, "epoch": 0.8453820857254334, "percentage": 84.54, "elapsed_time": "1 day, 11:53:53", "remaining_time": "6:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15168, "total_steps": 17941, "loss": 1.6362, "learning_rate": 5.990673917436196e-06, "epoch": 0.8454378239785965, "percentage": 84.54, "elapsed_time": "1 day, 11:54:02", "remaining_time": "6:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15169, "total_steps": 17941, "loss": 1.573, "learning_rate": 5.986448415929597e-06, "epoch": 0.8454935622317596, "percentage": 84.55, "elapsed_time": "1 day, 11:54:10", "remaining_time": "6:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15170, "total_steps": 17941, "loss": 1.5352, "learning_rate": 5.982224310276214e-06, "epoch": 0.8455493004849228, "percentage": 84.55, "elapsed_time": "1 day, 11:54:19", "remaining_time": "6:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15171, "total_steps": 17941, "loss": 1.7468, "learning_rate": 5.97800160061005e-06, "epoch": 0.8456050387380859, "percentage": 84.56, "elapsed_time": "1 day, 11:54:27", "remaining_time": "6:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15172, "total_steps": 17941, "loss": 1.5021, "learning_rate": 5.973780287065006e-06, "epoch": 0.8456607769912491, "percentage": 84.57, "elapsed_time": "1 day, 11:54:36", "remaining_time": "6:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15173, "total_steps": 17941, "loss": 1.6955, "learning_rate": 5.969560369774957e-06, "epoch": 0.8457165152444123, "percentage": 84.57, "elapsed_time": "1 day, 11:54:44", "remaining_time": "6:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15174, "total_steps": 17941, "loss": 1.5456, "learning_rate": 5.96534184887374e-06, "epoch": 0.8457722534975753, "percentage": 84.58, "elapsed_time": "1 day, 11:54:53", "remaining_time": "6:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15175, "total_steps": 17941, "loss": 1.4469, "learning_rate": 5.961124724495137e-06, "epoch": 0.8458279917507385, "percentage": 84.58, "elapsed_time": "1 day, 11:55:01", "remaining_time": "6:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15176, "total_steps": 17941, "loss": 1.5972, "learning_rate": 5.956908996772909e-06, "epoch": 0.8458837300039017, "percentage": 84.59, "elapsed_time": "1 day, 11:55:09", "remaining_time": "6:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15177, "total_steps": 17941, "loss": 1.8852, "learning_rate": 5.9526946658407245e-06, "epoch": 0.8459394682570648, "percentage": 84.59, "elapsed_time": "1 day, 11:55:18", "remaining_time": "6:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15178, "total_steps": 17941, "loss": 1.4465, "learning_rate": 5.948481731832239e-06, "epoch": 0.845995206510228, "percentage": 84.6, "elapsed_time": "1 day, 11:55:26", "remaining_time": "6:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15179, "total_steps": 17941, "loss": 1.5702, "learning_rate": 5.9442701948811015e-06, "epoch": 0.8460509447633912, "percentage": 84.61, "elapsed_time": "1 day, 11:55:35", "remaining_time": "6:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15180, "total_steps": 17941, "loss": 1.7079, "learning_rate": 5.940060055120838e-06, "epoch": 0.8461066830165542, "percentage": 84.61, "elapsed_time": "1 day, 11:55:43", "remaining_time": "6:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15181, "total_steps": 17941, "loss": 1.5781, "learning_rate": 5.935851312684981e-06, "epoch": 0.8461624212697174, "percentage": 84.62, "elapsed_time": "1 day, 11:55:52", "remaining_time": "6:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15182, "total_steps": 17941, "loss": 1.645, "learning_rate": 5.9316439677070066e-06, "epoch": 0.8462181595228806, "percentage": 84.62, "elapsed_time": "1 day, 11:56:00", "remaining_time": "6:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15183, "total_steps": 17941, "loss": 1.5638, "learning_rate": 5.927438020320364e-06, "epoch": 0.8462738977760437, "percentage": 84.63, "elapsed_time": "1 day, 11:56:09", "remaining_time": "6:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15184, "total_steps": 17941, "loss": 1.7303, "learning_rate": 5.923233470658412e-06, "epoch": 0.8463296360292069, "percentage": 84.63, "elapsed_time": "1 day, 11:56:17", "remaining_time": "6:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15185, "total_steps": 17941, "loss": 1.2655, "learning_rate": 5.919030318854513e-06, "epoch": 0.84638537428237, "percentage": 84.64, "elapsed_time": "1 day, 11:56:26", "remaining_time": "6:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15186, "total_steps": 17941, "loss": 1.6171, "learning_rate": 5.914828565041958e-06, "epoch": 0.8464411125355331, "percentage": 84.64, "elapsed_time": "1 day, 11:56:34", "remaining_time": "6:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15187, "total_steps": 17941, "loss": 1.8041, "learning_rate": 5.910628209354008e-06, "epoch": 0.8464968507886963, "percentage": 84.65, "elapsed_time": "1 day, 11:56:42", "remaining_time": "6:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15188, "total_steps": 17941, "loss": 1.6288, "learning_rate": 5.906429251923884e-06, "epoch": 0.8465525890418595, "percentage": 84.66, "elapsed_time": "1 day, 11:56:51", "remaining_time": "6:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15189, "total_steps": 17941, "loss": 1.4974, "learning_rate": 5.9022316928847185e-06, "epoch": 0.8466083272950226, "percentage": 84.66, "elapsed_time": "1 day, 11:56:59", "remaining_time": "6:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15190, "total_steps": 17941, "loss": 1.652, "learning_rate": 5.898035532369678e-06, "epoch": 0.8466640655481857, "percentage": 84.67, "elapsed_time": "1 day, 11:57:08", "remaining_time": "6:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15191, "total_steps": 17941, "loss": 1.7512, "learning_rate": 5.89384077051181e-06, "epoch": 0.8467198038013488, "percentage": 84.67, "elapsed_time": "1 day, 11:57:16", "remaining_time": "6:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15192, "total_steps": 17941, "loss": 1.4862, "learning_rate": 5.8896474074441545e-06, "epoch": 0.846775542054512, "percentage": 84.68, "elapsed_time": "1 day, 11:57:25", "remaining_time": "6:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15193, "total_steps": 17941, "loss": 1.7256, "learning_rate": 5.885455443299698e-06, "epoch": 0.8468312803076752, "percentage": 84.68, "elapsed_time": "1 day, 11:57:33", "remaining_time": "6:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15194, "total_steps": 17941, "loss": 1.8113, "learning_rate": 5.8812648782113955e-06, "epoch": 0.8468870185608383, "percentage": 84.69, "elapsed_time": "1 day, 11:57:42", "remaining_time": "6:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15195, "total_steps": 17941, "loss": 1.7658, "learning_rate": 5.877075712312147e-06, "epoch": 0.8469427568140014, "percentage": 84.69, "elapsed_time": "1 day, 11:57:50", "remaining_time": "6:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15196, "total_steps": 17941, "loss": 1.5032, "learning_rate": 5.872887945734784e-06, "epoch": 0.8469984950671646, "percentage": 84.7, "elapsed_time": "1 day, 11:57:58", "remaining_time": "6:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15197, "total_steps": 17941, "loss": 1.6255, "learning_rate": 5.8687015786121565e-06, "epoch": 0.8470542333203277, "percentage": 84.71, "elapsed_time": "1 day, 11:58:07", "remaining_time": "6:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15198, "total_steps": 17941, "loss": 2.0318, "learning_rate": 5.8645166110769976e-06, "epoch": 0.8471099715734909, "percentage": 84.71, "elapsed_time": "1 day, 11:58:15", "remaining_time": "6:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15199, "total_steps": 17941, "loss": 1.5605, "learning_rate": 5.860333043262045e-06, "epoch": 0.8471657098266541, "percentage": 84.72, "elapsed_time": "1 day, 11:58:24", "remaining_time": "6:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15200, "total_steps": 17941, "loss": 1.7965, "learning_rate": 5.8561508752999815e-06, "epoch": 0.8472214480798171, "percentage": 84.72, "elapsed_time": "1 day, 11:58:32", "remaining_time": "6:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15201, "total_steps": 17941, "loss": 1.6465, "learning_rate": 5.851970107323435e-06, "epoch": 0.8472771863329803, "percentage": 84.73, "elapsed_time": "1 day, 11:58:42", "remaining_time": "6:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15202, "total_steps": 17941, "loss": 1.6753, "learning_rate": 5.847790739465003e-06, "epoch": 0.8473329245861435, "percentage": 84.73, "elapsed_time": "1 day, 11:58:50", "remaining_time": "6:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15203, "total_steps": 17941, "loss": 1.5499, "learning_rate": 5.84361277185721e-06, "epoch": 0.8473886628393066, "percentage": 84.74, "elapsed_time": "1 day, 11:58:59", "remaining_time": "6:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15204, "total_steps": 17941, "loss": 1.9306, "learning_rate": 5.839436204632564e-06, "epoch": 0.8474444010924698, "percentage": 84.74, "elapsed_time": "1 day, 11:59:07", "remaining_time": "6:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15205, "total_steps": 17941, "loss": 1.4509, "learning_rate": 5.83526103792355e-06, "epoch": 0.847500139345633, "percentage": 84.75, "elapsed_time": "1 day, 11:59:15", "remaining_time": "6:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15206, "total_steps": 17941, "loss": 1.5115, "learning_rate": 5.8310872718625456e-06, "epoch": 0.847555877598796, "percentage": 84.76, "elapsed_time": "1 day, 11:59:24", "remaining_time": "6:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15207, "total_steps": 17941, "loss": 1.7621, "learning_rate": 5.826914906581932e-06, "epoch": 0.8476116158519592, "percentage": 84.76, "elapsed_time": "1 day, 11:59:32", "remaining_time": "6:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15208, "total_steps": 17941, "loss": 1.6684, "learning_rate": 5.822743942214026e-06, "epoch": 0.8476673541051224, "percentage": 84.77, "elapsed_time": "1 day, 11:59:41", "remaining_time": "6:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15209, "total_steps": 17941, "loss": 1.784, "learning_rate": 5.818574378891123e-06, "epoch": 0.8477230923582855, "percentage": 84.77, "elapsed_time": "1 day, 11:59:49", "remaining_time": "6:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15210, "total_steps": 17941, "loss": 1.5706, "learning_rate": 5.814406216745438e-06, "epoch": 0.8477788306114487, "percentage": 84.78, "elapsed_time": "1 day, 11:59:58", "remaining_time": "6:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15211, "total_steps": 17941, "loss": 1.541, "learning_rate": 5.8102394559091556e-06, "epoch": 0.8478345688646118, "percentage": 84.78, "elapsed_time": "1 day, 12:00:06", "remaining_time": "6:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15212, "total_steps": 17941, "loss": 1.6359, "learning_rate": 5.8060740965144525e-06, "epoch": 0.8478903071177749, "percentage": 84.79, "elapsed_time": "1 day, 12:00:15", "remaining_time": "6:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15213, "total_steps": 17941, "loss": 1.599, "learning_rate": 5.8019101386934e-06, "epoch": 0.8479460453709381, "percentage": 84.79, "elapsed_time": "1 day, 12:00:23", "remaining_time": "6:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15214, "total_steps": 17941, "loss": 1.7939, "learning_rate": 5.797747582578078e-06, "epoch": 0.8480017836241012, "percentage": 84.8, "elapsed_time": "1 day, 12:00:32", "remaining_time": "6:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15215, "total_steps": 17941, "loss": 1.3147, "learning_rate": 5.793586428300468e-06, "epoch": 0.8480575218772644, "percentage": 84.81, "elapsed_time": "1 day, 12:00:40", "remaining_time": "6:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15216, "total_steps": 17941, "loss": 1.4693, "learning_rate": 5.7894266759925705e-06, "epoch": 0.8481132601304275, "percentage": 84.81, "elapsed_time": "1 day, 12:00:49", "remaining_time": "6:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15217, "total_steps": 17941, "loss": 1.5794, "learning_rate": 5.785268325786286e-06, "epoch": 0.8481689983835906, "percentage": 84.82, "elapsed_time": "1 day, 12:00:57", "remaining_time": "6:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15218, "total_steps": 17941, "loss": 1.7335, "learning_rate": 5.781111377813498e-06, "epoch": 0.8482247366367538, "percentage": 84.82, "elapsed_time": "1 day, 12:01:06", "remaining_time": "6:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15219, "total_steps": 17941, "loss": 1.7115, "learning_rate": 5.776955832206044e-06, "epoch": 0.848280474889917, "percentage": 84.83, "elapsed_time": "1 day, 12:01:14", "remaining_time": "6:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15220, "total_steps": 17941, "loss": 1.626, "learning_rate": 5.7728016890957136e-06, "epoch": 0.84833621314308, "percentage": 84.83, "elapsed_time": "1 day, 12:01:23", "remaining_time": "6:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15221, "total_steps": 17941, "loss": 1.5939, "learning_rate": 5.768648948614258e-06, "epoch": 0.8483919513962432, "percentage": 84.84, "elapsed_time": "1 day, 12:01:31", "remaining_time": "6:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15222, "total_steps": 17941, "loss": 1.3716, "learning_rate": 5.764497610893355e-06, "epoch": 0.8484476896494064, "percentage": 84.84, "elapsed_time": "1 day, 12:01:40", "remaining_time": "6:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15223, "total_steps": 17941, "loss": 1.6838, "learning_rate": 5.7603476760646924e-06, "epoch": 0.8485034279025695, "percentage": 84.85, "elapsed_time": "1 day, 12:01:48", "remaining_time": "6:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15224, "total_steps": 17941, "loss": 1.6622, "learning_rate": 5.756199144259861e-06, "epoch": 0.8485591661557327, "percentage": 84.86, "elapsed_time": "1 day, 12:01:57", "remaining_time": "6:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15225, "total_steps": 17941, "loss": 1.626, "learning_rate": 5.752052015610432e-06, "epoch": 0.8486149044088959, "percentage": 84.86, "elapsed_time": "1 day, 12:02:05", "remaining_time": "6:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15226, "total_steps": 17941, "loss": 1.4526, "learning_rate": 5.7479062902479285e-06, "epoch": 0.8486706426620589, "percentage": 84.87, "elapsed_time": "1 day, 12:02:15", "remaining_time": "6:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15227, "total_steps": 17941, "loss": 1.4646, "learning_rate": 5.743761968303835e-06, "epoch": 0.8487263809152221, "percentage": 84.87, "elapsed_time": "1 day, 12:02:23", "remaining_time": "6:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15228, "total_steps": 17941, "loss": 1.4568, "learning_rate": 5.739619049909584e-06, "epoch": 0.8487821191683853, "percentage": 84.88, "elapsed_time": "1 day, 12:02:31", "remaining_time": "6:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15229, "total_steps": 17941, "loss": 1.539, "learning_rate": 5.735477535196554e-06, "epoch": 0.8488378574215484, "percentage": 84.88, "elapsed_time": "1 day, 12:02:40", "remaining_time": "6:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15230, "total_steps": 17941, "loss": 1.3992, "learning_rate": 5.7313374242960845e-06, "epoch": 0.8488935956747116, "percentage": 84.89, "elapsed_time": "1 day, 12:02:48", "remaining_time": "6:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15231, "total_steps": 17941, "loss": 1.7422, "learning_rate": 5.727198717339511e-06, "epoch": 0.8489493339278747, "percentage": 84.89, "elapsed_time": "1 day, 12:02:57", "remaining_time": "6:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15232, "total_steps": 17941, "loss": 1.6997, "learning_rate": 5.723061414458053e-06, "epoch": 0.8490050721810378, "percentage": 84.9, "elapsed_time": "1 day, 12:03:05", "remaining_time": "6:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15233, "total_steps": 17941, "loss": 1.854, "learning_rate": 5.718925515782936e-06, "epoch": 0.849060810434201, "percentage": 84.91, "elapsed_time": "1 day, 12:03:14", "remaining_time": "6:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15234, "total_steps": 17941, "loss": 1.6647, "learning_rate": 5.71479102144532e-06, "epoch": 0.8491165486873642, "percentage": 84.91, "elapsed_time": "1 day, 12:03:22", "remaining_time": "6:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15235, "total_steps": 17941, "loss": 1.6021, "learning_rate": 5.710657931576347e-06, "epoch": 0.8491722869405273, "percentage": 84.92, "elapsed_time": "1 day, 12:03:31", "remaining_time": "6:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15236, "total_steps": 17941, "loss": 1.7062, "learning_rate": 5.70652624630707e-06, "epoch": 0.8492280251936905, "percentage": 84.92, "elapsed_time": "1 day, 12:03:39", "remaining_time": "6:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15237, "total_steps": 17941, "loss": 1.6983, "learning_rate": 5.70239596576852e-06, "epoch": 0.8492837634468535, "percentage": 84.93, "elapsed_time": "1 day, 12:03:48", "remaining_time": "6:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15238, "total_steps": 17941, "loss": 1.6402, "learning_rate": 5.698267090091719e-06, "epoch": 0.8493395017000167, "percentage": 84.93, "elapsed_time": "1 day, 12:03:56", "remaining_time": "6:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15239, "total_steps": 17941, "loss": 1.5863, "learning_rate": 5.694139619407574e-06, "epoch": 0.8493952399531799, "percentage": 84.94, "elapsed_time": "1 day, 12:04:05", "remaining_time": "6:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15240, "total_steps": 17941, "loss": 1.6958, "learning_rate": 5.690013553847013e-06, "epoch": 0.849450978206343, "percentage": 84.95, "elapsed_time": "1 day, 12:04:13", "remaining_time": "6:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15241, "total_steps": 17941, "loss": 1.6198, "learning_rate": 5.685888893540858e-06, "epoch": 0.8495067164595062, "percentage": 84.95, "elapsed_time": "1 day, 12:04:22", "remaining_time": "6:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15242, "total_steps": 17941, "loss": 1.5416, "learning_rate": 5.681765638619957e-06, "epoch": 0.8495624547126693, "percentage": 84.96, "elapsed_time": "1 day, 12:04:30", "remaining_time": "6:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15243, "total_steps": 17941, "loss": 1.6824, "learning_rate": 5.677643789215042e-06, "epoch": 0.8496181929658324, "percentage": 84.96, "elapsed_time": "1 day, 12:04:39", "remaining_time": "6:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15244, "total_steps": 17941, "loss": 1.4865, "learning_rate": 5.673523345456855e-06, "epoch": 0.8496739312189956, "percentage": 84.97, "elapsed_time": "1 day, 12:04:48", "remaining_time": "6:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15245, "total_steps": 17941, "loss": 1.6201, "learning_rate": 5.669404307476067e-06, "epoch": 0.8497296694721588, "percentage": 84.97, "elapsed_time": "1 day, 12:04:56", "remaining_time": "6:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15246, "total_steps": 17941, "loss": 1.8477, "learning_rate": 5.665286675403303e-06, "epoch": 0.8497854077253219, "percentage": 84.98, "elapsed_time": "1 day, 12:05:05", "remaining_time": "6:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15247, "total_steps": 17941, "loss": 1.5675, "learning_rate": 5.661170449369168e-06, "epoch": 0.849841145978485, "percentage": 84.98, "elapsed_time": "1 day, 12:05:13", "remaining_time": "6:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15248, "total_steps": 17941, "loss": 1.6843, "learning_rate": 5.657055629504176e-06, "epoch": 0.8498968842316482, "percentage": 84.99, "elapsed_time": "1 day, 12:05:22", "remaining_time": "6:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15249, "total_steps": 17941, "loss": 1.5339, "learning_rate": 5.6529422159388615e-06, "epoch": 0.8499526224848113, "percentage": 85.0, "elapsed_time": "1 day, 12:05:30", "remaining_time": "6:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15250, "total_steps": 17941, "loss": 1.4031, "learning_rate": 5.648830208803646e-06, "epoch": 0.8500083607379745, "percentage": 85.0, "elapsed_time": "1 day, 12:05:39", "remaining_time": "6:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15251, "total_steps": 17941, "loss": 1.7687, "learning_rate": 5.644719608228954e-06, "epoch": 0.8500640989911377, "percentage": 85.01, "elapsed_time": "1 day, 12:05:47", "remaining_time": "6:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15252, "total_steps": 17941, "loss": 1.4767, "learning_rate": 5.640610414345149e-06, "epoch": 0.8501198372443007, "percentage": 85.01, "elapsed_time": "1 day, 12:05:55", "remaining_time": "6:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15253, "total_steps": 17941, "loss": 1.713, "learning_rate": 5.636502627282542e-06, "epoch": 0.8501755754974639, "percentage": 85.02, "elapsed_time": "1 day, 12:06:04", "remaining_time": "6:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15254, "total_steps": 17941, "loss": 1.7735, "learning_rate": 5.6323962471714286e-06, "epoch": 0.8502313137506271, "percentage": 85.02, "elapsed_time": "1 day, 12:06:13", "remaining_time": "6:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15255, "total_steps": 17941, "loss": 1.4571, "learning_rate": 5.628291274142017e-06, "epoch": 0.8502870520037902, "percentage": 85.03, "elapsed_time": "1 day, 12:06:21", "remaining_time": "6:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15256, "total_steps": 17941, "loss": 1.7026, "learning_rate": 5.624187708324497e-06, "epoch": 0.8503427902569534, "percentage": 85.03, "elapsed_time": "1 day, 12:06:29", "remaining_time": "6:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15257, "total_steps": 17941, "loss": 1.5978, "learning_rate": 5.620085549849013e-06, "epoch": 0.8503985285101165, "percentage": 85.04, "elapsed_time": "1 day, 12:06:38", "remaining_time": "6:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15258, "total_steps": 17941, "loss": 1.4557, "learning_rate": 5.6159847988456694e-06, "epoch": 0.8504542667632796, "percentage": 85.05, "elapsed_time": "1 day, 12:06:46", "remaining_time": "6:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15259, "total_steps": 17941, "loss": 1.7215, "learning_rate": 5.611885455444504e-06, "epoch": 0.8505100050164428, "percentage": 85.05, "elapsed_time": "1 day, 12:06:55", "remaining_time": "6:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15260, "total_steps": 17941, "loss": 1.7734, "learning_rate": 5.6077875197755316e-06, "epoch": 0.8505657432696059, "percentage": 85.06, "elapsed_time": "1 day, 12:07:03", "remaining_time": "6:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15261, "total_steps": 17941, "loss": 1.5654, "learning_rate": 5.60369099196873e-06, "epoch": 0.8506214815227691, "percentage": 85.06, "elapsed_time": "1 day, 12:07:12", "remaining_time": "6:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15262, "total_steps": 17941, "loss": 1.4452, "learning_rate": 5.59959587215399e-06, "epoch": 0.8506772197759322, "percentage": 85.07, "elapsed_time": "1 day, 12:07:20", "remaining_time": "6:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15263, "total_steps": 17941, "loss": 1.5936, "learning_rate": 5.595502160461186e-06, "epoch": 0.8507329580290953, "percentage": 85.07, "elapsed_time": "1 day, 12:07:29", "remaining_time": "6:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15264, "total_steps": 17941, "loss": 1.6409, "learning_rate": 5.591409857020175e-06, "epoch": 0.8507886962822585, "percentage": 85.08, "elapsed_time": "1 day, 12:07:37", "remaining_time": "6:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15265, "total_steps": 17941, "loss": 1.5613, "learning_rate": 5.587318961960714e-06, "epoch": 0.8508444345354217, "percentage": 85.08, "elapsed_time": "1 day, 12:07:46", "remaining_time": "6:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15266, "total_steps": 17941, "loss": 1.5431, "learning_rate": 5.583229475412561e-06, "epoch": 0.8509001727885848, "percentage": 85.09, "elapsed_time": "1 day, 12:07:54", "remaining_time": "6:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15267, "total_steps": 17941, "loss": 1.7616, "learning_rate": 5.579141397505383e-06, "epoch": 0.850955911041748, "percentage": 85.1, "elapsed_time": "1 day, 12:08:03", "remaining_time": "6:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15268, "total_steps": 17941, "loss": 1.3921, "learning_rate": 5.575054728368867e-06, "epoch": 0.8510116492949111, "percentage": 85.1, "elapsed_time": "1 day, 12:08:11", "remaining_time": "6:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15269, "total_steps": 17941, "loss": 1.4879, "learning_rate": 5.570969468132592e-06, "epoch": 0.8510673875480742, "percentage": 85.11, "elapsed_time": "1 day, 12:08:20", "remaining_time": "6:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15270, "total_steps": 17941, "loss": 1.5854, "learning_rate": 5.566885616926127e-06, "epoch": 0.8511231258012374, "percentage": 85.11, "elapsed_time": "1 day, 12:08:28", "remaining_time": "6:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15271, "total_steps": 17941, "loss": 1.664, "learning_rate": 5.562803174878983e-06, "epoch": 0.8511788640544006, "percentage": 85.12, "elapsed_time": "1 day, 12:08:37", "remaining_time": "6:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15272, "total_steps": 17941, "loss": 1.7785, "learning_rate": 5.558722142120637e-06, "epoch": 0.8512346023075636, "percentage": 85.12, "elapsed_time": "1 day, 12:08:45", "remaining_time": "6:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15273, "total_steps": 17941, "loss": 1.6459, "learning_rate": 5.554642518780529e-06, "epoch": 0.8512903405607268, "percentage": 85.13, "elapsed_time": "1 day, 12:08:54", "remaining_time": "6:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15274, "total_steps": 17941, "loss": 1.5275, "learning_rate": 5.550564304987999e-06, "epoch": 0.85134607881389, "percentage": 85.13, "elapsed_time": "1 day, 12:09:02", "remaining_time": "6:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15275, "total_steps": 17941, "loss": 1.6295, "learning_rate": 5.546487500872432e-06, "epoch": 0.8514018170670531, "percentage": 85.14, "elapsed_time": "1 day, 12:09:11", "remaining_time": "6:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15276, "total_steps": 17941, "loss": 1.6804, "learning_rate": 5.542412106563094e-06, "epoch": 0.8514575553202163, "percentage": 85.15, "elapsed_time": "1 day, 12:09:19", "remaining_time": "6:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15277, "total_steps": 17941, "loss": 1.8148, "learning_rate": 5.538338122189235e-06, "epoch": 0.8515132935733795, "percentage": 85.15, "elapsed_time": "1 day, 12:09:28", "remaining_time": "6:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15278, "total_steps": 17941, "loss": 1.7574, "learning_rate": 5.534265547880063e-06, "epoch": 0.8515690318265425, "percentage": 85.16, "elapsed_time": "1 day, 12:09:36", "remaining_time": "6:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15279, "total_steps": 17941, "loss": 1.3945, "learning_rate": 5.530194383764731e-06, "epoch": 0.8516247700797057, "percentage": 85.16, "elapsed_time": "1 day, 12:09:44", "remaining_time": "6:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15280, "total_steps": 17941, "loss": 1.8844, "learning_rate": 5.526124629972368e-06, "epoch": 0.8516805083328689, "percentage": 85.17, "elapsed_time": "1 day, 12:09:53", "remaining_time": "6:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15281, "total_steps": 17941, "loss": 1.7102, "learning_rate": 5.522056286632021e-06, "epoch": 0.851736246586032, "percentage": 85.17, "elapsed_time": "1 day, 12:10:01", "remaining_time": "6:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15282, "total_steps": 17941, "loss": 1.5469, "learning_rate": 5.517989353872727e-06, "epoch": 0.8517919848391952, "percentage": 85.18, "elapsed_time": "1 day, 12:10:10", "remaining_time": "6:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15283, "total_steps": 17941, "loss": 1.3507, "learning_rate": 5.513923831823459e-06, "epoch": 0.8518477230923582, "percentage": 85.18, "elapsed_time": "1 day, 12:10:18", "remaining_time": "6:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15284, "total_steps": 17941, "loss": 1.8035, "learning_rate": 5.509859720613159e-06, "epoch": 0.8519034613455214, "percentage": 85.19, "elapsed_time": "1 day, 12:10:27", "remaining_time": "6:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15285, "total_steps": 17941, "loss": 1.7747, "learning_rate": 5.505797020370706e-06, "epoch": 0.8519591995986846, "percentage": 85.2, "elapsed_time": "1 day, 12:10:35", "remaining_time": "6:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15286, "total_steps": 17941, "loss": 1.7629, "learning_rate": 5.50173573122496e-06, "epoch": 0.8520149378518477, "percentage": 85.2, "elapsed_time": "1 day, 12:10:43", "remaining_time": "6:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15287, "total_steps": 17941, "loss": 1.7322, "learning_rate": 5.497675853304718e-06, "epoch": 0.8520706761050109, "percentage": 85.21, "elapsed_time": "1 day, 12:10:52", "remaining_time": "6:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15288, "total_steps": 17941, "loss": 1.6233, "learning_rate": 5.493617386738725e-06, "epoch": 0.852126414358174, "percentage": 85.21, "elapsed_time": "1 day, 12:11:00", "remaining_time": "6:16:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15289, "total_steps": 17941, "loss": 1.1728, "learning_rate": 5.489560331655691e-06, "epoch": 0.8521821526113371, "percentage": 85.22, "elapsed_time": "1 day, 12:11:09", "remaining_time": "6:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15290, "total_steps": 17941, "loss": 1.8366, "learning_rate": 5.485504688184306e-06, "epoch": 0.8522378908645003, "percentage": 85.22, "elapsed_time": "1 day, 12:11:17", "remaining_time": "6:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15291, "total_steps": 17941, "loss": 1.7631, "learning_rate": 5.481450456453163e-06, "epoch": 0.8522936291176635, "percentage": 85.23, "elapsed_time": "1 day, 12:11:26", "remaining_time": "6:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15292, "total_steps": 17941, "loss": 1.4881, "learning_rate": 5.477397636590853e-06, "epoch": 0.8523493673708266, "percentage": 85.23, "elapsed_time": "1 day, 12:11:34", "remaining_time": "6:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15293, "total_steps": 17941, "loss": 1.7177, "learning_rate": 5.473346228725901e-06, "epoch": 0.8524051056239897, "percentage": 85.24, "elapsed_time": "1 day, 12:11:43", "remaining_time": "6:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15294, "total_steps": 17941, "loss": 1.7936, "learning_rate": 5.469296232986815e-06, "epoch": 0.8524608438771529, "percentage": 85.25, "elapsed_time": "1 day, 12:11:52", "remaining_time": "6:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15295, "total_steps": 17941, "loss": 1.846, "learning_rate": 5.4652476495020035e-06, "epoch": 0.852516582130316, "percentage": 85.25, "elapsed_time": "1 day, 12:12:00", "remaining_time": "6:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15296, "total_steps": 17941, "loss": 1.5868, "learning_rate": 5.461200478399886e-06, "epoch": 0.8525723203834792, "percentage": 85.26, "elapsed_time": "1 day, 12:12:09", "remaining_time": "6:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15297, "total_steps": 17941, "loss": 1.6317, "learning_rate": 5.45715471980881e-06, "epoch": 0.8526280586366424, "percentage": 85.26, "elapsed_time": "1 day, 12:12:17", "remaining_time": "6:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15298, "total_steps": 17941, "loss": 1.8102, "learning_rate": 5.4531103738570785e-06, "epoch": 0.8526837968898054, "percentage": 85.27, "elapsed_time": "1 day, 12:12:26", "remaining_time": "6:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15299, "total_steps": 17941, "loss": 1.4936, "learning_rate": 5.4490674406729724e-06, "epoch": 0.8527395351429686, "percentage": 85.27, "elapsed_time": "1 day, 12:12:34", "remaining_time": "6:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15300, "total_steps": 17941, "loss": 1.5057, "learning_rate": 5.445025920384678e-06, "epoch": 0.8527952733961318, "percentage": 85.28, "elapsed_time": "1 day, 12:12:43", "remaining_time": "6:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15301, "total_steps": 17941, "loss": 1.5193, "learning_rate": 5.4409858131204085e-06, "epoch": 0.8528510116492949, "percentage": 85.29, "elapsed_time": "1 day, 12:12:51", "remaining_time": "6:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15302, "total_steps": 17941, "loss": 1.6733, "learning_rate": 5.436947119008262e-06, "epoch": 0.8529067499024581, "percentage": 85.29, "elapsed_time": "1 day, 12:13:00", "remaining_time": "6:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15303, "total_steps": 17941, "loss": 1.5138, "learning_rate": 5.432909838176331e-06, "epoch": 0.8529624881556213, "percentage": 85.3, "elapsed_time": "1 day, 12:13:08", "remaining_time": "6:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15304, "total_steps": 17941, "loss": 1.5927, "learning_rate": 5.4288739707526574e-06, "epoch": 0.8530182264087843, "percentage": 85.3, "elapsed_time": "1 day, 12:13:17", "remaining_time": "6:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15305, "total_steps": 17941, "loss": 1.9848, "learning_rate": 5.424839516865232e-06, "epoch": 0.8530739646619475, "percentage": 85.31, "elapsed_time": "1 day, 12:13:25", "remaining_time": "6:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15306, "total_steps": 17941, "loss": 1.8113, "learning_rate": 5.4208064766420154e-06, "epoch": 0.8531297029151106, "percentage": 85.31, "elapsed_time": "1 day, 12:13:33", "remaining_time": "6:14:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15307, "total_steps": 17941, "loss": 1.5934, "learning_rate": 5.416774850210893e-06, "epoch": 0.8531854411682738, "percentage": 85.32, "elapsed_time": "1 day, 12:13:43", "remaining_time": "6:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15308, "total_steps": 17941, "loss": 1.6988, "learning_rate": 5.412744637699735e-06, "epoch": 0.853241179421437, "percentage": 85.32, "elapsed_time": "1 day, 12:13:51", "remaining_time": "6:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15309, "total_steps": 17941, "loss": 1.7733, "learning_rate": 5.408715839236356e-06, "epoch": 0.8532969176746, "percentage": 85.33, "elapsed_time": "1 day, 12:14:00", "remaining_time": "6:13:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15310, "total_steps": 17941, "loss": 1.5969, "learning_rate": 5.404688454948525e-06, "epoch": 0.8533526559277632, "percentage": 85.34, "elapsed_time": "1 day, 12:14:08", "remaining_time": "6:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15311, "total_steps": 17941, "loss": 2.1357, "learning_rate": 5.400662484963964e-06, "epoch": 0.8534083941809264, "percentage": 85.34, "elapsed_time": "1 day, 12:14:17", "remaining_time": "6:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15312, "total_steps": 17941, "loss": 1.5925, "learning_rate": 5.3966379294103646e-06, "epoch": 0.8534641324340895, "percentage": 85.35, "elapsed_time": "1 day, 12:14:25", "remaining_time": "6:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15313, "total_steps": 17941, "loss": 1.4044, "learning_rate": 5.392614788415357e-06, "epoch": 0.8535198706872527, "percentage": 85.35, "elapsed_time": "1 day, 12:14:33", "remaining_time": "6:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15314, "total_steps": 17941, "loss": 1.986, "learning_rate": 5.388593062106523e-06, "epoch": 0.8535756089404158, "percentage": 85.36, "elapsed_time": "1 day, 12:14:42", "remaining_time": "6:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15315, "total_steps": 17941, "loss": 1.6102, "learning_rate": 5.384572750611405e-06, "epoch": 0.8536313471935789, "percentage": 85.36, "elapsed_time": "1 day, 12:14:50", "remaining_time": "6:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15316, "total_steps": 17941, "loss": 1.5741, "learning_rate": 5.38055385405753e-06, "epoch": 0.8536870854467421, "percentage": 85.37, "elapsed_time": "1 day, 12:14:59", "remaining_time": "6:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15317, "total_steps": 17941, "loss": 1.7797, "learning_rate": 5.376536372572327e-06, "epoch": 0.8537428236999053, "percentage": 85.37, "elapsed_time": "1 day, 12:15:07", "remaining_time": "6:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15318, "total_steps": 17941, "loss": 1.6347, "learning_rate": 5.372520306283219e-06, "epoch": 0.8537985619530684, "percentage": 85.38, "elapsed_time": "1 day, 12:15:16", "remaining_time": "6:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15319, "total_steps": 17941, "loss": 1.6654, "learning_rate": 5.368505655317574e-06, "epoch": 0.8538543002062315, "percentage": 85.39, "elapsed_time": "1 day, 12:15:24", "remaining_time": "6:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15320, "total_steps": 17941, "loss": 1.6386, "learning_rate": 5.364492419802713e-06, "epoch": 0.8539100384593947, "percentage": 85.39, "elapsed_time": "1 day, 12:15:33", "remaining_time": "6:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15321, "total_steps": 17941, "loss": 1.5141, "learning_rate": 5.360480599865908e-06, "epoch": 0.8539657767125578, "percentage": 85.4, "elapsed_time": "1 day, 12:15:41", "remaining_time": "6:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15322, "total_steps": 17941, "loss": 1.6536, "learning_rate": 5.3564701956343835e-06, "epoch": 0.854021514965721, "percentage": 85.4, "elapsed_time": "1 day, 12:15:50", "remaining_time": "6:11:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15323, "total_steps": 17941, "loss": 1.5392, "learning_rate": 5.3524612072353434e-06, "epoch": 0.8540772532188842, "percentage": 85.41, "elapsed_time": "1 day, 12:15:58", "remaining_time": "6:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15324, "total_steps": 17941, "loss": 1.622, "learning_rate": 5.3484536347959135e-06, "epoch": 0.8541329914720472, "percentage": 85.41, "elapsed_time": "1 day, 12:16:06", "remaining_time": "6:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15325, "total_steps": 17941, "loss": 1.6824, "learning_rate": 5.34444747844321e-06, "epoch": 0.8541887297252104, "percentage": 85.42, "elapsed_time": "1 day, 12:16:15", "remaining_time": "6:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15326, "total_steps": 17941, "loss": 1.7105, "learning_rate": 5.340442738304252e-06, "epoch": 0.8542444679783736, "percentage": 85.42, "elapsed_time": "1 day, 12:16:24", "remaining_time": "6:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15327, "total_steps": 17941, "loss": 1.8319, "learning_rate": 5.336439414506089e-06, "epoch": 0.8543002062315367, "percentage": 85.43, "elapsed_time": "1 day, 12:16:32", "remaining_time": "6:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15328, "total_steps": 17941, "loss": 1.6904, "learning_rate": 5.332437507175647e-06, "epoch": 0.8543559444846999, "percentage": 85.44, "elapsed_time": "1 day, 12:16:41", "remaining_time": "6:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15329, "total_steps": 17941, "loss": 1.7488, "learning_rate": 5.3284370164398575e-06, "epoch": 0.8544116827378629, "percentage": 85.44, "elapsed_time": "1 day, 12:16:49", "remaining_time": "6:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15330, "total_steps": 17941, "loss": 1.5471, "learning_rate": 5.324437942425598e-06, "epoch": 0.8544674209910261, "percentage": 85.45, "elapsed_time": "1 day, 12:16:58", "remaining_time": "6:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15331, "total_steps": 17941, "loss": 1.5594, "learning_rate": 5.320440285259687e-06, "epoch": 0.8545231592441893, "percentage": 85.45, "elapsed_time": "1 day, 12:17:06", "remaining_time": "6:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15332, "total_steps": 17941, "loss": 1.3393, "learning_rate": 5.316444045068919e-06, "epoch": 0.8545788974973524, "percentage": 85.46, "elapsed_time": "1 day, 12:17:15", "remaining_time": "6:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15333, "total_steps": 17941, "loss": 1.523, "learning_rate": 5.3124492219800145e-06, "epoch": 0.8546346357505156, "percentage": 85.46, "elapsed_time": "1 day, 12:17:23", "remaining_time": "6:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15334, "total_steps": 17941, "loss": 1.9166, "learning_rate": 5.308455816119673e-06, "epoch": 0.8546903740036788, "percentage": 85.47, "elapsed_time": "1 day, 12:17:31", "remaining_time": "6:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15335, "total_steps": 17941, "loss": 1.8974, "learning_rate": 5.304463827614548e-06, "epoch": 0.8547461122568418, "percentage": 85.47, "elapsed_time": "1 day, 12:17:40", "remaining_time": "6:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15336, "total_steps": 17941, "loss": 1.5165, "learning_rate": 5.300473256591232e-06, "epoch": 0.854801850510005, "percentage": 85.48, "elapsed_time": "1 day, 12:17:49", "remaining_time": "6:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15337, "total_steps": 17941, "loss": 1.5878, "learning_rate": 5.296484103176291e-06, "epoch": 0.8548575887631682, "percentage": 85.49, "elapsed_time": "1 day, 12:17:57", "remaining_time": "6:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15338, "total_steps": 17941, "loss": 1.5214, "learning_rate": 5.292496367496231e-06, "epoch": 0.8549133270163313, "percentage": 85.49, "elapsed_time": "1 day, 12:18:07", "remaining_time": "6:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15339, "total_steps": 17941, "loss": 1.6509, "learning_rate": 5.288510049677536e-06, "epoch": 0.8549690652694945, "percentage": 85.5, "elapsed_time": "1 day, 12:18:15", "remaining_time": "6:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15340, "total_steps": 17941, "loss": 1.4928, "learning_rate": 5.284525149846609e-06, "epoch": 0.8550248035226576, "percentage": 85.5, "elapsed_time": "1 day, 12:18:23", "remaining_time": "6:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15341, "total_steps": 17941, "loss": 1.5425, "learning_rate": 5.2805416681298184e-06, "epoch": 0.8550805417758207, "percentage": 85.51, "elapsed_time": "1 day, 12:18:32", "remaining_time": "6:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15342, "total_steps": 17941, "loss": 1.3634, "learning_rate": 5.276559604653536e-06, "epoch": 0.8551362800289839, "percentage": 85.51, "elapsed_time": "1 day, 12:18:40", "remaining_time": "6:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15343, "total_steps": 17941, "loss": 1.5259, "learning_rate": 5.272578959544017e-06, "epoch": 0.8551920182821471, "percentage": 85.52, "elapsed_time": "1 day, 12:18:50", "remaining_time": "6:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15344, "total_steps": 17941, "loss": 1.5523, "learning_rate": 5.268599732927521e-06, "epoch": 0.8552477565353102, "percentage": 85.52, "elapsed_time": "1 day, 12:18:58", "remaining_time": "6:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15345, "total_steps": 17941, "loss": 1.6618, "learning_rate": 5.26462192493023e-06, "epoch": 0.8553034947884733, "percentage": 85.53, "elapsed_time": "1 day, 12:19:07", "remaining_time": "6:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15346, "total_steps": 17941, "loss": 1.8076, "learning_rate": 5.2606455356783215e-06, "epoch": 0.8553592330416365, "percentage": 85.54, "elapsed_time": "1 day, 12:19:15", "remaining_time": "6:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15347, "total_steps": 17941, "loss": 1.7027, "learning_rate": 5.256670565297878e-06, "epoch": 0.8554149712947996, "percentage": 85.54, "elapsed_time": "1 day, 12:19:23", "remaining_time": "6:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15348, "total_steps": 17941, "loss": 1.7644, "learning_rate": 5.25269701391497e-06, "epoch": 0.8554707095479628, "percentage": 85.55, "elapsed_time": "1 day, 12:19:33", "remaining_time": "6:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15349, "total_steps": 17941, "loss": 1.6903, "learning_rate": 5.24872488165562e-06, "epoch": 0.855526447801126, "percentage": 85.55, "elapsed_time": "1 day, 12:19:41", "remaining_time": "6:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15350, "total_steps": 17941, "loss": 1.6964, "learning_rate": 5.244754168645793e-06, "epoch": 0.855582186054289, "percentage": 85.56, "elapsed_time": "1 day, 12:19:49", "remaining_time": "6:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15351, "total_steps": 17941, "loss": 1.6683, "learning_rate": 5.240784875011439e-06, "epoch": 0.8556379243074522, "percentage": 85.56, "elapsed_time": "1 day, 12:19:58", "remaining_time": "6:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15352, "total_steps": 17941, "loss": 1.3393, "learning_rate": 5.236817000878402e-06, "epoch": 0.8556936625606153, "percentage": 85.57, "elapsed_time": "1 day, 12:20:06", "remaining_time": "6:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15353, "total_steps": 17941, "loss": 1.6366, "learning_rate": 5.232850546372564e-06, "epoch": 0.8557494008137785, "percentage": 85.57, "elapsed_time": "1 day, 12:20:15", "remaining_time": "6:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15354, "total_steps": 17941, "loss": 1.6016, "learning_rate": 5.228885511619686e-06, "epoch": 0.8558051390669417, "percentage": 85.58, "elapsed_time": "1 day, 12:20:23", "remaining_time": "6:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15355, "total_steps": 17941, "loss": 1.3442, "learning_rate": 5.2249218967455215e-06, "epoch": 0.8558608773201047, "percentage": 85.59, "elapsed_time": "1 day, 12:20:32", "remaining_time": "6:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15356, "total_steps": 17941, "loss": 1.7464, "learning_rate": 5.220959701875783e-06, "epoch": 0.8559166155732679, "percentage": 85.59, "elapsed_time": "1 day, 12:20:40", "remaining_time": "6:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15357, "total_steps": 17941, "loss": 1.5449, "learning_rate": 5.216998927136118e-06, "epoch": 0.8559723538264311, "percentage": 85.6, "elapsed_time": "1 day, 12:20:49", "remaining_time": "6:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15358, "total_steps": 17941, "loss": 1.5248, "learning_rate": 5.213039572652162e-06, "epoch": 0.8560280920795942, "percentage": 85.6, "elapsed_time": "1 day, 12:20:57", "remaining_time": "6:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15359, "total_steps": 17941, "loss": 1.7179, "learning_rate": 5.209081638549446e-06, "epoch": 0.8560838303327574, "percentage": 85.61, "elapsed_time": "1 day, 12:21:06", "remaining_time": "6:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15360, "total_steps": 17941, "loss": 1.5125, "learning_rate": 5.205125124953514e-06, "epoch": 0.8561395685859206, "percentage": 85.61, "elapsed_time": "1 day, 12:21:14", "remaining_time": "6:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15361, "total_steps": 17941, "loss": 1.6392, "learning_rate": 5.201170031989844e-06, "epoch": 0.8561953068390836, "percentage": 85.62, "elapsed_time": "1 day, 12:21:23", "remaining_time": "6:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15362, "total_steps": 17941, "loss": 1.709, "learning_rate": 5.197216359783863e-06, "epoch": 0.8562510450922468, "percentage": 85.63, "elapsed_time": "1 day, 12:21:31", "remaining_time": "6:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15363, "total_steps": 17941, "loss": 1.5904, "learning_rate": 5.19326410846096e-06, "epoch": 0.85630678334541, "percentage": 85.63, "elapsed_time": "1 day, 12:21:40", "remaining_time": "6:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15364, "total_steps": 17941, "loss": 1.6574, "learning_rate": 5.18931327814648e-06, "epoch": 0.8563625215985731, "percentage": 85.64, "elapsed_time": "1 day, 12:21:48", "remaining_time": "6:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15365, "total_steps": 17941, "loss": 1.6079, "learning_rate": 5.185363868965726e-06, "epoch": 0.8564182598517363, "percentage": 85.64, "elapsed_time": "1 day, 12:21:56", "remaining_time": "6:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15366, "total_steps": 17941, "loss": 1.6236, "learning_rate": 5.181415881043933e-06, "epoch": 0.8564739981048994, "percentage": 85.65, "elapsed_time": "1 day, 12:22:05", "remaining_time": "6:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15367, "total_steps": 17941, "loss": 1.7752, "learning_rate": 5.177469314506317e-06, "epoch": 0.8565297363580625, "percentage": 85.65, "elapsed_time": "1 day, 12:22:13", "remaining_time": "6:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15368, "total_steps": 17941, "loss": 1.4805, "learning_rate": 5.173524169478045e-06, "epoch": 0.8565854746112257, "percentage": 85.66, "elapsed_time": "1 day, 12:22:22", "remaining_time": "6:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15369, "total_steps": 17941, "loss": 1.4595, "learning_rate": 5.1695804460842264e-06, "epoch": 0.8566412128643889, "percentage": 85.66, "elapsed_time": "1 day, 12:22:30", "remaining_time": "6:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15370, "total_steps": 17941, "loss": 1.714, "learning_rate": 5.165638144449936e-06, "epoch": 0.856696951117552, "percentage": 85.67, "elapsed_time": "1 day, 12:22:39", "remaining_time": "6:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15371, "total_steps": 17941, "loss": 1.5827, "learning_rate": 5.161697264700205e-06, "epoch": 0.8567526893707151, "percentage": 85.68, "elapsed_time": "1 day, 12:22:47", "remaining_time": "6:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15372, "total_steps": 17941, "loss": 1.6936, "learning_rate": 5.1577578069600174e-06, "epoch": 0.8568084276238783, "percentage": 85.68, "elapsed_time": "1 day, 12:22:56", "remaining_time": "6:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15373, "total_steps": 17941, "loss": 1.5163, "learning_rate": 5.153819771354296e-06, "epoch": 0.8568641658770414, "percentage": 85.69, "elapsed_time": "1 day, 12:23:05", "remaining_time": "6:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15374, "total_steps": 17941, "loss": 1.3902, "learning_rate": 5.14988315800794e-06, "epoch": 0.8569199041302046, "percentage": 85.69, "elapsed_time": "1 day, 12:23:14", "remaining_time": "6:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15375, "total_steps": 17941, "loss": 1.443, "learning_rate": 5.145947967045794e-06, "epoch": 0.8569756423833677, "percentage": 85.7, "elapsed_time": "1 day, 12:23:22", "remaining_time": "6:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15376, "total_steps": 17941, "loss": 1.8804, "learning_rate": 5.142014198592665e-06, "epoch": 0.8570313806365308, "percentage": 85.7, "elapsed_time": "1 day, 12:23:31", "remaining_time": "6:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15377, "total_steps": 17941, "loss": 1.5493, "learning_rate": 5.138081852773313e-06, "epoch": 0.857087118889694, "percentage": 85.71, "elapsed_time": "1 day, 12:23:40", "remaining_time": "6:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15378, "total_steps": 17941, "loss": 1.8992, "learning_rate": 5.134150929712417e-06, "epoch": 0.8571428571428571, "percentage": 85.71, "elapsed_time": "1 day, 12:23:48", "remaining_time": "6:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15379, "total_steps": 17941, "loss": 1.6225, "learning_rate": 5.130221429534693e-06, "epoch": 0.8571985953960203, "percentage": 85.72, "elapsed_time": "1 day, 12:23:57", "remaining_time": "6:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15380, "total_steps": 17941, "loss": 1.7471, "learning_rate": 5.126293352364725e-06, "epoch": 0.8572543336491835, "percentage": 85.73, "elapsed_time": "1 day, 12:24:05", "remaining_time": "6:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15381, "total_steps": 17941, "loss": 1.6856, "learning_rate": 5.1223666983271025e-06, "epoch": 0.8573100719023465, "percentage": 85.73, "elapsed_time": "1 day, 12:24:14", "remaining_time": "6:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15382, "total_steps": 17941, "loss": 1.5704, "learning_rate": 5.118441467546348e-06, "epoch": 0.8573658101555097, "percentage": 85.74, "elapsed_time": "1 day, 12:24:22", "remaining_time": "6:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15383, "total_steps": 17941, "loss": 1.6813, "learning_rate": 5.114517660146956e-06, "epoch": 0.8574215484086729, "percentage": 85.74, "elapsed_time": "1 day, 12:24:32", "remaining_time": "6:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15384, "total_steps": 17941, "loss": 1.54, "learning_rate": 5.110595276253377e-06, "epoch": 0.857477286661836, "percentage": 85.75, "elapsed_time": "1 day, 12:24:40", "remaining_time": "6:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15385, "total_steps": 17941, "loss": 1.4813, "learning_rate": 5.106674315989968e-06, "epoch": 0.8575330249149992, "percentage": 85.75, "elapsed_time": "1 day, 12:24:48", "remaining_time": "6:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15386, "total_steps": 17941, "loss": 1.7306, "learning_rate": 5.102754779481122e-06, "epoch": 0.8575887631681623, "percentage": 85.76, "elapsed_time": "1 day, 12:24:57", "remaining_time": "6:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15387, "total_steps": 17941, "loss": 1.5453, "learning_rate": 5.09883666685112e-06, "epoch": 0.8576445014213254, "percentage": 85.76, "elapsed_time": "1 day, 12:25:05", "remaining_time": "6:02:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15388, "total_steps": 17941, "loss": 1.5683, "learning_rate": 5.094919978224222e-06, "epoch": 0.8577002396744886, "percentage": 85.77, "elapsed_time": "1 day, 12:25:14", "remaining_time": "6:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15389, "total_steps": 17941, "loss": 1.706, "learning_rate": 5.091004713724651e-06, "epoch": 0.8577559779276518, "percentage": 85.78, "elapsed_time": "1 day, 12:25:22", "remaining_time": "6:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15390, "total_steps": 17941, "loss": 1.7164, "learning_rate": 5.087090873476569e-06, "epoch": 0.8578117161808149, "percentage": 85.78, "elapsed_time": "1 day, 12:25:31", "remaining_time": "6:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15391, "total_steps": 17941, "loss": 1.4208, "learning_rate": 5.083178457604115e-06, "epoch": 0.857867454433978, "percentage": 85.79, "elapsed_time": "1 day, 12:25:39", "remaining_time": "6:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15392, "total_steps": 17941, "loss": 1.5262, "learning_rate": 5.079267466231352e-06, "epoch": 0.8579231926871412, "percentage": 85.79, "elapsed_time": "1 day, 12:25:48", "remaining_time": "6:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15393, "total_steps": 17941, "loss": 1.6433, "learning_rate": 5.075357899482314e-06, "epoch": 0.8579789309403043, "percentage": 85.8, "elapsed_time": "1 day, 12:25:57", "remaining_time": "6:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15394, "total_steps": 17941, "loss": 1.4153, "learning_rate": 5.071449757480995e-06, "epoch": 0.8580346691934675, "percentage": 85.8, "elapsed_time": "1 day, 12:26:05", "remaining_time": "6:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15395, "total_steps": 17941, "loss": 1.7719, "learning_rate": 5.067543040351341e-06, "epoch": 0.8580904074466307, "percentage": 85.81, "elapsed_time": "1 day, 12:26:14", "remaining_time": "6:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15396, "total_steps": 17941, "loss": 1.6683, "learning_rate": 5.063637748217248e-06, "epoch": 0.8581461456997937, "percentage": 85.81, "elapsed_time": "1 day, 12:26:22", "remaining_time": "6:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15397, "total_steps": 17941, "loss": 1.8132, "learning_rate": 5.059733881202567e-06, "epoch": 0.8582018839529569, "percentage": 85.82, "elapsed_time": "1 day, 12:26:30", "remaining_time": "6:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15398, "total_steps": 17941, "loss": 1.4149, "learning_rate": 5.055831439431114e-06, "epoch": 0.85825762220612, "percentage": 85.83, "elapsed_time": "1 day, 12:26:39", "remaining_time": "6:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15399, "total_steps": 17941, "loss": 1.7472, "learning_rate": 5.051930423026641e-06, "epoch": 0.8583133604592832, "percentage": 85.83, "elapsed_time": "1 day, 12:26:47", "remaining_time": "6:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15400, "total_steps": 17941, "loss": 1.7392, "learning_rate": 5.048030832112865e-06, "epoch": 0.8583690987124464, "percentage": 85.84, "elapsed_time": "1 day, 12:26:56", "remaining_time": "6:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15401, "total_steps": 17941, "loss": 1.6323, "learning_rate": 5.044132666813461e-06, "epoch": 0.8584248369656095, "percentage": 85.84, "elapsed_time": "1 day, 12:27:04", "remaining_time": "6:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15402, "total_steps": 17941, "loss": 1.7079, "learning_rate": 5.040235927252063e-06, "epoch": 0.8584805752187726, "percentage": 85.85, "elapsed_time": "1 day, 12:27:13", "remaining_time": "6:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15403, "total_steps": 17941, "loss": 1.7767, "learning_rate": 5.036340613552254e-06, "epoch": 0.8585363134719358, "percentage": 85.85, "elapsed_time": "1 day, 12:27:21", "remaining_time": "6:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15404, "total_steps": 17941, "loss": 1.487, "learning_rate": 5.032446725837547e-06, "epoch": 0.8585920517250989, "percentage": 85.86, "elapsed_time": "1 day, 12:27:30", "remaining_time": "6:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15405, "total_steps": 17941, "loss": 1.5984, "learning_rate": 5.028554264231472e-06, "epoch": 0.8586477899782621, "percentage": 85.86, "elapsed_time": "1 day, 12:27:38", "remaining_time": "6:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15406, "total_steps": 17941, "loss": 1.5717, "learning_rate": 5.02466322885744e-06, "epoch": 0.8587035282314253, "percentage": 85.87, "elapsed_time": "1 day, 12:27:47", "remaining_time": "5:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15407, "total_steps": 17941, "loss": 1.3869, "learning_rate": 5.02077361983887e-06, "epoch": 0.8587592664845883, "percentage": 85.88, "elapsed_time": "1 day, 12:27:55", "remaining_time": "5:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15408, "total_steps": 17941, "loss": 1.4508, "learning_rate": 5.0168854372991125e-06, "epoch": 0.8588150047377515, "percentage": 85.88, "elapsed_time": "1 day, 12:28:04", "remaining_time": "5:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15409, "total_steps": 17941, "loss": 1.617, "learning_rate": 5.012998681361475e-06, "epoch": 0.8588707429909147, "percentage": 85.89, "elapsed_time": "1 day, 12:28:12", "remaining_time": "5:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15410, "total_steps": 17941, "loss": 1.6986, "learning_rate": 5.0091133521492415e-06, "epoch": 0.8589264812440778, "percentage": 85.89, "elapsed_time": "1 day, 12:28:21", "remaining_time": "5:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15411, "total_steps": 17941, "loss": 1.4624, "learning_rate": 5.005229449785598e-06, "epoch": 0.858982219497241, "percentage": 85.9, "elapsed_time": "1 day, 12:28:29", "remaining_time": "5:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15412, "total_steps": 17941, "loss": 1.6463, "learning_rate": 5.001346974393755e-06, "epoch": 0.8590379577504041, "percentage": 85.9, "elapsed_time": "1 day, 12:28:38", "remaining_time": "5:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15413, "total_steps": 17941, "loss": 1.6815, "learning_rate": 4.997465926096817e-06, "epoch": 0.8590936960035672, "percentage": 85.91, "elapsed_time": "1 day, 12:28:46", "remaining_time": "5:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15414, "total_steps": 17941, "loss": 1.575, "learning_rate": 4.993586305017878e-06, "epoch": 0.8591494342567304, "percentage": 85.91, "elapsed_time": "1 day, 12:28:55", "remaining_time": "5:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15415, "total_steps": 17941, "loss": 1.5276, "learning_rate": 4.9897081112799725e-06, "epoch": 0.8592051725098936, "percentage": 85.92, "elapsed_time": "1 day, 12:29:03", "remaining_time": "5:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15416, "total_steps": 17941, "loss": 1.6019, "learning_rate": 4.985831345006103e-06, "epoch": 0.8592609107630567, "percentage": 85.93, "elapsed_time": "1 day, 12:29:12", "remaining_time": "5:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15417, "total_steps": 17941, "loss": 1.5506, "learning_rate": 4.981956006319216e-06, "epoch": 0.8593166490162198, "percentage": 85.93, "elapsed_time": "1 day, 12:29:20", "remaining_time": "5:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15418, "total_steps": 17941, "loss": 1.6915, "learning_rate": 4.978082095342207e-06, "epoch": 0.859372387269383, "percentage": 85.94, "elapsed_time": "1 day, 12:29:28", "remaining_time": "5:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15419, "total_steps": 17941, "loss": 1.7283, "learning_rate": 4.974209612197933e-06, "epoch": 0.8594281255225461, "percentage": 85.94, "elapsed_time": "1 day, 12:29:37", "remaining_time": "5:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15420, "total_steps": 17941, "loss": 1.575, "learning_rate": 4.970338557009219e-06, "epoch": 0.8594838637757093, "percentage": 85.95, "elapsed_time": "1 day, 12:29:46", "remaining_time": "5:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15421, "total_steps": 17941, "loss": 1.4879, "learning_rate": 4.9664689298988155e-06, "epoch": 0.8595396020288724, "percentage": 85.95, "elapsed_time": "1 day, 12:29:54", "remaining_time": "5:57:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15422, "total_steps": 17941, "loss": 1.5325, "learning_rate": 4.962600730989459e-06, "epoch": 0.8595953402820355, "percentage": 85.96, "elapsed_time": "1 day, 12:30:03", "remaining_time": "5:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15423, "total_steps": 17941, "loss": 1.7003, "learning_rate": 4.958733960403822e-06, "epoch": 0.8596510785351987, "percentage": 85.97, "elapsed_time": "1 day, 12:30:11", "remaining_time": "5:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15424, "total_steps": 17941, "loss": 1.6402, "learning_rate": 4.954868618264541e-06, "epoch": 0.8597068167883618, "percentage": 85.97, "elapsed_time": "1 day, 12:30:19", "remaining_time": "5:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15425, "total_steps": 17941, "loss": 1.5105, "learning_rate": 4.95100470469419e-06, "epoch": 0.859762555041525, "percentage": 85.98, "elapsed_time": "1 day, 12:30:28", "remaining_time": "5:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15426, "total_steps": 17941, "loss": 1.6836, "learning_rate": 4.947142219815315e-06, "epoch": 0.8598182932946882, "percentage": 85.98, "elapsed_time": "1 day, 12:30:37", "remaining_time": "5:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15427, "total_steps": 17941, "loss": 1.4754, "learning_rate": 4.943281163750413e-06, "epoch": 0.8598740315478512, "percentage": 85.99, "elapsed_time": "1 day, 12:30:45", "remaining_time": "5:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15428, "total_steps": 17941, "loss": 1.7882, "learning_rate": 4.9394215366219296e-06, "epoch": 0.8599297698010144, "percentage": 85.99, "elapsed_time": "1 day, 12:30:54", "remaining_time": "5:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15429, "total_steps": 17941, "loss": 1.8442, "learning_rate": 4.9355633385522905e-06, "epoch": 0.8599855080541776, "percentage": 86.0, "elapsed_time": "1 day, 12:31:02", "remaining_time": "5:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15430, "total_steps": 17941, "loss": 1.6857, "learning_rate": 4.931706569663813e-06, "epoch": 0.8600412463073407, "percentage": 86.0, "elapsed_time": "1 day, 12:31:11", "remaining_time": "5:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15431, "total_steps": 17941, "loss": 1.5753, "learning_rate": 4.9278512300788556e-06, "epoch": 0.8600969845605039, "percentage": 86.01, "elapsed_time": "1 day, 12:31:19", "remaining_time": "5:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15432, "total_steps": 17941, "loss": 1.5379, "learning_rate": 4.92399731991966e-06, "epoch": 0.8601527228136671, "percentage": 86.02, "elapsed_time": "1 day, 12:31:27", "remaining_time": "5:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15433, "total_steps": 17941, "loss": 1.6328, "learning_rate": 4.92014483930846e-06, "epoch": 0.8602084610668301, "percentage": 86.02, "elapsed_time": "1 day, 12:31:36", "remaining_time": "5:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15434, "total_steps": 17941, "loss": 1.6785, "learning_rate": 4.916293788367432e-06, "epoch": 0.8602641993199933, "percentage": 86.03, "elapsed_time": "1 day, 12:31:44", "remaining_time": "5:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15435, "total_steps": 17941, "loss": 1.8026, "learning_rate": 4.912444167218705e-06, "epoch": 0.8603199375731565, "percentage": 86.03, "elapsed_time": "1 day, 12:31:53", "remaining_time": "5:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15436, "total_steps": 17941, "loss": 1.5967, "learning_rate": 4.908595975984387e-06, "epoch": 0.8603756758263196, "percentage": 86.04, "elapsed_time": "1 day, 12:32:01", "remaining_time": "5:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15437, "total_steps": 17941, "loss": 1.3421, "learning_rate": 4.904749214786475e-06, "epoch": 0.8604314140794828, "percentage": 86.04, "elapsed_time": "1 day, 12:32:10", "remaining_time": "5:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15438, "total_steps": 17941, "loss": 1.7279, "learning_rate": 4.900903883747021e-06, "epoch": 0.8604871523326459, "percentage": 86.05, "elapsed_time": "1 day, 12:32:18", "remaining_time": "5:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15439, "total_steps": 17941, "loss": 1.6473, "learning_rate": 4.897059982987939e-06, "epoch": 0.860542890585809, "percentage": 86.05, "elapsed_time": "1 day, 12:32:27", "remaining_time": "5:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15440, "total_steps": 17941, "loss": 1.7516, "learning_rate": 4.893217512631143e-06, "epoch": 0.8605986288389722, "percentage": 86.06, "elapsed_time": "1 day, 12:32:35", "remaining_time": "5:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15441, "total_steps": 17941, "loss": 1.8468, "learning_rate": 4.889376472798502e-06, "epoch": 0.8606543670921354, "percentage": 86.07, "elapsed_time": "1 day, 12:32:43", "remaining_time": "5:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15442, "total_steps": 17941, "loss": 1.6379, "learning_rate": 4.8855368636118175e-06, "epoch": 0.8607101053452985, "percentage": 86.07, "elapsed_time": "1 day, 12:32:52", "remaining_time": "5:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15443, "total_steps": 17941, "loss": 1.6127, "learning_rate": 4.881698685192887e-06, "epoch": 0.8607658435984616, "percentage": 86.08, "elapsed_time": "1 day, 12:33:00", "remaining_time": "5:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15444, "total_steps": 17941, "loss": 1.487, "learning_rate": 4.877861937663397e-06, "epoch": 0.8608215818516247, "percentage": 86.08, "elapsed_time": "1 day, 12:33:09", "remaining_time": "5:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15445, "total_steps": 17941, "loss": 1.4375, "learning_rate": 4.874026621145055e-06, "epoch": 0.8608773201047879, "percentage": 86.09, "elapsed_time": "1 day, 12:33:17", "remaining_time": "5:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15446, "total_steps": 17941, "loss": 1.7431, "learning_rate": 4.870192735759482e-06, "epoch": 0.8609330583579511, "percentage": 86.09, "elapsed_time": "1 day, 12:33:26", "remaining_time": "5:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15447, "total_steps": 17941, "loss": 1.5807, "learning_rate": 4.866360281628268e-06, "epoch": 0.8609887966111142, "percentage": 86.1, "elapsed_time": "1 day, 12:33:34", "remaining_time": "5:54:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15448, "total_steps": 17941, "loss": 1.8166, "learning_rate": 4.862529258872961e-06, "epoch": 0.8610445348642773, "percentage": 86.1, "elapsed_time": "1 day, 12:33:43", "remaining_time": "5:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15449, "total_steps": 17941, "loss": 1.4941, "learning_rate": 4.858699667615057e-06, "epoch": 0.8611002731174405, "percentage": 86.11, "elapsed_time": "1 day, 12:33:51", "remaining_time": "5:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15450, "total_steps": 17941, "loss": 1.8157, "learning_rate": 4.8548715079760166e-06, "epoch": 0.8611560113706036, "percentage": 86.12, "elapsed_time": "1 day, 12:34:00", "remaining_time": "5:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15451, "total_steps": 17941, "loss": 1.641, "learning_rate": 4.85104478007723e-06, "epoch": 0.8612117496237668, "percentage": 86.12, "elapsed_time": "1 day, 12:34:08", "remaining_time": "5:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15452, "total_steps": 17941, "loss": 1.7062, "learning_rate": 4.847219484040055e-06, "epoch": 0.86126748787693, "percentage": 86.13, "elapsed_time": "1 day, 12:34:17", "remaining_time": "5:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15453, "total_steps": 17941, "loss": 1.5513, "learning_rate": 4.843395619985836e-06, "epoch": 0.861323226130093, "percentage": 86.13, "elapsed_time": "1 day, 12:34:25", "remaining_time": "5:53:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15454, "total_steps": 17941, "loss": 1.7844, "learning_rate": 4.839573188035818e-06, "epoch": 0.8613789643832562, "percentage": 86.14, "elapsed_time": "1 day, 12:34:34", "remaining_time": "5:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15455, "total_steps": 17941, "loss": 1.6284, "learning_rate": 4.835752188311249e-06, "epoch": 0.8614347026364194, "percentage": 86.14, "elapsed_time": "1 day, 12:34:42", "remaining_time": "5:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15456, "total_steps": 17941, "loss": 1.7408, "learning_rate": 4.8319326209332715e-06, "epoch": 0.8614904408895825, "percentage": 86.15, "elapsed_time": "1 day, 12:34:51", "remaining_time": "5:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15457, "total_steps": 17941, "loss": 1.6529, "learning_rate": 4.828114486023061e-06, "epoch": 0.8615461791427457, "percentage": 86.15, "elapsed_time": "1 day, 12:34:59", "remaining_time": "5:52:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15458, "total_steps": 17941, "loss": 1.429, "learning_rate": 4.824297783701681e-06, "epoch": 0.8616019173959089, "percentage": 86.16, "elapsed_time": "1 day, 12:35:08", "remaining_time": "5:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15459, "total_steps": 17941, "loss": 1.7355, "learning_rate": 4.82048251409018e-06, "epoch": 0.8616576556490719, "percentage": 86.17, "elapsed_time": "1 day, 12:35:16", "remaining_time": "5:52:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15460, "total_steps": 17941, "loss": 1.6579, "learning_rate": 4.816668677309566e-06, "epoch": 0.8617133939022351, "percentage": 86.17, "elapsed_time": "1 day, 12:35:24", "remaining_time": "5:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15461, "total_steps": 17941, "loss": 1.8092, "learning_rate": 4.812856273480776e-06, "epoch": 0.8617691321553983, "percentage": 86.18, "elapsed_time": "1 day, 12:35:33", "remaining_time": "5:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15462, "total_steps": 17941, "loss": 1.6346, "learning_rate": 4.80904530272474e-06, "epoch": 0.8618248704085614, "percentage": 86.18, "elapsed_time": "1 day, 12:35:41", "remaining_time": "5:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15463, "total_steps": 17941, "loss": 1.4948, "learning_rate": 4.805235765162286e-06, "epoch": 0.8618806086617246, "percentage": 86.19, "elapsed_time": "1 day, 12:35:50", "remaining_time": "5:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15464, "total_steps": 17941, "loss": 1.5347, "learning_rate": 4.801427660914265e-06, "epoch": 0.8619363469148877, "percentage": 86.19, "elapsed_time": "1 day, 12:35:58", "remaining_time": "5:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15465, "total_steps": 17941, "loss": 1.9691, "learning_rate": 4.797620990101431e-06, "epoch": 0.8619920851680508, "percentage": 86.2, "elapsed_time": "1 day, 12:36:07", "remaining_time": "5:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15466, "total_steps": 17941, "loss": 1.7786, "learning_rate": 4.793815752844505e-06, "epoch": 0.862047823421214, "percentage": 86.2, "elapsed_time": "1 day, 12:36:15", "remaining_time": "5:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15467, "total_steps": 17941, "loss": 1.4825, "learning_rate": 4.7900119492641726e-06, "epoch": 0.8621035616743771, "percentage": 86.21, "elapsed_time": "1 day, 12:36:24", "remaining_time": "5:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15468, "total_steps": 17941, "loss": 1.445, "learning_rate": 4.786209579481072e-06, "epoch": 0.8621592999275403, "percentage": 86.22, "elapsed_time": "1 day, 12:36:32", "remaining_time": "5:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15469, "total_steps": 17941, "loss": 1.4002, "learning_rate": 4.782408643615799e-06, "epoch": 0.8622150381807034, "percentage": 86.22, "elapsed_time": "1 day, 12:36:41", "remaining_time": "5:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15470, "total_steps": 17941, "loss": 1.4445, "learning_rate": 4.77860914178887e-06, "epoch": 0.8622707764338665, "percentage": 86.23, "elapsed_time": "1 day, 12:36:49", "remaining_time": "5:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15471, "total_steps": 17941, "loss": 1.6644, "learning_rate": 4.774811074120805e-06, "epoch": 0.8623265146870297, "percentage": 86.23, "elapsed_time": "1 day, 12:36:58", "remaining_time": "5:50:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15472, "total_steps": 17941, "loss": 1.62, "learning_rate": 4.771014440732052e-06, "epoch": 0.8623822529401929, "percentage": 86.24, "elapsed_time": "1 day, 12:37:06", "remaining_time": "5:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15473, "total_steps": 17941, "loss": 1.7278, "learning_rate": 4.76721924174302e-06, "epoch": 0.862437991193356, "percentage": 86.24, "elapsed_time": "1 day, 12:37:15", "remaining_time": "5:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15474, "total_steps": 17941, "loss": 1.4852, "learning_rate": 4.763425477274064e-06, "epoch": 0.8624937294465191, "percentage": 86.25, "elapsed_time": "1 day, 12:37:23", "remaining_time": "5:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15475, "total_steps": 17941, "loss": 1.7785, "learning_rate": 4.759633147445508e-06, "epoch": 0.8625494676996823, "percentage": 86.25, "elapsed_time": "1 day, 12:37:32", "remaining_time": "5:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15476, "total_steps": 17941, "loss": 1.7309, "learning_rate": 4.755842252377629e-06, "epoch": 0.8626052059528454, "percentage": 86.26, "elapsed_time": "1 day, 12:37:40", "remaining_time": "5:50:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15477, "total_steps": 17941, "loss": 1.6361, "learning_rate": 4.752052792190625e-06, "epoch": 0.8626609442060086, "percentage": 86.27, "elapsed_time": "1 day, 12:37:49", "remaining_time": "5:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15478, "total_steps": 17941, "loss": 1.7223, "learning_rate": 4.748264767004701e-06, "epoch": 0.8627166824591718, "percentage": 86.27, "elapsed_time": "1 day, 12:37:58", "remaining_time": "5:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15479, "total_steps": 17941, "loss": 1.8503, "learning_rate": 4.744478176939976e-06, "epoch": 0.8627724207123348, "percentage": 86.28, "elapsed_time": "1 day, 12:38:06", "remaining_time": "5:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15480, "total_steps": 17941, "loss": 1.8527, "learning_rate": 4.740693022116549e-06, "epoch": 0.862828158965498, "percentage": 86.28, "elapsed_time": "1 day, 12:38:14", "remaining_time": "5:49:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15481, "total_steps": 17941, "loss": 1.5862, "learning_rate": 4.736909302654469e-06, "epoch": 0.8628838972186612, "percentage": 86.29, "elapsed_time": "1 day, 12:38:23", "remaining_time": "5:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15482, "total_steps": 17941, "loss": 1.3339, "learning_rate": 4.7331270186737055e-06, "epoch": 0.8629396354718243, "percentage": 86.29, "elapsed_time": "1 day, 12:38:31", "remaining_time": "5:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15483, "total_steps": 17941, "loss": 1.6642, "learning_rate": 4.729346170294247e-06, "epoch": 0.8629953737249875, "percentage": 86.3, "elapsed_time": "1 day, 12:38:40", "remaining_time": "5:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15484, "total_steps": 17941, "loss": 1.4468, "learning_rate": 4.725566757635969e-06, "epoch": 0.8630511119781507, "percentage": 86.31, "elapsed_time": "1 day, 12:38:48", "remaining_time": "5:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15485, "total_steps": 17941, "loss": 1.6472, "learning_rate": 4.721788780818748e-06, "epoch": 0.8631068502313137, "percentage": 86.31, "elapsed_time": "1 day, 12:38:57", "remaining_time": "5:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15486, "total_steps": 17941, "loss": 1.5244, "learning_rate": 4.718012239962399e-06, "epoch": 0.8631625884844769, "percentage": 86.32, "elapsed_time": "1 day, 12:39:05", "remaining_time": "5:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15487, "total_steps": 17941, "loss": 2.0101, "learning_rate": 4.714237135186689e-06, "epoch": 0.8632183267376401, "percentage": 86.32, "elapsed_time": "1 day, 12:39:14", "remaining_time": "5:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15488, "total_steps": 17941, "loss": 1.5559, "learning_rate": 4.710463466611348e-06, "epoch": 0.8632740649908032, "percentage": 86.33, "elapsed_time": "1 day, 12:39:22", "remaining_time": "5:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15489, "total_steps": 17941, "loss": 1.485, "learning_rate": 4.706691234356031e-06, "epoch": 0.8633298032439664, "percentage": 86.33, "elapsed_time": "1 day, 12:39:30", "remaining_time": "5:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15490, "total_steps": 17941, "loss": 1.6059, "learning_rate": 4.702920438540409e-06, "epoch": 0.8633855414971294, "percentage": 86.34, "elapsed_time": "1 day, 12:39:39", "remaining_time": "5:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15491, "total_steps": 17941, "loss": 1.5789, "learning_rate": 4.699151079284042e-06, "epoch": 0.8634412797502926, "percentage": 86.34, "elapsed_time": "1 day, 12:39:47", "remaining_time": "5:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15492, "total_steps": 17941, "loss": 1.675, "learning_rate": 4.695383156706484e-06, "epoch": 0.8634970180034558, "percentage": 86.35, "elapsed_time": "1 day, 12:39:56", "remaining_time": "5:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15493, "total_steps": 17941, "loss": 1.5333, "learning_rate": 4.691616670927224e-06, "epoch": 0.8635527562566189, "percentage": 86.36, "elapsed_time": "1 day, 12:40:05", "remaining_time": "5:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15494, "total_steps": 17941, "loss": 1.4639, "learning_rate": 4.68785162206572e-06, "epoch": 0.863608494509782, "percentage": 86.36, "elapsed_time": "1 day, 12:40:14", "remaining_time": "5:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15495, "total_steps": 17941, "loss": 1.79, "learning_rate": 4.684088010241377e-06, "epoch": 0.8636642327629452, "percentage": 86.37, "elapsed_time": "1 day, 12:40:22", "remaining_time": "5:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15496, "total_steps": 17941, "loss": 1.6528, "learning_rate": 4.680325835573551e-06, "epoch": 0.8637199710161083, "percentage": 86.37, "elapsed_time": "1 day, 12:40:30", "remaining_time": "5:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15497, "total_steps": 17941, "loss": 1.7418, "learning_rate": 4.676565098181551e-06, "epoch": 0.8637757092692715, "percentage": 86.38, "elapsed_time": "1 day, 12:40:39", "remaining_time": "5:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15498, "total_steps": 17941, "loss": 1.8748, "learning_rate": 4.6728057981846596e-06, "epoch": 0.8638314475224347, "percentage": 86.38, "elapsed_time": "1 day, 12:40:47", "remaining_time": "5:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15499, "total_steps": 17941, "loss": 1.599, "learning_rate": 4.669047935702087e-06, "epoch": 0.8638871857755978, "percentage": 86.39, "elapsed_time": "1 day, 12:40:56", "remaining_time": "5:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15500, "total_steps": 17941, "loss": 1.6501, "learning_rate": 4.665291510853015e-06, "epoch": 0.8639429240287609, "percentage": 86.39, "elapsed_time": "1 day, 12:41:04", "remaining_time": "5:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15501, "total_steps": 17941, "loss": 1.7524, "learning_rate": 4.661536523756576e-06, "epoch": 0.8639986622819241, "percentage": 86.4, "elapsed_time": "1 day, 12:41:13", "remaining_time": "5:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15502, "total_steps": 17941, "loss": 1.5037, "learning_rate": 4.6577829745318714e-06, "epoch": 0.8640544005350872, "percentage": 86.41, "elapsed_time": "1 day, 12:41:21", "remaining_time": "5:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15503, "total_steps": 17941, "loss": 1.6441, "learning_rate": 4.654030863297915e-06, "epoch": 0.8641101387882504, "percentage": 86.41, "elapsed_time": "1 day, 12:41:29", "remaining_time": "5:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15504, "total_steps": 17941, "loss": 1.593, "learning_rate": 4.650280190173717e-06, "epoch": 0.8641658770414136, "percentage": 86.42, "elapsed_time": "1 day, 12:41:38", "remaining_time": "5:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15505, "total_steps": 17941, "loss": 1.7073, "learning_rate": 4.6465309552782224e-06, "epoch": 0.8642216152945766, "percentage": 86.42, "elapsed_time": "1 day, 12:41:46", "remaining_time": "5:45:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15506, "total_steps": 17941, "loss": 1.6903, "learning_rate": 4.642783158730335e-06, "epoch": 0.8642773535477398, "percentage": 86.43, "elapsed_time": "1 day, 12:41:55", "remaining_time": "5:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15507, "total_steps": 17941, "loss": 1.8398, "learning_rate": 4.639036800648927e-06, "epoch": 0.864333091800903, "percentage": 86.43, "elapsed_time": "1 day, 12:42:03", "remaining_time": "5:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15508, "total_steps": 17941, "loss": 1.5834, "learning_rate": 4.635291881152776e-06, "epoch": 0.8643888300540661, "percentage": 86.44, "elapsed_time": "1 day, 12:42:12", "remaining_time": "5:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15509, "total_steps": 17941, "loss": 1.6087, "learning_rate": 4.631548400360697e-06, "epoch": 0.8644445683072293, "percentage": 86.44, "elapsed_time": "1 day, 12:42:20", "remaining_time": "5:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15510, "total_steps": 17941, "loss": 1.5439, "learning_rate": 4.627806358391374e-06, "epoch": 0.8645003065603925, "percentage": 86.45, "elapsed_time": "1 day, 12:42:29", "remaining_time": "5:45:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15511, "total_steps": 17941, "loss": 1.7105, "learning_rate": 4.624065755363494e-06, "epoch": 0.8645560448135555, "percentage": 86.46, "elapsed_time": "1 day, 12:42:37", "remaining_time": "5:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15512, "total_steps": 17941, "loss": 1.5566, "learning_rate": 4.620326591395685e-06, "epoch": 0.8646117830667187, "percentage": 86.46, "elapsed_time": "1 day, 12:42:45", "remaining_time": "5:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15513, "total_steps": 17941, "loss": 1.6774, "learning_rate": 4.616588866606542e-06, "epoch": 0.8646675213198818, "percentage": 86.47, "elapsed_time": "1 day, 12:42:54", "remaining_time": "5:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15514, "total_steps": 17941, "loss": 1.4555, "learning_rate": 4.612852581114602e-06, "epoch": 0.864723259573045, "percentage": 86.47, "elapsed_time": "1 day, 12:43:02", "remaining_time": "5:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15515, "total_steps": 17941, "loss": 1.6735, "learning_rate": 4.609117735038332e-06, "epoch": 0.8647789978262082, "percentage": 86.48, "elapsed_time": "1 day, 12:43:11", "remaining_time": "5:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15516, "total_steps": 17941, "loss": 1.8024, "learning_rate": 4.605384328496221e-06, "epoch": 0.8648347360793712, "percentage": 86.48, "elapsed_time": "1 day, 12:43:19", "remaining_time": "5:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15517, "total_steps": 17941, "loss": 1.4956, "learning_rate": 4.60165236160664e-06, "epoch": 0.8648904743325344, "percentage": 86.49, "elapsed_time": "1 day, 12:43:28", "remaining_time": "5:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15518, "total_steps": 17941, "loss": 1.8077, "learning_rate": 4.597921834487956e-06, "epoch": 0.8649462125856976, "percentage": 86.49, "elapsed_time": "1 day, 12:43:36", "remaining_time": "5:44:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15519, "total_steps": 17941, "loss": 1.5009, "learning_rate": 4.59419274725848e-06, "epoch": 0.8650019508388607, "percentage": 86.5, "elapsed_time": "1 day, 12:43:45", "remaining_time": "5:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15520, "total_steps": 17941, "loss": 1.6073, "learning_rate": 4.590465100036473e-06, "epoch": 0.8650576890920239, "percentage": 86.51, "elapsed_time": "1 day, 12:43:53", "remaining_time": "5:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15521, "total_steps": 17941, "loss": 1.594, "learning_rate": 4.586738892940173e-06, "epoch": 0.865113427345187, "percentage": 86.51, "elapsed_time": "1 day, 12:44:02", "remaining_time": "5:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15522, "total_steps": 17941, "loss": 1.2062, "learning_rate": 4.58301412608772e-06, "epoch": 0.8651691655983501, "percentage": 86.52, "elapsed_time": "1 day, 12:44:11", "remaining_time": "5:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15523, "total_steps": 17941, "loss": 1.5692, "learning_rate": 4.579290799597263e-06, "epoch": 0.8652249038515133, "percentage": 86.52, "elapsed_time": "1 day, 12:44:19", "remaining_time": "5:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15524, "total_steps": 17941, "loss": 1.7171, "learning_rate": 4.57556891358688e-06, "epoch": 0.8652806421046765, "percentage": 86.53, "elapsed_time": "1 day, 12:44:28", "remaining_time": "5:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15525, "total_steps": 17941, "loss": 1.475, "learning_rate": 4.571848468174611e-06, "epoch": 0.8653363803578396, "percentage": 86.53, "elapsed_time": "1 day, 12:44:36", "remaining_time": "5:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15526, "total_steps": 17941, "loss": 1.5265, "learning_rate": 4.568129463478443e-06, "epoch": 0.8653921186110027, "percentage": 86.54, "elapsed_time": "1 day, 12:44:45", "remaining_time": "5:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15527, "total_steps": 17941, "loss": 1.5385, "learning_rate": 4.564411899616322e-06, "epoch": 0.8654478568641659, "percentage": 86.54, "elapsed_time": "1 day, 12:44:53", "remaining_time": "5:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15528, "total_steps": 17941, "loss": 1.8107, "learning_rate": 4.560695776706159e-06, "epoch": 0.865503595117329, "percentage": 86.55, "elapsed_time": "1 day, 12:45:02", "remaining_time": "5:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15529, "total_steps": 17941, "loss": 1.8119, "learning_rate": 4.556981094865781e-06, "epoch": 0.8655593333704922, "percentage": 86.56, "elapsed_time": "1 day, 12:45:10", "remaining_time": "5:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15530, "total_steps": 17941, "loss": 1.8444, "learning_rate": 4.553267854213017e-06, "epoch": 0.8656150716236554, "percentage": 86.56, "elapsed_time": "1 day, 12:45:19", "remaining_time": "5:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15531, "total_steps": 17941, "loss": 1.3499, "learning_rate": 4.5495560548656224e-06, "epoch": 0.8656708098768184, "percentage": 86.57, "elapsed_time": "1 day, 12:45:27", "remaining_time": "5:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15532, "total_steps": 17941, "loss": 1.6111, "learning_rate": 4.545845696941314e-06, "epoch": 0.8657265481299816, "percentage": 86.57, "elapsed_time": "1 day, 12:45:35", "remaining_time": "5:42:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15533, "total_steps": 17941, "loss": 1.6156, "learning_rate": 4.542136780557776e-06, "epoch": 0.8657822863831448, "percentage": 86.58, "elapsed_time": "1 day, 12:45:44", "remaining_time": "5:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15534, "total_steps": 17941, "loss": 1.7633, "learning_rate": 4.538429305832597e-06, "epoch": 0.8658380246363079, "percentage": 86.58, "elapsed_time": "1 day, 12:45:52", "remaining_time": "5:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15535, "total_steps": 17941, "loss": 1.7511, "learning_rate": 4.534723272883407e-06, "epoch": 0.8658937628894711, "percentage": 86.59, "elapsed_time": "1 day, 12:46:01", "remaining_time": "5:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15536, "total_steps": 17941, "loss": 1.7555, "learning_rate": 4.5310186818277035e-06, "epoch": 0.8659495011426341, "percentage": 86.59, "elapsed_time": "1 day, 12:46:09", "remaining_time": "5:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15537, "total_steps": 17941, "loss": 1.5834, "learning_rate": 4.527315532782983e-06, "epoch": 0.8660052393957973, "percentage": 86.6, "elapsed_time": "1 day, 12:46:18", "remaining_time": "5:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15538, "total_steps": 17941, "loss": 1.9246, "learning_rate": 4.523613825866685e-06, "epoch": 0.8660609776489605, "percentage": 86.61, "elapsed_time": "1 day, 12:46:27", "remaining_time": "5:41:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15539, "total_steps": 17941, "loss": 1.5153, "learning_rate": 4.519913561196215e-06, "epoch": 0.8661167159021236, "percentage": 86.61, "elapsed_time": "1 day, 12:46:35", "remaining_time": "5:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15540, "total_steps": 17941, "loss": 1.5956, "learning_rate": 4.51621473888893e-06, "epoch": 0.8661724541552868, "percentage": 86.62, "elapsed_time": "1 day, 12:46:44", "remaining_time": "5:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15541, "total_steps": 17941, "loss": 1.649, "learning_rate": 4.512517359062107e-06, "epoch": 0.86622819240845, "percentage": 86.62, "elapsed_time": "1 day, 12:46:52", "remaining_time": "5:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15542, "total_steps": 17941, "loss": 1.5356, "learning_rate": 4.508821421833037e-06, "epoch": 0.866283930661613, "percentage": 86.63, "elapsed_time": "1 day, 12:47:00", "remaining_time": "5:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15543, "total_steps": 17941, "loss": 1.7055, "learning_rate": 4.505126927318915e-06, "epoch": 0.8663396689147762, "percentage": 86.63, "elapsed_time": "1 day, 12:47:10", "remaining_time": "5:40:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15544, "total_steps": 17941, "loss": 1.6176, "learning_rate": 4.501433875636912e-06, "epoch": 0.8663954071679394, "percentage": 86.64, "elapsed_time": "1 day, 12:47:18", "remaining_time": "5:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15545, "total_steps": 17941, "loss": 1.6723, "learning_rate": 4.497742266904148e-06, "epoch": 0.8664511454211025, "percentage": 86.65, "elapsed_time": "1 day, 12:47:27", "remaining_time": "5:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15546, "total_steps": 17941, "loss": 1.712, "learning_rate": 4.494052101237706e-06, "epoch": 0.8665068836742656, "percentage": 86.65, "elapsed_time": "1 day, 12:47:35", "remaining_time": "5:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15547, "total_steps": 17941, "loss": 1.5149, "learning_rate": 4.490363378754625e-06, "epoch": 0.8665626219274288, "percentage": 86.66, "elapsed_time": "1 day, 12:47:44", "remaining_time": "5:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15548, "total_steps": 17941, "loss": 1.7661, "learning_rate": 4.486676099571863e-06, "epoch": 0.8666183601805919, "percentage": 86.66, "elapsed_time": "1 day, 12:47:52", "remaining_time": "5:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15549, "total_steps": 17941, "loss": 1.6221, "learning_rate": 4.4829902638063746e-06, "epoch": 0.8666740984337551, "percentage": 86.67, "elapsed_time": "1 day, 12:48:00", "remaining_time": "5:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15550, "total_steps": 17941, "loss": 1.7164, "learning_rate": 4.479305871575057e-06, "epoch": 0.8667298366869183, "percentage": 86.67, "elapsed_time": "1 day, 12:48:09", "remaining_time": "5:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15551, "total_steps": 17941, "loss": 1.4664, "learning_rate": 4.475622922994749e-06, "epoch": 0.8667855749400813, "percentage": 86.68, "elapsed_time": "1 day, 12:48:17", "remaining_time": "5:39:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15552, "total_steps": 17941, "loss": 1.5011, "learning_rate": 4.471941418182257e-06, "epoch": 0.8668413131932445, "percentage": 86.68, "elapsed_time": "1 day, 12:48:26", "remaining_time": "5:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15553, "total_steps": 17941, "loss": 1.8066, "learning_rate": 4.468261357254339e-06, "epoch": 0.8668970514464077, "percentage": 86.69, "elapsed_time": "1 day, 12:48:34", "remaining_time": "5:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15554, "total_steps": 17941, "loss": 1.5738, "learning_rate": 4.46458274032771e-06, "epoch": 0.8669527896995708, "percentage": 86.7, "elapsed_time": "1 day, 12:48:43", "remaining_time": "5:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15555, "total_steps": 17941, "loss": 1.749, "learning_rate": 4.460905567519019e-06, "epoch": 0.867008527952734, "percentage": 86.7, "elapsed_time": "1 day, 12:48:52", "remaining_time": "5:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15556, "total_steps": 17941, "loss": 1.6565, "learning_rate": 4.457229838944888e-06, "epoch": 0.8670642662058972, "percentage": 86.71, "elapsed_time": "1 day, 12:49:00", "remaining_time": "5:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15557, "total_steps": 17941, "loss": 1.7361, "learning_rate": 4.453555554721894e-06, "epoch": 0.8671200044590602, "percentage": 86.71, "elapsed_time": "1 day, 12:49:09", "remaining_time": "5:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15558, "total_steps": 17941, "loss": 1.6593, "learning_rate": 4.449882714966569e-06, "epoch": 0.8671757427122234, "percentage": 86.72, "elapsed_time": "1 day, 12:49:17", "remaining_time": "5:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15559, "total_steps": 17941, "loss": 1.6871, "learning_rate": 4.446211319795385e-06, "epoch": 0.8672314809653865, "percentage": 86.72, "elapsed_time": "1 day, 12:49:25", "remaining_time": "5:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15560, "total_steps": 17941, "loss": 1.7918, "learning_rate": 4.442541369324782e-06, "epoch": 0.8672872192185497, "percentage": 86.73, "elapsed_time": "1 day, 12:49:34", "remaining_time": "5:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15561, "total_steps": 17941, "loss": 1.6794, "learning_rate": 4.438872863671156e-06, "epoch": 0.8673429574717129, "percentage": 86.73, "elapsed_time": "1 day, 12:49:42", "remaining_time": "5:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15562, "total_steps": 17941, "loss": 1.7128, "learning_rate": 4.435205802950832e-06, "epoch": 0.8673986957248759, "percentage": 86.74, "elapsed_time": "1 day, 12:49:51", "remaining_time": "5:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15563, "total_steps": 17941, "loss": 1.7655, "learning_rate": 4.431540187280126e-06, "epoch": 0.8674544339780391, "percentage": 86.75, "elapsed_time": "1 day, 12:50:00", "remaining_time": "5:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15564, "total_steps": 17941, "loss": 1.5178, "learning_rate": 4.427876016775273e-06, "epoch": 0.8675101722312023, "percentage": 86.75, "elapsed_time": "1 day, 12:50:08", "remaining_time": "5:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15565, "total_steps": 17941, "loss": 1.435, "learning_rate": 4.424213291552498e-06, "epoch": 0.8675659104843654, "percentage": 86.76, "elapsed_time": "1 day, 12:50:17", "remaining_time": "5:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15566, "total_steps": 17941, "loss": 1.6849, "learning_rate": 4.420552011727952e-06, "epoch": 0.8676216487375286, "percentage": 86.76, "elapsed_time": "1 day, 12:50:25", "remaining_time": "5:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15567, "total_steps": 17941, "loss": 1.428, "learning_rate": 4.416892177417736e-06, "epoch": 0.8676773869906917, "percentage": 86.77, "elapsed_time": "1 day, 12:50:33", "remaining_time": "5:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15568, "total_steps": 17941, "loss": 2.1306, "learning_rate": 4.413233788737953e-06, "epoch": 0.8677331252438548, "percentage": 86.77, "elapsed_time": "1 day, 12:50:42", "remaining_time": "5:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15569, "total_steps": 17941, "loss": 1.6757, "learning_rate": 4.409576845804591e-06, "epoch": 0.867788863497018, "percentage": 86.78, "elapsed_time": "1 day, 12:50:50", "remaining_time": "5:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15570, "total_steps": 17941, "loss": 1.6635, "learning_rate": 4.405921348733644e-06, "epoch": 0.8678446017501812, "percentage": 86.78, "elapsed_time": "1 day, 12:50:59", "remaining_time": "5:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15571, "total_steps": 17941, "loss": 1.6816, "learning_rate": 4.402267297641044e-06, "epoch": 0.8679003400033443, "percentage": 86.79, "elapsed_time": "1 day, 12:51:07", "remaining_time": "5:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15572, "total_steps": 17941, "loss": 1.7229, "learning_rate": 4.398614692642666e-06, "epoch": 0.8679560782565074, "percentage": 86.8, "elapsed_time": "1 day, 12:51:16", "remaining_time": "5:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15573, "total_steps": 17941, "loss": 1.5502, "learning_rate": 4.394963533854362e-06, "epoch": 0.8680118165096706, "percentage": 86.8, "elapsed_time": "1 day, 12:51:24", "remaining_time": "5:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15574, "total_steps": 17941, "loss": 1.6453, "learning_rate": 4.391313821391918e-06, "epoch": 0.8680675547628337, "percentage": 86.81, "elapsed_time": "1 day, 12:51:33", "remaining_time": "5:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15575, "total_steps": 17941, "loss": 1.4136, "learning_rate": 4.387665555371079e-06, "epoch": 0.8681232930159969, "percentage": 86.81, "elapsed_time": "1 day, 12:51:41", "remaining_time": "5:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15576, "total_steps": 17941, "loss": 1.7267, "learning_rate": 4.384018735907547e-06, "epoch": 0.8681790312691601, "percentage": 86.82, "elapsed_time": "1 day, 12:51:50", "remaining_time": "5:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15577, "total_steps": 17941, "loss": 1.313, "learning_rate": 4.380373363116985e-06, "epoch": 0.8682347695223231, "percentage": 86.82, "elapsed_time": "1 day, 12:51:58", "remaining_time": "5:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15578, "total_steps": 17941, "loss": 1.7581, "learning_rate": 4.376729437114996e-06, "epoch": 0.8682905077754863, "percentage": 86.83, "elapsed_time": "1 day, 12:52:06", "remaining_time": "5:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15579, "total_steps": 17941, "loss": 1.7934, "learning_rate": 4.373086958017147e-06, "epoch": 0.8683462460286495, "percentage": 86.83, "elapsed_time": "1 day, 12:52:15", "remaining_time": "5:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15580, "total_steps": 17941, "loss": 1.5457, "learning_rate": 4.3694459259389696e-06, "epoch": 0.8684019842818126, "percentage": 86.84, "elapsed_time": "1 day, 12:52:23", "remaining_time": "5:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15581, "total_steps": 17941, "loss": 1.5551, "learning_rate": 4.3658063409959095e-06, "epoch": 0.8684577225349758, "percentage": 86.85, "elapsed_time": "1 day, 12:52:32", "remaining_time": "5:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15582, "total_steps": 17941, "loss": 1.6441, "learning_rate": 4.3621682033034075e-06, "epoch": 0.8685134607881388, "percentage": 86.85, "elapsed_time": "1 day, 12:52:40", "remaining_time": "5:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15583, "total_steps": 17941, "loss": 1.3928, "learning_rate": 4.358531512976849e-06, "epoch": 0.868569199041302, "percentage": 86.86, "elapsed_time": "1 day, 12:52:49", "remaining_time": "5:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15584, "total_steps": 17941, "loss": 1.6283, "learning_rate": 4.354896270131553e-06, "epoch": 0.8686249372944652, "percentage": 86.86, "elapsed_time": "1 day, 12:52:57", "remaining_time": "5:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15585, "total_steps": 17941, "loss": 2.1723, "learning_rate": 4.351262474882822e-06, "epoch": 0.8686806755476283, "percentage": 86.87, "elapsed_time": "1 day, 12:53:06", "remaining_time": "5:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15586, "total_steps": 17941, "loss": 1.6998, "learning_rate": 4.347630127345897e-06, "epoch": 0.8687364138007915, "percentage": 86.87, "elapsed_time": "1 day, 12:53:14", "remaining_time": "5:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15587, "total_steps": 17941, "loss": 1.5729, "learning_rate": 4.343999227635981e-06, "epoch": 0.8687921520539547, "percentage": 86.88, "elapsed_time": "1 day, 12:53:23", "remaining_time": "5:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15588, "total_steps": 17941, "loss": 1.9269, "learning_rate": 4.340369775868203e-06, "epoch": 0.8688478903071177, "percentage": 86.88, "elapsed_time": "1 day, 12:53:32", "remaining_time": "5:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15589, "total_steps": 17941, "loss": 1.6061, "learning_rate": 4.336741772157688e-06, "epoch": 0.8689036285602809, "percentage": 86.89, "elapsed_time": "1 day, 12:53:40", "remaining_time": "5:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15590, "total_steps": 17941, "loss": 1.6895, "learning_rate": 4.333115216619482e-06, "epoch": 0.8689593668134441, "percentage": 86.9, "elapsed_time": "1 day, 12:53:50", "remaining_time": "5:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15591, "total_steps": 17941, "loss": 1.6801, "learning_rate": 4.329490109368611e-06, "epoch": 0.8690151050666072, "percentage": 86.9, "elapsed_time": "1 day, 12:53:58", "remaining_time": "5:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15592, "total_steps": 17941, "loss": 1.4233, "learning_rate": 4.325866450520044e-06, "epoch": 0.8690708433197704, "percentage": 86.91, "elapsed_time": "1 day, 12:54:07", "remaining_time": "5:33:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15593, "total_steps": 17941, "loss": 1.6267, "learning_rate": 4.322244240188672e-06, "epoch": 0.8691265815729335, "percentage": 86.91, "elapsed_time": "1 day, 12:54:15", "remaining_time": "5:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15594, "total_steps": 17941, "loss": 1.8838, "learning_rate": 4.318623478489414e-06, "epoch": 0.8691823198260966, "percentage": 86.92, "elapsed_time": "1 day, 12:54:24", "remaining_time": "5:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15595, "total_steps": 17941, "loss": 1.7112, "learning_rate": 4.315004165537073e-06, "epoch": 0.8692380580792598, "percentage": 86.92, "elapsed_time": "1 day, 12:54:32", "remaining_time": "5:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15596, "total_steps": 17941, "loss": 1.513, "learning_rate": 4.311386301446435e-06, "epoch": 0.869293796332423, "percentage": 86.93, "elapsed_time": "1 day, 12:54:40", "remaining_time": "5:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15597, "total_steps": 17941, "loss": 1.6379, "learning_rate": 4.307769886332236e-06, "epoch": 0.8693495345855861, "percentage": 86.93, "elapsed_time": "1 day, 12:54:49", "remaining_time": "5:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15598, "total_steps": 17941, "loss": 1.4164, "learning_rate": 4.304154920309178e-06, "epoch": 0.8694052728387492, "percentage": 86.94, "elapsed_time": "1 day, 12:54:57", "remaining_time": "5:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15599, "total_steps": 17941, "loss": 1.5725, "learning_rate": 4.3005414034919086e-06, "epoch": 0.8694610110919124, "percentage": 86.95, "elapsed_time": "1 day, 12:55:06", "remaining_time": "5:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15600, "total_steps": 17941, "loss": 1.6476, "learning_rate": 4.296929335995009e-06, "epoch": 0.8695167493450755, "percentage": 86.95, "elapsed_time": "1 day, 12:55:14", "remaining_time": "5:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15601, "total_steps": 17941, "loss": 1.8728, "learning_rate": 4.2933187179330424e-06, "epoch": 0.8695724875982387, "percentage": 86.96, "elapsed_time": "1 day, 12:55:23", "remaining_time": "5:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15602, "total_steps": 17941, "loss": 1.7015, "learning_rate": 4.2897095494205176e-06, "epoch": 0.8696282258514019, "percentage": 86.96, "elapsed_time": "1 day, 12:55:31", "remaining_time": "5:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15603, "total_steps": 17941, "loss": 1.7217, "learning_rate": 4.2861018305718984e-06, "epoch": 0.8696839641045649, "percentage": 86.97, "elapsed_time": "1 day, 12:55:39", "remaining_time": "5:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15604, "total_steps": 17941, "loss": 1.8056, "learning_rate": 4.282495561501598e-06, "epoch": 0.8697397023577281, "percentage": 86.97, "elapsed_time": "1 day, 12:55:48", "remaining_time": "5:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15605, "total_steps": 17941, "loss": 1.8375, "learning_rate": 4.278890742323988e-06, "epoch": 0.8697954406108912, "percentage": 86.98, "elapsed_time": "1 day, 12:55:57", "remaining_time": "5:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15606, "total_steps": 17941, "loss": 1.5903, "learning_rate": 4.275287373153403e-06, "epoch": 0.8698511788640544, "percentage": 86.99, "elapsed_time": "1 day, 12:56:06", "remaining_time": "5:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15607, "total_steps": 17941, "loss": 1.6892, "learning_rate": 4.271685454104091e-06, "epoch": 0.8699069171172176, "percentage": 86.99, "elapsed_time": "1 day, 12:56:14", "remaining_time": "5:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15608, "total_steps": 17941, "loss": 1.5293, "learning_rate": 4.26808498529031e-06, "epoch": 0.8699626553703806, "percentage": 87.0, "elapsed_time": "1 day, 12:56:23", "remaining_time": "5:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15609, "total_steps": 17941, "loss": 1.6881, "learning_rate": 4.264485966826231e-06, "epoch": 0.8700183936235438, "percentage": 87.0, "elapsed_time": "1 day, 12:56:31", "remaining_time": "5:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15610, "total_steps": 17941, "loss": 1.5591, "learning_rate": 4.260888398826008e-06, "epoch": 0.870074131876707, "percentage": 87.01, "elapsed_time": "1 day, 12:56:40", "remaining_time": "5:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15611, "total_steps": 17941, "loss": 1.4014, "learning_rate": 4.257292281403724e-06, "epoch": 0.8701298701298701, "percentage": 87.01, "elapsed_time": "1 day, 12:56:48", "remaining_time": "5:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15612, "total_steps": 17941, "loss": 1.6571, "learning_rate": 4.25369761467343e-06, "epoch": 0.8701856083830333, "percentage": 87.02, "elapsed_time": "1 day, 12:56:57", "remaining_time": "5:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15613, "total_steps": 17941, "loss": 1.5419, "learning_rate": 4.250104398749138e-06, "epoch": 0.8702413466361965, "percentage": 87.02, "elapsed_time": "1 day, 12:57:06", "remaining_time": "5:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15614, "total_steps": 17941, "loss": 1.7289, "learning_rate": 4.246512633744781e-06, "epoch": 0.8702970848893595, "percentage": 87.03, "elapsed_time": "1 day, 12:57:14", "remaining_time": "5:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15615, "total_steps": 17941, "loss": 1.6259, "learning_rate": 4.242922319774284e-06, "epoch": 0.8703528231425227, "percentage": 87.04, "elapsed_time": "1 day, 12:57:23", "remaining_time": "5:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15616, "total_steps": 17941, "loss": 1.7026, "learning_rate": 4.239333456951511e-06, "epoch": 0.8704085613956859, "percentage": 87.04, "elapsed_time": "1 day, 12:57:31", "remaining_time": "5:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15617, "total_steps": 17941, "loss": 1.673, "learning_rate": 4.235746045390276e-06, "epoch": 0.870464299648849, "percentage": 87.05, "elapsed_time": "1 day, 12:57:40", "remaining_time": "5:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15618, "total_steps": 17941, "loss": 1.4717, "learning_rate": 4.232160085204362e-06, "epoch": 0.8705200379020122, "percentage": 87.05, "elapsed_time": "1 day, 12:57:48", "remaining_time": "5:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15619, "total_steps": 17941, "loss": 1.5752, "learning_rate": 4.228575576507471e-06, "epoch": 0.8705757761551753, "percentage": 87.06, "elapsed_time": "1 day, 12:57:57", "remaining_time": "5:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15620, "total_steps": 17941, "loss": 1.8164, "learning_rate": 4.224992519413307e-06, "epoch": 0.8706315144083384, "percentage": 87.06, "elapsed_time": "1 day, 12:58:05", "remaining_time": "5:29:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15621, "total_steps": 17941, "loss": 1.6512, "learning_rate": 4.221410914035489e-06, "epoch": 0.8706872526615016, "percentage": 87.07, "elapsed_time": "1 day, 12:58:14", "remaining_time": "5:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15622, "total_steps": 17941, "loss": 1.8409, "learning_rate": 4.217830760487607e-06, "epoch": 0.8707429909146648, "percentage": 87.07, "elapsed_time": "1 day, 12:58:22", "remaining_time": "5:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15623, "total_steps": 17941, "loss": 1.4412, "learning_rate": 4.2142520588832055e-06, "epoch": 0.8707987291678279, "percentage": 87.08, "elapsed_time": "1 day, 12:58:31", "remaining_time": "5:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15624, "total_steps": 17941, "loss": 1.7831, "learning_rate": 4.210674809335785e-06, "epoch": 0.870854467420991, "percentage": 87.09, "elapsed_time": "1 day, 12:58:39", "remaining_time": "5:29:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15625, "total_steps": 17941, "loss": 1.8052, "learning_rate": 4.207099011958793e-06, "epoch": 0.8709102056741542, "percentage": 87.09, "elapsed_time": "1 day, 12:58:48", "remaining_time": "5:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15626, "total_steps": 17941, "loss": 1.6564, "learning_rate": 4.20352466686561e-06, "epoch": 0.8709659439273173, "percentage": 87.1, "elapsed_time": "1 day, 12:58:56", "remaining_time": "5:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15627, "total_steps": 17941, "loss": 1.4838, "learning_rate": 4.19995177416963e-06, "epoch": 0.8710216821804805, "percentage": 87.1, "elapsed_time": "1 day, 12:59:05", "remaining_time": "5:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15628, "total_steps": 17941, "loss": 1.7513, "learning_rate": 4.19638033398414e-06, "epoch": 0.8710774204336436, "percentage": 87.11, "elapsed_time": "1 day, 12:59:14", "remaining_time": "5:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15629, "total_steps": 17941, "loss": 1.6848, "learning_rate": 4.192810346422415e-06, "epoch": 0.8711331586868067, "percentage": 87.11, "elapsed_time": "1 day, 12:59:23", "remaining_time": "5:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15630, "total_steps": 17941, "loss": 1.7092, "learning_rate": 4.189241811597666e-06, "epoch": 0.8711888969399699, "percentage": 87.12, "elapsed_time": "1 day, 12:59:32", "remaining_time": "5:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15631, "total_steps": 17941, "loss": 1.7318, "learning_rate": 4.185674729623074e-06, "epoch": 0.871244635193133, "percentage": 87.12, "elapsed_time": "1 day, 12:59:40", "remaining_time": "5:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15632, "total_steps": 17941, "loss": 1.6107, "learning_rate": 4.182109100611775e-06, "epoch": 0.8713003734462962, "percentage": 87.13, "elapsed_time": "1 day, 12:59:49", "remaining_time": "5:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15633, "total_steps": 17941, "loss": 1.6532, "learning_rate": 4.178544924676825e-06, "epoch": 0.8713561116994594, "percentage": 87.14, "elapsed_time": "1 day, 12:59:57", "remaining_time": "5:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15634, "total_steps": 17941, "loss": 1.2978, "learning_rate": 4.174982201931271e-06, "epoch": 0.8714118499526224, "percentage": 87.14, "elapsed_time": "1 day, 13:00:06", "remaining_time": "5:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15635, "total_steps": 17941, "loss": 1.4143, "learning_rate": 4.171420932488107e-06, "epoch": 0.8714675882057856, "percentage": 87.15, "elapsed_time": "1 day, 13:00:14", "remaining_time": "5:27:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15636, "total_steps": 17941, "loss": 1.515, "learning_rate": 4.1678611164602755e-06, "epoch": 0.8715233264589488, "percentage": 87.15, "elapsed_time": "1 day, 13:00:24", "remaining_time": "5:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15637, "total_steps": 17941, "loss": 1.7191, "learning_rate": 4.1643027539606635e-06, "epoch": 0.8715790647121119, "percentage": 87.16, "elapsed_time": "1 day, 13:00:32", "remaining_time": "5:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15638, "total_steps": 17941, "loss": 1.5287, "learning_rate": 4.160745845102127e-06, "epoch": 0.8716348029652751, "percentage": 87.16, "elapsed_time": "1 day, 13:00:41", "remaining_time": "5:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15639, "total_steps": 17941, "loss": 1.6858, "learning_rate": 4.157190389997484e-06, "epoch": 0.8716905412184383, "percentage": 87.17, "elapsed_time": "1 day, 13:00:49", "remaining_time": "5:26:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15640, "total_steps": 17941, "loss": 1.8478, "learning_rate": 4.153636388759469e-06, "epoch": 0.8717462794716013, "percentage": 87.17, "elapsed_time": "1 day, 13:00:58", "remaining_time": "5:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15641, "total_steps": 17941, "loss": 1.3555, "learning_rate": 4.150083841500807e-06, "epoch": 0.8718020177247645, "percentage": 87.18, "elapsed_time": "1 day, 13:01:07", "remaining_time": "5:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15642, "total_steps": 17941, "loss": 1.7335, "learning_rate": 4.1465327483341585e-06, "epoch": 0.8718577559779277, "percentage": 87.19, "elapsed_time": "1 day, 13:01:15", "remaining_time": "5:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15643, "total_steps": 17941, "loss": 1.4399, "learning_rate": 4.142983109372145e-06, "epoch": 0.8719134942310908, "percentage": 87.19, "elapsed_time": "1 day, 13:01:24", "remaining_time": "5:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15644, "total_steps": 17941, "loss": 1.5743, "learning_rate": 4.139434924727359e-06, "epoch": 0.871969232484254, "percentage": 87.2, "elapsed_time": "1 day, 13:01:32", "remaining_time": "5:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15645, "total_steps": 17941, "loss": 1.9219, "learning_rate": 4.135888194512289e-06, "epoch": 0.8720249707374171, "percentage": 87.2, "elapsed_time": "1 day, 13:01:40", "remaining_time": "5:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15646, "total_steps": 17941, "loss": 1.5456, "learning_rate": 4.132342918839455e-06, "epoch": 0.8720807089905802, "percentage": 87.21, "elapsed_time": "1 day, 13:01:49", "remaining_time": "5:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15647, "total_steps": 17941, "loss": 1.5484, "learning_rate": 4.128799097821268e-06, "epoch": 0.8721364472437434, "percentage": 87.21, "elapsed_time": "1 day, 13:01:58", "remaining_time": "5:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15648, "total_steps": 17941, "loss": 1.6531, "learning_rate": 4.125256731570132e-06, "epoch": 0.8721921854969066, "percentage": 87.22, "elapsed_time": "1 day, 13:02:06", "remaining_time": "5:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15649, "total_steps": 17941, "loss": 1.3986, "learning_rate": 4.121715820198379e-06, "epoch": 0.8722479237500697, "percentage": 87.22, "elapsed_time": "1 day, 13:02:15", "remaining_time": "5:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15650, "total_steps": 17941, "loss": 1.4709, "learning_rate": 4.11817636381831e-06, "epoch": 0.8723036620032328, "percentage": 87.23, "elapsed_time": "1 day, 13:02:25", "remaining_time": "5:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15651, "total_steps": 17941, "loss": 1.6281, "learning_rate": 4.114638362542189e-06, "epoch": 0.8723594002563959, "percentage": 87.24, "elapsed_time": "1 day, 13:02:33", "remaining_time": "5:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15652, "total_steps": 17941, "loss": 1.5158, "learning_rate": 4.111101816482193e-06, "epoch": 0.8724151385095591, "percentage": 87.24, "elapsed_time": "1 day, 13:02:42", "remaining_time": "5:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15653, "total_steps": 17941, "loss": 1.598, "learning_rate": 4.107566725750512e-06, "epoch": 0.8724708767627223, "percentage": 87.25, "elapsed_time": "1 day, 13:02:50", "remaining_time": "5:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15654, "total_steps": 17941, "loss": 1.5373, "learning_rate": 4.10403309045923e-06, "epoch": 0.8725266150158854, "percentage": 87.25, "elapsed_time": "1 day, 13:02:58", "remaining_time": "5:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15655, "total_steps": 17941, "loss": 1.5468, "learning_rate": 4.100500910720434e-06, "epoch": 0.8725823532690485, "percentage": 87.26, "elapsed_time": "1 day, 13:03:07", "remaining_time": "5:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15656, "total_steps": 17941, "loss": 1.742, "learning_rate": 4.096970186646132e-06, "epoch": 0.8726380915222117, "percentage": 87.26, "elapsed_time": "1 day, 13:03:16", "remaining_time": "5:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15657, "total_steps": 17941, "loss": 1.5131, "learning_rate": 4.093440918348302e-06, "epoch": 0.8726938297753748, "percentage": 87.27, "elapsed_time": "1 day, 13:03:24", "remaining_time": "5:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15658, "total_steps": 17941, "loss": 1.345, "learning_rate": 4.089913105938881e-06, "epoch": 0.872749568028538, "percentage": 87.27, "elapsed_time": "1 day, 13:03:33", "remaining_time": "5:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15659, "total_steps": 17941, "loss": 1.6515, "learning_rate": 4.086386749529736e-06, "epoch": 0.8728053062817012, "percentage": 87.28, "elapsed_time": "1 day, 13:03:41", "remaining_time": "5:24:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15660, "total_steps": 17941, "loss": 1.668, "learning_rate": 4.082861849232706e-06, "epoch": 0.8728610445348642, "percentage": 87.29, "elapsed_time": "1 day, 13:03:49", "remaining_time": "5:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15661, "total_steps": 17941, "loss": 1.6234, "learning_rate": 4.079338405159583e-06, "epoch": 0.8729167827880274, "percentage": 87.29, "elapsed_time": "1 day, 13:03:58", "remaining_time": "5:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15662, "total_steps": 17941, "loss": 1.6388, "learning_rate": 4.075816417422113e-06, "epoch": 0.8729725210411906, "percentage": 87.3, "elapsed_time": "1 day, 13:04:06", "remaining_time": "5:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15663, "total_steps": 17941, "loss": 1.5423, "learning_rate": 4.072295886131983e-06, "epoch": 0.8730282592943537, "percentage": 87.3, "elapsed_time": "1 day, 13:04:15", "remaining_time": "5:23:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15664, "total_steps": 17941, "loss": 1.4875, "learning_rate": 4.068776811400854e-06, "epoch": 0.8730839975475169, "percentage": 87.31, "elapsed_time": "1 day, 13:04:23", "remaining_time": "5:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15665, "total_steps": 17941, "loss": 1.5053, "learning_rate": 4.065259193340337e-06, "epoch": 0.87313973580068, "percentage": 87.31, "elapsed_time": "1 day, 13:04:32", "remaining_time": "5:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15666, "total_steps": 17941, "loss": 1.7788, "learning_rate": 4.061743032061971e-06, "epoch": 0.8731954740538431, "percentage": 87.32, "elapsed_time": "1 day, 13:04:40", "remaining_time": "5:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15667, "total_steps": 17941, "loss": 1.4898, "learning_rate": 4.058228327677277e-06, "epoch": 0.8732512123070063, "percentage": 87.33, "elapsed_time": "1 day, 13:04:49", "remaining_time": "5:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15668, "total_steps": 17941, "loss": 1.5606, "learning_rate": 4.054715080297722e-06, "epoch": 0.8733069505601695, "percentage": 87.33, "elapsed_time": "1 day, 13:04:57", "remaining_time": "5:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15669, "total_steps": 17941, "loss": 1.8127, "learning_rate": 4.051203290034722e-06, "epoch": 0.8733626888133326, "percentage": 87.34, "elapsed_time": "1 day, 13:05:05", "remaining_time": "5:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15670, "total_steps": 17941, "loss": 1.6833, "learning_rate": 4.047692956999665e-06, "epoch": 0.8734184270664958, "percentage": 87.34, "elapsed_time": "1 day, 13:05:14", "remaining_time": "5:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15671, "total_steps": 17941, "loss": 1.6853, "learning_rate": 4.044184081303848e-06, "epoch": 0.8734741653196589, "percentage": 87.35, "elapsed_time": "1 day, 13:05:22", "remaining_time": "5:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15672, "total_steps": 17941, "loss": 1.7173, "learning_rate": 4.04067666305859e-06, "epoch": 0.873529903572822, "percentage": 87.35, "elapsed_time": "1 day, 13:05:32", "remaining_time": "5:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15673, "total_steps": 17941, "loss": 1.6507, "learning_rate": 4.037170702375098e-06, "epoch": 0.8735856418259852, "percentage": 87.36, "elapsed_time": "1 day, 13:05:40", "remaining_time": "5:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15674, "total_steps": 17941, "loss": 1.4363, "learning_rate": 4.033666199364572e-06, "epoch": 0.8736413800791483, "percentage": 87.36, "elapsed_time": "1 day, 13:05:49", "remaining_time": "5:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15675, "total_steps": 17941, "loss": 1.6504, "learning_rate": 4.030163154138144e-06, "epoch": 0.8736971183323115, "percentage": 87.37, "elapsed_time": "1 day, 13:05:57", "remaining_time": "5:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15676, "total_steps": 17941, "loss": 1.5737, "learning_rate": 4.026661566806927e-06, "epoch": 0.8737528565854746, "percentage": 87.38, "elapsed_time": "1 day, 13:06:05", "remaining_time": "5:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15677, "total_steps": 17941, "loss": 1.438, "learning_rate": 4.023161437481965e-06, "epoch": 0.8738085948386377, "percentage": 87.38, "elapsed_time": "1 day, 13:06:14", "remaining_time": "5:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15678, "total_steps": 17941, "loss": 1.5465, "learning_rate": 4.01966276627424e-06, "epoch": 0.8738643330918009, "percentage": 87.39, "elapsed_time": "1 day, 13:06:22", "remaining_time": "5:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15679, "total_steps": 17941, "loss": 1.5558, "learning_rate": 4.0161655532947485e-06, "epoch": 0.8739200713449641, "percentage": 87.39, "elapsed_time": "1 day, 13:06:31", "remaining_time": "5:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15680, "total_steps": 17941, "loss": 1.3105, "learning_rate": 4.012669798654372e-06, "epoch": 0.8739758095981272, "percentage": 87.4, "elapsed_time": "1 day, 13:06:39", "remaining_time": "5:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15681, "total_steps": 17941, "loss": 1.6766, "learning_rate": 4.009175502463985e-06, "epoch": 0.8740315478512903, "percentage": 87.4, "elapsed_time": "1 day, 13:06:48", "remaining_time": "5:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15682, "total_steps": 17941, "loss": 1.6375, "learning_rate": 4.005682664834409e-06, "epoch": 0.8740872861044535, "percentage": 87.41, "elapsed_time": "1 day, 13:06:56", "remaining_time": "5:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15683, "total_steps": 17941, "loss": 1.5017, "learning_rate": 4.002191285876411e-06, "epoch": 0.8741430243576166, "percentage": 87.41, "elapsed_time": "1 day, 13:07:04", "remaining_time": "5:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15684, "total_steps": 17941, "loss": 1.6714, "learning_rate": 3.998701365700724e-06, "epoch": 0.8741987626107798, "percentage": 87.42, "elapsed_time": "1 day, 13:07:13", "remaining_time": "5:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15685, "total_steps": 17941, "loss": 1.6666, "learning_rate": 3.995212904418022e-06, "epoch": 0.874254500863943, "percentage": 87.43, "elapsed_time": "1 day, 13:07:21", "remaining_time": "5:20:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15686, "total_steps": 17941, "loss": 1.6705, "learning_rate": 3.991725902138932e-06, "epoch": 0.874310239117106, "percentage": 87.43, "elapsed_time": "1 day, 13:07:30", "remaining_time": "5:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15687, "total_steps": 17941, "loss": 1.5875, "learning_rate": 3.988240358974054e-06, "epoch": 0.8743659773702692, "percentage": 87.44, "elapsed_time": "1 day, 13:07:38", "remaining_time": "5:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15688, "total_steps": 17941, "loss": 1.4768, "learning_rate": 3.98475627503393e-06, "epoch": 0.8744217156234324, "percentage": 87.44, "elapsed_time": "1 day, 13:07:47", "remaining_time": "5:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15689, "total_steps": 17941, "loss": 1.6493, "learning_rate": 3.98127365042904e-06, "epoch": 0.8744774538765955, "percentage": 87.45, "elapsed_time": "1 day, 13:07:55", "remaining_time": "5:19:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15690, "total_steps": 17941, "loss": 1.7767, "learning_rate": 3.977792485269849e-06, "epoch": 0.8745331921297587, "percentage": 87.45, "elapsed_time": "1 day, 13:08:03", "remaining_time": "5:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15691, "total_steps": 17941, "loss": 1.8401, "learning_rate": 3.974312779666756e-06, "epoch": 0.8745889303829218, "percentage": 87.46, "elapsed_time": "1 day, 13:08:12", "remaining_time": "5:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15692, "total_steps": 17941, "loss": 1.7548, "learning_rate": 3.970834533730106e-06, "epoch": 0.8746446686360849, "percentage": 87.46, "elapsed_time": "1 day, 13:08:20", "remaining_time": "5:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15693, "total_steps": 17941, "loss": 1.7338, "learning_rate": 3.967357747570216e-06, "epoch": 0.8747004068892481, "percentage": 87.47, "elapsed_time": "1 day, 13:08:29", "remaining_time": "5:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15694, "total_steps": 17941, "loss": 1.5358, "learning_rate": 3.963882421297354e-06, "epoch": 0.8747561451424113, "percentage": 87.48, "elapsed_time": "1 day, 13:08:37", "remaining_time": "5:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15695, "total_steps": 17941, "loss": 1.6326, "learning_rate": 3.960408555021727e-06, "epoch": 0.8748118833955744, "percentage": 87.48, "elapsed_time": "1 day, 13:08:46", "remaining_time": "5:18:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15696, "total_steps": 17941, "loss": 1.6002, "learning_rate": 3.956936148853518e-06, "epoch": 0.8748676216487375, "percentage": 87.49, "elapsed_time": "1 day, 13:08:54", "remaining_time": "5:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15697, "total_steps": 17941, "loss": 1.4552, "learning_rate": 3.953465202902834e-06, "epoch": 0.8749233599019006, "percentage": 87.49, "elapsed_time": "1 day, 13:09:03", "remaining_time": "5:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15698, "total_steps": 17941, "loss": 1.7802, "learning_rate": 3.949995717279775e-06, "epoch": 0.8749790981550638, "percentage": 87.5, "elapsed_time": "1 day, 13:09:11", "remaining_time": "5:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15699, "total_steps": 17941, "loss": 1.7097, "learning_rate": 3.94652769209436e-06, "epoch": 0.875034836408227, "percentage": 87.5, "elapsed_time": "1 day, 13:09:20", "remaining_time": "5:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15700, "total_steps": 17941, "loss": 1.7576, "learning_rate": 3.943061127456571e-06, "epoch": 0.8750905746613901, "percentage": 87.51, "elapsed_time": "1 day, 13:09:28", "remaining_time": "5:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15701, "total_steps": 17941, "loss": 1.6516, "learning_rate": 3.939596023476355e-06, "epoch": 0.8751463129145532, "percentage": 87.51, "elapsed_time": "1 day, 13:09:38", "remaining_time": "5:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15702, "total_steps": 17941, "loss": 1.7933, "learning_rate": 3.936132380263596e-06, "epoch": 0.8752020511677164, "percentage": 87.52, "elapsed_time": "1 day, 13:09:47", "remaining_time": "5:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15703, "total_steps": 17941, "loss": 1.6893, "learning_rate": 3.9326701979281624e-06, "epoch": 0.8752577894208795, "percentage": 87.53, "elapsed_time": "1 day, 13:09:55", "remaining_time": "5:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15704, "total_steps": 17941, "loss": 1.6717, "learning_rate": 3.929209476579821e-06, "epoch": 0.8753135276740427, "percentage": 87.53, "elapsed_time": "1 day, 13:10:04", "remaining_time": "5:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15705, "total_steps": 17941, "loss": 1.5763, "learning_rate": 3.925750216328361e-06, "epoch": 0.8753692659272059, "percentage": 87.54, "elapsed_time": "1 day, 13:10:12", "remaining_time": "5:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15706, "total_steps": 17941, "loss": 1.7637, "learning_rate": 3.922292417283463e-06, "epoch": 0.875425004180369, "percentage": 87.54, "elapsed_time": "1 day, 13:10:21", "remaining_time": "5:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15707, "total_steps": 17941, "loss": 1.4888, "learning_rate": 3.918836079554794e-06, "epoch": 0.8754807424335321, "percentage": 87.55, "elapsed_time": "1 day, 13:10:29", "remaining_time": "5:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15708, "total_steps": 17941, "loss": 1.4943, "learning_rate": 3.915381203251977e-06, "epoch": 0.8755364806866953, "percentage": 87.55, "elapsed_time": "1 day, 13:10:37", "remaining_time": "5:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15709, "total_steps": 17941, "loss": 1.709, "learning_rate": 3.911927788484576e-06, "epoch": 0.8755922189398584, "percentage": 87.56, "elapsed_time": "1 day, 13:10:46", "remaining_time": "5:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15710, "total_steps": 17941, "loss": 1.6748, "learning_rate": 3.908475835362124e-06, "epoch": 0.8756479571930216, "percentage": 87.56, "elapsed_time": "1 day, 13:10:55", "remaining_time": "5:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15711, "total_steps": 17941, "loss": 1.6158, "learning_rate": 3.905025343994073e-06, "epoch": 0.8757036954461848, "percentage": 87.57, "elapsed_time": "1 day, 13:11:04", "remaining_time": "5:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15712, "total_steps": 17941, "loss": 1.6543, "learning_rate": 3.901576314489869e-06, "epoch": 0.8757594336993478, "percentage": 87.58, "elapsed_time": "1 day, 13:11:12", "remaining_time": "5:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15713, "total_steps": 17941, "loss": 1.617, "learning_rate": 3.89812874695889e-06, "epoch": 0.875815171952511, "percentage": 87.58, "elapsed_time": "1 day, 13:11:21", "remaining_time": "5:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15714, "total_steps": 17941, "loss": 1.5324, "learning_rate": 3.894682641510477e-06, "epoch": 0.8758709102056742, "percentage": 87.59, "elapsed_time": "1 day, 13:11:29", "remaining_time": "5:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15715, "total_steps": 17941, "loss": 1.6526, "learning_rate": 3.891237998253916e-06, "epoch": 0.8759266484588373, "percentage": 87.59, "elapsed_time": "1 day, 13:11:38", "remaining_time": "5:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15716, "total_steps": 17941, "loss": 1.5923, "learning_rate": 3.887794817298452e-06, "epoch": 0.8759823867120005, "percentage": 87.6, "elapsed_time": "1 day, 13:11:46", "remaining_time": "5:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15717, "total_steps": 17941, "loss": 1.6028, "learning_rate": 3.884353098753296e-06, "epoch": 0.8760381249651636, "percentage": 87.6, "elapsed_time": "1 day, 13:11:54", "remaining_time": "5:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15718, "total_steps": 17941, "loss": 1.6405, "learning_rate": 3.880912842727574e-06, "epoch": 0.8760938632183267, "percentage": 87.61, "elapsed_time": "1 day, 13:12:03", "remaining_time": "5:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15719, "total_steps": 17941, "loss": 1.5182, "learning_rate": 3.877474049330404e-06, "epoch": 0.8761496014714899, "percentage": 87.61, "elapsed_time": "1 day, 13:12:11", "remaining_time": "5:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15720, "total_steps": 17941, "loss": 1.4649, "learning_rate": 3.8740367186708485e-06, "epoch": 0.876205339724653, "percentage": 87.62, "elapsed_time": "1 day, 13:12:20", "remaining_time": "5:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15721, "total_steps": 17941, "loss": 1.5252, "learning_rate": 3.870600850857914e-06, "epoch": 0.8762610779778162, "percentage": 87.63, "elapsed_time": "1 day, 13:12:28", "remaining_time": "5:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15722, "total_steps": 17941, "loss": 1.7815, "learning_rate": 3.86716644600057e-06, "epoch": 0.8763168162309793, "percentage": 87.63, "elapsed_time": "1 day, 13:12:37", "remaining_time": "5:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15723, "total_steps": 17941, "loss": 1.6557, "learning_rate": 3.8637335042077225e-06, "epoch": 0.8763725544841424, "percentage": 87.64, "elapsed_time": "1 day, 13:12:45", "remaining_time": "5:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15724, "total_steps": 17941, "loss": 1.7001, "learning_rate": 3.86030202558827e-06, "epoch": 0.8764282927373056, "percentage": 87.64, "elapsed_time": "1 day, 13:12:54", "remaining_time": "5:14:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15725, "total_steps": 17941, "loss": 1.7792, "learning_rate": 3.856872010251017e-06, "epoch": 0.8764840309904688, "percentage": 87.65, "elapsed_time": "1 day, 13:13:02", "remaining_time": "5:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15726, "total_steps": 17941, "loss": 1.6699, "learning_rate": 3.853443458304751e-06, "epoch": 0.8765397692436319, "percentage": 87.65, "elapsed_time": "1 day, 13:13:10", "remaining_time": "5:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15727, "total_steps": 17941, "loss": 1.5898, "learning_rate": 3.8500163698582e-06, "epoch": 0.876595507496795, "percentage": 87.66, "elapsed_time": "1 day, 13:13:19", "remaining_time": "5:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15728, "total_steps": 17941, "loss": 1.5957, "learning_rate": 3.846590745020062e-06, "epoch": 0.8766512457499582, "percentage": 87.67, "elapsed_time": "1 day, 13:13:28", "remaining_time": "5:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15729, "total_steps": 17941, "loss": 1.6312, "learning_rate": 3.843166583898983e-06, "epoch": 0.8767069840031213, "percentage": 87.67, "elapsed_time": "1 day, 13:13:36", "remaining_time": "5:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15730, "total_steps": 17941, "loss": 1.7032, "learning_rate": 3.839743886603525e-06, "epoch": 0.8767627222562845, "percentage": 87.68, "elapsed_time": "1 day, 13:13:45", "remaining_time": "5:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15731, "total_steps": 17941, "loss": 1.8931, "learning_rate": 3.836322653242275e-06, "epoch": 0.8768184605094477, "percentage": 87.68, "elapsed_time": "1 day, 13:13:53", "remaining_time": "5:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15732, "total_steps": 17941, "loss": 1.4354, "learning_rate": 3.832902883923711e-06, "epoch": 0.8768741987626107, "percentage": 87.69, "elapsed_time": "1 day, 13:14:02", "remaining_time": "5:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15733, "total_steps": 17941, "loss": 1.5042, "learning_rate": 3.829484578756298e-06, "epoch": 0.8769299370157739, "percentage": 87.69, "elapsed_time": "1 day, 13:14:10", "remaining_time": "5:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15734, "total_steps": 17941, "loss": 1.4766, "learning_rate": 3.826067737848438e-06, "epoch": 0.8769856752689371, "percentage": 87.7, "elapsed_time": "1 day, 13:14:19", "remaining_time": "5:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15735, "total_steps": 17941, "loss": 1.568, "learning_rate": 3.822652361308493e-06, "epoch": 0.8770414135221002, "percentage": 87.7, "elapsed_time": "1 day, 13:14:28", "remaining_time": "5:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15736, "total_steps": 17941, "loss": 1.7266, "learning_rate": 3.819238449244794e-06, "epoch": 0.8770971517752634, "percentage": 87.71, "elapsed_time": "1 day, 13:14:36", "remaining_time": "5:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15737, "total_steps": 17941, "loss": 1.6284, "learning_rate": 3.815826001765593e-06, "epoch": 0.8771528900284266, "percentage": 87.72, "elapsed_time": "1 day, 13:14:45", "remaining_time": "5:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15738, "total_steps": 17941, "loss": 1.5299, "learning_rate": 3.812415018979115e-06, "epoch": 0.8772086282815896, "percentage": 87.72, "elapsed_time": "1 day, 13:14:53", "remaining_time": "5:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15739, "total_steps": 17941, "loss": 1.6306, "learning_rate": 3.8090055009935454e-06, "epoch": 0.8772643665347528, "percentage": 87.73, "elapsed_time": "1 day, 13:15:02", "remaining_time": "5:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15740, "total_steps": 17941, "loss": 1.4984, "learning_rate": 3.805597447917003e-06, "epoch": 0.877320104787916, "percentage": 87.73, "elapsed_time": "1 day, 13:15:10", "remaining_time": "5:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15741, "total_steps": 17941, "loss": 1.5862, "learning_rate": 3.8021908598575795e-06, "epoch": 0.8773758430410791, "percentage": 87.74, "elapsed_time": "1 day, 13:15:18", "remaining_time": "5:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15742, "total_steps": 17941, "loss": 1.7315, "learning_rate": 3.7987857369233103e-06, "epoch": 0.8774315812942423, "percentage": 87.74, "elapsed_time": "1 day, 13:15:27", "remaining_time": "5:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15743, "total_steps": 17941, "loss": 1.6165, "learning_rate": 3.7953820792221984e-06, "epoch": 0.8774873195474053, "percentage": 87.75, "elapsed_time": "1 day, 13:15:35", "remaining_time": "5:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15744, "total_steps": 17941, "loss": 1.4986, "learning_rate": 3.7919798868621626e-06, "epoch": 0.8775430578005685, "percentage": 87.75, "elapsed_time": "1 day, 13:15:44", "remaining_time": "5:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15745, "total_steps": 17941, "loss": 1.6291, "learning_rate": 3.788579159951111e-06, "epoch": 0.8775987960537317, "percentage": 87.76, "elapsed_time": "1 day, 13:15:52", "remaining_time": "5:11:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15746, "total_steps": 17941, "loss": 1.5745, "learning_rate": 3.7851798985969023e-06, "epoch": 0.8776545343068948, "percentage": 87.77, "elapsed_time": "1 day, 13:16:01", "remaining_time": "5:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15747, "total_steps": 17941, "loss": 1.6791, "learning_rate": 3.781782102907333e-06, "epoch": 0.877710272560058, "percentage": 87.77, "elapsed_time": "1 day, 13:16:09", "remaining_time": "5:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15748, "total_steps": 17941, "loss": 1.666, "learning_rate": 3.778385772990173e-06, "epoch": 0.8777660108132211, "percentage": 87.78, "elapsed_time": "1 day, 13:16:18", "remaining_time": "5:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15749, "total_steps": 17941, "loss": 1.5475, "learning_rate": 3.7749909089531076e-06, "epoch": 0.8778217490663842, "percentage": 87.78, "elapsed_time": "1 day, 13:16:26", "remaining_time": "5:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15750, "total_steps": 17941, "loss": 1.8361, "learning_rate": 3.7715975109038406e-06, "epoch": 0.8778774873195474, "percentage": 87.79, "elapsed_time": "1 day, 13:16:35", "remaining_time": "5:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15751, "total_steps": 17941, "loss": 1.6891, "learning_rate": 3.7682055789499626e-06, "epoch": 0.8779332255727106, "percentage": 87.79, "elapsed_time": "1 day, 13:16:43", "remaining_time": "5:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15752, "total_steps": 17941, "loss": 1.5066, "learning_rate": 3.7648151131990494e-06, "epoch": 0.8779889638258737, "percentage": 87.8, "elapsed_time": "1 day, 13:16:52", "remaining_time": "5:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15753, "total_steps": 17941, "loss": 1.6471, "learning_rate": 3.7614261137586314e-06, "epoch": 0.8780447020790368, "percentage": 87.8, "elapsed_time": "1 day, 13:17:00", "remaining_time": "5:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15754, "total_steps": 17941, "loss": 1.5962, "learning_rate": 3.7580385807361894e-06, "epoch": 0.8781004403322, "percentage": 87.81, "elapsed_time": "1 day, 13:17:08", "remaining_time": "5:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15755, "total_steps": 17941, "loss": 1.5955, "learning_rate": 3.7546525142391654e-06, "epoch": 0.8781561785853631, "percentage": 87.82, "elapsed_time": "1 day, 13:17:17", "remaining_time": "5:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15756, "total_steps": 17941, "loss": 1.6844, "learning_rate": 3.751267914374912e-06, "epoch": 0.8782119168385263, "percentage": 87.82, "elapsed_time": "1 day, 13:17:26", "remaining_time": "5:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15757, "total_steps": 17941, "loss": 1.4976, "learning_rate": 3.74788478125081e-06, "epoch": 0.8782676550916895, "percentage": 87.83, "elapsed_time": "1 day, 13:17:34", "remaining_time": "5:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15758, "total_steps": 17941, "loss": 1.4495, "learning_rate": 3.7445031149741294e-06, "epoch": 0.8783233933448525, "percentage": 87.83, "elapsed_time": "1 day, 13:17:42", "remaining_time": "5:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15759, "total_steps": 17941, "loss": 1.7237, "learning_rate": 3.741122915652118e-06, "epoch": 0.8783791315980157, "percentage": 87.84, "elapsed_time": "1 day, 13:17:51", "remaining_time": "5:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15760, "total_steps": 17941, "loss": 1.5868, "learning_rate": 3.737744183391978e-06, "epoch": 0.8784348698511789, "percentage": 87.84, "elapsed_time": "1 day, 13:17:59", "remaining_time": "5:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15761, "total_steps": 17941, "loss": 1.6997, "learning_rate": 3.734366918300869e-06, "epoch": 0.878490608104342, "percentage": 87.85, "elapsed_time": "1 day, 13:18:08", "remaining_time": "5:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15762, "total_steps": 17941, "loss": 1.8069, "learning_rate": 3.7309911204858995e-06, "epoch": 0.8785463463575052, "percentage": 87.85, "elapsed_time": "1 day, 13:18:16", "remaining_time": "5:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15763, "total_steps": 17941, "loss": 1.7699, "learning_rate": 3.727616790054117e-06, "epoch": 0.8786020846106684, "percentage": 87.86, "elapsed_time": "1 day, 13:18:25", "remaining_time": "5:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15764, "total_steps": 17941, "loss": 1.6868, "learning_rate": 3.7242439271125474e-06, "epoch": 0.8786578228638314, "percentage": 87.87, "elapsed_time": "1 day, 13:18:33", "remaining_time": "5:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15765, "total_steps": 17941, "loss": 1.6907, "learning_rate": 3.720872531768149e-06, "epoch": 0.8787135611169946, "percentage": 87.87, "elapsed_time": "1 day, 13:18:42", "remaining_time": "5:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15766, "total_steps": 17941, "loss": 1.7177, "learning_rate": 3.7175026041278483e-06, "epoch": 0.8787692993701577, "percentage": 87.88, "elapsed_time": "1 day, 13:18:50", "remaining_time": "5:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15767, "total_steps": 17941, "loss": 1.6994, "learning_rate": 3.71413414429852e-06, "epoch": 0.8788250376233209, "percentage": 87.88, "elapsed_time": "1 day, 13:18:59", "remaining_time": "5:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15768, "total_steps": 17941, "loss": 1.5811, "learning_rate": 3.7107671523869903e-06, "epoch": 0.878880775876484, "percentage": 87.89, "elapsed_time": "1 day, 13:19:07", "remaining_time": "5:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15769, "total_steps": 17941, "loss": 1.6197, "learning_rate": 3.7074016285000512e-06, "epoch": 0.8789365141296471, "percentage": 87.89, "elapsed_time": "1 day, 13:19:16", "remaining_time": "5:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15770, "total_steps": 17941, "loss": 1.657, "learning_rate": 3.7040375727444233e-06, "epoch": 0.8789922523828103, "percentage": 87.9, "elapsed_time": "1 day, 13:19:24", "remaining_time": "5:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15771, "total_steps": 17941, "loss": 1.8687, "learning_rate": 3.700674985226793e-06, "epoch": 0.8790479906359735, "percentage": 87.9, "elapsed_time": "1 day, 13:19:33", "remaining_time": "5:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15772, "total_steps": 17941, "loss": 1.6434, "learning_rate": 3.6973138660538144e-06, "epoch": 0.8791037288891366, "percentage": 87.91, "elapsed_time": "1 day, 13:19:42", "remaining_time": "5:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15773, "total_steps": 17941, "loss": 1.6503, "learning_rate": 3.693954215332074e-06, "epoch": 0.8791594671422998, "percentage": 87.92, "elapsed_time": "1 day, 13:19:50", "remaining_time": "5:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15774, "total_steps": 17941, "loss": 1.8172, "learning_rate": 3.6905960331681256e-06, "epoch": 0.8792152053954629, "percentage": 87.92, "elapsed_time": "1 day, 13:19:58", "remaining_time": "5:07:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15775, "total_steps": 17941, "loss": 1.7368, "learning_rate": 3.687239319668462e-06, "epoch": 0.879270943648626, "percentage": 87.93, "elapsed_time": "1 day, 13:20:07", "remaining_time": "5:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15776, "total_steps": 17941, "loss": 1.5331, "learning_rate": 3.683884074939553e-06, "epoch": 0.8793266819017892, "percentage": 87.93, "elapsed_time": "1 day, 13:20:15", "remaining_time": "5:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15777, "total_steps": 17941, "loss": 1.6661, "learning_rate": 3.6805302990877976e-06, "epoch": 0.8793824201549524, "percentage": 87.94, "elapsed_time": "1 day, 13:20:24", "remaining_time": "5:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15778, "total_steps": 17941, "loss": 1.608, "learning_rate": 3.6771779922195547e-06, "epoch": 0.8794381584081155, "percentage": 87.94, "elapsed_time": "1 day, 13:20:32", "remaining_time": "5:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15779, "total_steps": 17941, "loss": 1.9745, "learning_rate": 3.6738271544411453e-06, "epoch": 0.8794938966612786, "percentage": 87.95, "elapsed_time": "1 day, 13:20:41", "remaining_time": "5:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15780, "total_steps": 17941, "loss": 1.6281, "learning_rate": 3.6704777858588444e-06, "epoch": 0.8795496349144418, "percentage": 87.95, "elapsed_time": "1 day, 13:20:49", "remaining_time": "5:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15781, "total_steps": 17941, "loss": 1.6116, "learning_rate": 3.6671298865788685e-06, "epoch": 0.8796053731676049, "percentage": 87.96, "elapsed_time": "1 day, 13:20:58", "remaining_time": "5:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15782, "total_steps": 17941, "loss": 1.7403, "learning_rate": 3.6637834567073815e-06, "epoch": 0.8796611114207681, "percentage": 87.97, "elapsed_time": "1 day, 13:21:06", "remaining_time": "5:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15783, "total_steps": 17941, "loss": 1.617, "learning_rate": 3.6604384963505433e-06, "epoch": 0.8797168496739313, "percentage": 87.97, "elapsed_time": "1 day, 13:21:14", "remaining_time": "5:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15784, "total_steps": 17941, "loss": 1.5354, "learning_rate": 3.6570950056144026e-06, "epoch": 0.8797725879270943, "percentage": 87.98, "elapsed_time": "1 day, 13:21:23", "remaining_time": "5:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15785, "total_steps": 17941, "loss": 1.5775, "learning_rate": 3.6537529846050134e-06, "epoch": 0.8798283261802575, "percentage": 87.98, "elapsed_time": "1 day, 13:21:31", "remaining_time": "5:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15786, "total_steps": 17941, "loss": 1.7492, "learning_rate": 3.650412433428363e-06, "epoch": 0.8798840644334207, "percentage": 87.99, "elapsed_time": "1 day, 13:21:40", "remaining_time": "5:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15787, "total_steps": 17941, "loss": 1.6341, "learning_rate": 3.6470733521903945e-06, "epoch": 0.8799398026865838, "percentage": 87.99, "elapsed_time": "1 day, 13:21:48", "remaining_time": "5:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15788, "total_steps": 17941, "loss": 1.7935, "learning_rate": 3.643735740997012e-06, "epoch": 0.879995540939747, "percentage": 88.0, "elapsed_time": "1 day, 13:21:57", "remaining_time": "5:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15789, "total_steps": 17941, "loss": 1.7948, "learning_rate": 3.640399599954042e-06, "epoch": 0.88005127919291, "percentage": 88.01, "elapsed_time": "1 day, 13:22:05", "remaining_time": "5:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15790, "total_steps": 17941, "loss": 1.7953, "learning_rate": 3.6370649291673055e-06, "epoch": 0.8801070174460732, "percentage": 88.01, "elapsed_time": "1 day, 13:22:14", "remaining_time": "5:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15791, "total_steps": 17941, "loss": 1.6587, "learning_rate": 3.6337317287425565e-06, "epoch": 0.8801627556992364, "percentage": 88.02, "elapsed_time": "1 day, 13:22:22", "remaining_time": "5:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15792, "total_steps": 17941, "loss": 1.6646, "learning_rate": 3.6303999987854996e-06, "epoch": 0.8802184939523995, "percentage": 88.02, "elapsed_time": "1 day, 13:22:31", "remaining_time": "5:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15793, "total_steps": 17941, "loss": 1.6545, "learning_rate": 3.6270697394018007e-06, "epoch": 0.8802742322055627, "percentage": 88.03, "elapsed_time": "1 day, 13:22:39", "remaining_time": "5:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15794, "total_steps": 17941, "loss": 1.5467, "learning_rate": 3.62374095069708e-06, "epoch": 0.8803299704587259, "percentage": 88.03, "elapsed_time": "1 day, 13:22:48", "remaining_time": "5:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15795, "total_steps": 17941, "loss": 1.641, "learning_rate": 3.6204136327769088e-06, "epoch": 0.8803857087118889, "percentage": 88.04, "elapsed_time": "1 day, 13:22:56", "remaining_time": "5:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15796, "total_steps": 17941, "loss": 1.7804, "learning_rate": 3.6170877857467977e-06, "epoch": 0.8804414469650521, "percentage": 88.04, "elapsed_time": "1 day, 13:23:04", "remaining_time": "5:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15797, "total_steps": 17941, "loss": 1.7916, "learning_rate": 3.613763409712234e-06, "epoch": 0.8804971852182153, "percentage": 88.05, "elapsed_time": "1 day, 13:23:13", "remaining_time": "5:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15798, "total_steps": 17941, "loss": 1.6742, "learning_rate": 3.610440504778645e-06, "epoch": 0.8805529234713784, "percentage": 88.06, "elapsed_time": "1 day, 13:23:21", "remaining_time": "5:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15799, "total_steps": 17941, "loss": 1.7098, "learning_rate": 3.607119071051407e-06, "epoch": 0.8806086617245416, "percentage": 88.06, "elapsed_time": "1 day, 13:23:30", "remaining_time": "5:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15800, "total_steps": 17941, "loss": 1.4523, "learning_rate": 3.603799108635869e-06, "epoch": 0.8806643999777047, "percentage": 88.07, "elapsed_time": "1 day, 13:23:39", "remaining_time": "5:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15801, "total_steps": 17941, "loss": 1.655, "learning_rate": 3.600480617637314e-06, "epoch": 0.8807201382308678, "percentage": 88.07, "elapsed_time": "1 day, 13:23:47", "remaining_time": "5:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15802, "total_steps": 17941, "loss": 1.4806, "learning_rate": 3.597163598160991e-06, "epoch": 0.880775876484031, "percentage": 88.08, "elapsed_time": "1 day, 13:23:56", "remaining_time": "5:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15803, "total_steps": 17941, "loss": 1.7873, "learning_rate": 3.593848050312082e-06, "epoch": 0.8808316147371942, "percentage": 88.08, "elapsed_time": "1 day, 13:24:04", "remaining_time": "5:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15804, "total_steps": 17941, "loss": 1.6772, "learning_rate": 3.5905339741957535e-06, "epoch": 0.8808873529903573, "percentage": 88.09, "elapsed_time": "1 day, 13:24:13", "remaining_time": "5:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15805, "total_steps": 17941, "loss": 1.3347, "learning_rate": 3.5872213699170932e-06, "epoch": 0.8809430912435204, "percentage": 88.09, "elapsed_time": "1 day, 13:24:22", "remaining_time": "5:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15806, "total_steps": 17941, "loss": 1.6325, "learning_rate": 3.5839102375811674e-06, "epoch": 0.8809988294966836, "percentage": 88.1, "elapsed_time": "1 day, 13:24:31", "remaining_time": "5:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15807, "total_steps": 17941, "loss": 1.7944, "learning_rate": 3.5806005772929975e-06, "epoch": 0.8810545677498467, "percentage": 88.11, "elapsed_time": "1 day, 13:24:39", "remaining_time": "5:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15808, "total_steps": 17941, "loss": 1.6031, "learning_rate": 3.5772923891575107e-06, "epoch": 0.8811103060030099, "percentage": 88.11, "elapsed_time": "1 day, 13:24:48", "remaining_time": "5:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15809, "total_steps": 17941, "loss": 1.6244, "learning_rate": 3.5739856732796674e-06, "epoch": 0.8811660442561731, "percentage": 88.12, "elapsed_time": "1 day, 13:24:57", "remaining_time": "5:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15810, "total_steps": 17941, "loss": 1.819, "learning_rate": 3.570680429764306e-06, "epoch": 0.8812217825093361, "percentage": 88.12, "elapsed_time": "1 day, 13:25:05", "remaining_time": "5:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15811, "total_steps": 17941, "loss": 1.4932, "learning_rate": 3.5673766587162593e-06, "epoch": 0.8812775207624993, "percentage": 88.13, "elapsed_time": "1 day, 13:25:14", "remaining_time": "5:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15812, "total_steps": 17941, "loss": 1.5483, "learning_rate": 3.564074360240305e-06, "epoch": 0.8813332590156624, "percentage": 88.13, "elapsed_time": "1 day, 13:25:22", "remaining_time": "5:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15813, "total_steps": 17941, "loss": 1.4245, "learning_rate": 3.560773534441175e-06, "epoch": 0.8813889972688256, "percentage": 88.14, "elapsed_time": "1 day, 13:25:31", "remaining_time": "5:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15814, "total_steps": 17941, "loss": 1.9034, "learning_rate": 3.5574741814235534e-06, "epoch": 0.8814447355219888, "percentage": 88.14, "elapsed_time": "1 day, 13:25:39", "remaining_time": "5:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15815, "total_steps": 17941, "loss": 1.5504, "learning_rate": 3.5541763012920613e-06, "epoch": 0.8815004737751518, "percentage": 88.15, "elapsed_time": "1 day, 13:25:48", "remaining_time": "5:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15816, "total_steps": 17941, "loss": 1.5131, "learning_rate": 3.5508798941513045e-06, "epoch": 0.881556212028315, "percentage": 88.16, "elapsed_time": "1 day, 13:25:56", "remaining_time": "5:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15817, "total_steps": 17941, "loss": 1.5225, "learning_rate": 3.5475849601058154e-06, "epoch": 0.8816119502814782, "percentage": 88.16, "elapsed_time": "1 day, 13:26:04", "remaining_time": "5:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15818, "total_steps": 17941, "loss": 1.5951, "learning_rate": 3.5442914992600995e-06, "epoch": 0.8816676885346413, "percentage": 88.17, "elapsed_time": "1 day, 13:26:13", "remaining_time": "5:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15819, "total_steps": 17941, "loss": 1.6046, "learning_rate": 3.5409995117185957e-06, "epoch": 0.8817234267878045, "percentage": 88.17, "elapsed_time": "1 day, 13:26:21", "remaining_time": "5:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15820, "total_steps": 17941, "loss": 1.6479, "learning_rate": 3.5377089975857148e-06, "epoch": 0.8817791650409676, "percentage": 88.18, "elapsed_time": "1 day, 13:26:30", "remaining_time": "5:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15821, "total_steps": 17941, "loss": 1.467, "learning_rate": 3.5344199569658233e-06, "epoch": 0.8818349032941307, "percentage": 88.18, "elapsed_time": "1 day, 13:26:38", "remaining_time": "5:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15822, "total_steps": 17941, "loss": 1.7529, "learning_rate": 3.5311323899632044e-06, "epoch": 0.8818906415472939, "percentage": 88.19, "elapsed_time": "1 day, 13:26:47", "remaining_time": "5:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15823, "total_steps": 17941, "loss": 1.5552, "learning_rate": 3.5278462966821357e-06, "epoch": 0.8819463798004571, "percentage": 88.19, "elapsed_time": "1 day, 13:26:55", "remaining_time": "5:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15824, "total_steps": 17941, "loss": 1.4434, "learning_rate": 3.524561677226834e-06, "epoch": 0.8820021180536202, "percentage": 88.2, "elapsed_time": "1 day, 13:27:03", "remaining_time": "5:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15825, "total_steps": 17941, "loss": 1.4434, "learning_rate": 3.521278531701461e-06, "epoch": 0.8820578563067833, "percentage": 88.21, "elapsed_time": "1 day, 13:27:12", "remaining_time": "5:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15826, "total_steps": 17941, "loss": 1.489, "learning_rate": 3.517996860210143e-06, "epoch": 0.8821135945599465, "percentage": 88.21, "elapsed_time": "1 day, 13:27:20", "remaining_time": "5:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15827, "total_steps": 17941, "loss": 1.5887, "learning_rate": 3.5147166628569594e-06, "epoch": 0.8821693328131096, "percentage": 88.22, "elapsed_time": "1 day, 13:27:29", "remaining_time": "5:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15828, "total_steps": 17941, "loss": 1.7832, "learning_rate": 3.511437939745943e-06, "epoch": 0.8822250710662728, "percentage": 88.22, "elapsed_time": "1 day, 13:27:38", "remaining_time": "5:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15829, "total_steps": 17941, "loss": 1.5757, "learning_rate": 3.508160690981055e-06, "epoch": 0.882280809319436, "percentage": 88.23, "elapsed_time": "1 day, 13:27:46", "remaining_time": "4:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15830, "total_steps": 17941, "loss": 1.5776, "learning_rate": 3.5048849166662456e-06, "epoch": 0.882336547572599, "percentage": 88.23, "elapsed_time": "1 day, 13:27:55", "remaining_time": "4:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15831, "total_steps": 17941, "loss": 1.582, "learning_rate": 3.501610616905404e-06, "epoch": 0.8823922858257622, "percentage": 88.24, "elapsed_time": "1 day, 13:28:04", "remaining_time": "4:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15832, "total_steps": 17941, "loss": 1.6043, "learning_rate": 3.4983377918023698e-06, "epoch": 0.8824480240789254, "percentage": 88.24, "elapsed_time": "1 day, 13:28:12", "remaining_time": "4:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15833, "total_steps": 17941, "loss": 1.6977, "learning_rate": 3.4950664414609425e-06, "epoch": 0.8825037623320885, "percentage": 88.25, "elapsed_time": "1 day, 13:28:21", "remaining_time": "4:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15834, "total_steps": 17941, "loss": 1.5686, "learning_rate": 3.4917965659848506e-06, "epoch": 0.8825595005852517, "percentage": 88.26, "elapsed_time": "1 day, 13:28:29", "remaining_time": "4:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15835, "total_steps": 17941, "loss": 1.4928, "learning_rate": 3.4885281654778224e-06, "epoch": 0.8826152388384148, "percentage": 88.26, "elapsed_time": "1 day, 13:28:38", "remaining_time": "4:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15836, "total_steps": 17941, "loss": 1.8674, "learning_rate": 3.485261240043497e-06, "epoch": 0.8826709770915779, "percentage": 88.27, "elapsed_time": "1 day, 13:28:46", "remaining_time": "4:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15837, "total_steps": 17941, "loss": 1.5629, "learning_rate": 3.4819957897854805e-06, "epoch": 0.8827267153447411, "percentage": 88.27, "elapsed_time": "1 day, 13:28:55", "remaining_time": "4:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15838, "total_steps": 17941, "loss": 1.7014, "learning_rate": 3.4787318148073455e-06, "epoch": 0.8827824535979042, "percentage": 88.28, "elapsed_time": "1 day, 13:29:03", "remaining_time": "4:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15839, "total_steps": 17941, "loss": 1.8721, "learning_rate": 3.4754693152125928e-06, "epoch": 0.8828381918510674, "percentage": 88.28, "elapsed_time": "1 day, 13:29:12", "remaining_time": "4:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15840, "total_steps": 17941, "loss": 1.72, "learning_rate": 3.4722082911047116e-06, "epoch": 0.8828939301042306, "percentage": 88.29, "elapsed_time": "1 day, 13:29:20", "remaining_time": "4:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15841, "total_steps": 17941, "loss": 1.5737, "learning_rate": 3.4689487425870916e-06, "epoch": 0.8829496683573936, "percentage": 88.29, "elapsed_time": "1 day, 13:29:28", "remaining_time": "4:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15842, "total_steps": 17941, "loss": 1.7312, "learning_rate": 3.4656906697631276e-06, "epoch": 0.8830054066105568, "percentage": 88.3, "elapsed_time": "1 day, 13:29:37", "remaining_time": "4:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15843, "total_steps": 17941, "loss": 1.7947, "learning_rate": 3.462434072736143e-06, "epoch": 0.88306114486372, "percentage": 88.31, "elapsed_time": "1 day, 13:29:45", "remaining_time": "4:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15844, "total_steps": 17941, "loss": 1.7457, "learning_rate": 3.4591789516094095e-06, "epoch": 0.8831168831168831, "percentage": 88.31, "elapsed_time": "1 day, 13:29:54", "remaining_time": "4:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15845, "total_steps": 17941, "loss": 1.5253, "learning_rate": 3.455925306486174e-06, "epoch": 0.8831726213700463, "percentage": 88.32, "elapsed_time": "1 day, 13:30:02", "remaining_time": "4:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15846, "total_steps": 17941, "loss": 1.5557, "learning_rate": 3.452673137469614e-06, "epoch": 0.8832283596232094, "percentage": 88.32, "elapsed_time": "1 day, 13:30:11", "remaining_time": "4:57:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15847, "total_steps": 17941, "loss": 1.8283, "learning_rate": 3.4494224446628863e-06, "epoch": 0.8832840978763725, "percentage": 88.33, "elapsed_time": "1 day, 13:30:20", "remaining_time": "4:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15848, "total_steps": 17941, "loss": 1.5048, "learning_rate": 3.4461732281690585e-06, "epoch": 0.8833398361295357, "percentage": 88.33, "elapsed_time": "1 day, 13:30:28", "remaining_time": "4:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15849, "total_steps": 17941, "loss": 1.3804, "learning_rate": 3.4429254880911867e-06, "epoch": 0.8833955743826989, "percentage": 88.34, "elapsed_time": "1 day, 13:30:37", "remaining_time": "4:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15850, "total_steps": 17941, "loss": 1.5334, "learning_rate": 3.4396792245322716e-06, "epoch": 0.883451312635862, "percentage": 88.35, "elapsed_time": "1 day, 13:30:45", "remaining_time": "4:56:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15851, "total_steps": 17941, "loss": 1.6218, "learning_rate": 3.4364344375952652e-06, "epoch": 0.8835070508890251, "percentage": 88.35, "elapsed_time": "1 day, 13:30:54", "remaining_time": "4:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15852, "total_steps": 17941, "loss": 1.4603, "learning_rate": 3.4331911273830784e-06, "epoch": 0.8835627891421883, "percentage": 88.36, "elapsed_time": "1 day, 13:31:02", "remaining_time": "4:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15853, "total_steps": 17941, "loss": 1.3335, "learning_rate": 3.4299492939985633e-06, "epoch": 0.8836185273953514, "percentage": 88.36, "elapsed_time": "1 day, 13:31:11", "remaining_time": "4:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15854, "total_steps": 17941, "loss": 1.5551, "learning_rate": 3.4267089375445425e-06, "epoch": 0.8836742656485146, "percentage": 88.37, "elapsed_time": "1 day, 13:31:19", "remaining_time": "4:56:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15855, "total_steps": 17941, "loss": 1.9433, "learning_rate": 3.423470058123762e-06, "epoch": 0.8837300039016778, "percentage": 88.37, "elapsed_time": "1 day, 13:31:27", "remaining_time": "4:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15856, "total_steps": 17941, "loss": 1.6007, "learning_rate": 3.4202326558389563e-06, "epoch": 0.8837857421548408, "percentage": 88.38, "elapsed_time": "1 day, 13:31:36", "remaining_time": "4:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15857, "total_steps": 17941, "loss": 1.7967, "learning_rate": 3.4169967307927875e-06, "epoch": 0.883841480408004, "percentage": 88.38, "elapsed_time": "1 day, 13:31:44", "remaining_time": "4:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15858, "total_steps": 17941, "loss": 1.607, "learning_rate": 3.41376228308789e-06, "epoch": 0.8838972186611671, "percentage": 88.39, "elapsed_time": "1 day, 13:31:53", "remaining_time": "4:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15859, "total_steps": 17941, "loss": 1.6588, "learning_rate": 3.410529312826838e-06, "epoch": 0.8839529569143303, "percentage": 88.4, "elapsed_time": "1 day, 13:32:01", "remaining_time": "4:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15860, "total_steps": 17941, "loss": 1.8458, "learning_rate": 3.4072978201121485e-06, "epoch": 0.8840086951674935, "percentage": 88.4, "elapsed_time": "1 day, 13:32:10", "remaining_time": "4:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15861, "total_steps": 17941, "loss": 1.7582, "learning_rate": 3.404067805046335e-06, "epoch": 0.8840644334206565, "percentage": 88.41, "elapsed_time": "1 day, 13:32:18", "remaining_time": "4:55:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15862, "total_steps": 17941, "loss": 1.633, "learning_rate": 3.4008392677318034e-06, "epoch": 0.8841201716738197, "percentage": 88.41, "elapsed_time": "1 day, 13:32:27", "remaining_time": "4:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15863, "total_steps": 17941, "loss": 1.5867, "learning_rate": 3.3976122082709672e-06, "epoch": 0.8841759099269829, "percentage": 88.42, "elapsed_time": "1 day, 13:32:35", "remaining_time": "4:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15864, "total_steps": 17941, "loss": 1.5209, "learning_rate": 3.394386626766155e-06, "epoch": 0.884231648180146, "percentage": 88.42, "elapsed_time": "1 day, 13:32:44", "remaining_time": "4:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15865, "total_steps": 17941, "loss": 1.6386, "learning_rate": 3.3911625233196685e-06, "epoch": 0.8842873864333092, "percentage": 88.43, "elapsed_time": "1 day, 13:32:52", "remaining_time": "4:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15866, "total_steps": 17941, "loss": 1.5442, "learning_rate": 3.3879398980337707e-06, "epoch": 0.8843431246864724, "percentage": 88.43, "elapsed_time": "1 day, 13:33:00", "remaining_time": "4:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15867, "total_steps": 17941, "loss": 1.6252, "learning_rate": 3.3847187510106403e-06, "epoch": 0.8843988629396354, "percentage": 88.44, "elapsed_time": "1 day, 13:33:09", "remaining_time": "4:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15868, "total_steps": 17941, "loss": 1.5251, "learning_rate": 3.381499082352446e-06, "epoch": 0.8844546011927986, "percentage": 88.45, "elapsed_time": "1 day, 13:33:18", "remaining_time": "4:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15869, "total_steps": 17941, "loss": 1.6025, "learning_rate": 3.3782808921613005e-06, "epoch": 0.8845103394459618, "percentage": 88.45, "elapsed_time": "1 day, 13:33:26", "remaining_time": "4:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15870, "total_steps": 17941, "loss": 1.7369, "learning_rate": 3.3750641805392557e-06, "epoch": 0.8845660776991249, "percentage": 88.46, "elapsed_time": "1 day, 13:33:34", "remaining_time": "4:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15871, "total_steps": 17941, "loss": 1.7343, "learning_rate": 3.3718489475883354e-06, "epoch": 0.8846218159522881, "percentage": 88.46, "elapsed_time": "1 day, 13:33:43", "remaining_time": "4:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15872, "total_steps": 17941, "loss": 1.5965, "learning_rate": 3.3686351934105076e-06, "epoch": 0.8846775542054512, "percentage": 88.47, "elapsed_time": "1 day, 13:33:51", "remaining_time": "4:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15873, "total_steps": 17941, "loss": 1.677, "learning_rate": 3.3654229181076968e-06, "epoch": 0.8847332924586143, "percentage": 88.47, "elapsed_time": "1 day, 13:34:00", "remaining_time": "4:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15874, "total_steps": 17941, "loss": 1.5953, "learning_rate": 3.362212121781766e-06, "epoch": 0.8847890307117775, "percentage": 88.48, "elapsed_time": "1 day, 13:34:08", "remaining_time": "4:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15875, "total_steps": 17941, "loss": 1.5175, "learning_rate": 3.35900280453455e-06, "epoch": 0.8848447689649407, "percentage": 88.48, "elapsed_time": "1 day, 13:34:17", "remaining_time": "4:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15876, "total_steps": 17941, "loss": 1.7415, "learning_rate": 3.355794966467829e-06, "epoch": 0.8849005072181038, "percentage": 88.49, "elapsed_time": "1 day, 13:34:25", "remaining_time": "4:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15877, "total_steps": 17941, "loss": 1.7925, "learning_rate": 3.3525886076833326e-06, "epoch": 0.884956245471267, "percentage": 88.5, "elapsed_time": "1 day, 13:34:34", "remaining_time": "4:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15878, "total_steps": 17941, "loss": 1.7262, "learning_rate": 3.349383728282757e-06, "epoch": 0.8850119837244301, "percentage": 88.5, "elapsed_time": "1 day, 13:34:42", "remaining_time": "4:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15879, "total_steps": 17941, "loss": 1.5908, "learning_rate": 3.3461803283677373e-06, "epoch": 0.8850677219775932, "percentage": 88.51, "elapsed_time": "1 day, 13:34:51", "remaining_time": "4:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15880, "total_steps": 17941, "loss": 1.6122, "learning_rate": 3.3429784080398762e-06, "epoch": 0.8851234602307564, "percentage": 88.51, "elapsed_time": "1 day, 13:34:59", "remaining_time": "4:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15881, "total_steps": 17941, "loss": 1.7489, "learning_rate": 3.339777967400698e-06, "epoch": 0.8851791984839195, "percentage": 88.52, "elapsed_time": "1 day, 13:35:08", "remaining_time": "4:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15882, "total_steps": 17941, "loss": 1.5237, "learning_rate": 3.3365790065517156e-06, "epoch": 0.8852349367370826, "percentage": 88.52, "elapsed_time": "1 day, 13:35:16", "remaining_time": "4:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15883, "total_steps": 17941, "loss": 1.7946, "learning_rate": 3.3333815255943867e-06, "epoch": 0.8852906749902458, "percentage": 88.53, "elapsed_time": "1 day, 13:35:25", "remaining_time": "4:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15884, "total_steps": 17941, "loss": 1.7742, "learning_rate": 3.3301855246301026e-06, "epoch": 0.8853464132434089, "percentage": 88.53, "elapsed_time": "1 day, 13:35:34", "remaining_time": "4:52:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15885, "total_steps": 17941, "loss": 1.6423, "learning_rate": 3.3269910037602436e-06, "epoch": 0.8854021514965721, "percentage": 88.54, "elapsed_time": "1 day, 13:35:42", "remaining_time": "4:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15886, "total_steps": 17941, "loss": 1.5558, "learning_rate": 3.3237979630860892e-06, "epoch": 0.8854578897497353, "percentage": 88.55, "elapsed_time": "1 day, 13:35:51", "remaining_time": "4:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15887, "total_steps": 17941, "loss": 1.6937, "learning_rate": 3.3206064027089367e-06, "epoch": 0.8855136280028983, "percentage": 88.55, "elapsed_time": "1 day, 13:35:59", "remaining_time": "4:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15888, "total_steps": 17941, "loss": 1.776, "learning_rate": 3.3174163227299826e-06, "epoch": 0.8855693662560615, "percentage": 88.56, "elapsed_time": "1 day, 13:36:07", "remaining_time": "4:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15889, "total_steps": 17941, "loss": 1.7548, "learning_rate": 3.314227723250407e-06, "epoch": 0.8856251045092247, "percentage": 88.56, "elapsed_time": "1 day, 13:36:16", "remaining_time": "4:51:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15890, "total_steps": 17941, "loss": 1.8775, "learning_rate": 3.3110406043713296e-06, "epoch": 0.8856808427623878, "percentage": 88.57, "elapsed_time": "1 day, 13:36:24", "remaining_time": "4:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15891, "total_steps": 17941, "loss": 1.7155, "learning_rate": 3.307854966193824e-06, "epoch": 0.885736581015551, "percentage": 88.57, "elapsed_time": "1 day, 13:36:33", "remaining_time": "4:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15892, "total_steps": 17941, "loss": 1.6435, "learning_rate": 3.304670808818938e-06, "epoch": 0.8857923192687142, "percentage": 88.58, "elapsed_time": "1 day, 13:36:41", "remaining_time": "4:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15893, "total_steps": 17941, "loss": 1.4476, "learning_rate": 3.3014881323476242e-06, "epoch": 0.8858480575218772, "percentage": 88.58, "elapsed_time": "1 day, 13:36:50", "remaining_time": "4:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15894, "total_steps": 17941, "loss": 1.8098, "learning_rate": 3.2983069368808516e-06, "epoch": 0.8859037957750404, "percentage": 88.59, "elapsed_time": "1 day, 13:36:59", "remaining_time": "4:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15895, "total_steps": 17941, "loss": 1.4949, "learning_rate": 3.295127222519484e-06, "epoch": 0.8859595340282036, "percentage": 88.6, "elapsed_time": "1 day, 13:37:08", "remaining_time": "4:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15896, "total_steps": 17941, "loss": 1.5185, "learning_rate": 3.291948989364374e-06, "epoch": 0.8860152722813667, "percentage": 88.6, "elapsed_time": "1 day, 13:37:16", "remaining_time": "4:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15897, "total_steps": 17941, "loss": 1.7169, "learning_rate": 3.2887722375163133e-06, "epoch": 0.8860710105345299, "percentage": 88.61, "elapsed_time": "1 day, 13:37:24", "remaining_time": "4:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15898, "total_steps": 17941, "loss": 1.5604, "learning_rate": 3.2855969670760543e-06, "epoch": 0.886126748787693, "percentage": 88.61, "elapsed_time": "1 day, 13:37:33", "remaining_time": "4:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15899, "total_steps": 17941, "loss": 1.7701, "learning_rate": 3.282423178144306e-06, "epoch": 0.8861824870408561, "percentage": 88.62, "elapsed_time": "1 day, 13:37:41", "remaining_time": "4:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15900, "total_steps": 17941, "loss": 1.6685, "learning_rate": 3.2792508708216986e-06, "epoch": 0.8862382252940193, "percentage": 88.62, "elapsed_time": "1 day, 13:37:50", "remaining_time": "4:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15901, "total_steps": 17941, "loss": 1.6324, "learning_rate": 3.276080045208857e-06, "epoch": 0.8862939635471825, "percentage": 88.63, "elapsed_time": "1 day, 13:37:59", "remaining_time": "4:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15902, "total_steps": 17941, "loss": 1.5295, "learning_rate": 3.272910701406334e-06, "epoch": 0.8863497018003456, "percentage": 88.63, "elapsed_time": "1 day, 13:38:08", "remaining_time": "4:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15903, "total_steps": 17941, "loss": 1.6449, "learning_rate": 3.2697428395146444e-06, "epoch": 0.8864054400535087, "percentage": 88.64, "elapsed_time": "1 day, 13:38:16", "remaining_time": "4:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15904, "total_steps": 17941, "loss": 1.6511, "learning_rate": 3.2665764596342575e-06, "epoch": 0.8864611783066718, "percentage": 88.65, "elapsed_time": "1 day, 13:38:24", "remaining_time": "4:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15905, "total_steps": 17941, "loss": 1.4201, "learning_rate": 3.2634115618655926e-06, "epoch": 0.886516916559835, "percentage": 88.65, "elapsed_time": "1 day, 13:38:34", "remaining_time": "4:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15906, "total_steps": 17941, "loss": 1.708, "learning_rate": 3.2602481463090252e-06, "epoch": 0.8865726548129982, "percentage": 88.66, "elapsed_time": "1 day, 13:38:42", "remaining_time": "4:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15907, "total_steps": 17941, "loss": 1.8314, "learning_rate": 3.2570862130648696e-06, "epoch": 0.8866283930661613, "percentage": 88.66, "elapsed_time": "1 day, 13:38:51", "remaining_time": "4:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15908, "total_steps": 17941, "loss": 1.7611, "learning_rate": 3.2539257622334062e-06, "epoch": 0.8866841313193244, "percentage": 88.67, "elapsed_time": "1 day, 13:38:59", "remaining_time": "4:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15909, "total_steps": 17941, "loss": 1.7406, "learning_rate": 3.2507667939148722e-06, "epoch": 0.8867398695724876, "percentage": 88.67, "elapsed_time": "1 day, 13:39:07", "remaining_time": "4:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15910, "total_steps": 17941, "loss": 1.5265, "learning_rate": 3.247609308209443e-06, "epoch": 0.8867956078256507, "percentage": 88.68, "elapsed_time": "1 day, 13:39:16", "remaining_time": "4:48:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15911, "total_steps": 17941, "loss": 1.661, "learning_rate": 3.2444533052172766e-06, "epoch": 0.8868513460788139, "percentage": 88.69, "elapsed_time": "1 day, 13:39:24", "remaining_time": "4:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15912, "total_steps": 17941, "loss": 1.5103, "learning_rate": 3.241298785038427e-06, "epoch": 0.8869070843319771, "percentage": 88.69, "elapsed_time": "1 day, 13:39:33", "remaining_time": "4:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15913, "total_steps": 17941, "loss": 1.6671, "learning_rate": 3.2381457477729747e-06, "epoch": 0.8869628225851401, "percentage": 88.7, "elapsed_time": "1 day, 13:39:41", "remaining_time": "4:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15914, "total_steps": 17941, "loss": 1.7058, "learning_rate": 3.2349941935208905e-06, "epoch": 0.8870185608383033, "percentage": 88.7, "elapsed_time": "1 day, 13:39:50", "remaining_time": "4:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15915, "total_steps": 17941, "loss": 1.7952, "learning_rate": 3.231844122382133e-06, "epoch": 0.8870742990914665, "percentage": 88.71, "elapsed_time": "1 day, 13:39:58", "remaining_time": "4:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15916, "total_steps": 17941, "loss": 1.6081, "learning_rate": 3.2286955344565993e-06, "epoch": 0.8871300373446296, "percentage": 88.71, "elapsed_time": "1 day, 13:40:07", "remaining_time": "4:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15917, "total_steps": 17941, "loss": 1.7535, "learning_rate": 3.2255484298441497e-06, "epoch": 0.8871857755977928, "percentage": 88.72, "elapsed_time": "1 day, 13:40:15", "remaining_time": "4:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15918, "total_steps": 17941, "loss": 1.4049, "learning_rate": 3.222402808644598e-06, "epoch": 0.887241513850956, "percentage": 88.72, "elapsed_time": "1 day, 13:40:24", "remaining_time": "4:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15919, "total_steps": 17941, "loss": 1.4825, "learning_rate": 3.219258670957681e-06, "epoch": 0.887297252104119, "percentage": 88.73, "elapsed_time": "1 day, 13:40:32", "remaining_time": "4:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15920, "total_steps": 17941, "loss": 1.4344, "learning_rate": 3.216116016883147e-06, "epoch": 0.8873529903572822, "percentage": 88.74, "elapsed_time": "1 day, 13:40:40", "remaining_time": "4:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15921, "total_steps": 17941, "loss": 1.6976, "learning_rate": 3.2129748465206335e-06, "epoch": 0.8874087286104454, "percentage": 88.74, "elapsed_time": "1 day, 13:40:49", "remaining_time": "4:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15922, "total_steps": 17941, "loss": 1.6668, "learning_rate": 3.209835159969771e-06, "epoch": 0.8874644668636085, "percentage": 88.75, "elapsed_time": "1 day, 13:40:58", "remaining_time": "4:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15923, "total_steps": 17941, "loss": 1.8659, "learning_rate": 3.20669695733013e-06, "epoch": 0.8875202051167717, "percentage": 88.75, "elapsed_time": "1 day, 13:41:06", "remaining_time": "4:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15924, "total_steps": 17941, "loss": 1.7998, "learning_rate": 3.2035602387012367e-06, "epoch": 0.8875759433699348, "percentage": 88.76, "elapsed_time": "1 day, 13:41:15", "remaining_time": "4:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15925, "total_steps": 17941, "loss": 1.6054, "learning_rate": 3.2004250041825834e-06, "epoch": 0.8876316816230979, "percentage": 88.76, "elapsed_time": "1 day, 13:41:23", "remaining_time": "4:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15926, "total_steps": 17941, "loss": 1.6876, "learning_rate": 3.1972912538735745e-06, "epoch": 0.8876874198762611, "percentage": 88.77, "elapsed_time": "1 day, 13:41:31", "remaining_time": "4:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15927, "total_steps": 17941, "loss": 1.6825, "learning_rate": 3.1941589878736135e-06, "epoch": 0.8877431581294242, "percentage": 88.77, "elapsed_time": "1 day, 13:41:40", "remaining_time": "4:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15928, "total_steps": 17941, "loss": 1.6847, "learning_rate": 3.191028206282032e-06, "epoch": 0.8877988963825874, "percentage": 88.78, "elapsed_time": "1 day, 13:41:48", "remaining_time": "4:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15929, "total_steps": 17941, "loss": 1.5833, "learning_rate": 3.187898909198117e-06, "epoch": 0.8878546346357505, "percentage": 88.79, "elapsed_time": "1 day, 13:41:57", "remaining_time": "4:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15930, "total_steps": 17941, "loss": 1.5762, "learning_rate": 3.1847710967211174e-06, "epoch": 0.8879103728889136, "percentage": 88.79, "elapsed_time": "1 day, 13:42:05", "remaining_time": "4:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15931, "total_steps": 17941, "loss": 1.6475, "learning_rate": 3.181644768950226e-06, "epoch": 0.8879661111420768, "percentage": 88.8, "elapsed_time": "1 day, 13:42:14", "remaining_time": "4:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15932, "total_steps": 17941, "loss": 1.6052, "learning_rate": 3.178519925984602e-06, "epoch": 0.88802184939524, "percentage": 88.8, "elapsed_time": "1 day, 13:42:22", "remaining_time": "4:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15933, "total_steps": 17941, "loss": 1.571, "learning_rate": 3.175396567923328e-06, "epoch": 0.888077587648403, "percentage": 88.81, "elapsed_time": "1 day, 13:42:31", "remaining_time": "4:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15934, "total_steps": 17941, "loss": 1.6819, "learning_rate": 3.172274694865468e-06, "epoch": 0.8881333259015662, "percentage": 88.81, "elapsed_time": "1 day, 13:42:39", "remaining_time": "4:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15935, "total_steps": 17941, "loss": 1.704, "learning_rate": 3.169154306910033e-06, "epoch": 0.8881890641547294, "percentage": 88.82, "elapsed_time": "1 day, 13:42:48", "remaining_time": "4:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15936, "total_steps": 17941, "loss": 1.6457, "learning_rate": 3.166035404155976e-06, "epoch": 0.8882448024078925, "percentage": 88.82, "elapsed_time": "1 day, 13:42:56", "remaining_time": "4:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15937, "total_steps": 17941, "loss": 1.7127, "learning_rate": 3.1629179867022298e-06, "epoch": 0.8883005406610557, "percentage": 88.83, "elapsed_time": "1 day, 13:43:04", "remaining_time": "4:44:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15938, "total_steps": 17941, "loss": 1.5, "learning_rate": 3.159802054647626e-06, "epoch": 0.8883562789142189, "percentage": 88.84, "elapsed_time": "1 day, 13:43:13", "remaining_time": "4:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15939, "total_steps": 17941, "loss": 1.6278, "learning_rate": 3.156687608091019e-06, "epoch": 0.8884120171673819, "percentage": 88.84, "elapsed_time": "1 day, 13:43:21", "remaining_time": "4:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15940, "total_steps": 17941, "loss": 1.7275, "learning_rate": 3.1535746471311578e-06, "epoch": 0.8884677554205451, "percentage": 88.85, "elapsed_time": "1 day, 13:43:30", "remaining_time": "4:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15941, "total_steps": 17941, "loss": 1.6617, "learning_rate": 3.1504631718667744e-06, "epoch": 0.8885234936737083, "percentage": 88.85, "elapsed_time": "1 day, 13:43:39", "remaining_time": "4:44:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15942, "total_steps": 17941, "loss": 1.7402, "learning_rate": 3.1473531823965507e-06, "epoch": 0.8885792319268714, "percentage": 88.86, "elapsed_time": "1 day, 13:43:47", "remaining_time": "4:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15943, "total_steps": 17941, "loss": 1.45, "learning_rate": 3.144244678819114e-06, "epoch": 0.8886349701800346, "percentage": 88.86, "elapsed_time": "1 day, 13:43:56", "remaining_time": "4:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15944, "total_steps": 17941, "loss": 1.4243, "learning_rate": 3.1411376612330514e-06, "epoch": 0.8886907084331978, "percentage": 88.87, "elapsed_time": "1 day, 13:44:04", "remaining_time": "4:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15945, "total_steps": 17941, "loss": 1.7704, "learning_rate": 3.138032129736884e-06, "epoch": 0.8887464466863608, "percentage": 88.87, "elapsed_time": "1 day, 13:44:13", "remaining_time": "4:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15946, "total_steps": 17941, "loss": 1.6739, "learning_rate": 3.1349280844291286e-06, "epoch": 0.888802184939524, "percentage": 88.88, "elapsed_time": "1 day, 13:44:22", "remaining_time": "4:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15947, "total_steps": 17941, "loss": 1.5555, "learning_rate": 3.131825525408205e-06, "epoch": 0.8888579231926872, "percentage": 88.89, "elapsed_time": "1 day, 13:44:30", "remaining_time": "4:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15948, "total_steps": 17941, "loss": 1.512, "learning_rate": 3.1287244527725135e-06, "epoch": 0.8889136614458503, "percentage": 88.89, "elapsed_time": "1 day, 13:44:39", "remaining_time": "4:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15949, "total_steps": 17941, "loss": 1.658, "learning_rate": 3.125624866620408e-06, "epoch": 0.8889693996990135, "percentage": 88.9, "elapsed_time": "1 day, 13:44:48", "remaining_time": "4:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15950, "total_steps": 17941, "loss": 1.4094, "learning_rate": 3.122526767050177e-06, "epoch": 0.8890251379521765, "percentage": 88.9, "elapsed_time": "1 day, 13:44:56", "remaining_time": "4:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15951, "total_steps": 17941, "loss": 1.6805, "learning_rate": 3.119430154160097e-06, "epoch": 0.8890808762053397, "percentage": 88.91, "elapsed_time": "1 day, 13:45:05", "remaining_time": "4:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15952, "total_steps": 17941, "loss": 1.7003, "learning_rate": 3.1163350280483505e-06, "epoch": 0.8891366144585029, "percentage": 88.91, "elapsed_time": "1 day, 13:45:13", "remaining_time": "4:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15953, "total_steps": 17941, "loss": 1.5728, "learning_rate": 3.113241388813104e-06, "epoch": 0.889192352711666, "percentage": 88.92, "elapsed_time": "1 day, 13:45:22", "remaining_time": "4:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15954, "total_steps": 17941, "loss": 1.6875, "learning_rate": 3.110149236552473e-06, "epoch": 0.8892480909648292, "percentage": 88.92, "elapsed_time": "1 day, 13:45:30", "remaining_time": "4:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15955, "total_steps": 17941, "loss": 1.4887, "learning_rate": 3.107058571364524e-06, "epoch": 0.8893038292179923, "percentage": 88.93, "elapsed_time": "1 day, 13:45:39", "remaining_time": "4:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15956, "total_steps": 17941, "loss": 1.6033, "learning_rate": 3.103969393347267e-06, "epoch": 0.8893595674711554, "percentage": 88.94, "elapsed_time": "1 day, 13:45:47", "remaining_time": "4:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15957, "total_steps": 17941, "loss": 1.4675, "learning_rate": 3.1008817025986847e-06, "epoch": 0.8894153057243186, "percentage": 88.94, "elapsed_time": "1 day, 13:45:56", "remaining_time": "4:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15958, "total_steps": 17941, "loss": 1.7095, "learning_rate": 3.097795499216699e-06, "epoch": 0.8894710439774818, "percentage": 88.95, "elapsed_time": "1 day, 13:46:04", "remaining_time": "4:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15959, "total_steps": 17941, "loss": 1.5529, "learning_rate": 3.094710783299171e-06, "epoch": 0.8895267822306449, "percentage": 88.95, "elapsed_time": "1 day, 13:46:13", "remaining_time": "4:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15960, "total_steps": 17941, "loss": 1.8335, "learning_rate": 3.0916275549439432e-06, "epoch": 0.889582520483808, "percentage": 88.96, "elapsed_time": "1 day, 13:46:21", "remaining_time": "4:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15961, "total_steps": 17941, "loss": 1.7716, "learning_rate": 3.0885458142487944e-06, "epoch": 0.8896382587369712, "percentage": 88.96, "elapsed_time": "1 day, 13:46:29", "remaining_time": "4:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15962, "total_steps": 17941, "loss": 1.3397, "learning_rate": 3.085465561311457e-06, "epoch": 0.8896939969901343, "percentage": 88.97, "elapsed_time": "1 day, 13:46:38", "remaining_time": "4:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15963, "total_steps": 17941, "loss": 1.6436, "learning_rate": 3.0823867962296305e-06, "epoch": 0.8897497352432975, "percentage": 88.97, "elapsed_time": "1 day, 13:46:47", "remaining_time": "4:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15964, "total_steps": 17941, "loss": 1.7821, "learning_rate": 3.0793095191009314e-06, "epoch": 0.8898054734964607, "percentage": 88.98, "elapsed_time": "1 day, 13:46:55", "remaining_time": "4:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15965, "total_steps": 17941, "loss": 1.7467, "learning_rate": 3.0762337300229817e-06, "epoch": 0.8898612117496237, "percentage": 88.99, "elapsed_time": "1 day, 13:47:04", "remaining_time": "4:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15966, "total_steps": 17941, "loss": 1.5924, "learning_rate": 3.0731594290933085e-06, "epoch": 0.8899169500027869, "percentage": 88.99, "elapsed_time": "1 day, 13:47:12", "remaining_time": "4:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15967, "total_steps": 17941, "loss": 1.5698, "learning_rate": 3.0700866164094123e-06, "epoch": 0.8899726882559501, "percentage": 89.0, "elapsed_time": "1 day, 13:47:21", "remaining_time": "4:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15968, "total_steps": 17941, "loss": 1.6342, "learning_rate": 3.0670152920687478e-06, "epoch": 0.8900284265091132, "percentage": 89.0, "elapsed_time": "1 day, 13:47:29", "remaining_time": "4:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15969, "total_steps": 17941, "loss": 1.7048, "learning_rate": 3.063945456168721e-06, "epoch": 0.8900841647622764, "percentage": 89.01, "elapsed_time": "1 day, 13:47:38", "remaining_time": "4:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15970, "total_steps": 17941, "loss": 1.8074, "learning_rate": 3.060877108806698e-06, "epoch": 0.8901399030154395, "percentage": 89.01, "elapsed_time": "1 day, 13:47:46", "remaining_time": "4:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15971, "total_steps": 17941, "loss": 1.5402, "learning_rate": 3.0578102500799623e-06, "epoch": 0.8901956412686026, "percentage": 89.02, "elapsed_time": "1 day, 13:47:55", "remaining_time": "4:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15972, "total_steps": 17941, "loss": 1.7861, "learning_rate": 3.054744880085808e-06, "epoch": 0.8902513795217658, "percentage": 89.03, "elapsed_time": "1 day, 13:48:04", "remaining_time": "4:39:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15973, "total_steps": 17941, "loss": 1.5309, "learning_rate": 3.0516809989214302e-06, "epoch": 0.8903071177749289, "percentage": 89.03, "elapsed_time": "1 day, 13:48:12", "remaining_time": "4:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15974, "total_steps": 17941, "loss": 1.6472, "learning_rate": 3.048618606684006e-06, "epoch": 0.8903628560280921, "percentage": 89.04, "elapsed_time": "1 day, 13:48:21", "remaining_time": "4:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15975, "total_steps": 17941, "loss": 1.4459, "learning_rate": 3.045557703470647e-06, "epoch": 0.8904185942812552, "percentage": 89.04, "elapsed_time": "1 day, 13:48:29", "remaining_time": "4:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15976, "total_steps": 17941, "loss": 1.481, "learning_rate": 3.0424982893784426e-06, "epoch": 0.8904743325344183, "percentage": 89.05, "elapsed_time": "1 day, 13:48:37", "remaining_time": "4:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15977, "total_steps": 17941, "loss": 1.6715, "learning_rate": 3.0394403645044144e-06, "epoch": 0.8905300707875815, "percentage": 89.05, "elapsed_time": "1 day, 13:48:46", "remaining_time": "4:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15978, "total_steps": 17941, "loss": 1.8429, "learning_rate": 3.0363839289455297e-06, "epoch": 0.8905858090407447, "percentage": 89.06, "elapsed_time": "1 day, 13:48:54", "remaining_time": "4:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15979, "total_steps": 17941, "loss": 1.7792, "learning_rate": 3.033328982798733e-06, "epoch": 0.8906415472939078, "percentage": 89.06, "elapsed_time": "1 day, 13:49:03", "remaining_time": "4:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15980, "total_steps": 17941, "loss": 1.6636, "learning_rate": 3.0302755261609028e-06, "epoch": 0.890697285547071, "percentage": 89.07, "elapsed_time": "1 day, 13:49:11", "remaining_time": "4:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15981, "total_steps": 17941, "loss": 1.6162, "learning_rate": 3.0272235591288833e-06, "epoch": 0.8907530238002341, "percentage": 89.08, "elapsed_time": "1 day, 13:49:20", "remaining_time": "4:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15982, "total_steps": 17941, "loss": 1.9301, "learning_rate": 3.0241730817994583e-06, "epoch": 0.8908087620533972, "percentage": 89.08, "elapsed_time": "1 day, 13:49:28", "remaining_time": "4:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15983, "total_steps": 17941, "loss": 1.5951, "learning_rate": 3.0211240942693786e-06, "epoch": 0.8908645003065604, "percentage": 89.09, "elapsed_time": "1 day, 13:49:37", "remaining_time": "4:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15984, "total_steps": 17941, "loss": 1.5957, "learning_rate": 3.0180765966353443e-06, "epoch": 0.8909202385597236, "percentage": 89.09, "elapsed_time": "1 day, 13:49:45", "remaining_time": "4:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15985, "total_steps": 17941, "loss": 1.5814, "learning_rate": 3.015030588993989e-06, "epoch": 0.8909759768128866, "percentage": 89.1, "elapsed_time": "1 day, 13:49:54", "remaining_time": "4:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15986, "total_steps": 17941, "loss": 1.5555, "learning_rate": 3.0119860714419247e-06, "epoch": 0.8910317150660498, "percentage": 89.1, "elapsed_time": "1 day, 13:50:02", "remaining_time": "4:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15987, "total_steps": 17941, "loss": 1.6901, "learning_rate": 3.008943044075696e-06, "epoch": 0.891087453319213, "percentage": 89.11, "elapsed_time": "1 day, 13:50:11", "remaining_time": "4:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15988, "total_steps": 17941, "loss": 1.7219, "learning_rate": 3.005901506991826e-06, "epoch": 0.8911431915723761, "percentage": 89.11, "elapsed_time": "1 day, 13:50:20", "remaining_time": "4:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15989, "total_steps": 17941, "loss": 1.9941, "learning_rate": 3.0028614602867656e-06, "epoch": 0.8911989298255393, "percentage": 89.12, "elapsed_time": "1 day, 13:50:28", "remaining_time": "4:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15990, "total_steps": 17941, "loss": 1.7898, "learning_rate": 2.999822904056915e-06, "epoch": 0.8912546680787025, "percentage": 89.13, "elapsed_time": "1 day, 13:50:37", "remaining_time": "4:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15991, "total_steps": 17941, "loss": 1.7062, "learning_rate": 2.996785838398669e-06, "epoch": 0.8913104063318655, "percentage": 89.13, "elapsed_time": "1 day, 13:50:45", "remaining_time": "4:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15992, "total_steps": 17941, "loss": 1.6367, "learning_rate": 2.9937502634083183e-06, "epoch": 0.8913661445850287, "percentage": 89.14, "elapsed_time": "1 day, 13:50:54", "remaining_time": "4:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15993, "total_steps": 17941, "loss": 1.7481, "learning_rate": 2.990716179182146e-06, "epoch": 0.8914218828381919, "percentage": 89.14, "elapsed_time": "1 day, 13:51:02", "remaining_time": "4:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15994, "total_steps": 17941, "loss": 1.5891, "learning_rate": 2.9876835858163698e-06, "epoch": 0.891477621091355, "percentage": 89.15, "elapsed_time": "1 day, 13:51:11", "remaining_time": "4:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15995, "total_steps": 17941, "loss": 1.7217, "learning_rate": 2.984652483407169e-06, "epoch": 0.8915333593445182, "percentage": 89.15, "elapsed_time": "1 day, 13:51:19", "remaining_time": "4:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15996, "total_steps": 17941, "loss": 1.7456, "learning_rate": 2.981622872050682e-06, "epoch": 0.8915890975976812, "percentage": 89.16, "elapsed_time": "1 day, 13:51:28", "remaining_time": "4:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15997, "total_steps": 17941, "loss": 1.5291, "learning_rate": 2.978594751842967e-06, "epoch": 0.8916448358508444, "percentage": 89.16, "elapsed_time": "1 day, 13:51:36", "remaining_time": "4:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15998, "total_steps": 17941, "loss": 1.5079, "learning_rate": 2.9755681228800902e-06, "epoch": 0.8917005741040076, "percentage": 89.17, "elapsed_time": "1 day, 13:51:45", "remaining_time": "4:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15999, "total_steps": 17941, "loss": 1.6639, "learning_rate": 2.972542985258009e-06, "epoch": 0.8917563123571707, "percentage": 89.18, "elapsed_time": "1 day, 13:51:53", "remaining_time": "4:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16000, "total_steps": 17941, "loss": 1.776, "learning_rate": 2.9695193390726793e-06, "epoch": 0.8918120506103339, "percentage": 89.18, "elapsed_time": "1 day, 13:52:02", "remaining_time": "4:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16001, "total_steps": 17941, "loss": 1.4699, "learning_rate": 2.9664971844199863e-06, "epoch": 0.891867788863497, "percentage": 89.19, "elapsed_time": "1 day, 13:52:10", "remaining_time": "4:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16002, "total_steps": 17941, "loss": 1.7631, "learning_rate": 2.9634765213957803e-06, "epoch": 0.8919235271166601, "percentage": 89.19, "elapsed_time": "1 day, 13:52:19", "remaining_time": "4:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16003, "total_steps": 17941, "loss": 1.4175, "learning_rate": 2.9604573500958633e-06, "epoch": 0.8919792653698233, "percentage": 89.2, "elapsed_time": "1 day, 13:52:28", "remaining_time": "4:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16004, "total_steps": 17941, "loss": 1.5931, "learning_rate": 2.9574396706159746e-06, "epoch": 0.8920350036229865, "percentage": 89.2, "elapsed_time": "1 day, 13:52:36", "remaining_time": "4:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16005, "total_steps": 17941, "loss": 1.7791, "learning_rate": 2.9544234830518213e-06, "epoch": 0.8920907418761496, "percentage": 89.21, "elapsed_time": "1 day, 13:52:45", "remaining_time": "4:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16006, "total_steps": 17941, "loss": 1.7419, "learning_rate": 2.9514087874990604e-06, "epoch": 0.8921464801293127, "percentage": 89.21, "elapsed_time": "1 day, 13:52:53", "remaining_time": "4:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16007, "total_steps": 17941, "loss": 1.7437, "learning_rate": 2.9483955840532984e-06, "epoch": 0.8922022183824759, "percentage": 89.22, "elapsed_time": "1 day, 13:53:02", "remaining_time": "4:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16008, "total_steps": 17941, "loss": 1.5056, "learning_rate": 2.945383872810098e-06, "epoch": 0.892257956635639, "percentage": 89.23, "elapsed_time": "1 day, 13:53:10", "remaining_time": "4:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16009, "total_steps": 17941, "loss": 1.6407, "learning_rate": 2.942373653864977e-06, "epoch": 0.8923136948888022, "percentage": 89.23, "elapsed_time": "1 day, 13:53:18", "remaining_time": "4:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16010, "total_steps": 17941, "loss": 1.6579, "learning_rate": 2.939364927313404e-06, "epoch": 0.8923694331419654, "percentage": 89.24, "elapsed_time": "1 day, 13:53:27", "remaining_time": "4:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16011, "total_steps": 17941, "loss": 1.4188, "learning_rate": 2.9363576932507854e-06, "epoch": 0.8924251713951284, "percentage": 89.24, "elapsed_time": "1 day, 13:53:35", "remaining_time": "4:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16012, "total_steps": 17941, "loss": 1.583, "learning_rate": 2.9333519517725004e-06, "epoch": 0.8924809096482916, "percentage": 89.25, "elapsed_time": "1 day, 13:53:44", "remaining_time": "4:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16013, "total_steps": 17941, "loss": 1.6154, "learning_rate": 2.9303477029738793e-06, "epoch": 0.8925366479014548, "percentage": 89.25, "elapsed_time": "1 day, 13:53:52", "remaining_time": "4:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16014, "total_steps": 17941, "loss": 1.7656, "learning_rate": 2.927344946950189e-06, "epoch": 0.8925923861546179, "percentage": 89.26, "elapsed_time": "1 day, 13:54:01", "remaining_time": "4:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16015, "total_steps": 17941, "loss": 1.8014, "learning_rate": 2.9243436837966708e-06, "epoch": 0.8926481244077811, "percentage": 89.26, "elapsed_time": "1 day, 13:54:09", "remaining_time": "4:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16016, "total_steps": 17941, "loss": 1.7021, "learning_rate": 2.9213439136084875e-06, "epoch": 0.8927038626609443, "percentage": 89.27, "elapsed_time": "1 day, 13:54:18", "remaining_time": "4:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16017, "total_steps": 17941, "loss": 1.7614, "learning_rate": 2.9183456364808013e-06, "epoch": 0.8927596009141073, "percentage": 89.28, "elapsed_time": "1 day, 13:54:26", "remaining_time": "4:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16018, "total_steps": 17941, "loss": 1.6005, "learning_rate": 2.9153488525086814e-06, "epoch": 0.8928153391672705, "percentage": 89.28, "elapsed_time": "1 day, 13:54:35", "remaining_time": "4:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16019, "total_steps": 17941, "loss": 1.6781, "learning_rate": 2.9123535617871734e-06, "epoch": 0.8928710774204336, "percentage": 89.29, "elapsed_time": "1 day, 13:54:43", "remaining_time": "4:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16020, "total_steps": 17941, "loss": 1.5218, "learning_rate": 2.909359764411268e-06, "epoch": 0.8929268156735968, "percentage": 89.29, "elapsed_time": "1 day, 13:54:52", "remaining_time": "4:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16021, "total_steps": 17941, "loss": 1.7996, "learning_rate": 2.9063674604759118e-06, "epoch": 0.89298255392676, "percentage": 89.3, "elapsed_time": "1 day, 13:55:00", "remaining_time": "4:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16022, "total_steps": 17941, "loss": 1.5145, "learning_rate": 2.903376650076017e-06, "epoch": 0.893038292179923, "percentage": 89.3, "elapsed_time": "1 day, 13:55:08", "remaining_time": "4:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16023, "total_steps": 17941, "loss": 1.7649, "learning_rate": 2.9003873333064035e-06, "epoch": 0.8930940304330862, "percentage": 89.31, "elapsed_time": "1 day, 13:55:17", "remaining_time": "4:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16024, "total_steps": 17941, "loss": 2.0282, "learning_rate": 2.897399510261911e-06, "epoch": 0.8931497686862494, "percentage": 89.31, "elapsed_time": "1 day, 13:55:25", "remaining_time": "4:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16025, "total_steps": 17941, "loss": 1.4677, "learning_rate": 2.8944131810372754e-06, "epoch": 0.8932055069394125, "percentage": 89.32, "elapsed_time": "1 day, 13:55:34", "remaining_time": "4:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16026, "total_steps": 17941, "loss": 1.885, "learning_rate": 2.891428345727204e-06, "epoch": 0.8932612451925757, "percentage": 89.33, "elapsed_time": "1 day, 13:55:42", "remaining_time": "4:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16027, "total_steps": 17941, "loss": 1.8177, "learning_rate": 2.8884450044263654e-06, "epoch": 0.8933169834457388, "percentage": 89.33, "elapsed_time": "1 day, 13:55:51", "remaining_time": "4:31:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16028, "total_steps": 17941, "loss": 1.7025, "learning_rate": 2.885463157229368e-06, "epoch": 0.8933727216989019, "percentage": 89.34, "elapsed_time": "1 day, 13:55:59", "remaining_time": "4:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16029, "total_steps": 17941, "loss": 1.5729, "learning_rate": 2.882482804230796e-06, "epoch": 0.8934284599520651, "percentage": 89.34, "elapsed_time": "1 day, 13:56:07", "remaining_time": "4:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16030, "total_steps": 17941, "loss": 1.619, "learning_rate": 2.8795039455251417e-06, "epoch": 0.8934841982052283, "percentage": 89.35, "elapsed_time": "1 day, 13:56:16", "remaining_time": "4:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16031, "total_steps": 17941, "loss": 1.6816, "learning_rate": 2.8765265812068955e-06, "epoch": 0.8935399364583914, "percentage": 89.35, "elapsed_time": "1 day, 13:56:24", "remaining_time": "4:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16032, "total_steps": 17941, "loss": 1.4816, "learning_rate": 2.8735507113704765e-06, "epoch": 0.8935956747115545, "percentage": 89.36, "elapsed_time": "1 day, 13:56:33", "remaining_time": "4:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16033, "total_steps": 17941, "loss": 1.6472, "learning_rate": 2.870576336110259e-06, "epoch": 0.8936514129647177, "percentage": 89.37, "elapsed_time": "1 day, 13:56:41", "remaining_time": "4:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16034, "total_steps": 17941, "loss": 1.5764, "learning_rate": 2.867603455520579e-06, "epoch": 0.8937071512178808, "percentage": 89.37, "elapsed_time": "1 day, 13:56:50", "remaining_time": "4:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16035, "total_steps": 17941, "loss": 1.5398, "learning_rate": 2.8646320696957163e-06, "epoch": 0.893762889471044, "percentage": 89.38, "elapsed_time": "1 day, 13:56:58", "remaining_time": "4:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16036, "total_steps": 17941, "loss": 1.5303, "learning_rate": 2.8616621787299182e-06, "epoch": 0.8938186277242072, "percentage": 89.38, "elapsed_time": "1 day, 13:57:07", "remaining_time": "4:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16037, "total_steps": 17941, "loss": 1.6509, "learning_rate": 2.8586937827173475e-06, "epoch": 0.8938743659773702, "percentage": 89.39, "elapsed_time": "1 day, 13:57:15", "remaining_time": "4:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16038, "total_steps": 17941, "loss": 1.4169, "learning_rate": 2.8557268817521577e-06, "epoch": 0.8939301042305334, "percentage": 89.39, "elapsed_time": "1 day, 13:57:24", "remaining_time": "4:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16039, "total_steps": 17941, "loss": 1.6065, "learning_rate": 2.8527614759284393e-06, "epoch": 0.8939858424836966, "percentage": 89.4, "elapsed_time": "1 day, 13:57:32", "remaining_time": "4:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16040, "total_steps": 17941, "loss": 1.498, "learning_rate": 2.8497975653402398e-06, "epoch": 0.8940415807368597, "percentage": 89.4, "elapsed_time": "1 day, 13:57:41", "remaining_time": "4:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16041, "total_steps": 17941, "loss": 1.5735, "learning_rate": 2.846835150081567e-06, "epoch": 0.8940973189900229, "percentage": 89.41, "elapsed_time": "1 day, 13:57:49", "remaining_time": "4:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16042, "total_steps": 17941, "loss": 1.4585, "learning_rate": 2.8438742302463463e-06, "epoch": 0.894153057243186, "percentage": 89.42, "elapsed_time": "1 day, 13:57:57", "remaining_time": "4:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16043, "total_steps": 17941, "loss": 1.5987, "learning_rate": 2.8409148059285074e-06, "epoch": 0.8942087954963491, "percentage": 89.42, "elapsed_time": "1 day, 13:58:06", "remaining_time": "4:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16044, "total_steps": 17941, "loss": 1.6512, "learning_rate": 2.8379568772218925e-06, "epoch": 0.8942645337495123, "percentage": 89.43, "elapsed_time": "1 day, 13:58:15", "remaining_time": "4:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16045, "total_steps": 17941, "loss": 1.5096, "learning_rate": 2.8350004442203093e-06, "epoch": 0.8943202720026754, "percentage": 89.43, "elapsed_time": "1 day, 13:58:23", "remaining_time": "4:29:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16046, "total_steps": 17941, "loss": 1.6152, "learning_rate": 2.832045507017517e-06, "epoch": 0.8943760102558386, "percentage": 89.44, "elapsed_time": "1 day, 13:58:31", "remaining_time": "4:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16047, "total_steps": 17941, "loss": 1.6592, "learning_rate": 2.8290920657072395e-06, "epoch": 0.8944317485090018, "percentage": 89.44, "elapsed_time": "1 day, 13:58:40", "remaining_time": "4:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16048, "total_steps": 17941, "loss": 1.6614, "learning_rate": 2.826140120383136e-06, "epoch": 0.8944874867621648, "percentage": 89.45, "elapsed_time": "1 day, 13:58:49", "remaining_time": "4:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16049, "total_steps": 17941, "loss": 1.7733, "learning_rate": 2.823189671138815e-06, "epoch": 0.894543225015328, "percentage": 89.45, "elapsed_time": "1 day, 13:58:57", "remaining_time": "4:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16050, "total_steps": 17941, "loss": 1.8013, "learning_rate": 2.8202407180678734e-06, "epoch": 0.8945989632684912, "percentage": 89.46, "elapsed_time": "1 day, 13:59:06", "remaining_time": "4:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16051, "total_steps": 17941, "loss": 1.6324, "learning_rate": 2.8172932612638094e-06, "epoch": 0.8946547015216543, "percentage": 89.47, "elapsed_time": "1 day, 13:59:14", "remaining_time": "4:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16052, "total_steps": 17941, "loss": 1.5339, "learning_rate": 2.8143473008201083e-06, "epoch": 0.8947104397748175, "percentage": 89.47, "elapsed_time": "1 day, 13:59:23", "remaining_time": "4:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16053, "total_steps": 17941, "loss": 1.4765, "learning_rate": 2.8114028368302016e-06, "epoch": 0.8947661780279806, "percentage": 89.48, "elapsed_time": "1 day, 13:59:31", "remaining_time": "4:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16054, "total_steps": 17941, "loss": 1.5913, "learning_rate": 2.8084598693874696e-06, "epoch": 0.8948219162811437, "percentage": 89.48, "elapsed_time": "1 day, 13:59:40", "remaining_time": "4:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16055, "total_steps": 17941, "loss": 1.4893, "learning_rate": 2.8055183985852495e-06, "epoch": 0.8948776545343069, "percentage": 89.49, "elapsed_time": "1 day, 13:59:49", "remaining_time": "4:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16056, "total_steps": 17941, "loss": 1.6404, "learning_rate": 2.8025784245168165e-06, "epoch": 0.8949333927874701, "percentage": 89.49, "elapsed_time": "1 day, 13:59:57", "remaining_time": "4:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16057, "total_steps": 17941, "loss": 1.6021, "learning_rate": 2.799639947275412e-06, "epoch": 0.8949891310406332, "percentage": 89.5, "elapsed_time": "1 day, 14:00:06", "remaining_time": "4:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16058, "total_steps": 17941, "loss": 1.5734, "learning_rate": 2.79670296695424e-06, "epoch": 0.8950448692937963, "percentage": 89.5, "elapsed_time": "1 day, 14:00:15", "remaining_time": "4:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16059, "total_steps": 17941, "loss": 1.7043, "learning_rate": 2.7937674836464256e-06, "epoch": 0.8951006075469595, "percentage": 89.51, "elapsed_time": "1 day, 14:00:23", "remaining_time": "4:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16060, "total_steps": 17941, "loss": 1.5945, "learning_rate": 2.7908334974450835e-06, "epoch": 0.8951563458001226, "percentage": 89.52, "elapsed_time": "1 day, 14:00:32", "remaining_time": "4:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16061, "total_steps": 17941, "loss": 1.8713, "learning_rate": 2.78790100844325e-06, "epoch": 0.8952120840532858, "percentage": 89.52, "elapsed_time": "1 day, 14:00:40", "remaining_time": "4:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16062, "total_steps": 17941, "loss": 1.5255, "learning_rate": 2.7849700167339397e-06, "epoch": 0.895267822306449, "percentage": 89.53, "elapsed_time": "1 day, 14:00:49", "remaining_time": "4:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16063, "total_steps": 17941, "loss": 1.5041, "learning_rate": 2.7820405224100898e-06, "epoch": 0.895323560559612, "percentage": 89.53, "elapsed_time": "1 day, 14:00:57", "remaining_time": "4:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16064, "total_steps": 17941, "loss": 1.7677, "learning_rate": 2.7791125255646146e-06, "epoch": 0.8953792988127752, "percentage": 89.54, "elapsed_time": "1 day, 14:01:06", "remaining_time": "4:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16065, "total_steps": 17941, "loss": 1.7189, "learning_rate": 2.7761860262903728e-06, "epoch": 0.8954350370659383, "percentage": 89.54, "elapsed_time": "1 day, 14:01:14", "remaining_time": "4:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16066, "total_steps": 17941, "loss": 1.5225, "learning_rate": 2.7732610246801737e-06, "epoch": 0.8954907753191015, "percentage": 89.55, "elapsed_time": "1 day, 14:01:23", "remaining_time": "4:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16067, "total_steps": 17941, "loss": 1.7542, "learning_rate": 2.7703375208267877e-06, "epoch": 0.8955465135722647, "percentage": 89.55, "elapsed_time": "1 day, 14:01:31", "remaining_time": "4:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16068, "total_steps": 17941, "loss": 1.5417, "learning_rate": 2.767415514822924e-06, "epoch": 0.8956022518254277, "percentage": 89.56, "elapsed_time": "1 day, 14:01:40", "remaining_time": "4:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16069, "total_steps": 17941, "loss": 1.7285, "learning_rate": 2.7644950067612694e-06, "epoch": 0.8956579900785909, "percentage": 89.57, "elapsed_time": "1 day, 14:01:48", "remaining_time": "4:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16070, "total_steps": 17941, "loss": 1.6136, "learning_rate": 2.7615759967344167e-06, "epoch": 0.8957137283317541, "percentage": 89.57, "elapsed_time": "1 day, 14:01:57", "remaining_time": "4:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16071, "total_steps": 17941, "loss": 2.0667, "learning_rate": 2.758658484834958e-06, "epoch": 0.8957694665849172, "percentage": 89.58, "elapsed_time": "1 day, 14:02:05", "remaining_time": "4:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16072, "total_steps": 17941, "loss": 1.5887, "learning_rate": 2.7557424711554146e-06, "epoch": 0.8958252048380804, "percentage": 89.58, "elapsed_time": "1 day, 14:02:14", "remaining_time": "4:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16073, "total_steps": 17941, "loss": 1.7353, "learning_rate": 2.7528279557882675e-06, "epoch": 0.8958809430912436, "percentage": 89.59, "elapsed_time": "1 day, 14:02:22", "remaining_time": "4:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16074, "total_steps": 17941, "loss": 1.6566, "learning_rate": 2.7499149388259536e-06, "epoch": 0.8959366813444066, "percentage": 89.59, "elapsed_time": "1 day, 14:02:32", "remaining_time": "4:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16075, "total_steps": 17941, "loss": 1.536, "learning_rate": 2.7470034203608384e-06, "epoch": 0.8959924195975698, "percentage": 89.6, "elapsed_time": "1 day, 14:02:40", "remaining_time": "4:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16076, "total_steps": 17941, "loss": 1.563, "learning_rate": 2.7440934004852816e-06, "epoch": 0.896048157850733, "percentage": 89.6, "elapsed_time": "1 day, 14:02:48", "remaining_time": "4:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16077, "total_steps": 17941, "loss": 1.8413, "learning_rate": 2.7411848792915585e-06, "epoch": 0.8961038961038961, "percentage": 89.61, "elapsed_time": "1 day, 14:02:57", "remaining_time": "4:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16078, "total_steps": 17941, "loss": 1.7377, "learning_rate": 2.7382778568719127e-06, "epoch": 0.8961596343570593, "percentage": 89.62, "elapsed_time": "1 day, 14:03:06", "remaining_time": "4:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16079, "total_steps": 17941, "loss": 1.5769, "learning_rate": 2.7353723333185365e-06, "epoch": 0.8962153726102224, "percentage": 89.62, "elapsed_time": "1 day, 14:03:14", "remaining_time": "4:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16080, "total_steps": 17941, "loss": 1.1935, "learning_rate": 2.7324683087235736e-06, "epoch": 0.8962711108633855, "percentage": 89.63, "elapsed_time": "1 day, 14:03:22", "remaining_time": "4:24:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16081, "total_steps": 17941, "loss": 1.5682, "learning_rate": 2.7295657831791387e-06, "epoch": 0.8963268491165487, "percentage": 89.63, "elapsed_time": "1 day, 14:03:31", "remaining_time": "4:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16082, "total_steps": 17941, "loss": 1.4302, "learning_rate": 2.7266647567772643e-06, "epoch": 0.8963825873697119, "percentage": 89.64, "elapsed_time": "1 day, 14:03:39", "remaining_time": "4:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16083, "total_steps": 17941, "loss": 1.7366, "learning_rate": 2.7237652296099646e-06, "epoch": 0.896438325622875, "percentage": 89.64, "elapsed_time": "1 day, 14:03:48", "remaining_time": "4:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16084, "total_steps": 17941, "loss": 1.5471, "learning_rate": 2.7208672017691893e-06, "epoch": 0.8964940638760381, "percentage": 89.65, "elapsed_time": "1 day, 14:03:56", "remaining_time": "4:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16085, "total_steps": 17941, "loss": 1.8768, "learning_rate": 2.717970673346848e-06, "epoch": 0.8965498021292013, "percentage": 89.65, "elapsed_time": "1 day, 14:04:05", "remaining_time": "4:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16086, "total_steps": 17941, "loss": 1.725, "learning_rate": 2.715075644434806e-06, "epoch": 0.8966055403823644, "percentage": 89.66, "elapsed_time": "1 day, 14:04:13", "remaining_time": "4:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16087, "total_steps": 17941, "loss": 1.4072, "learning_rate": 2.7121821151248726e-06, "epoch": 0.8966612786355276, "percentage": 89.67, "elapsed_time": "1 day, 14:04:22", "remaining_time": "4:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16088, "total_steps": 17941, "loss": 1.6065, "learning_rate": 2.70929008550882e-06, "epoch": 0.8967170168886907, "percentage": 89.67, "elapsed_time": "1 day, 14:04:30", "remaining_time": "4:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16089, "total_steps": 17941, "loss": 1.5687, "learning_rate": 2.706399555678357e-06, "epoch": 0.8967727551418538, "percentage": 89.68, "elapsed_time": "1 day, 14:04:39", "remaining_time": "4:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16090, "total_steps": 17941, "loss": 1.7931, "learning_rate": 2.7035105257251614e-06, "epoch": 0.896828493395017, "percentage": 89.68, "elapsed_time": "1 day, 14:04:47", "remaining_time": "4:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16091, "total_steps": 17941, "loss": 1.4986, "learning_rate": 2.7006229957408537e-06, "epoch": 0.8968842316481801, "percentage": 89.69, "elapsed_time": "1 day, 14:04:56", "remaining_time": "4:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16092, "total_steps": 17941, "loss": 1.5404, "learning_rate": 2.6977369658170105e-06, "epoch": 0.8969399699013433, "percentage": 89.69, "elapsed_time": "1 day, 14:05:04", "remaining_time": "4:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16093, "total_steps": 17941, "loss": 1.6416, "learning_rate": 2.6948524360451588e-06, "epoch": 0.8969957081545065, "percentage": 89.7, "elapsed_time": "1 day, 14:05:13", "remaining_time": "4:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16094, "total_steps": 17941, "loss": 1.3168, "learning_rate": 2.6919694065167756e-06, "epoch": 0.8970514464076695, "percentage": 89.71, "elapsed_time": "1 day, 14:05:21", "remaining_time": "4:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16095, "total_steps": 17941, "loss": 1.3254, "learning_rate": 2.6890878773233097e-06, "epoch": 0.8971071846608327, "percentage": 89.71, "elapsed_time": "1 day, 14:05:30", "remaining_time": "4:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16096, "total_steps": 17941, "loss": 1.7026, "learning_rate": 2.686207848556127e-06, "epoch": 0.8971629229139959, "percentage": 89.72, "elapsed_time": "1 day, 14:05:38", "remaining_time": "4:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16097, "total_steps": 17941, "loss": 1.8391, "learning_rate": 2.683329320306571e-06, "epoch": 0.897218661167159, "percentage": 89.72, "elapsed_time": "1 day, 14:05:47", "remaining_time": "4:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16098, "total_steps": 17941, "loss": 1.7414, "learning_rate": 2.6804522926659358e-06, "epoch": 0.8972743994203222, "percentage": 89.73, "elapsed_time": "1 day, 14:05:55", "remaining_time": "4:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16099, "total_steps": 17941, "loss": 1.8649, "learning_rate": 2.677576765725459e-06, "epoch": 0.8973301376734854, "percentage": 89.73, "elapsed_time": "1 day, 14:06:04", "remaining_time": "4:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16100, "total_steps": 17941, "loss": 1.6357, "learning_rate": 2.674702739576351e-06, "epoch": 0.8973858759266484, "percentage": 89.74, "elapsed_time": "1 day, 14:06:13", "remaining_time": "4:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16101, "total_steps": 17941, "loss": 1.6912, "learning_rate": 2.6718302143097283e-06, "epoch": 0.8974416141798116, "percentage": 89.74, "elapsed_time": "1 day, 14:06:21", "remaining_time": "4:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16102, "total_steps": 17941, "loss": 1.4666, "learning_rate": 2.668959190016723e-06, "epoch": 0.8974973524329748, "percentage": 89.75, "elapsed_time": "1 day, 14:06:29", "remaining_time": "4:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16103, "total_steps": 17941, "loss": 1.5336, "learning_rate": 2.666089666788363e-06, "epoch": 0.8975530906861379, "percentage": 89.76, "elapsed_time": "1 day, 14:06:38", "remaining_time": "4:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16104, "total_steps": 17941, "loss": 1.3672, "learning_rate": 2.6632216447156686e-06, "epoch": 0.897608828939301, "percentage": 89.76, "elapsed_time": "1 day, 14:06:47", "remaining_time": "4:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16105, "total_steps": 17941, "loss": 2.1044, "learning_rate": 2.6603551238895853e-06, "epoch": 0.8976645671924642, "percentage": 89.77, "elapsed_time": "1 day, 14:06:55", "remaining_time": "4:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16106, "total_steps": 17941, "loss": 1.8391, "learning_rate": 2.6574901044010337e-06, "epoch": 0.8977203054456273, "percentage": 89.77, "elapsed_time": "1 day, 14:07:04", "remaining_time": "4:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16107, "total_steps": 17941, "loss": 1.4328, "learning_rate": 2.654626586340875e-06, "epoch": 0.8977760436987905, "percentage": 89.78, "elapsed_time": "1 day, 14:07:12", "remaining_time": "4:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16108, "total_steps": 17941, "loss": 1.6311, "learning_rate": 2.651764569799908e-06, "epoch": 0.8978317819519537, "percentage": 89.78, "elapsed_time": "1 day, 14:07:21", "remaining_time": "4:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16109, "total_steps": 17941, "loss": 1.7373, "learning_rate": 2.648904054868917e-06, "epoch": 0.8978875202051168, "percentage": 89.79, "elapsed_time": "1 day, 14:07:29", "remaining_time": "4:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16110, "total_steps": 17941, "loss": 1.779, "learning_rate": 2.646045041638606e-06, "epoch": 0.8979432584582799, "percentage": 89.79, "elapsed_time": "1 day, 14:07:38", "remaining_time": "4:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16111, "total_steps": 17941, "loss": 1.683, "learning_rate": 2.6431875301996645e-06, "epoch": 0.897998996711443, "percentage": 89.8, "elapsed_time": "1 day, 14:07:46", "remaining_time": "4:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16112, "total_steps": 17941, "loss": 1.5908, "learning_rate": 2.6403315206426917e-06, "epoch": 0.8980547349646062, "percentage": 89.81, "elapsed_time": "1 day, 14:07:55", "remaining_time": "4:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16113, "total_steps": 17941, "loss": 1.7345, "learning_rate": 2.6374770130582815e-06, "epoch": 0.8981104732177694, "percentage": 89.81, "elapsed_time": "1 day, 14:08:03", "remaining_time": "4:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16114, "total_steps": 17941, "loss": 1.6287, "learning_rate": 2.6346240075369677e-06, "epoch": 0.8981662114709325, "percentage": 89.82, "elapsed_time": "1 day, 14:08:12", "remaining_time": "4:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16115, "total_steps": 17941, "loss": 1.5898, "learning_rate": 2.631772504169211e-06, "epoch": 0.8982219497240956, "percentage": 89.82, "elapsed_time": "1 day, 14:08:20", "remaining_time": "4:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16116, "total_steps": 17941, "loss": 1.8715, "learning_rate": 2.6289225030454555e-06, "epoch": 0.8982776879772588, "percentage": 89.83, "elapsed_time": "1 day, 14:08:29", "remaining_time": "4:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16117, "total_steps": 17941, "loss": 1.6249, "learning_rate": 2.626074004256085e-06, "epoch": 0.8983334262304219, "percentage": 89.83, "elapsed_time": "1 day, 14:08:37", "remaining_time": "4:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16118, "total_steps": 17941, "loss": 1.7873, "learning_rate": 2.6232270078914378e-06, "epoch": 0.8983891644835851, "percentage": 89.84, "elapsed_time": "1 day, 14:08:46", "remaining_time": "4:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16119, "total_steps": 17941, "loss": 1.4625, "learning_rate": 2.620381514041803e-06, "epoch": 0.8984449027367483, "percentage": 89.84, "elapsed_time": "1 day, 14:08:54", "remaining_time": "4:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16120, "total_steps": 17941, "loss": 1.7089, "learning_rate": 2.617537522797431e-06, "epoch": 0.8985006409899113, "percentage": 89.85, "elapsed_time": "1 day, 14:09:02", "remaining_time": "4:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16121, "total_steps": 17941, "loss": 1.8189, "learning_rate": 2.61469503424851e-06, "epoch": 0.8985563792430745, "percentage": 89.86, "elapsed_time": "1 day, 14:09:11", "remaining_time": "4:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16122, "total_steps": 17941, "loss": 1.8311, "learning_rate": 2.611854048485185e-06, "epoch": 0.8986121174962377, "percentage": 89.86, "elapsed_time": "1 day, 14:09:20", "remaining_time": "4:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16123, "total_steps": 17941, "loss": 1.6892, "learning_rate": 2.6090145655975505e-06, "epoch": 0.8986678557494008, "percentage": 89.87, "elapsed_time": "1 day, 14:09:28", "remaining_time": "4:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16124, "total_steps": 17941, "loss": 1.7123, "learning_rate": 2.6061765856756737e-06, "epoch": 0.898723594002564, "percentage": 89.87, "elapsed_time": "1 day, 14:09:37", "remaining_time": "4:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16125, "total_steps": 17941, "loss": 1.7274, "learning_rate": 2.603340108809543e-06, "epoch": 0.8987793322557271, "percentage": 89.88, "elapsed_time": "1 day, 14:09:45", "remaining_time": "4:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16126, "total_steps": 17941, "loss": 1.6002, "learning_rate": 2.600505135089132e-06, "epoch": 0.8988350705088902, "percentage": 89.88, "elapsed_time": "1 day, 14:09:53", "remaining_time": "4:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16127, "total_steps": 17941, "loss": 1.7723, "learning_rate": 2.5976716646043286e-06, "epoch": 0.8988908087620534, "percentage": 89.89, "elapsed_time": "1 day, 14:10:02", "remaining_time": "4:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16128, "total_steps": 17941, "loss": 1.4776, "learning_rate": 2.594839697445017e-06, "epoch": 0.8989465470152166, "percentage": 89.89, "elapsed_time": "1 day, 14:10:11", "remaining_time": "4:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16129, "total_steps": 17941, "loss": 1.7196, "learning_rate": 2.592009233700993e-06, "epoch": 0.8990022852683797, "percentage": 89.9, "elapsed_time": "1 day, 14:10:19", "remaining_time": "4:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16130, "total_steps": 17941, "loss": 1.7536, "learning_rate": 2.5891802734620273e-06, "epoch": 0.8990580235215428, "percentage": 89.91, "elapsed_time": "1 day, 14:10:27", "remaining_time": "4:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16131, "total_steps": 17941, "loss": 1.7116, "learning_rate": 2.5863528168178385e-06, "epoch": 0.899113761774706, "percentage": 89.91, "elapsed_time": "1 day, 14:10:36", "remaining_time": "4:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16132, "total_steps": 17941, "loss": 1.6725, "learning_rate": 2.583526863858099e-06, "epoch": 0.8991695000278691, "percentage": 89.92, "elapsed_time": "1 day, 14:10:44", "remaining_time": "4:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16133, "total_steps": 17941, "loss": 1.9008, "learning_rate": 2.5807024146724368e-06, "epoch": 0.8992252382810323, "percentage": 89.92, "elapsed_time": "1 day, 14:10:53", "remaining_time": "4:16:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16134, "total_steps": 17941, "loss": 1.6693, "learning_rate": 2.5778794693504136e-06, "epoch": 0.8992809765341954, "percentage": 89.93, "elapsed_time": "1 day, 14:11:01", "remaining_time": "4:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16135, "total_steps": 17941, "loss": 1.5989, "learning_rate": 2.575058027981564e-06, "epoch": 0.8993367147873585, "percentage": 89.93, "elapsed_time": "1 day, 14:11:10", "remaining_time": "4:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16136, "total_steps": 17941, "loss": 1.6231, "learning_rate": 2.5722380906553655e-06, "epoch": 0.8993924530405217, "percentage": 89.94, "elapsed_time": "1 day, 14:11:18", "remaining_time": "4:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16137, "total_steps": 17941, "loss": 1.5986, "learning_rate": 2.5694196574612585e-06, "epoch": 0.8994481912936848, "percentage": 89.94, "elapsed_time": "1 day, 14:11:27", "remaining_time": "4:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16138, "total_steps": 17941, "loss": 1.6638, "learning_rate": 2.5666027284886095e-06, "epoch": 0.899503929546848, "percentage": 89.95, "elapsed_time": "1 day, 14:11:35", "remaining_time": "4:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16139, "total_steps": 17941, "loss": 1.5928, "learning_rate": 2.56378730382677e-06, "epoch": 0.8995596678000112, "percentage": 89.96, "elapsed_time": "1 day, 14:11:44", "remaining_time": "4:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16140, "total_steps": 17941, "loss": 1.8026, "learning_rate": 2.560973383565035e-06, "epoch": 0.8996154060531742, "percentage": 89.96, "elapsed_time": "1 day, 14:11:52", "remaining_time": "4:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16141, "total_steps": 17941, "loss": 1.6094, "learning_rate": 2.558160967792622e-06, "epoch": 0.8996711443063374, "percentage": 89.97, "elapsed_time": "1 day, 14:12:01", "remaining_time": "4:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16142, "total_steps": 17941, "loss": 1.5472, "learning_rate": 2.5553500565987433e-06, "epoch": 0.8997268825595006, "percentage": 89.97, "elapsed_time": "1 day, 14:12:09", "remaining_time": "4:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16143, "total_steps": 17941, "loss": 1.5912, "learning_rate": 2.5525406500725378e-06, "epoch": 0.8997826208126637, "percentage": 89.98, "elapsed_time": "1 day, 14:12:18", "remaining_time": "4:15:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16144, "total_steps": 17941, "loss": 1.5085, "learning_rate": 2.5497327483031075e-06, "epoch": 0.8998383590658269, "percentage": 89.98, "elapsed_time": "1 day, 14:12:26", "remaining_time": "4:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16145, "total_steps": 17941, "loss": 1.0702, "learning_rate": 2.546926351379497e-06, "epoch": 0.8998940973189901, "percentage": 89.99, "elapsed_time": "1 day, 14:12:35", "remaining_time": "4:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16146, "total_steps": 17941, "loss": 1.78, "learning_rate": 2.544121459390714e-06, "epoch": 0.8999498355721531, "percentage": 89.99, "elapsed_time": "1 day, 14:12:44", "remaining_time": "4:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16147, "total_steps": 17941, "loss": 1.7871, "learning_rate": 2.5413180724257192e-06, "epoch": 0.9000055738253163, "percentage": 90.0, "elapsed_time": "1 day, 14:12:52", "remaining_time": "4:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16148, "total_steps": 17941, "loss": 1.626, "learning_rate": 2.5385161905734036e-06, "epoch": 0.9000613120784795, "percentage": 90.01, "elapsed_time": "1 day, 14:13:01", "remaining_time": "4:14:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16149, "total_steps": 17941, "loss": 1.6934, "learning_rate": 2.5357158139226347e-06, "epoch": 0.9001170503316426, "percentage": 90.01, "elapsed_time": "1 day, 14:13:10", "remaining_time": "4:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16150, "total_steps": 17941, "loss": 1.5418, "learning_rate": 2.5329169425622247e-06, "epoch": 0.9001727885848058, "percentage": 90.02, "elapsed_time": "1 day, 14:13:18", "remaining_time": "4:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16151, "total_steps": 17941, "loss": 1.8433, "learning_rate": 2.530119576580936e-06, "epoch": 0.900228526837969, "percentage": 90.02, "elapsed_time": "1 day, 14:13:27", "remaining_time": "4:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16152, "total_steps": 17941, "loss": 1.665, "learning_rate": 2.5273237160674924e-06, "epoch": 0.900284265091132, "percentage": 90.03, "elapsed_time": "1 day, 14:13:36", "remaining_time": "4:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16153, "total_steps": 17941, "loss": 1.4747, "learning_rate": 2.5245293611105393e-06, "epoch": 0.9003400033442952, "percentage": 90.03, "elapsed_time": "1 day, 14:13:44", "remaining_time": "4:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16154, "total_steps": 17941, "loss": 1.648, "learning_rate": 2.5217365117987334e-06, "epoch": 0.9003957415974584, "percentage": 90.04, "elapsed_time": "1 day, 14:13:53", "remaining_time": "4:13:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16155, "total_steps": 17941, "loss": 1.3829, "learning_rate": 2.5189451682206157e-06, "epoch": 0.9004514798506215, "percentage": 90.05, "elapsed_time": "1 day, 14:14:01", "remaining_time": "4:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16156, "total_steps": 17941, "loss": 1.8415, "learning_rate": 2.5161553304647256e-06, "epoch": 0.9005072181037846, "percentage": 90.05, "elapsed_time": "1 day, 14:14:10", "remaining_time": "4:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16157, "total_steps": 17941, "loss": 1.7705, "learning_rate": 2.513366998619543e-06, "epoch": 0.9005629563569477, "percentage": 90.06, "elapsed_time": "1 day, 14:14:18", "remaining_time": "4:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16158, "total_steps": 17941, "loss": 1.8471, "learning_rate": 2.5105801727734857e-06, "epoch": 0.9006186946101109, "percentage": 90.06, "elapsed_time": "1 day, 14:14:27", "remaining_time": "4:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16159, "total_steps": 17941, "loss": 1.5019, "learning_rate": 2.5077948530149554e-06, "epoch": 0.9006744328632741, "percentage": 90.07, "elapsed_time": "1 day, 14:14:35", "remaining_time": "4:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16160, "total_steps": 17941, "loss": 1.5259, "learning_rate": 2.5050110394322533e-06, "epoch": 0.9007301711164372, "percentage": 90.07, "elapsed_time": "1 day, 14:14:44", "remaining_time": "4:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16161, "total_steps": 17941, "loss": 1.7377, "learning_rate": 2.502228732113704e-06, "epoch": 0.9007859093696003, "percentage": 90.08, "elapsed_time": "1 day, 14:14:52", "remaining_time": "4:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16162, "total_steps": 17941, "loss": 1.6652, "learning_rate": 2.499447931147525e-06, "epoch": 0.9008416476227635, "percentage": 90.08, "elapsed_time": "1 day, 14:15:01", "remaining_time": "4:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16163, "total_steps": 17941, "loss": 1.5852, "learning_rate": 2.4966686366219127e-06, "epoch": 0.9008973858759266, "percentage": 90.09, "elapsed_time": "1 day, 14:15:09", "remaining_time": "4:12:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16164, "total_steps": 17941, "loss": 1.5853, "learning_rate": 2.493890848624991e-06, "epoch": 0.9009531241290898, "percentage": 90.1, "elapsed_time": "1 day, 14:15:17", "remaining_time": "4:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16165, "total_steps": 17941, "loss": 1.6512, "learning_rate": 2.491114567244884e-06, "epoch": 0.901008862382253, "percentage": 90.1, "elapsed_time": "1 day, 14:15:26", "remaining_time": "4:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16166, "total_steps": 17941, "loss": 1.6572, "learning_rate": 2.488339792569633e-06, "epoch": 0.901064600635416, "percentage": 90.11, "elapsed_time": "1 day, 14:15:34", "remaining_time": "4:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16167, "total_steps": 17941, "loss": 1.6004, "learning_rate": 2.4855665246872216e-06, "epoch": 0.9011203388885792, "percentage": 90.11, "elapsed_time": "1 day, 14:15:43", "remaining_time": "4:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16168, "total_steps": 17941, "loss": 1.6282, "learning_rate": 2.4827947636856142e-06, "epoch": 0.9011760771417424, "percentage": 90.12, "elapsed_time": "1 day, 14:15:52", "remaining_time": "4:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16169, "total_steps": 17941, "loss": 1.6305, "learning_rate": 2.480024509652712e-06, "epoch": 0.9012318153949055, "percentage": 90.12, "elapsed_time": "1 day, 14:16:00", "remaining_time": "4:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16170, "total_steps": 17941, "loss": 1.6547, "learning_rate": 2.477255762676367e-06, "epoch": 0.9012875536480687, "percentage": 90.13, "elapsed_time": "1 day, 14:16:08", "remaining_time": "4:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16171, "total_steps": 17941, "loss": 1.7767, "learning_rate": 2.474488522844398e-06, "epoch": 0.9013432919012319, "percentage": 90.13, "elapsed_time": "1 day, 14:16:17", "remaining_time": "4:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16172, "total_steps": 17941, "loss": 1.5718, "learning_rate": 2.4717227902445573e-06, "epoch": 0.9013990301543949, "percentage": 90.14, "elapsed_time": "1 day, 14:16:26", "remaining_time": "4:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16173, "total_steps": 17941, "loss": 1.8284, "learning_rate": 2.4689585649645685e-06, "epoch": 0.9014547684075581, "percentage": 90.15, "elapsed_time": "1 day, 14:16:34", "remaining_time": "4:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16174, "total_steps": 17941, "loss": 1.7134, "learning_rate": 2.4661958470920844e-06, "epoch": 0.9015105066607213, "percentage": 90.15, "elapsed_time": "1 day, 14:16:43", "remaining_time": "4:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16175, "total_steps": 17941, "loss": 1.4603, "learning_rate": 2.4634346367147233e-06, "epoch": 0.9015662449138844, "percentage": 90.16, "elapsed_time": "1 day, 14:16:51", "remaining_time": "4:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16176, "total_steps": 17941, "loss": 1.3745, "learning_rate": 2.4606749339200595e-06, "epoch": 0.9016219831670476, "percentage": 90.16, "elapsed_time": "1 day, 14:17:00", "remaining_time": "4:10:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16177, "total_steps": 17941, "loss": 1.5152, "learning_rate": 2.4579167387956127e-06, "epoch": 0.9016777214202107, "percentage": 90.17, "elapsed_time": "1 day, 14:17:08", "remaining_time": "4:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16178, "total_steps": 17941, "loss": 1.8504, "learning_rate": 2.4551600514288674e-06, "epoch": 0.9017334596733738, "percentage": 90.17, "elapsed_time": "1 day, 14:17:17", "remaining_time": "4:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16179, "total_steps": 17941, "loss": 1.5154, "learning_rate": 2.4524048719072214e-06, "epoch": 0.901789197926537, "percentage": 90.18, "elapsed_time": "1 day, 14:17:25", "remaining_time": "4:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16180, "total_steps": 17941, "loss": 1.481, "learning_rate": 2.449651200318087e-06, "epoch": 0.9018449361797001, "percentage": 90.18, "elapsed_time": "1 day, 14:17:34", "remaining_time": "4:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16181, "total_steps": 17941, "loss": 1.5498, "learning_rate": 2.446899036748773e-06, "epoch": 0.9019006744328633, "percentage": 90.19, "elapsed_time": "1 day, 14:17:42", "remaining_time": "4:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16182, "total_steps": 17941, "loss": 1.5103, "learning_rate": 2.444148381286565e-06, "epoch": 0.9019564126860264, "percentage": 90.2, "elapsed_time": "1 day, 14:17:50", "remaining_time": "4:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16183, "total_steps": 17941, "loss": 1.6951, "learning_rate": 2.441399234018704e-06, "epoch": 0.9020121509391895, "percentage": 90.2, "elapsed_time": "1 day, 14:17:59", "remaining_time": "4:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16184, "total_steps": 17941, "loss": 1.7548, "learning_rate": 2.4386515950323705e-06, "epoch": 0.9020678891923527, "percentage": 90.21, "elapsed_time": "1 day, 14:18:07", "remaining_time": "4:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16185, "total_steps": 17941, "loss": 1.5964, "learning_rate": 2.4359054644147117e-06, "epoch": 0.9021236274455159, "percentage": 90.21, "elapsed_time": "1 day, 14:18:16", "remaining_time": "4:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16186, "total_steps": 17941, "loss": 1.7819, "learning_rate": 2.433160842252802e-06, "epoch": 0.902179365698679, "percentage": 90.22, "elapsed_time": "1 day, 14:18:25", "remaining_time": "4:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16187, "total_steps": 17941, "loss": 1.5818, "learning_rate": 2.4304177286337102e-06, "epoch": 0.9022351039518421, "percentage": 90.22, "elapsed_time": "1 day, 14:18:33", "remaining_time": "4:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16188, "total_steps": 17941, "loss": 1.6073, "learning_rate": 2.4276761236444125e-06, "epoch": 0.9022908422050053, "percentage": 90.23, "elapsed_time": "1 day, 14:18:42", "remaining_time": "4:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16189, "total_steps": 17941, "loss": 1.696, "learning_rate": 2.4249360273718714e-06, "epoch": 0.9023465804581684, "percentage": 90.23, "elapsed_time": "1 day, 14:18:50", "remaining_time": "4:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16190, "total_steps": 17941, "loss": 1.7948, "learning_rate": 2.4221974399029625e-06, "epoch": 0.9024023187113316, "percentage": 90.24, "elapsed_time": "1 day, 14:18:58", "remaining_time": "4:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16191, "total_steps": 17941, "loss": 1.5173, "learning_rate": 2.4194603613245546e-06, "epoch": 0.9024580569644948, "percentage": 90.25, "elapsed_time": "1 day, 14:19:07", "remaining_time": "4:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16192, "total_steps": 17941, "loss": 1.8802, "learning_rate": 2.4167247917234626e-06, "epoch": 0.9025137952176578, "percentage": 90.25, "elapsed_time": "1 day, 14:19:16", "remaining_time": "4:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16193, "total_steps": 17941, "loss": 1.5677, "learning_rate": 2.413990731186422e-06, "epoch": 0.902569533470821, "percentage": 90.26, "elapsed_time": "1 day, 14:19:24", "remaining_time": "4:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16194, "total_steps": 17941, "loss": 1.5949, "learning_rate": 2.4112581798001464e-06, "epoch": 0.9026252717239842, "percentage": 90.26, "elapsed_time": "1 day, 14:19:33", "remaining_time": "4:08:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16195, "total_steps": 17941, "loss": 1.9555, "learning_rate": 2.4085271376513065e-06, "epoch": 0.9026810099771473, "percentage": 90.27, "elapsed_time": "1 day, 14:19:41", "remaining_time": "4:07:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16196, "total_steps": 17941, "loss": 1.7255, "learning_rate": 2.405797604826504e-06, "epoch": 0.9027367482303105, "percentage": 90.27, "elapsed_time": "1 day, 14:19:50", "remaining_time": "4:07:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16197, "total_steps": 17941, "loss": 1.6104, "learning_rate": 2.4030695814123094e-06, "epoch": 0.9027924864834737, "percentage": 90.28, "elapsed_time": "1 day, 14:19:58", "remaining_time": "4:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16198, "total_steps": 17941, "loss": 1.6265, "learning_rate": 2.4003430674952366e-06, "epoch": 0.9028482247366367, "percentage": 90.28, "elapsed_time": "1 day, 14:20:07", "remaining_time": "4:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16199, "total_steps": 17941, "loss": 1.5713, "learning_rate": 2.3976180631617605e-06, "epoch": 0.9029039629897999, "percentage": 90.29, "elapsed_time": "1 day, 14:20:15", "remaining_time": "4:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16200, "total_steps": 17941, "loss": 1.6233, "learning_rate": 2.394894568498296e-06, "epoch": 0.9029597012429631, "percentage": 90.3, "elapsed_time": "1 day, 14:20:24", "remaining_time": "4:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16201, "total_steps": 17941, "loss": 1.7263, "learning_rate": 2.392172583591218e-06, "epoch": 0.9030154394961262, "percentage": 90.3, "elapsed_time": "1 day, 14:20:32", "remaining_time": "4:07:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16202, "total_steps": 17941, "loss": 1.6395, "learning_rate": 2.3894521085268516e-06, "epoch": 0.9030711777492894, "percentage": 90.31, "elapsed_time": "1 day, 14:20:41", "remaining_time": "4:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16203, "total_steps": 17941, "loss": 1.4497, "learning_rate": 2.3867331433914787e-06, "epoch": 0.9031269160024524, "percentage": 90.31, "elapsed_time": "1 day, 14:20:50", "remaining_time": "4:06:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16204, "total_steps": 17941, "loss": 1.688, "learning_rate": 2.3840156882713293e-06, "epoch": 0.9031826542556156, "percentage": 90.32, "elapsed_time": "1 day, 14:20:59", "remaining_time": "4:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16205, "total_steps": 17941, "loss": 1.6415, "learning_rate": 2.3812997432525687e-06, "epoch": 0.9032383925087788, "percentage": 90.32, "elapsed_time": "1 day, 14:21:07", "remaining_time": "4:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16206, "total_steps": 17941, "loss": 1.5103, "learning_rate": 2.3785853084213604e-06, "epoch": 0.9032941307619419, "percentage": 90.33, "elapsed_time": "1 day, 14:21:16", "remaining_time": "4:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16207, "total_steps": 17941, "loss": 1.7707, "learning_rate": 2.3758723838637643e-06, "epoch": 0.9033498690151051, "percentage": 90.33, "elapsed_time": "1 day, 14:21:24", "remaining_time": "4:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16208, "total_steps": 17941, "loss": 1.6635, "learning_rate": 2.373160969665833e-06, "epoch": 0.9034056072682682, "percentage": 90.34, "elapsed_time": "1 day, 14:21:33", "remaining_time": "4:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16209, "total_steps": 17941, "loss": 1.7736, "learning_rate": 2.370451065913548e-06, "epoch": 0.9034613455214313, "percentage": 90.35, "elapsed_time": "1 day, 14:21:41", "remaining_time": "4:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16210, "total_steps": 17941, "loss": 1.4639, "learning_rate": 2.367742672692852e-06, "epoch": 0.9035170837745945, "percentage": 90.35, "elapsed_time": "1 day, 14:21:50", "remaining_time": "4:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16211, "total_steps": 17941, "loss": 1.6669, "learning_rate": 2.3650357900896536e-06, "epoch": 0.9035728220277577, "percentage": 90.36, "elapsed_time": "1 day, 14:21:58", "remaining_time": "4:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16212, "total_steps": 17941, "loss": 1.8263, "learning_rate": 2.362330418189779e-06, "epoch": 0.9036285602809208, "percentage": 90.36, "elapsed_time": "1 day, 14:22:07", "remaining_time": "4:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16213, "total_steps": 17941, "loss": 1.5759, "learning_rate": 2.359626557079042e-06, "epoch": 0.9036842985340839, "percentage": 90.37, "elapsed_time": "1 day, 14:22:16", "remaining_time": "4:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16214, "total_steps": 17941, "loss": 1.4883, "learning_rate": 2.3569242068431863e-06, "epoch": 0.9037400367872471, "percentage": 90.37, "elapsed_time": "1 day, 14:22:24", "remaining_time": "4:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16215, "total_steps": 17941, "loss": 1.7013, "learning_rate": 2.354223367567926e-06, "epoch": 0.9037957750404102, "percentage": 90.38, "elapsed_time": "1 day, 14:22:33", "remaining_time": "4:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16216, "total_steps": 17941, "loss": 1.737, "learning_rate": 2.351524039338887e-06, "epoch": 0.9038515132935734, "percentage": 90.39, "elapsed_time": "1 day, 14:22:42", "remaining_time": "4:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16217, "total_steps": 17941, "loss": 1.7467, "learning_rate": 2.3488262222417067e-06, "epoch": 0.9039072515467366, "percentage": 90.39, "elapsed_time": "1 day, 14:22:50", "remaining_time": "4:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16218, "total_steps": 17941, "loss": 1.6631, "learning_rate": 2.346129916361939e-06, "epoch": 0.9039629897998996, "percentage": 90.4, "elapsed_time": "1 day, 14:22:59", "remaining_time": "4:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16219, "total_steps": 17941, "loss": 1.7187, "learning_rate": 2.3434351217850815e-06, "epoch": 0.9040187280530628, "percentage": 90.4, "elapsed_time": "1 day, 14:23:07", "remaining_time": "4:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16220, "total_steps": 17941, "loss": 1.5157, "learning_rate": 2.340741838596605e-06, "epoch": 0.904074466306226, "percentage": 90.41, "elapsed_time": "1 day, 14:23:16", "remaining_time": "4:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16221, "total_steps": 17941, "loss": 1.5417, "learning_rate": 2.3380500668819193e-06, "epoch": 0.9041302045593891, "percentage": 90.41, "elapsed_time": "1 day, 14:23:25", "remaining_time": "4:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16222, "total_steps": 17941, "loss": 1.6474, "learning_rate": 2.3353598067264114e-06, "epoch": 0.9041859428125523, "percentage": 90.42, "elapsed_time": "1 day, 14:23:34", "remaining_time": "4:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16223, "total_steps": 17941, "loss": 1.5528, "learning_rate": 2.3326710582153687e-06, "epoch": 0.9042416810657155, "percentage": 90.42, "elapsed_time": "1 day, 14:23:43", "remaining_time": "4:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16224, "total_steps": 17941, "loss": 1.7656, "learning_rate": 2.3299838214340898e-06, "epoch": 0.9042974193188785, "percentage": 90.43, "elapsed_time": "1 day, 14:23:51", "remaining_time": "4:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16225, "total_steps": 17941, "loss": 1.5688, "learning_rate": 2.3272980964677947e-06, "epoch": 0.9043531575720417, "percentage": 90.44, "elapsed_time": "1 day, 14:24:00", "remaining_time": "4:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16226, "total_steps": 17941, "loss": 1.4842, "learning_rate": 2.324613883401644e-06, "epoch": 0.9044088958252048, "percentage": 90.44, "elapsed_time": "1 day, 14:24:08", "remaining_time": "4:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16227, "total_steps": 17941, "loss": 1.5161, "learning_rate": 2.3219311823207748e-06, "epoch": 0.904464634078368, "percentage": 90.45, "elapsed_time": "1 day, 14:24:17", "remaining_time": "4:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16228, "total_steps": 17941, "loss": 1.6988, "learning_rate": 2.3192499933102683e-06, "epoch": 0.9045203723315312, "percentage": 90.45, "elapsed_time": "1 day, 14:24:26", "remaining_time": "4:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16229, "total_steps": 17941, "loss": 1.5747, "learning_rate": 2.316570316455152e-06, "epoch": 0.9045761105846942, "percentage": 90.46, "elapsed_time": "1 day, 14:24:34", "remaining_time": "4:03:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16230, "total_steps": 17941, "loss": 1.5106, "learning_rate": 2.313892151840419e-06, "epoch": 0.9046318488378574, "percentage": 90.46, "elapsed_time": "1 day, 14:24:42", "remaining_time": "4:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16231, "total_steps": 17941, "loss": 1.5141, "learning_rate": 2.311215499550984e-06, "epoch": 0.9046875870910206, "percentage": 90.47, "elapsed_time": "1 day, 14:24:51", "remaining_time": "4:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16232, "total_steps": 17941, "loss": 1.6803, "learning_rate": 2.3085403596717623e-06, "epoch": 0.9047433253441837, "percentage": 90.47, "elapsed_time": "1 day, 14:25:00", "remaining_time": "4:02:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16233, "total_steps": 17941, "loss": 1.718, "learning_rate": 2.3058667322875705e-06, "epoch": 0.9047990635973469, "percentage": 90.48, "elapsed_time": "1 day, 14:25:09", "remaining_time": "4:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16234, "total_steps": 17941, "loss": 1.7267, "learning_rate": 2.303194617483212e-06, "epoch": 0.90485480185051, "percentage": 90.49, "elapsed_time": "1 day, 14:25:17", "remaining_time": "4:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16235, "total_steps": 17941, "loss": 1.8153, "learning_rate": 2.3005240153434306e-06, "epoch": 0.9049105401036731, "percentage": 90.49, "elapsed_time": "1 day, 14:25:26", "remaining_time": "4:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16236, "total_steps": 17941, "loss": 1.5595, "learning_rate": 2.2978549259529137e-06, "epoch": 0.9049662783568363, "percentage": 90.5, "elapsed_time": "1 day, 14:25:34", "remaining_time": "4:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16237, "total_steps": 17941, "loss": 1.6735, "learning_rate": 2.2951873493963274e-06, "epoch": 0.9050220166099995, "percentage": 90.5, "elapsed_time": "1 day, 14:25:43", "remaining_time": "4:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16238, "total_steps": 17941, "loss": 1.4991, "learning_rate": 2.292521285758248e-06, "epoch": 0.9050777548631626, "percentage": 90.51, "elapsed_time": "1 day, 14:25:51", "remaining_time": "4:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16239, "total_steps": 17941, "loss": 1.5668, "learning_rate": 2.2898567351232524e-06, "epoch": 0.9051334931163257, "percentage": 90.51, "elapsed_time": "1 day, 14:26:00", "remaining_time": "4:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16240, "total_steps": 17941, "loss": 1.8032, "learning_rate": 2.2871936975758234e-06, "epoch": 0.9051892313694889, "percentage": 90.52, "elapsed_time": "1 day, 14:26:08", "remaining_time": "4:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16241, "total_steps": 17941, "loss": 1.8109, "learning_rate": 2.2845321732004267e-06, "epoch": 0.905244969622652, "percentage": 90.52, "elapsed_time": "1 day, 14:26:17", "remaining_time": "4:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16242, "total_steps": 17941, "loss": 1.6465, "learning_rate": 2.2818721620814665e-06, "epoch": 0.9053007078758152, "percentage": 90.53, "elapsed_time": "1 day, 14:26:25", "remaining_time": "4:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16243, "total_steps": 17941, "loss": 1.9135, "learning_rate": 2.2792136643033036e-06, "epoch": 0.9053564461289784, "percentage": 90.54, "elapsed_time": "1 day, 14:26:34", "remaining_time": "4:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16244, "total_steps": 17941, "loss": 1.4893, "learning_rate": 2.2765566799502647e-06, "epoch": 0.9054121843821414, "percentage": 90.54, "elapsed_time": "1 day, 14:26:42", "remaining_time": "4:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16245, "total_steps": 17941, "loss": 1.6798, "learning_rate": 2.273901209106588e-06, "epoch": 0.9054679226353046, "percentage": 90.55, "elapsed_time": "1 day, 14:26:50", "remaining_time": "4:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16246, "total_steps": 17941, "loss": 1.6062, "learning_rate": 2.2712472518565065e-06, "epoch": 0.9055236608884678, "percentage": 90.55, "elapsed_time": "1 day, 14:26:59", "remaining_time": "4:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16247, "total_steps": 17941, "loss": 1.3619, "learning_rate": 2.268594808284186e-06, "epoch": 0.9055793991416309, "percentage": 90.56, "elapsed_time": "1 day, 14:27:07", "remaining_time": "4:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16248, "total_steps": 17941, "loss": 1.8227, "learning_rate": 2.2659438784737476e-06, "epoch": 0.9056351373947941, "percentage": 90.56, "elapsed_time": "1 day, 14:27:16", "remaining_time": "4:00:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16249, "total_steps": 17941, "loss": 1.7411, "learning_rate": 2.263294462509247e-06, "epoch": 0.9056908756479571, "percentage": 90.57, "elapsed_time": "1 day, 14:27:24", "remaining_time": "4:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16250, "total_steps": 17941, "loss": 1.694, "learning_rate": 2.260646560474733e-06, "epoch": 0.9057466139011203, "percentage": 90.57, "elapsed_time": "1 day, 14:27:33", "remaining_time": "4:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16251, "total_steps": 17941, "loss": 1.6663, "learning_rate": 2.2580001724541723e-06, "epoch": 0.9058023521542835, "percentage": 90.58, "elapsed_time": "1 day, 14:27:41", "remaining_time": "3:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16252, "total_steps": 17941, "loss": 1.7592, "learning_rate": 2.2553552985314864e-06, "epoch": 0.9058580904074466, "percentage": 90.59, "elapsed_time": "1 day, 14:27:50", "remaining_time": "3:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16253, "total_steps": 17941, "loss": 1.5501, "learning_rate": 2.2527119387905582e-06, "epoch": 0.9059138286606098, "percentage": 90.59, "elapsed_time": "1 day, 14:27:58", "remaining_time": "3:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16254, "total_steps": 17941, "loss": 1.4766, "learning_rate": 2.2500700933152264e-06, "epoch": 0.905969566913773, "percentage": 90.6, "elapsed_time": "1 day, 14:28:07", "remaining_time": "3:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16255, "total_steps": 17941, "loss": 1.4374, "learning_rate": 2.2474297621892628e-06, "epoch": 0.906025305166936, "percentage": 90.6, "elapsed_time": "1 day, 14:28:15", "remaining_time": "3:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16256, "total_steps": 17941, "loss": 1.4, "learning_rate": 2.244790945496422e-06, "epoch": 0.9060810434200992, "percentage": 90.61, "elapsed_time": "1 day, 14:28:24", "remaining_time": "3:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16257, "total_steps": 17941, "loss": 1.5911, "learning_rate": 2.242153643320366e-06, "epoch": 0.9061367816732624, "percentage": 90.61, "elapsed_time": "1 day, 14:28:32", "remaining_time": "3:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16258, "total_steps": 17941, "loss": 1.6573, "learning_rate": 2.2395178557447605e-06, "epoch": 0.9061925199264255, "percentage": 90.62, "elapsed_time": "1 day, 14:28:41", "remaining_time": "3:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16259, "total_steps": 17941, "loss": 1.6426, "learning_rate": 2.2368835828531774e-06, "epoch": 0.9062482581795887, "percentage": 90.62, "elapsed_time": "1 day, 14:28:49", "remaining_time": "3:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16260, "total_steps": 17941, "loss": 1.6886, "learning_rate": 2.234250824729173e-06, "epoch": 0.9063039964327518, "percentage": 90.63, "elapsed_time": "1 day, 14:28:58", "remaining_time": "3:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16261, "total_steps": 17941, "loss": 1.5702, "learning_rate": 2.2316195814562345e-06, "epoch": 0.9063597346859149, "percentage": 90.64, "elapsed_time": "1 day, 14:29:06", "remaining_time": "3:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16262, "total_steps": 17941, "loss": 1.6387, "learning_rate": 2.228989853117819e-06, "epoch": 0.9064154729390781, "percentage": 90.64, "elapsed_time": "1 day, 14:29:15", "remaining_time": "3:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16263, "total_steps": 17941, "loss": 1.5259, "learning_rate": 2.226361639797325e-06, "epoch": 0.9064712111922413, "percentage": 90.65, "elapsed_time": "1 day, 14:29:23", "remaining_time": "3:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16264, "total_steps": 17941, "loss": 1.6076, "learning_rate": 2.2237349415780873e-06, "epoch": 0.9065269494454044, "percentage": 90.65, "elapsed_time": "1 day, 14:29:32", "remaining_time": "3:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16265, "total_steps": 17941, "loss": 1.6696, "learning_rate": 2.2211097585434324e-06, "epoch": 0.9065826876985675, "percentage": 90.66, "elapsed_time": "1 day, 14:29:40", "remaining_time": "3:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16266, "total_steps": 17941, "loss": 1.6529, "learning_rate": 2.2184860907766e-06, "epoch": 0.9066384259517307, "percentage": 90.66, "elapsed_time": "1 day, 14:29:49", "remaining_time": "3:57:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16267, "total_steps": 17941, "loss": 1.5219, "learning_rate": 2.215863938360807e-06, "epoch": 0.9066941642048938, "percentage": 90.67, "elapsed_time": "1 day, 14:29:58", "remaining_time": "3:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16268, "total_steps": 17941, "loss": 1.5906, "learning_rate": 2.2132433013792087e-06, "epoch": 0.906749902458057, "percentage": 90.67, "elapsed_time": "1 day, 14:30:07", "remaining_time": "3:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16269, "total_steps": 17941, "loss": 1.6548, "learning_rate": 2.2106241799149165e-06, "epoch": 0.9068056407112202, "percentage": 90.68, "elapsed_time": "1 day, 14:30:15", "remaining_time": "3:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16270, "total_steps": 17941, "loss": 1.6273, "learning_rate": 2.208006574050997e-06, "epoch": 0.9068613789643832, "percentage": 90.69, "elapsed_time": "1 day, 14:30:24", "remaining_time": "3:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16271, "total_steps": 17941, "loss": 1.6253, "learning_rate": 2.2053904838704564e-06, "epoch": 0.9069171172175464, "percentage": 90.69, "elapsed_time": "1 day, 14:30:33", "remaining_time": "3:57:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16272, "total_steps": 17941, "loss": 1.5816, "learning_rate": 2.2027759094562726e-06, "epoch": 0.9069728554707095, "percentage": 90.7, "elapsed_time": "1 day, 14:30:41", "remaining_time": "3:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16273, "total_steps": 17941, "loss": 1.8245, "learning_rate": 2.200162850891352e-06, "epoch": 0.9070285937238727, "percentage": 90.7, "elapsed_time": "1 day, 14:30:50", "remaining_time": "3:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16274, "total_steps": 17941, "loss": 1.6826, "learning_rate": 2.1975513082585885e-06, "epoch": 0.9070843319770359, "percentage": 90.71, "elapsed_time": "1 day, 14:30:58", "remaining_time": "3:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16275, "total_steps": 17941, "loss": 1.4705, "learning_rate": 2.194941281640772e-06, "epoch": 0.9071400702301989, "percentage": 90.71, "elapsed_time": "1 day, 14:31:06", "remaining_time": "3:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16276, "total_steps": 17941, "loss": 1.8863, "learning_rate": 2.192332771120703e-06, "epoch": 0.9071958084833621, "percentage": 90.72, "elapsed_time": "1 day, 14:31:15", "remaining_time": "3:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16277, "total_steps": 17941, "loss": 1.5036, "learning_rate": 2.189725776781104e-06, "epoch": 0.9072515467365253, "percentage": 90.73, "elapsed_time": "1 day, 14:31:24", "remaining_time": "3:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16278, "total_steps": 17941, "loss": 1.7201, "learning_rate": 2.187120298704648e-06, "epoch": 0.9073072849896884, "percentage": 90.73, "elapsed_time": "1 day, 14:31:32", "remaining_time": "3:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16279, "total_steps": 17941, "loss": 1.4208, "learning_rate": 2.184516336973963e-06, "epoch": 0.9073630232428516, "percentage": 90.74, "elapsed_time": "1 day, 14:31:41", "remaining_time": "3:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16280, "total_steps": 17941, "loss": 1.6301, "learning_rate": 2.1819138916716386e-06, "epoch": 0.9074187614960147, "percentage": 90.74, "elapsed_time": "1 day, 14:31:49", "remaining_time": "3:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16281, "total_steps": 17941, "loss": 1.756, "learning_rate": 2.179312962880209e-06, "epoch": 0.9074744997491778, "percentage": 90.75, "elapsed_time": "1 day, 14:31:58", "remaining_time": "3:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16282, "total_steps": 17941, "loss": 1.5911, "learning_rate": 2.1767135506821636e-06, "epoch": 0.907530238002341, "percentage": 90.75, "elapsed_time": "1 day, 14:32:06", "remaining_time": "3:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16283, "total_steps": 17941, "loss": 1.6621, "learning_rate": 2.1741156551599196e-06, "epoch": 0.9075859762555042, "percentage": 90.76, "elapsed_time": "1 day, 14:32:15", "remaining_time": "3:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16284, "total_steps": 17941, "loss": 1.6103, "learning_rate": 2.1715192763959e-06, "epoch": 0.9076417145086673, "percentage": 90.76, "elapsed_time": "1 day, 14:32:23", "remaining_time": "3:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16285, "total_steps": 17941, "loss": 1.8086, "learning_rate": 2.1689244144724173e-06, "epoch": 0.9076974527618304, "percentage": 90.77, "elapsed_time": "1 day, 14:32:32", "remaining_time": "3:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16286, "total_steps": 17941, "loss": 1.7998, "learning_rate": 2.1663310694717832e-06, "epoch": 0.9077531910149936, "percentage": 90.78, "elapsed_time": "1 day, 14:32:41", "remaining_time": "3:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16287, "total_steps": 17941, "loss": 1.4457, "learning_rate": 2.163739241476237e-06, "epoch": 0.9078089292681567, "percentage": 90.78, "elapsed_time": "1 day, 14:32:49", "remaining_time": "3:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16288, "total_steps": 17941, "loss": 1.3774, "learning_rate": 2.1611489305679743e-06, "epoch": 0.9078646675213199, "percentage": 90.79, "elapsed_time": "1 day, 14:32:58", "remaining_time": "3:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16289, "total_steps": 17941, "loss": 1.5493, "learning_rate": 2.1585601368291574e-06, "epoch": 0.9079204057744831, "percentage": 90.79, "elapsed_time": "1 day, 14:33:06", "remaining_time": "3:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16290, "total_steps": 17941, "loss": 1.6492, "learning_rate": 2.155972860341865e-06, "epoch": 0.9079761440276461, "percentage": 90.8, "elapsed_time": "1 day, 14:33:15", "remaining_time": "3:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16291, "total_steps": 17941, "loss": 1.5392, "learning_rate": 2.1533871011881757e-06, "epoch": 0.9080318822808093, "percentage": 90.8, "elapsed_time": "1 day, 14:33:24", "remaining_time": "3:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16292, "total_steps": 17941, "loss": 1.6312, "learning_rate": 2.150802859450074e-06, "epoch": 0.9080876205339725, "percentage": 90.81, "elapsed_time": "1 day, 14:33:32", "remaining_time": "3:54:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16293, "total_steps": 17941, "loss": 1.7963, "learning_rate": 2.1482201352095275e-06, "epoch": 0.9081433587871356, "percentage": 90.81, "elapsed_time": "1 day, 14:33:41", "remaining_time": "3:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16294, "total_steps": 17941, "loss": 1.529, "learning_rate": 2.1456389285484437e-06, "epoch": 0.9081990970402988, "percentage": 90.82, "elapsed_time": "1 day, 14:33:49", "remaining_time": "3:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16295, "total_steps": 17941, "loss": 1.4003, "learning_rate": 2.143059239548678e-06, "epoch": 0.9082548352934618, "percentage": 90.83, "elapsed_time": "1 day, 14:33:58", "remaining_time": "3:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16296, "total_steps": 17941, "loss": 1.6012, "learning_rate": 2.140481068292061e-06, "epoch": 0.908310573546625, "percentage": 90.83, "elapsed_time": "1 day, 14:34:06", "remaining_time": "3:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16297, "total_steps": 17941, "loss": 1.6037, "learning_rate": 2.137904414860331e-06, "epoch": 0.9083663117997882, "percentage": 90.84, "elapsed_time": "1 day, 14:34:15", "remaining_time": "3:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16298, "total_steps": 17941, "loss": 1.5799, "learning_rate": 2.135329279335224e-06, "epoch": 0.9084220500529513, "percentage": 90.84, "elapsed_time": "1 day, 14:34:23", "remaining_time": "3:53:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16299, "total_steps": 17941, "loss": 1.5622, "learning_rate": 2.132755661798397e-06, "epoch": 0.9084777883061145, "percentage": 90.85, "elapsed_time": "1 day, 14:34:32", "remaining_time": "3:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16300, "total_steps": 17941, "loss": 1.6835, "learning_rate": 2.1301835623314836e-06, "epoch": 0.9085335265592777, "percentage": 90.85, "elapsed_time": "1 day, 14:34:40", "remaining_time": "3:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16301, "total_steps": 17941, "loss": 1.6256, "learning_rate": 2.127612981016036e-06, "epoch": 0.9085892648124407, "percentage": 90.86, "elapsed_time": "1 day, 14:34:49", "remaining_time": "3:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16302, "total_steps": 17941, "loss": 1.8222, "learning_rate": 2.1250439179335946e-06, "epoch": 0.9086450030656039, "percentage": 90.86, "elapsed_time": "1 day, 14:34:58", "remaining_time": "3:52:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16303, "total_steps": 17941, "loss": 1.7279, "learning_rate": 2.122476373165633e-06, "epoch": 0.9087007413187671, "percentage": 90.87, "elapsed_time": "1 day, 14:35:06", "remaining_time": "3:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16304, "total_steps": 17941, "loss": 1.6672, "learning_rate": 2.1199103467935744e-06, "epoch": 0.9087564795719302, "percentage": 90.88, "elapsed_time": "1 day, 14:35:15", "remaining_time": "3:52:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16305, "total_steps": 17941, "loss": 1.6559, "learning_rate": 2.117345838898793e-06, "epoch": 0.9088122178250934, "percentage": 90.88, "elapsed_time": "1 day, 14:35:23", "remaining_time": "3:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16306, "total_steps": 17941, "loss": 1.5189, "learning_rate": 2.1147828495626298e-06, "epoch": 0.9088679560782565, "percentage": 90.89, "elapsed_time": "1 day, 14:35:32", "remaining_time": "3:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16307, "total_steps": 17941, "loss": 1.6515, "learning_rate": 2.112221378866369e-06, "epoch": 0.9089236943314196, "percentage": 90.89, "elapsed_time": "1 day, 14:35:40", "remaining_time": "3:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16308, "total_steps": 17941, "loss": 1.6793, "learning_rate": 2.109661426891241e-06, "epoch": 0.9089794325845828, "percentage": 90.9, "elapsed_time": "1 day, 14:35:49", "remaining_time": "3:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16309, "total_steps": 17941, "loss": 1.6749, "learning_rate": 2.107102993718424e-06, "epoch": 0.909035170837746, "percentage": 90.9, "elapsed_time": "1 day, 14:35:57", "remaining_time": "3:51:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16310, "total_steps": 17941, "loss": 1.6496, "learning_rate": 2.1045460794290704e-06, "epoch": 0.9090909090909091, "percentage": 90.91, "elapsed_time": "1 day, 14:36:06", "remaining_time": "3:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16311, "total_steps": 17941, "loss": 1.6938, "learning_rate": 2.101990684104266e-06, "epoch": 0.9091466473440722, "percentage": 90.91, "elapsed_time": "1 day, 14:36:14", "remaining_time": "3:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16312, "total_steps": 17941, "loss": 1.7482, "learning_rate": 2.0994368078250503e-06, "epoch": 0.9092023855972354, "percentage": 90.92, "elapsed_time": "1 day, 14:36:23", "remaining_time": "3:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16313, "total_steps": 17941, "loss": 2.0318, "learning_rate": 2.0968844506724204e-06, "epoch": 0.9092581238503985, "percentage": 90.93, "elapsed_time": "1 day, 14:36:31", "remaining_time": "3:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16314, "total_steps": 17941, "loss": 1.63, "learning_rate": 2.094333612727317e-06, "epoch": 0.9093138621035617, "percentage": 90.93, "elapsed_time": "1 day, 14:36:40", "remaining_time": "3:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16315, "total_steps": 17941, "loss": 1.6674, "learning_rate": 2.091784294070653e-06, "epoch": 0.9093696003567249, "percentage": 90.94, "elapsed_time": "1 day, 14:36:48", "remaining_time": "3:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16316, "total_steps": 17941, "loss": 1.6477, "learning_rate": 2.0892364947832534e-06, "epoch": 0.909425338609888, "percentage": 90.94, "elapsed_time": "1 day, 14:36:57", "remaining_time": "3:50:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16317, "total_steps": 17941, "loss": 1.5441, "learning_rate": 2.0866902149459466e-06, "epoch": 0.9094810768630511, "percentage": 90.95, "elapsed_time": "1 day, 14:37:05", "remaining_time": "3:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16318, "total_steps": 17941, "loss": 1.527, "learning_rate": 2.0841454546394633e-06, "epoch": 0.9095368151162142, "percentage": 90.95, "elapsed_time": "1 day, 14:37:14", "remaining_time": "3:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16319, "total_steps": 17941, "loss": 1.7746, "learning_rate": 2.0816022139445167e-06, "epoch": 0.9095925533693774, "percentage": 90.96, "elapsed_time": "1 day, 14:37:23", "remaining_time": "3:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16320, "total_steps": 17941, "loss": 1.6312, "learning_rate": 2.07906049294177e-06, "epoch": 0.9096482916225406, "percentage": 90.96, "elapsed_time": "1 day, 14:37:32", "remaining_time": "3:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16321, "total_steps": 17941, "loss": 1.6555, "learning_rate": 2.0765202917118198e-06, "epoch": 0.9097040298757036, "percentage": 90.97, "elapsed_time": "1 day, 14:37:40", "remaining_time": "3:50:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16322, "total_steps": 17941, "loss": 1.4457, "learning_rate": 2.0739816103352404e-06, "epoch": 0.9097597681288668, "percentage": 90.98, "elapsed_time": "1 day, 14:37:49", "remaining_time": "3:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16323, "total_steps": 17941, "loss": 1.8818, "learning_rate": 2.071444448892529e-06, "epoch": 0.90981550638203, "percentage": 90.98, "elapsed_time": "1 day, 14:37:58", "remaining_time": "3:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16324, "total_steps": 17941, "loss": 1.6588, "learning_rate": 2.0689088074641593e-06, "epoch": 0.9098712446351931, "percentage": 90.99, "elapsed_time": "1 day, 14:38:06", "remaining_time": "3:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16325, "total_steps": 17941, "loss": 1.5367, "learning_rate": 2.0663746861305457e-06, "epoch": 0.9099269828883563, "percentage": 90.99, "elapsed_time": "1 day, 14:38:15", "remaining_time": "3:49:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16326, "total_steps": 17941, "loss": 1.5971, "learning_rate": 2.0638420849720565e-06, "epoch": 0.9099827211415195, "percentage": 91.0, "elapsed_time": "1 day, 14:38:23", "remaining_time": "3:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16327, "total_steps": 17941, "loss": 1.7707, "learning_rate": 2.061311004069e-06, "epoch": 0.9100384593946825, "percentage": 91.0, "elapsed_time": "1 day, 14:38:32", "remaining_time": "3:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16328, "total_steps": 17941, "loss": 1.7856, "learning_rate": 2.058781443501662e-06, "epoch": 0.9100941976478457, "percentage": 91.01, "elapsed_time": "1 day, 14:38:41", "remaining_time": "3:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16329, "total_steps": 17941, "loss": 1.4072, "learning_rate": 2.056253403350267e-06, "epoch": 0.9101499359010089, "percentage": 91.01, "elapsed_time": "1 day, 14:38:50", "remaining_time": "3:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16330, "total_steps": 17941, "loss": 1.6138, "learning_rate": 2.0537268836949784e-06, "epoch": 0.910205674154172, "percentage": 91.02, "elapsed_time": "1 day, 14:38:58", "remaining_time": "3:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16331, "total_steps": 17941, "loss": 1.7281, "learning_rate": 2.051201884615922e-06, "epoch": 0.9102614124073352, "percentage": 91.03, "elapsed_time": "1 day, 14:39:07", "remaining_time": "3:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16332, "total_steps": 17941, "loss": 1.8754, "learning_rate": 2.048678406193183e-06, "epoch": 0.9103171506604983, "percentage": 91.03, "elapsed_time": "1 day, 14:39:15", "remaining_time": "3:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16333, "total_steps": 17941, "loss": 1.6788, "learning_rate": 2.046156448506786e-06, "epoch": 0.9103728889136614, "percentage": 91.04, "elapsed_time": "1 day, 14:39:24", "remaining_time": "3:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16334, "total_steps": 17941, "loss": 1.5839, "learning_rate": 2.0436360116367236e-06, "epoch": 0.9104286271668246, "percentage": 91.04, "elapsed_time": "1 day, 14:39:32", "remaining_time": "3:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16335, "total_steps": 17941, "loss": 1.6303, "learning_rate": 2.0411170956629143e-06, "epoch": 0.9104843654199878, "percentage": 91.05, "elapsed_time": "1 day, 14:39:41", "remaining_time": "3:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16336, "total_steps": 17941, "loss": 1.6719, "learning_rate": 2.0385997006652614e-06, "epoch": 0.9105401036731509, "percentage": 91.05, "elapsed_time": "1 day, 14:39:49", "remaining_time": "3:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16337, "total_steps": 17941, "loss": 1.6495, "learning_rate": 2.0360838267235837e-06, "epoch": 0.910595841926314, "percentage": 91.06, "elapsed_time": "1 day, 14:39:58", "remaining_time": "3:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16338, "total_steps": 17941, "loss": 1.6592, "learning_rate": 2.0335694739176793e-06, "epoch": 0.9106515801794772, "percentage": 91.07, "elapsed_time": "1 day, 14:40:06", "remaining_time": "3:47:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16339, "total_steps": 17941, "loss": 1.6613, "learning_rate": 2.0310566423272893e-06, "epoch": 0.9107073184326403, "percentage": 91.07, "elapsed_time": "1 day, 14:40:15", "remaining_time": "3:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16340, "total_steps": 17941, "loss": 1.4194, "learning_rate": 2.0285453320321003e-06, "epoch": 0.9107630566858035, "percentage": 91.08, "elapsed_time": "1 day, 14:40:23", "remaining_time": "3:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16341, "total_steps": 17941, "loss": 1.4815, "learning_rate": 2.0260355431117707e-06, "epoch": 0.9108187949389666, "percentage": 91.08, "elapsed_time": "1 day, 14:40:32", "remaining_time": "3:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16342, "total_steps": 17941, "loss": 1.6783, "learning_rate": 2.02352727564587e-06, "epoch": 0.9108745331921297, "percentage": 91.09, "elapsed_time": "1 day, 14:40:40", "remaining_time": "3:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16343, "total_steps": 17941, "loss": 1.8243, "learning_rate": 2.0210205297139794e-06, "epoch": 0.9109302714452929, "percentage": 91.09, "elapsed_time": "1 day, 14:40:49", "remaining_time": "3:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16344, "total_steps": 17941, "loss": 1.6776, "learning_rate": 2.0185153053955684e-06, "epoch": 0.910986009698456, "percentage": 91.1, "elapsed_time": "1 day, 14:40:57", "remaining_time": "3:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16345, "total_steps": 17941, "loss": 1.8912, "learning_rate": 2.0160116027701014e-06, "epoch": 0.9110417479516192, "percentage": 91.1, "elapsed_time": "1 day, 14:41:06", "remaining_time": "3:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16346, "total_steps": 17941, "loss": 1.5518, "learning_rate": 2.0135094219169814e-06, "epoch": 0.9110974862047824, "percentage": 91.11, "elapsed_time": "1 day, 14:41:14", "remaining_time": "3:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16347, "total_steps": 17941, "loss": 1.623, "learning_rate": 2.0110087629155614e-06, "epoch": 0.9111532244579454, "percentage": 91.12, "elapsed_time": "1 day, 14:41:23", "remaining_time": "3:46:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16348, "total_steps": 17941, "loss": 1.4222, "learning_rate": 2.0085096258451563e-06, "epoch": 0.9112089627111086, "percentage": 91.12, "elapsed_time": "1 day, 14:41:31", "remaining_time": "3:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16349, "total_steps": 17941, "loss": 1.3592, "learning_rate": 2.0060120107850078e-06, "epoch": 0.9112647009642718, "percentage": 91.13, "elapsed_time": "1 day, 14:41:40", "remaining_time": "3:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16350, "total_steps": 17941, "loss": 1.4282, "learning_rate": 2.0035159178143358e-06, "epoch": 0.9113204392174349, "percentage": 91.13, "elapsed_time": "1 day, 14:41:48", "remaining_time": "3:45:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16351, "total_steps": 17941, "loss": 1.6585, "learning_rate": 2.0010213470123e-06, "epoch": 0.9113761774705981, "percentage": 91.14, "elapsed_time": "1 day, 14:41:57", "remaining_time": "3:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16352, "total_steps": 17941, "loss": 1.548, "learning_rate": 1.998528298458019e-06, "epoch": 0.9114319157237613, "percentage": 91.14, "elapsed_time": "1 day, 14:42:05", "remaining_time": "3:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16353, "total_steps": 17941, "loss": 1.5965, "learning_rate": 1.9960367722305416e-06, "epoch": 0.9114876539769243, "percentage": 91.15, "elapsed_time": "1 day, 14:42:14", "remaining_time": "3:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16354, "total_steps": 17941, "loss": 1.6278, "learning_rate": 1.993546768408899e-06, "epoch": 0.9115433922300875, "percentage": 91.15, "elapsed_time": "1 day, 14:42:22", "remaining_time": "3:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16355, "total_steps": 17941, "loss": 1.5308, "learning_rate": 1.9910582870720616e-06, "epoch": 0.9115991304832507, "percentage": 91.16, "elapsed_time": "1 day, 14:42:31", "remaining_time": "3:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16356, "total_steps": 17941, "loss": 1.7062, "learning_rate": 1.9885713282989383e-06, "epoch": 0.9116548687364138, "percentage": 91.17, "elapsed_time": "1 day, 14:42:39", "remaining_time": "3:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16357, "total_steps": 17941, "loss": 1.5839, "learning_rate": 1.98608589216841e-06, "epoch": 0.911710606989577, "percentage": 91.17, "elapsed_time": "1 day, 14:42:47", "remaining_time": "3:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16358, "total_steps": 17941, "loss": 1.5855, "learning_rate": 1.983601978759292e-06, "epoch": 0.9117663452427401, "percentage": 91.18, "elapsed_time": "1 day, 14:42:57", "remaining_time": "3:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16359, "total_steps": 17941, "loss": 1.5939, "learning_rate": 1.9811195881503707e-06, "epoch": 0.9118220834959032, "percentage": 91.18, "elapsed_time": "1 day, 14:43:05", "remaining_time": "3:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16360, "total_steps": 17941, "loss": 1.8301, "learning_rate": 1.978638720420356e-06, "epoch": 0.9118778217490664, "percentage": 91.19, "elapsed_time": "1 day, 14:43:14", "remaining_time": "3:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16361, "total_steps": 17941, "loss": 1.6721, "learning_rate": 1.976159375647946e-06, "epoch": 0.9119335600022296, "percentage": 91.19, "elapsed_time": "1 day, 14:43:23", "remaining_time": "3:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16362, "total_steps": 17941, "loss": 1.4492, "learning_rate": 1.973681553911766e-06, "epoch": 0.9119892982553927, "percentage": 91.2, "elapsed_time": "1 day, 14:43:31", "remaining_time": "3:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16363, "total_steps": 17941, "loss": 1.3443, "learning_rate": 1.971205255290387e-06, "epoch": 0.9120450365085558, "percentage": 91.2, "elapsed_time": "1 day, 14:43:40", "remaining_time": "3:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16364, "total_steps": 17941, "loss": 1.6671, "learning_rate": 1.9687304798623465e-06, "epoch": 0.9121007747617189, "percentage": 91.21, "elapsed_time": "1 day, 14:43:48", "remaining_time": "3:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16365, "total_steps": 17941, "loss": 1.8718, "learning_rate": 1.966257227706142e-06, "epoch": 0.9121565130148821, "percentage": 91.22, "elapsed_time": "1 day, 14:43:57", "remaining_time": "3:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16366, "total_steps": 17941, "loss": 1.8048, "learning_rate": 1.9637854989001947e-06, "epoch": 0.9122122512680453, "percentage": 91.22, "elapsed_time": "1 day, 14:44:06", "remaining_time": "3:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16367, "total_steps": 17941, "loss": 1.7361, "learning_rate": 1.9613152935229082e-06, "epoch": 0.9122679895212084, "percentage": 91.23, "elapsed_time": "1 day, 14:44:14", "remaining_time": "3:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16368, "total_steps": 17941, "loss": 1.5224, "learning_rate": 1.9588466116526092e-06, "epoch": 0.9123237277743715, "percentage": 91.23, "elapsed_time": "1 day, 14:44:23", "remaining_time": "3:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16369, "total_steps": 17941, "loss": 1.6835, "learning_rate": 1.9563794533676016e-06, "epoch": 0.9123794660275347, "percentage": 91.24, "elapsed_time": "1 day, 14:44:32", "remaining_time": "3:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16370, "total_steps": 17941, "loss": 1.5155, "learning_rate": 1.9539138187461225e-06, "epoch": 0.9124352042806978, "percentage": 91.24, "elapsed_time": "1 day, 14:44:40", "remaining_time": "3:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16371, "total_steps": 17941, "loss": 1.6996, "learning_rate": 1.9514497078663653e-06, "epoch": 0.912490942533861, "percentage": 91.25, "elapsed_time": "1 day, 14:44:49", "remaining_time": "3:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16372, "total_steps": 17941, "loss": 1.6456, "learning_rate": 1.9489871208064835e-06, "epoch": 0.9125466807870242, "percentage": 91.25, "elapsed_time": "1 day, 14:44:57", "remaining_time": "3:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16373, "total_steps": 17941, "loss": 1.8207, "learning_rate": 1.9465260576445708e-06, "epoch": 0.9126024190401872, "percentage": 91.26, "elapsed_time": "1 day, 14:45:06", "remaining_time": "3:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16374, "total_steps": 17941, "loss": 1.8296, "learning_rate": 1.944066518458687e-06, "epoch": 0.9126581572933504, "percentage": 91.27, "elapsed_time": "1 day, 14:45:14", "remaining_time": "3:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16375, "total_steps": 17941, "loss": 1.942, "learning_rate": 1.941608503326825e-06, "epoch": 0.9127138955465136, "percentage": 91.27, "elapsed_time": "1 day, 14:45:22", "remaining_time": "3:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16376, "total_steps": 17941, "loss": 1.792, "learning_rate": 1.939152012326939e-06, "epoch": 0.9127696337996767, "percentage": 91.28, "elapsed_time": "1 day, 14:45:31", "remaining_time": "3:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16377, "total_steps": 17941, "loss": 1.8032, "learning_rate": 1.936697045536934e-06, "epoch": 0.9128253720528399, "percentage": 91.28, "elapsed_time": "1 day, 14:45:40", "remaining_time": "3:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16378, "total_steps": 17941, "loss": 1.9287, "learning_rate": 1.93424360303468e-06, "epoch": 0.912881110306003, "percentage": 91.29, "elapsed_time": "1 day, 14:45:48", "remaining_time": "3:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16379, "total_steps": 17941, "loss": 1.8145, "learning_rate": 1.9317916848979657e-06, "epoch": 0.9129368485591661, "percentage": 91.29, "elapsed_time": "1 day, 14:45:56", "remaining_time": "3:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16380, "total_steps": 17941, "loss": 1.4588, "learning_rate": 1.929341291204567e-06, "epoch": 0.9129925868123293, "percentage": 91.3, "elapsed_time": "1 day, 14:46:05", "remaining_time": "3:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16381, "total_steps": 17941, "loss": 1.8245, "learning_rate": 1.926892422032195e-06, "epoch": 0.9130483250654925, "percentage": 91.3, "elapsed_time": "1 day, 14:46:13", "remaining_time": "3:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16382, "total_steps": 17941, "loss": 1.687, "learning_rate": 1.9244450774585033e-06, "epoch": 0.9131040633186556, "percentage": 91.31, "elapsed_time": "1 day, 14:46:22", "remaining_time": "3:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16383, "total_steps": 17941, "loss": 1.7481, "learning_rate": 1.9219992575611133e-06, "epoch": 0.9131598015718188, "percentage": 91.32, "elapsed_time": "1 day, 14:46:30", "remaining_time": "3:41:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16384, "total_steps": 17941, "loss": 1.7939, "learning_rate": 1.9195549624175967e-06, "epoch": 0.9132155398249819, "percentage": 91.32, "elapsed_time": "1 day, 14:46:39", "remaining_time": "3:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16385, "total_steps": 17941, "loss": 1.5386, "learning_rate": 1.9171121921054747e-06, "epoch": 0.913271278078145, "percentage": 91.33, "elapsed_time": "1 day, 14:46:47", "remaining_time": "3:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16386, "total_steps": 17941, "loss": 1.6413, "learning_rate": 1.914670946702196e-06, "epoch": 0.9133270163313082, "percentage": 91.33, "elapsed_time": "1 day, 14:46:56", "remaining_time": "3:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16387, "total_steps": 17941, "loss": 1.4792, "learning_rate": 1.912231226285205e-06, "epoch": 0.9133827545844713, "percentage": 91.34, "elapsed_time": "1 day, 14:47:04", "remaining_time": "3:40:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16388, "total_steps": 17941, "loss": 1.5589, "learning_rate": 1.9097930309318724e-06, "epoch": 0.9134384928376345, "percentage": 91.34, "elapsed_time": "1 day, 14:47:13", "remaining_time": "3:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16389, "total_steps": 17941, "loss": 1.4047, "learning_rate": 1.9073563607195145e-06, "epoch": 0.9134942310907976, "percentage": 91.35, "elapsed_time": "1 day, 14:47:21", "remaining_time": "3:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16390, "total_steps": 17941, "loss": 1.5307, "learning_rate": 1.9049212157254138e-06, "epoch": 0.9135499693439607, "percentage": 91.35, "elapsed_time": "1 day, 14:47:30", "remaining_time": "3:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16391, "total_steps": 17941, "loss": 1.6551, "learning_rate": 1.9024875960267975e-06, "epoch": 0.9136057075971239, "percentage": 91.36, "elapsed_time": "1 day, 14:47:39", "remaining_time": "3:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16392, "total_steps": 17941, "loss": 1.5454, "learning_rate": 1.900055501700848e-06, "epoch": 0.9136614458502871, "percentage": 91.37, "elapsed_time": "1 day, 14:47:47", "remaining_time": "3:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16393, "total_steps": 17941, "loss": 1.8315, "learning_rate": 1.8976249328247042e-06, "epoch": 0.9137171841034502, "percentage": 91.37, "elapsed_time": "1 day, 14:47:55", "remaining_time": "3:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16394, "total_steps": 17941, "loss": 1.6967, "learning_rate": 1.8951958894754264e-06, "epoch": 0.9137729223566133, "percentage": 91.38, "elapsed_time": "1 day, 14:48:05", "remaining_time": "3:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16395, "total_steps": 17941, "loss": 1.5542, "learning_rate": 1.892768371730075e-06, "epoch": 0.9138286606097765, "percentage": 91.38, "elapsed_time": "1 day, 14:48:13", "remaining_time": "3:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16396, "total_steps": 17941, "loss": 1.6167, "learning_rate": 1.8903423796656216e-06, "epoch": 0.9138843988629396, "percentage": 91.39, "elapsed_time": "1 day, 14:48:22", "remaining_time": "3:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16397, "total_steps": 17941, "loss": 1.5031, "learning_rate": 1.8879179133590107e-06, "epoch": 0.9139401371161028, "percentage": 91.39, "elapsed_time": "1 day, 14:48:30", "remaining_time": "3:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16398, "total_steps": 17941, "loss": 1.526, "learning_rate": 1.8854949728871308e-06, "epoch": 0.913995875369266, "percentage": 91.4, "elapsed_time": "1 day, 14:48:39", "remaining_time": "3:39:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16399, "total_steps": 17941, "loss": 1.5379, "learning_rate": 1.88307355832682e-06, "epoch": 0.914051613622429, "percentage": 91.41, "elapsed_time": "1 day, 14:48:48", "remaining_time": "3:38:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16400, "total_steps": 17941, "loss": 1.6934, "learning_rate": 1.8806536697548838e-06, "epoch": 0.9141073518755922, "percentage": 91.41, "elapsed_time": "1 day, 14:48:57", "remaining_time": "3:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16401, "total_steps": 17941, "loss": 1.601, "learning_rate": 1.878235307248044e-06, "epoch": 0.9141630901287554, "percentage": 91.42, "elapsed_time": "1 day, 14:49:05", "remaining_time": "3:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16402, "total_steps": 17941, "loss": 1.4037, "learning_rate": 1.875818470883023e-06, "epoch": 0.9142188283819185, "percentage": 91.42, "elapsed_time": "1 day, 14:49:14", "remaining_time": "3:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16403, "total_steps": 17941, "loss": 1.5897, "learning_rate": 1.8734031607364532e-06, "epoch": 0.9142745666350817, "percentage": 91.43, "elapsed_time": "1 day, 14:49:23", "remaining_time": "3:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16404, "total_steps": 17941, "loss": 1.5717, "learning_rate": 1.8709893768849406e-06, "epoch": 0.9143303048882448, "percentage": 91.43, "elapsed_time": "1 day, 14:49:31", "remaining_time": "3:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16405, "total_steps": 17941, "loss": 1.4539, "learning_rate": 1.868577119405024e-06, "epoch": 0.9143860431414079, "percentage": 91.44, "elapsed_time": "1 day, 14:49:40", "remaining_time": "3:38:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16406, "total_steps": 17941, "loss": 1.5421, "learning_rate": 1.8661663883732195e-06, "epoch": 0.9144417813945711, "percentage": 91.44, "elapsed_time": "1 day, 14:49:48", "remaining_time": "3:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16407, "total_steps": 17941, "loss": 1.1721, "learning_rate": 1.8637571838659828e-06, "epoch": 0.9144975196477343, "percentage": 91.45, "elapsed_time": "1 day, 14:49:57", "remaining_time": "3:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16408, "total_steps": 17941, "loss": 1.6126, "learning_rate": 1.8613495059597086e-06, "epoch": 0.9145532579008974, "percentage": 91.46, "elapsed_time": "1 day, 14:50:05", "remaining_time": "3:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16409, "total_steps": 17941, "loss": 1.7637, "learning_rate": 1.8589433547307633e-06, "epoch": 0.9146089961540605, "percentage": 91.46, "elapsed_time": "1 day, 14:50:14", "remaining_time": "3:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16410, "total_steps": 17941, "loss": 1.7126, "learning_rate": 1.8565387302554527e-06, "epoch": 0.9146647344072236, "percentage": 91.47, "elapsed_time": "1 day, 14:50:23", "remaining_time": "3:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16411, "total_steps": 17941, "loss": 1.4304, "learning_rate": 1.8541356326100433e-06, "epoch": 0.9147204726603868, "percentage": 91.47, "elapsed_time": "1 day, 14:50:31", "remaining_time": "3:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16412, "total_steps": 17941, "loss": 1.2973, "learning_rate": 1.8517340618707247e-06, "epoch": 0.91477621091355, "percentage": 91.48, "elapsed_time": "1 day, 14:50:40", "remaining_time": "3:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16413, "total_steps": 17941, "loss": 1.5642, "learning_rate": 1.8493340181136908e-06, "epoch": 0.9148319491667131, "percentage": 91.48, "elapsed_time": "1 day, 14:50:48", "remaining_time": "3:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16414, "total_steps": 17941, "loss": 1.6875, "learning_rate": 1.846935501415048e-06, "epoch": 0.9148876874198762, "percentage": 91.49, "elapsed_time": "1 day, 14:50:57", "remaining_time": "3:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16415, "total_steps": 17941, "loss": 1.6338, "learning_rate": 1.8445385118508517e-06, "epoch": 0.9149434256730394, "percentage": 91.49, "elapsed_time": "1 day, 14:51:05", "remaining_time": "3:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16416, "total_steps": 17941, "loss": 1.6241, "learning_rate": 1.8421430494971248e-06, "epoch": 0.9149991639262025, "percentage": 91.5, "elapsed_time": "1 day, 14:51:14", "remaining_time": "3:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16417, "total_steps": 17941, "loss": 1.7354, "learning_rate": 1.839749114429845e-06, "epoch": 0.9150549021793657, "percentage": 91.51, "elapsed_time": "1 day, 14:51:22", "remaining_time": "3:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16418, "total_steps": 17941, "loss": 1.7374, "learning_rate": 1.8373567067249298e-06, "epoch": 0.9151106404325289, "percentage": 91.51, "elapsed_time": "1 day, 14:51:31", "remaining_time": "3:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16419, "total_steps": 17941, "loss": 1.7834, "learning_rate": 1.834965826458257e-06, "epoch": 0.915166378685692, "percentage": 91.52, "elapsed_time": "1 day, 14:51:39", "remaining_time": "3:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16420, "total_steps": 17941, "loss": 1.8441, "learning_rate": 1.8325764737056328e-06, "epoch": 0.9152221169388551, "percentage": 91.52, "elapsed_time": "1 day, 14:51:47", "remaining_time": "3:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16421, "total_steps": 17941, "loss": 1.5443, "learning_rate": 1.8301886485428632e-06, "epoch": 0.9152778551920183, "percentage": 91.53, "elapsed_time": "1 day, 14:51:56", "remaining_time": "3:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16422, "total_steps": 17941, "loss": 1.3697, "learning_rate": 1.8278023510456543e-06, "epoch": 0.9153335934451814, "percentage": 91.53, "elapsed_time": "1 day, 14:52:04", "remaining_time": "3:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16423, "total_steps": 17941, "loss": 1.6132, "learning_rate": 1.82541758128969e-06, "epoch": 0.9153893316983446, "percentage": 91.54, "elapsed_time": "1 day, 14:52:13", "remaining_time": "3:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16424, "total_steps": 17941, "loss": 1.7383, "learning_rate": 1.823034339350599e-06, "epoch": 0.9154450699515078, "percentage": 91.54, "elapsed_time": "1 day, 14:52:21", "remaining_time": "3:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16425, "total_steps": 17941, "loss": 1.5158, "learning_rate": 1.8206526253039702e-06, "epoch": 0.9155008082046708, "percentage": 91.55, "elapsed_time": "1 day, 14:52:30", "remaining_time": "3:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16426, "total_steps": 17941, "loss": 1.5575, "learning_rate": 1.8182724392253437e-06, "epoch": 0.915556546457834, "percentage": 91.56, "elapsed_time": "1 day, 14:52:38", "remaining_time": "3:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16427, "total_steps": 17941, "loss": 1.8494, "learning_rate": 1.815893781190181e-06, "epoch": 0.9156122847109972, "percentage": 91.56, "elapsed_time": "1 day, 14:52:47", "remaining_time": "3:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16428, "total_steps": 17941, "loss": 1.489, "learning_rate": 1.81351665127395e-06, "epoch": 0.9156680229641603, "percentage": 91.57, "elapsed_time": "1 day, 14:52:56", "remaining_time": "3:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16429, "total_steps": 17941, "loss": 1.5362, "learning_rate": 1.811141049552012e-06, "epoch": 0.9157237612173235, "percentage": 91.57, "elapsed_time": "1 day, 14:53:04", "remaining_time": "3:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16430, "total_steps": 17941, "loss": 1.6659, "learning_rate": 1.8087669760997295e-06, "epoch": 0.9157794994704866, "percentage": 91.58, "elapsed_time": "1 day, 14:53:13", "remaining_time": "3:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16431, "total_steps": 17941, "loss": 1.6386, "learning_rate": 1.8063944309923752e-06, "epoch": 0.9158352377236497, "percentage": 91.58, "elapsed_time": "1 day, 14:53:21", "remaining_time": "3:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16432, "total_steps": 17941, "loss": 1.6515, "learning_rate": 1.804023414305206e-06, "epoch": 0.9158909759768129, "percentage": 91.59, "elapsed_time": "1 day, 14:53:31", "remaining_time": "3:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16433, "total_steps": 17941, "loss": 1.4344, "learning_rate": 1.8016539261134113e-06, "epoch": 0.915946714229976, "percentage": 91.59, "elapsed_time": "1 day, 14:53:39", "remaining_time": "3:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16434, "total_steps": 17941, "loss": 1.5954, "learning_rate": 1.7992859664921424e-06, "epoch": 0.9160024524831392, "percentage": 91.6, "elapsed_time": "1 day, 14:53:47", "remaining_time": "3:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16435, "total_steps": 17941, "loss": 1.7711, "learning_rate": 1.7969195355164836e-06, "epoch": 0.9160581907363023, "percentage": 91.61, "elapsed_time": "1 day, 14:53:56", "remaining_time": "3:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16436, "total_steps": 17941, "loss": 1.635, "learning_rate": 1.794554633261497e-06, "epoch": 0.9161139289894654, "percentage": 91.61, "elapsed_time": "1 day, 14:54:04", "remaining_time": "3:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16437, "total_steps": 17941, "loss": 1.8298, "learning_rate": 1.7921912598021895e-06, "epoch": 0.9161696672426286, "percentage": 91.62, "elapsed_time": "1 day, 14:54:13", "remaining_time": "3:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16438, "total_steps": 17941, "loss": 1.511, "learning_rate": 1.7898294152134899e-06, "epoch": 0.9162254054957918, "percentage": 91.62, "elapsed_time": "1 day, 14:54:21", "remaining_time": "3:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16439, "total_steps": 17941, "loss": 1.6774, "learning_rate": 1.7874690995703213e-06, "epoch": 0.9162811437489549, "percentage": 91.63, "elapsed_time": "1 day, 14:54:30", "remaining_time": "3:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16440, "total_steps": 17941, "loss": 1.6264, "learning_rate": 1.785110312947541e-06, "epoch": 0.916336882002118, "percentage": 91.63, "elapsed_time": "1 day, 14:54:38", "remaining_time": "3:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16441, "total_steps": 17941, "loss": 1.5843, "learning_rate": 1.7827530554199445e-06, "epoch": 0.9163926202552812, "percentage": 91.64, "elapsed_time": "1 day, 14:54:47", "remaining_time": "3:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16442, "total_steps": 17941, "loss": 1.5035, "learning_rate": 1.7803973270622943e-06, "epoch": 0.9164483585084443, "percentage": 91.64, "elapsed_time": "1 day, 14:54:55", "remaining_time": "3:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16443, "total_steps": 17941, "loss": 1.6238, "learning_rate": 1.7780431279493027e-06, "epoch": 0.9165040967616075, "percentage": 91.65, "elapsed_time": "1 day, 14:55:04", "remaining_time": "3:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16444, "total_steps": 17941, "loss": 1.5588, "learning_rate": 1.7756904581556265e-06, "epoch": 0.9165598350147707, "percentage": 91.66, "elapsed_time": "1 day, 14:55:13", "remaining_time": "3:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16445, "total_steps": 17941, "loss": 1.6715, "learning_rate": 1.77333931775589e-06, "epoch": 0.9166155732679337, "percentage": 91.66, "elapsed_time": "1 day, 14:55:21", "remaining_time": "3:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16446, "total_steps": 17941, "loss": 1.626, "learning_rate": 1.7709897068246385e-06, "epoch": 0.9166713115210969, "percentage": 91.67, "elapsed_time": "1 day, 14:55:30", "remaining_time": "3:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16447, "total_steps": 17941, "loss": 1.622, "learning_rate": 1.7686416254364068e-06, "epoch": 0.9167270497742601, "percentage": 91.67, "elapsed_time": "1 day, 14:55:38", "remaining_time": "3:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16448, "total_steps": 17941, "loss": 1.5325, "learning_rate": 1.7662950736656524e-06, "epoch": 0.9167827880274232, "percentage": 91.68, "elapsed_time": "1 day, 14:55:47", "remaining_time": "3:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16449, "total_steps": 17941, "loss": 1.6706, "learning_rate": 1.7639500515867934e-06, "epoch": 0.9168385262805864, "percentage": 91.68, "elapsed_time": "1 day, 14:55:55", "remaining_time": "3:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16450, "total_steps": 17941, "loss": 1.4834, "learning_rate": 1.7616065592742038e-06, "epoch": 0.9168942645337496, "percentage": 91.69, "elapsed_time": "1 day, 14:56:04", "remaining_time": "3:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16451, "total_steps": 17941, "loss": 1.5534, "learning_rate": 1.7592645968022015e-06, "epoch": 0.9169500027869126, "percentage": 91.7, "elapsed_time": "1 day, 14:56:12", "remaining_time": "3:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16452, "total_steps": 17941, "loss": 1.5757, "learning_rate": 1.7569241642450774e-06, "epoch": 0.9170057410400758, "percentage": 91.7, "elapsed_time": "1 day, 14:56:21", "remaining_time": "3:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16453, "total_steps": 17941, "loss": 1.7064, "learning_rate": 1.754585261677022e-06, "epoch": 0.917061479293239, "percentage": 91.71, "elapsed_time": "1 day, 14:56:29", "remaining_time": "3:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16454, "total_steps": 17941, "loss": 1.5926, "learning_rate": 1.7522478891722483e-06, "epoch": 0.9171172175464021, "percentage": 91.71, "elapsed_time": "1 day, 14:56:38", "remaining_time": "3:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16455, "total_steps": 17941, "loss": 1.6621, "learning_rate": 1.7499120468048635e-06, "epoch": 0.9171729557995653, "percentage": 91.72, "elapsed_time": "1 day, 14:56:46", "remaining_time": "3:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16456, "total_steps": 17941, "loss": 1.6868, "learning_rate": 1.747577734648953e-06, "epoch": 0.9172286940527283, "percentage": 91.72, "elapsed_time": "1 day, 14:56:55", "remaining_time": "3:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16457, "total_steps": 17941, "loss": 1.5867, "learning_rate": 1.7452449527785353e-06, "epoch": 0.9172844323058915, "percentage": 91.73, "elapsed_time": "1 day, 14:57:03", "remaining_time": "3:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16458, "total_steps": 17941, "loss": 1.7146, "learning_rate": 1.7429137012676066e-06, "epoch": 0.9173401705590547, "percentage": 91.73, "elapsed_time": "1 day, 14:57:12", "remaining_time": "3:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16459, "total_steps": 17941, "loss": 1.5809, "learning_rate": 1.7405839801901026e-06, "epoch": 0.9173959088122178, "percentage": 91.74, "elapsed_time": "1 day, 14:57:20", "remaining_time": "3:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16460, "total_steps": 17941, "loss": 1.6357, "learning_rate": 1.7382557896199025e-06, "epoch": 0.917451647065381, "percentage": 91.75, "elapsed_time": "1 day, 14:57:29", "remaining_time": "3:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16461, "total_steps": 17941, "loss": 1.522, "learning_rate": 1.7359291296308365e-06, "epoch": 0.9175073853185441, "percentage": 91.75, "elapsed_time": "1 day, 14:57:37", "remaining_time": "3:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16462, "total_steps": 17941, "loss": 1.5754, "learning_rate": 1.7336040002967069e-06, "epoch": 0.9175631235717072, "percentage": 91.76, "elapsed_time": "1 day, 14:57:46", "remaining_time": "3:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16463, "total_steps": 17941, "loss": 1.514, "learning_rate": 1.7312804016912433e-06, "epoch": 0.9176188618248704, "percentage": 91.76, "elapsed_time": "1 day, 14:57:54", "remaining_time": "3:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16464, "total_steps": 17941, "loss": 1.7679, "learning_rate": 1.7289583338881365e-06, "epoch": 0.9176746000780336, "percentage": 91.77, "elapsed_time": "1 day, 14:58:03", "remaining_time": "3:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16465, "total_steps": 17941, "loss": 1.8285, "learning_rate": 1.7266377969610281e-06, "epoch": 0.9177303383311967, "percentage": 91.77, "elapsed_time": "1 day, 14:58:12", "remaining_time": "3:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16466, "total_steps": 17941, "loss": 1.6595, "learning_rate": 1.7243187909835257e-06, "epoch": 0.9177860765843598, "percentage": 91.78, "elapsed_time": "1 day, 14:58:20", "remaining_time": "3:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16467, "total_steps": 17941, "loss": 1.5281, "learning_rate": 1.7220013160291592e-06, "epoch": 0.917841814837523, "percentage": 91.78, "elapsed_time": "1 day, 14:58:29", "remaining_time": "3:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16468, "total_steps": 17941, "loss": 1.677, "learning_rate": 1.7196853721714313e-06, "epoch": 0.9178975530906861, "percentage": 91.79, "elapsed_time": "1 day, 14:58:37", "remaining_time": "3:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16469, "total_steps": 17941, "loss": 1.8137, "learning_rate": 1.7173709594837884e-06, "epoch": 0.9179532913438493, "percentage": 91.8, "elapsed_time": "1 day, 14:58:46", "remaining_time": "3:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16470, "total_steps": 17941, "loss": 1.6009, "learning_rate": 1.7150580780396387e-06, "epoch": 0.9180090295970125, "percentage": 91.8, "elapsed_time": "1 day, 14:58:54", "remaining_time": "3:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16471, "total_steps": 17941, "loss": 1.7379, "learning_rate": 1.7127467279123232e-06, "epoch": 0.9180647678501755, "percentage": 91.81, "elapsed_time": "1 day, 14:59:03", "remaining_time": "3:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16472, "total_steps": 17941, "loss": 1.5403, "learning_rate": 1.7104369091751337e-06, "epoch": 0.9181205061033387, "percentage": 91.81, "elapsed_time": "1 day, 14:59:11", "remaining_time": "3:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16473, "total_steps": 17941, "loss": 1.5477, "learning_rate": 1.7081286219013559e-06, "epoch": 0.9181762443565019, "percentage": 91.82, "elapsed_time": "1 day, 14:59:20", "remaining_time": "3:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16474, "total_steps": 17941, "loss": 1.5801, "learning_rate": 1.7058218661641645e-06, "epoch": 0.918231982609665, "percentage": 91.82, "elapsed_time": "1 day, 14:59:28", "remaining_time": "3:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16475, "total_steps": 17941, "loss": 1.6562, "learning_rate": 1.7035166420367344e-06, "epoch": 0.9182877208628282, "percentage": 91.83, "elapsed_time": "1 day, 14:59:37", "remaining_time": "3:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16476, "total_steps": 17941, "loss": 1.5919, "learning_rate": 1.7012129495921681e-06, "epoch": 0.9183434591159914, "percentage": 91.83, "elapsed_time": "1 day, 14:59:45", "remaining_time": "3:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16477, "total_steps": 17941, "loss": 1.6926, "learning_rate": 1.6989107889035238e-06, "epoch": 0.9183991973691544, "percentage": 91.84, "elapsed_time": "1 day, 14:59:54", "remaining_time": "3:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16478, "total_steps": 17941, "loss": 1.6333, "learning_rate": 1.696610160043821e-06, "epoch": 0.9184549356223176, "percentage": 91.85, "elapsed_time": "1 day, 15:00:02", "remaining_time": "3:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16479, "total_steps": 17941, "loss": 1.6626, "learning_rate": 1.6943110630860016e-06, "epoch": 0.9185106738754807, "percentage": 91.85, "elapsed_time": "1 day, 15:00:11", "remaining_time": "3:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16480, "total_steps": 17941, "loss": 1.6502, "learning_rate": 1.6920134981030122e-06, "epoch": 0.9185664121286439, "percentage": 91.86, "elapsed_time": "1 day, 15:00:19", "remaining_time": "3:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16481, "total_steps": 17941, "loss": 1.6908, "learning_rate": 1.6897174651676895e-06, "epoch": 0.9186221503818071, "percentage": 91.86, "elapsed_time": "1 day, 15:00:27", "remaining_time": "3:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16482, "total_steps": 17941, "loss": 1.7559, "learning_rate": 1.6874229643528583e-06, "epoch": 0.9186778886349701, "percentage": 91.87, "elapsed_time": "1 day, 15:00:37", "remaining_time": "3:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16483, "total_steps": 17941, "loss": 1.8367, "learning_rate": 1.6851299957312883e-06, "epoch": 0.9187336268881333, "percentage": 91.87, "elapsed_time": "1 day, 15:00:45", "remaining_time": "3:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16484, "total_steps": 17941, "loss": 1.6753, "learning_rate": 1.6828385593757047e-06, "epoch": 0.9187893651412965, "percentage": 91.88, "elapsed_time": "1 day, 15:00:54", "remaining_time": "3:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16485, "total_steps": 17941, "loss": 1.713, "learning_rate": 1.6805486553587712e-06, "epoch": 0.9188451033944596, "percentage": 91.88, "elapsed_time": "1 day, 15:01:02", "remaining_time": "3:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16486, "total_steps": 17941, "loss": 1.6826, "learning_rate": 1.6782602837531136e-06, "epoch": 0.9189008416476228, "percentage": 91.89, "elapsed_time": "1 day, 15:01:11", "remaining_time": "3:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16487, "total_steps": 17941, "loss": 1.5478, "learning_rate": 1.6759734446313014e-06, "epoch": 0.9189565799007859, "percentage": 91.9, "elapsed_time": "1 day, 15:01:19", "remaining_time": "3:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16488, "total_steps": 17941, "loss": 1.6034, "learning_rate": 1.6736881380658654e-06, "epoch": 0.919012318153949, "percentage": 91.9, "elapsed_time": "1 day, 15:01:28", "remaining_time": "3:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16489, "total_steps": 17941, "loss": 1.4609, "learning_rate": 1.6714043641292864e-06, "epoch": 0.9190680564071122, "percentage": 91.91, "elapsed_time": "1 day, 15:01:36", "remaining_time": "3:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16490, "total_steps": 17941, "loss": 1.3554, "learning_rate": 1.669122122893968e-06, "epoch": 0.9191237946602754, "percentage": 91.91, "elapsed_time": "1 day, 15:01:45", "remaining_time": "3:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16491, "total_steps": 17941, "loss": 1.4837, "learning_rate": 1.6668414144323186e-06, "epoch": 0.9191795329134385, "percentage": 91.92, "elapsed_time": "1 day, 15:01:53", "remaining_time": "3:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16492, "total_steps": 17941, "loss": 1.7913, "learning_rate": 1.6645622388166638e-06, "epoch": 0.9192352711666016, "percentage": 91.92, "elapsed_time": "1 day, 15:02:02", "remaining_time": "3:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16493, "total_steps": 17941, "loss": 1.9116, "learning_rate": 1.662284596119268e-06, "epoch": 0.9192910094197648, "percentage": 91.93, "elapsed_time": "1 day, 15:02:10", "remaining_time": "3:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16494, "total_steps": 17941, "loss": 1.6278, "learning_rate": 1.660008486412379e-06, "epoch": 0.9193467476729279, "percentage": 91.93, "elapsed_time": "1 day, 15:02:19", "remaining_time": "3:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16495, "total_steps": 17941, "loss": 1.4077, "learning_rate": 1.6577339097681832e-06, "epoch": 0.9194024859260911, "percentage": 91.94, "elapsed_time": "1 day, 15:02:27", "remaining_time": "3:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16496, "total_steps": 17941, "loss": 1.4824, "learning_rate": 1.655460866258818e-06, "epoch": 0.9194582241792543, "percentage": 91.95, "elapsed_time": "1 day, 15:02:36", "remaining_time": "3:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16497, "total_steps": 17941, "loss": 1.6222, "learning_rate": 1.6531893559563526e-06, "epoch": 0.9195139624324173, "percentage": 91.95, "elapsed_time": "1 day, 15:02:44", "remaining_time": "3:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16498, "total_steps": 17941, "loss": 1.6781, "learning_rate": 1.6509193789328413e-06, "epoch": 0.9195697006855805, "percentage": 91.96, "elapsed_time": "1 day, 15:02:53", "remaining_time": "3:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16499, "total_steps": 17941, "loss": 1.4755, "learning_rate": 1.648650935260282e-06, "epoch": 0.9196254389387437, "percentage": 91.96, "elapsed_time": "1 day, 15:03:01", "remaining_time": "3:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16500, "total_steps": 17941, "loss": 1.755, "learning_rate": 1.6463840250106e-06, "epoch": 0.9196811771919068, "percentage": 91.97, "elapsed_time": "1 day, 15:03:10", "remaining_time": "3:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16501, "total_steps": 17941, "loss": 1.5966, "learning_rate": 1.644118648255699e-06, "epoch": 0.91973691544507, "percentage": 91.97, "elapsed_time": "1 day, 15:03:18", "remaining_time": "3:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16502, "total_steps": 17941, "loss": 1.5313, "learning_rate": 1.6418548050674166e-06, "epoch": 0.919792653698233, "percentage": 91.98, "elapsed_time": "1 day, 15:03:27", "remaining_time": "3:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16503, "total_steps": 17941, "loss": 1.9343, "learning_rate": 1.6395924955175502e-06, "epoch": 0.9198483919513962, "percentage": 91.98, "elapsed_time": "1 day, 15:03:35", "remaining_time": "3:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16504, "total_steps": 17941, "loss": 1.7741, "learning_rate": 1.6373317196778592e-06, "epoch": 0.9199041302045594, "percentage": 91.99, "elapsed_time": "1 day, 15:03:43", "remaining_time": "3:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16505, "total_steps": 17941, "loss": 1.8046, "learning_rate": 1.6350724776200199e-06, "epoch": 0.9199598684577225, "percentage": 92.0, "elapsed_time": "1 day, 15:03:52", "remaining_time": "3:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16506, "total_steps": 17941, "loss": 1.8731, "learning_rate": 1.632814769415708e-06, "epoch": 0.9200156067108857, "percentage": 92.0, "elapsed_time": "1 day, 15:04:00", "remaining_time": "3:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16507, "total_steps": 17941, "loss": 1.7025, "learning_rate": 1.6305585951365e-06, "epoch": 0.9200713449640489, "percentage": 92.01, "elapsed_time": "1 day, 15:04:09", "remaining_time": "3:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16508, "total_steps": 17941, "loss": 1.7016, "learning_rate": 1.6283039548539658e-06, "epoch": 0.9201270832172119, "percentage": 92.01, "elapsed_time": "1 day, 15:04:17", "remaining_time": "3:23:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16509, "total_steps": 17941, "loss": 2.1694, "learning_rate": 1.6260508486395986e-06, "epoch": 0.9201828214703751, "percentage": 92.02, "elapsed_time": "1 day, 15:04:26", "remaining_time": "3:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16510, "total_steps": 17941, "loss": 1.526, "learning_rate": 1.6237992765648636e-06, "epoch": 0.9202385597235383, "percentage": 92.02, "elapsed_time": "1 day, 15:04:34", "remaining_time": "3:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16511, "total_steps": 17941, "loss": 1.6928, "learning_rate": 1.6215492387011643e-06, "epoch": 0.9202942979767014, "percentage": 92.03, "elapsed_time": "1 day, 15:04:43", "remaining_time": "3:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16512, "total_steps": 17941, "loss": 1.4855, "learning_rate": 1.6193007351198553e-06, "epoch": 0.9203500362298646, "percentage": 92.04, "elapsed_time": "1 day, 15:04:51", "remaining_time": "3:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16513, "total_steps": 17941, "loss": 1.5693, "learning_rate": 1.6170537658922457e-06, "epoch": 0.9204057744830277, "percentage": 92.04, "elapsed_time": "1 day, 15:05:00", "remaining_time": "3:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16514, "total_steps": 17941, "loss": 1.9811, "learning_rate": 1.6148083310895956e-06, "epoch": 0.9204615127361908, "percentage": 92.05, "elapsed_time": "1 day, 15:05:08", "remaining_time": "3:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16515, "total_steps": 17941, "loss": 1.7147, "learning_rate": 1.612564430783131e-06, "epoch": 0.920517250989354, "percentage": 92.05, "elapsed_time": "1 day, 15:05:17", "remaining_time": "3:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16516, "total_steps": 17941, "loss": 1.5628, "learning_rate": 1.6103220650439898e-06, "epoch": 0.9205729892425172, "percentage": 92.06, "elapsed_time": "1 day, 15:05:25", "remaining_time": "3:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16517, "total_steps": 17941, "loss": 1.6205, "learning_rate": 1.6080812339433094e-06, "epoch": 0.9206287274956803, "percentage": 92.06, "elapsed_time": "1 day, 15:05:34", "remaining_time": "3:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16518, "total_steps": 17941, "loss": 1.6176, "learning_rate": 1.6058419375521494e-06, "epoch": 0.9206844657488434, "percentage": 92.07, "elapsed_time": "1 day, 15:05:42", "remaining_time": "3:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16519, "total_steps": 17941, "loss": 1.7232, "learning_rate": 1.6036041759415254e-06, "epoch": 0.9207402040020066, "percentage": 92.07, "elapsed_time": "1 day, 15:05:50", "remaining_time": "3:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16520, "total_steps": 17941, "loss": 1.4445, "learning_rate": 1.601367949182403e-06, "epoch": 0.9207959422551697, "percentage": 92.08, "elapsed_time": "1 day, 15:05:59", "remaining_time": "3:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16521, "total_steps": 17941, "loss": 1.4912, "learning_rate": 1.599133257345703e-06, "epoch": 0.9208516805083329, "percentage": 92.09, "elapsed_time": "1 day, 15:06:07", "remaining_time": "3:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16522, "total_steps": 17941, "loss": 1.5366, "learning_rate": 1.5969001005023077e-06, "epoch": 0.9209074187614961, "percentage": 92.09, "elapsed_time": "1 day, 15:06:16", "remaining_time": "3:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16523, "total_steps": 17941, "loss": 1.7946, "learning_rate": 1.594668478723027e-06, "epoch": 0.9209631570146591, "percentage": 92.1, "elapsed_time": "1 day, 15:06:24", "remaining_time": "3:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16524, "total_steps": 17941, "loss": 1.5214, "learning_rate": 1.5924383920786323e-06, "epoch": 0.9210188952678223, "percentage": 92.1, "elapsed_time": "1 day, 15:06:33", "remaining_time": "3:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16525, "total_steps": 17941, "loss": 1.8999, "learning_rate": 1.5902098406398724e-06, "epoch": 0.9210746335209854, "percentage": 92.11, "elapsed_time": "1 day, 15:06:41", "remaining_time": "3:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16526, "total_steps": 17941, "loss": 1.3326, "learning_rate": 1.5879828244773965e-06, "epoch": 0.9211303717741486, "percentage": 92.11, "elapsed_time": "1 day, 15:06:50", "remaining_time": "3:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16527, "total_steps": 17941, "loss": 1.6633, "learning_rate": 1.585757343661848e-06, "epoch": 0.9211861100273118, "percentage": 92.12, "elapsed_time": "1 day, 15:06:58", "remaining_time": "3:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16528, "total_steps": 17941, "loss": 1.6892, "learning_rate": 1.5835333982637978e-06, "epoch": 0.9212418482804748, "percentage": 92.12, "elapsed_time": "1 day, 15:07:07", "remaining_time": "3:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16529, "total_steps": 17941, "loss": 1.4578, "learning_rate": 1.581310988353779e-06, "epoch": 0.921297586533638, "percentage": 92.13, "elapsed_time": "1 day, 15:07:15", "remaining_time": "3:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16530, "total_steps": 17941, "loss": 1.7048, "learning_rate": 1.579090114002285e-06, "epoch": 0.9213533247868012, "percentage": 92.14, "elapsed_time": "1 day, 15:07:24", "remaining_time": "3:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16531, "total_steps": 17941, "loss": 1.724, "learning_rate": 1.5768707752797263e-06, "epoch": 0.9214090630399643, "percentage": 92.14, "elapsed_time": "1 day, 15:07:32", "remaining_time": "3:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16532, "total_steps": 17941, "loss": 1.8385, "learning_rate": 1.574652972256513e-06, "epoch": 0.9214648012931275, "percentage": 92.15, "elapsed_time": "1 day, 15:07:41", "remaining_time": "3:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16533, "total_steps": 17941, "loss": 1.5621, "learning_rate": 1.5724367050029608e-06, "epoch": 0.9215205395462907, "percentage": 92.15, "elapsed_time": "1 day, 15:07:49", "remaining_time": "3:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16534, "total_steps": 17941, "loss": 1.5684, "learning_rate": 1.5702219735893643e-06, "epoch": 0.9215762777994537, "percentage": 92.16, "elapsed_time": "1 day, 15:07:58", "remaining_time": "3:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16535, "total_steps": 17941, "loss": 1.8214, "learning_rate": 1.5680087780859609e-06, "epoch": 0.9216320160526169, "percentage": 92.16, "elapsed_time": "1 day, 15:08:06", "remaining_time": "3:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16536, "total_steps": 17941, "loss": 1.4727, "learning_rate": 1.565797118562945e-06, "epoch": 0.9216877543057801, "percentage": 92.17, "elapsed_time": "1 day, 15:08:15", "remaining_time": "3:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16537, "total_steps": 17941, "loss": 1.8936, "learning_rate": 1.5635869950904547e-06, "epoch": 0.9217434925589432, "percentage": 92.17, "elapsed_time": "1 day, 15:08:23", "remaining_time": "3:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16538, "total_steps": 17941, "loss": 1.7389, "learning_rate": 1.5613784077385785e-06, "epoch": 0.9217992308121064, "percentage": 92.18, "elapsed_time": "1 day, 15:08:32", "remaining_time": "3:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16539, "total_steps": 17941, "loss": 1.902, "learning_rate": 1.5591713565773602e-06, "epoch": 0.9218549690652695, "percentage": 92.19, "elapsed_time": "1 day, 15:08:40", "remaining_time": "3:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16540, "total_steps": 17941, "loss": 1.8112, "learning_rate": 1.556965841676794e-06, "epoch": 0.9219107073184326, "percentage": 92.19, "elapsed_time": "1 day, 15:08:49", "remaining_time": "3:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16541, "total_steps": 17941, "loss": 1.5137, "learning_rate": 1.5547618631068407e-06, "epoch": 0.9219664455715958, "percentage": 92.2, "elapsed_time": "1 day, 15:08:57", "remaining_time": "3:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16542, "total_steps": 17941, "loss": 1.5703, "learning_rate": 1.5525594209373717e-06, "epoch": 0.922022183824759, "percentage": 92.2, "elapsed_time": "1 day, 15:09:06", "remaining_time": "3:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16543, "total_steps": 17941, "loss": 1.5157, "learning_rate": 1.5503585152382538e-06, "epoch": 0.922077922077922, "percentage": 92.21, "elapsed_time": "1 day, 15:09:14", "remaining_time": "3:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16544, "total_steps": 17941, "loss": 1.7501, "learning_rate": 1.5481591460792921e-06, "epoch": 0.9221336603310852, "percentage": 92.21, "elapsed_time": "1 day, 15:09:23", "remaining_time": "3:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16545, "total_steps": 17941, "loss": 1.3828, "learning_rate": 1.5459613135302198e-06, "epoch": 0.9221893985842484, "percentage": 92.22, "elapsed_time": "1 day, 15:09:31", "remaining_time": "3:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16546, "total_steps": 17941, "loss": 1.8228, "learning_rate": 1.5437650176607477e-06, "epoch": 0.9222451368374115, "percentage": 92.22, "elapsed_time": "1 day, 15:09:40", "remaining_time": "3:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16547, "total_steps": 17941, "loss": 1.7252, "learning_rate": 1.5415702585405312e-06, "epoch": 0.9223008750905747, "percentage": 92.23, "elapsed_time": "1 day, 15:09:48", "remaining_time": "3:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16548, "total_steps": 17941, "loss": 1.735, "learning_rate": 1.5393770362391813e-06, "epoch": 0.9223566133437378, "percentage": 92.24, "elapsed_time": "1 day, 15:09:57", "remaining_time": "3:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16549, "total_steps": 17941, "loss": 1.6412, "learning_rate": 1.537185350826237e-06, "epoch": 0.9224123515969009, "percentage": 92.24, "elapsed_time": "1 day, 15:10:05", "remaining_time": "3:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16550, "total_steps": 17941, "loss": 1.7825, "learning_rate": 1.5349952023712144e-06, "epoch": 0.9224680898500641, "percentage": 92.25, "elapsed_time": "1 day, 15:10:14", "remaining_time": "3:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16551, "total_steps": 17941, "loss": 1.535, "learning_rate": 1.5328065909435807e-06, "epoch": 0.9225238281032272, "percentage": 92.25, "elapsed_time": "1 day, 15:10:22", "remaining_time": "3:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16552, "total_steps": 17941, "loss": 1.7134, "learning_rate": 1.5306195166127357e-06, "epoch": 0.9225795663563904, "percentage": 92.26, "elapsed_time": "1 day, 15:10:31", "remaining_time": "3:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16553, "total_steps": 17941, "loss": 1.7493, "learning_rate": 1.5284339794480406e-06, "epoch": 0.9226353046095536, "percentage": 92.26, "elapsed_time": "1 day, 15:10:39", "remaining_time": "3:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16554, "total_steps": 17941, "loss": 1.6107, "learning_rate": 1.5262499795188124e-06, "epoch": 0.9226910428627166, "percentage": 92.27, "elapsed_time": "1 day, 15:10:48", "remaining_time": "3:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16555, "total_steps": 17941, "loss": 1.3162, "learning_rate": 1.5240675168943118e-06, "epoch": 0.9227467811158798, "percentage": 92.27, "elapsed_time": "1 day, 15:10:56", "remaining_time": "3:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16556, "total_steps": 17941, "loss": 1.8181, "learning_rate": 1.521886591643762e-06, "epoch": 0.922802519369043, "percentage": 92.28, "elapsed_time": "1 day, 15:11:05", "remaining_time": "3:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16557, "total_steps": 17941, "loss": 1.7267, "learning_rate": 1.5197072038363125e-06, "epoch": 0.9228582576222061, "percentage": 92.29, "elapsed_time": "1 day, 15:11:13", "remaining_time": "3:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16558, "total_steps": 17941, "loss": 1.4564, "learning_rate": 1.5175293535411028e-06, "epoch": 0.9229139958753693, "percentage": 92.29, "elapsed_time": "1 day, 15:11:22", "remaining_time": "3:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16559, "total_steps": 17941, "loss": 1.5022, "learning_rate": 1.5153530408271832e-06, "epoch": 0.9229697341285324, "percentage": 92.3, "elapsed_time": "1 day, 15:11:30", "remaining_time": "3:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16560, "total_steps": 17941, "loss": 1.6439, "learning_rate": 1.5131782657635763e-06, "epoch": 0.9230254723816955, "percentage": 92.3, "elapsed_time": "1 day, 15:11:38", "remaining_time": "3:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16561, "total_steps": 17941, "loss": 1.8417, "learning_rate": 1.51100502841926e-06, "epoch": 0.9230812106348587, "percentage": 92.31, "elapsed_time": "1 day, 15:11:48", "remaining_time": "3:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16562, "total_steps": 17941, "loss": 1.6319, "learning_rate": 1.5088333288631573e-06, "epoch": 0.9231369488880219, "percentage": 92.31, "elapsed_time": "1 day, 15:11:56", "remaining_time": "3:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16563, "total_steps": 17941, "loss": 1.6145, "learning_rate": 1.5066631671641406e-06, "epoch": 0.923192687141185, "percentage": 92.32, "elapsed_time": "1 day, 15:12:05", "remaining_time": "3:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16564, "total_steps": 17941, "loss": 1.6342, "learning_rate": 1.5044945433910274e-06, "epoch": 0.9232484253943481, "percentage": 92.32, "elapsed_time": "1 day, 15:12:13", "remaining_time": "3:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16565, "total_steps": 17941, "loss": 1.5479, "learning_rate": 1.5023274576125956e-06, "epoch": 0.9233041636475113, "percentage": 92.33, "elapsed_time": "1 day, 15:12:22", "remaining_time": "3:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16566, "total_steps": 17941, "loss": 1.6262, "learning_rate": 1.5001619098975795e-06, "epoch": 0.9233599019006744, "percentage": 92.34, "elapsed_time": "1 day, 15:12:31", "remaining_time": "3:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16567, "total_steps": 17941, "loss": 1.4897, "learning_rate": 1.4979979003146572e-06, "epoch": 0.9234156401538376, "percentage": 92.34, "elapsed_time": "1 day, 15:12:39", "remaining_time": "3:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16568, "total_steps": 17941, "loss": 1.6279, "learning_rate": 1.4958354289324462e-06, "epoch": 0.9234713784070008, "percentage": 92.35, "elapsed_time": "1 day, 15:12:48", "remaining_time": "3:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16569, "total_steps": 17941, "loss": 1.5064, "learning_rate": 1.4936744958195415e-06, "epoch": 0.9235271166601638, "percentage": 92.35, "elapsed_time": "1 day, 15:12:56", "remaining_time": "3:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16570, "total_steps": 17941, "loss": 1.7816, "learning_rate": 1.4915151010444716e-06, "epoch": 0.923582854913327, "percentage": 92.36, "elapsed_time": "1 day, 15:13:05", "remaining_time": "3:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16571, "total_steps": 17941, "loss": 1.701, "learning_rate": 1.489357244675721e-06, "epoch": 0.9236385931664901, "percentage": 92.36, "elapsed_time": "1 day, 15:13:13", "remaining_time": "3:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16572, "total_steps": 17941, "loss": 1.6186, "learning_rate": 1.4872009267817177e-06, "epoch": 0.9236943314196533, "percentage": 92.37, "elapsed_time": "1 day, 15:13:22", "remaining_time": "3:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16573, "total_steps": 17941, "loss": 1.684, "learning_rate": 1.485046147430852e-06, "epoch": 0.9237500696728165, "percentage": 92.38, "elapsed_time": "1 day, 15:13:31", "remaining_time": "3:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16574, "total_steps": 17941, "loss": 1.5003, "learning_rate": 1.4828929066914632e-06, "epoch": 0.9238058079259795, "percentage": 92.38, "elapsed_time": "1 day, 15:13:39", "remaining_time": "3:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16575, "total_steps": 17941, "loss": 1.684, "learning_rate": 1.4807412046318303e-06, "epoch": 0.9238615461791427, "percentage": 92.39, "elapsed_time": "1 day, 15:13:48", "remaining_time": "3:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16576, "total_steps": 17941, "loss": 1.5795, "learning_rate": 1.4785910413202042e-06, "epoch": 0.9239172844323059, "percentage": 92.39, "elapsed_time": "1 day, 15:13:56", "remaining_time": "3:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16577, "total_steps": 17941, "loss": 1.5598, "learning_rate": 1.4764424168247747e-06, "epoch": 0.923973022685469, "percentage": 92.4, "elapsed_time": "1 day, 15:14:05", "remaining_time": "3:13:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16578, "total_steps": 17941, "loss": 1.4809, "learning_rate": 1.4742953312136765e-06, "epoch": 0.9240287609386322, "percentage": 92.4, "elapsed_time": "1 day, 15:14:13", "remaining_time": "3:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16579, "total_steps": 17941, "loss": 1.5731, "learning_rate": 1.4721497845550048e-06, "epoch": 0.9240844991917954, "percentage": 92.41, "elapsed_time": "1 day, 15:14:22", "remaining_time": "3:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16580, "total_steps": 17941, "loss": 1.7021, "learning_rate": 1.4700057769168053e-06, "epoch": 0.9241402374449584, "percentage": 92.41, "elapsed_time": "1 day, 15:14:30", "remaining_time": "3:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16581, "total_steps": 17941, "loss": 1.7689, "learning_rate": 1.4678633083670734e-06, "epoch": 0.9241959756981216, "percentage": 92.42, "elapsed_time": "1 day, 15:14:38", "remaining_time": "3:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16582, "total_steps": 17941, "loss": 1.0948, "learning_rate": 1.4657223789737606e-06, "epoch": 0.9242517139512848, "percentage": 92.43, "elapsed_time": "1 day, 15:14:47", "remaining_time": "3:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16583, "total_steps": 17941, "loss": 1.6724, "learning_rate": 1.4635829888047459e-06, "epoch": 0.9243074522044479, "percentage": 92.43, "elapsed_time": "1 day, 15:14:56", "remaining_time": "3:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16584, "total_steps": 17941, "loss": 1.3943, "learning_rate": 1.4614451379279081e-06, "epoch": 0.9243631904576111, "percentage": 92.44, "elapsed_time": "1 day, 15:15:05", "remaining_time": "3:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16585, "total_steps": 17941, "loss": 1.5175, "learning_rate": 1.459308826411021e-06, "epoch": 0.9244189287107742, "percentage": 92.44, "elapsed_time": "1 day, 15:15:13", "remaining_time": "3:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16586, "total_steps": 17941, "loss": 1.6664, "learning_rate": 1.457174054321847e-06, "epoch": 0.9244746669639373, "percentage": 92.45, "elapsed_time": "1 day, 15:15:21", "remaining_time": "3:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16587, "total_steps": 17941, "loss": 1.7089, "learning_rate": 1.4550408217280875e-06, "epoch": 0.9245304052171005, "percentage": 92.45, "elapsed_time": "1 day, 15:15:30", "remaining_time": "3:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16588, "total_steps": 17941, "loss": 1.7767, "learning_rate": 1.4529091286973995e-06, "epoch": 0.9245861434702637, "percentage": 92.46, "elapsed_time": "1 day, 15:15:38", "remaining_time": "3:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16589, "total_steps": 17941, "loss": 1.5851, "learning_rate": 1.4507789752973844e-06, "epoch": 0.9246418817234268, "percentage": 92.46, "elapsed_time": "1 day, 15:15:47", "remaining_time": "3:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16590, "total_steps": 17941, "loss": 1.6937, "learning_rate": 1.4486503615955993e-06, "epoch": 0.92469761997659, "percentage": 92.47, "elapsed_time": "1 day, 15:15:55", "remaining_time": "3:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16591, "total_steps": 17941, "loss": 1.7255, "learning_rate": 1.4465232876595457e-06, "epoch": 0.9247533582297531, "percentage": 92.48, "elapsed_time": "1 day, 15:16:04", "remaining_time": "3:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16592, "total_steps": 17941, "loss": 1.4131, "learning_rate": 1.4443977535566922e-06, "epoch": 0.9248090964829162, "percentage": 92.48, "elapsed_time": "1 day, 15:16:13", "remaining_time": "3:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16593, "total_steps": 17941, "loss": 1.802, "learning_rate": 1.4422737593544455e-06, "epoch": 0.9248648347360794, "percentage": 92.49, "elapsed_time": "1 day, 15:16:22", "remaining_time": "3:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16594, "total_steps": 17941, "loss": 1.5824, "learning_rate": 1.4401513051201521e-06, "epoch": 0.9249205729892425, "percentage": 92.49, "elapsed_time": "1 day, 15:16:30", "remaining_time": "3:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16595, "total_steps": 17941, "loss": 1.5499, "learning_rate": 1.4380303909211413e-06, "epoch": 0.9249763112424056, "percentage": 92.5, "elapsed_time": "1 day, 15:16:39", "remaining_time": "3:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16596, "total_steps": 17941, "loss": 1.5213, "learning_rate": 1.435911016824676e-06, "epoch": 0.9250320494955688, "percentage": 92.5, "elapsed_time": "1 day, 15:16:47", "remaining_time": "3:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16597, "total_steps": 17941, "loss": 1.7629, "learning_rate": 1.4337931828979633e-06, "epoch": 0.9250877877487319, "percentage": 92.51, "elapsed_time": "1 day, 15:16:56", "remaining_time": "3:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16598, "total_steps": 17941, "loss": 1.53, "learning_rate": 1.4316768892081667e-06, "epoch": 0.9251435260018951, "percentage": 92.51, "elapsed_time": "1 day, 15:17:04", "remaining_time": "3:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16599, "total_steps": 17941, "loss": 1.6082, "learning_rate": 1.42956213582241e-06, "epoch": 0.9251992642550583, "percentage": 92.52, "elapsed_time": "1 day, 15:17:13", "remaining_time": "3:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16600, "total_steps": 17941, "loss": 1.6629, "learning_rate": 1.427448922807756e-06, "epoch": 0.9252550025082213, "percentage": 92.53, "elapsed_time": "1 day, 15:17:21", "remaining_time": "3:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16601, "total_steps": 17941, "loss": 1.6067, "learning_rate": 1.425337250231218e-06, "epoch": 0.9253107407613845, "percentage": 92.53, "elapsed_time": "1 day, 15:17:30", "remaining_time": "3:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16602, "total_steps": 17941, "loss": 1.8957, "learning_rate": 1.4232271181597757e-06, "epoch": 0.9253664790145477, "percentage": 92.54, "elapsed_time": "1 day, 15:17:38", "remaining_time": "3:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16603, "total_steps": 17941, "loss": 1.6444, "learning_rate": 1.4211185266603589e-06, "epoch": 0.9254222172677108, "percentage": 92.54, "elapsed_time": "1 day, 15:17:47", "remaining_time": "3:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16604, "total_steps": 17941, "loss": 1.6003, "learning_rate": 1.4190114757998141e-06, "epoch": 0.925477955520874, "percentage": 92.55, "elapsed_time": "1 day, 15:17:55", "remaining_time": "3:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16605, "total_steps": 17941, "loss": 1.5485, "learning_rate": 1.4169059656449824e-06, "epoch": 0.9255336937740372, "percentage": 92.55, "elapsed_time": "1 day, 15:18:04", "remaining_time": "3:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16606, "total_steps": 17941, "loss": 1.4721, "learning_rate": 1.4148019962626323e-06, "epoch": 0.9255894320272002, "percentage": 92.56, "elapsed_time": "1 day, 15:18:13", "remaining_time": "3:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16607, "total_steps": 17941, "loss": 1.7393, "learning_rate": 1.4126995677195e-06, "epoch": 0.9256451702803634, "percentage": 92.56, "elapsed_time": "1 day, 15:18:22", "remaining_time": "3:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16608, "total_steps": 17941, "loss": 1.7286, "learning_rate": 1.410598680082248e-06, "epoch": 0.9257009085335266, "percentage": 92.57, "elapsed_time": "1 day, 15:18:30", "remaining_time": "3:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16609, "total_steps": 17941, "loss": 1.7772, "learning_rate": 1.4084993334175012e-06, "epoch": 0.9257566467866897, "percentage": 92.58, "elapsed_time": "1 day, 15:18:38", "remaining_time": "3:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16610, "total_steps": 17941, "loss": 1.4551, "learning_rate": 1.4064015277918618e-06, "epoch": 0.9258123850398529, "percentage": 92.58, "elapsed_time": "1 day, 15:18:47", "remaining_time": "3:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16611, "total_steps": 17941, "loss": 1.6318, "learning_rate": 1.4043052632718378e-06, "epoch": 0.925868123293016, "percentage": 92.59, "elapsed_time": "1 day, 15:18:55", "remaining_time": "3:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16612, "total_steps": 17941, "loss": 1.5872, "learning_rate": 1.4022105399239206e-06, "epoch": 0.9259238615461791, "percentage": 92.59, "elapsed_time": "1 day, 15:19:04", "remaining_time": "3:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16613, "total_steps": 17941, "loss": 1.5583, "learning_rate": 1.4001173578145398e-06, "epoch": 0.9259795997993423, "percentage": 92.6, "elapsed_time": "1 day, 15:19:12", "remaining_time": "3:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16614, "total_steps": 17941, "loss": 1.635, "learning_rate": 1.3980257170100763e-06, "epoch": 0.9260353380525055, "percentage": 92.6, "elapsed_time": "1 day, 15:19:21", "remaining_time": "3:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16615, "total_steps": 17941, "loss": 1.4499, "learning_rate": 1.3959356175768768e-06, "epoch": 0.9260910763056686, "percentage": 92.61, "elapsed_time": "1 day, 15:19:29", "remaining_time": "3:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16616, "total_steps": 17941, "loss": 1.2255, "learning_rate": 1.3938470595812103e-06, "epoch": 0.9261468145588317, "percentage": 92.61, "elapsed_time": "1 day, 15:19:38", "remaining_time": "3:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16617, "total_steps": 17941, "loss": 1.5682, "learning_rate": 1.391760043089324e-06, "epoch": 0.9262025528119948, "percentage": 92.62, "elapsed_time": "1 day, 15:19:46", "remaining_time": "3:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16618, "total_steps": 17941, "loss": 1.8535, "learning_rate": 1.3896745681674039e-06, "epoch": 0.926258291065158, "percentage": 92.63, "elapsed_time": "1 day, 15:19:55", "remaining_time": "3:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16619, "total_steps": 17941, "loss": 1.5544, "learning_rate": 1.3875906348815914e-06, "epoch": 0.9263140293183212, "percentage": 92.63, "elapsed_time": "1 day, 15:20:03", "remaining_time": "3:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16620, "total_steps": 17941, "loss": 1.5231, "learning_rate": 1.3855082432979672e-06, "epoch": 0.9263697675714843, "percentage": 92.64, "elapsed_time": "1 day, 15:20:12", "remaining_time": "3:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16621, "total_steps": 17941, "loss": 1.6676, "learning_rate": 1.383427393482578e-06, "epoch": 0.9264255058246474, "percentage": 92.64, "elapsed_time": "1 day, 15:20:20", "remaining_time": "3:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16622, "total_steps": 17941, "loss": 1.5498, "learning_rate": 1.381348085501427e-06, "epoch": 0.9264812440778106, "percentage": 92.65, "elapsed_time": "1 day, 15:20:29", "remaining_time": "3:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16623, "total_steps": 17941, "loss": 1.7304, "learning_rate": 1.3792703194204448e-06, "epoch": 0.9265369823309737, "percentage": 92.65, "elapsed_time": "1 day, 15:20:37", "remaining_time": "3:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16624, "total_steps": 17941, "loss": 1.73, "learning_rate": 1.3771940953055284e-06, "epoch": 0.9265927205841369, "percentage": 92.66, "elapsed_time": "1 day, 15:20:46", "remaining_time": "3:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16625, "total_steps": 17941, "loss": 1.653, "learning_rate": 1.3751194132225253e-06, "epoch": 0.9266484588373001, "percentage": 92.66, "elapsed_time": "1 day, 15:20:55", "remaining_time": "3:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16626, "total_steps": 17941, "loss": 1.467, "learning_rate": 1.3730462732372328e-06, "epoch": 0.9267041970904631, "percentage": 92.67, "elapsed_time": "1 day, 15:21:04", "remaining_time": "3:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16627, "total_steps": 17941, "loss": 1.7548, "learning_rate": 1.370974675415393e-06, "epoch": 0.9267599353436263, "percentage": 92.68, "elapsed_time": "1 day, 15:21:12", "remaining_time": "3:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16628, "total_steps": 17941, "loss": 1.8312, "learning_rate": 1.3689046198227086e-06, "epoch": 0.9268156735967895, "percentage": 92.68, "elapsed_time": "1 day, 15:21:21", "remaining_time": "3:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16629, "total_steps": 17941, "loss": 1.6967, "learning_rate": 1.366836106524838e-06, "epoch": 0.9268714118499526, "percentage": 92.69, "elapsed_time": "1 day, 15:21:29", "remaining_time": "3:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16630, "total_steps": 17941, "loss": 1.4939, "learning_rate": 1.3647691355873737e-06, "epoch": 0.9269271501031158, "percentage": 92.69, "elapsed_time": "1 day, 15:21:38", "remaining_time": "3:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16631, "total_steps": 17941, "loss": 1.4178, "learning_rate": 1.3627037070758686e-06, "epoch": 0.926982888356279, "percentage": 92.7, "elapsed_time": "1 day, 15:21:46", "remaining_time": "3:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16632, "total_steps": 17941, "loss": 1.5338, "learning_rate": 1.3606398210558202e-06, "epoch": 0.927038626609442, "percentage": 92.7, "elapsed_time": "1 day, 15:21:55", "remaining_time": "3:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16633, "total_steps": 17941, "loss": 1.6177, "learning_rate": 1.3585774775926985e-06, "epoch": 0.9270943648626052, "percentage": 92.71, "elapsed_time": "1 day, 15:22:03", "remaining_time": "3:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16634, "total_steps": 17941, "loss": 1.6417, "learning_rate": 1.3565166767519012e-06, "epoch": 0.9271501031157684, "percentage": 92.72, "elapsed_time": "1 day, 15:22:12", "remaining_time": "3:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16635, "total_steps": 17941, "loss": 1.5803, "learning_rate": 1.3544574185987702e-06, "epoch": 0.9272058413689315, "percentage": 92.72, "elapsed_time": "1 day, 15:22:20", "remaining_time": "3:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16636, "total_steps": 17941, "loss": 1.5008, "learning_rate": 1.3523997031986424e-06, "epoch": 0.9272615796220947, "percentage": 92.73, "elapsed_time": "1 day, 15:22:28", "remaining_time": "3:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16637, "total_steps": 17941, "loss": 1.5865, "learning_rate": 1.350343530616749e-06, "epoch": 0.9273173178752578, "percentage": 92.73, "elapsed_time": "1 day, 15:22:37", "remaining_time": "3:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16638, "total_steps": 17941, "loss": 1.8265, "learning_rate": 1.3482889009183153e-06, "epoch": 0.9273730561284209, "percentage": 92.74, "elapsed_time": "1 day, 15:22:46", "remaining_time": "3:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16639, "total_steps": 17941, "loss": 1.7269, "learning_rate": 1.3462358141685005e-06, "epoch": 0.9274287943815841, "percentage": 92.74, "elapsed_time": "1 day, 15:22:54", "remaining_time": "3:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16640, "total_steps": 17941, "loss": 1.686, "learning_rate": 1.3441842704324136e-06, "epoch": 0.9274845326347472, "percentage": 92.75, "elapsed_time": "1 day, 15:23:02", "remaining_time": "3:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16641, "total_steps": 17941, "loss": 1.7519, "learning_rate": 1.3421342697751249e-06, "epoch": 0.9275402708879104, "percentage": 92.75, "elapsed_time": "1 day, 15:23:11", "remaining_time": "3:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16642, "total_steps": 17941, "loss": 1.8219, "learning_rate": 1.3400858122616323e-06, "epoch": 0.9275960091410735, "percentage": 92.76, "elapsed_time": "1 day, 15:23:19", "remaining_time": "3:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16643, "total_steps": 17941, "loss": 1.6694, "learning_rate": 1.338038897956917e-06, "epoch": 0.9276517473942366, "percentage": 92.77, "elapsed_time": "1 day, 15:23:28", "remaining_time": "3:04:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16644, "total_steps": 17941, "loss": 1.396, "learning_rate": 1.3359935269258828e-06, "epoch": 0.9277074856473998, "percentage": 92.77, "elapsed_time": "1 day, 15:23:36", "remaining_time": "3:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16645, "total_steps": 17941, "loss": 1.7887, "learning_rate": 1.333949699233411e-06, "epoch": 0.927763223900563, "percentage": 92.78, "elapsed_time": "1 day, 15:23:45", "remaining_time": "3:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16646, "total_steps": 17941, "loss": 1.6942, "learning_rate": 1.3319074149443057e-06, "epoch": 0.9278189621537261, "percentage": 92.78, "elapsed_time": "1 day, 15:23:53", "remaining_time": "3:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16647, "total_steps": 17941, "loss": 1.7105, "learning_rate": 1.3298666741233424e-06, "epoch": 0.9278747004068892, "percentage": 92.79, "elapsed_time": "1 day, 15:24:02", "remaining_time": "3:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16648, "total_steps": 17941, "loss": 1.6445, "learning_rate": 1.3278274768352473e-06, "epoch": 0.9279304386600524, "percentage": 92.79, "elapsed_time": "1 day, 15:24:10", "remaining_time": "3:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16649, "total_steps": 17941, "loss": 1.6324, "learning_rate": 1.3257898231446797e-06, "epoch": 0.9279861769132155, "percentage": 92.8, "elapsed_time": "1 day, 15:24:19", "remaining_time": "3:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16650, "total_steps": 17941, "loss": 1.611, "learning_rate": 1.3237537131162714e-06, "epoch": 0.9280419151663787, "percentage": 92.8, "elapsed_time": "1 day, 15:24:27", "remaining_time": "3:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16651, "total_steps": 17941, "loss": 1.6696, "learning_rate": 1.3217191468145928e-06, "epoch": 0.9280976534195419, "percentage": 92.81, "elapsed_time": "1 day, 15:24:36", "remaining_time": "3:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16652, "total_steps": 17941, "loss": 1.4856, "learning_rate": 1.3196861243041758e-06, "epoch": 0.9281533916727049, "percentage": 92.82, "elapsed_time": "1 day, 15:24:44", "remaining_time": "3:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16653, "total_steps": 17941, "loss": 1.7154, "learning_rate": 1.3176546456494742e-06, "epoch": 0.9282091299258681, "percentage": 92.82, "elapsed_time": "1 day, 15:24:53", "remaining_time": "3:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16654, "total_steps": 17941, "loss": 1.6028, "learning_rate": 1.3156247109149366e-06, "epoch": 0.9282648681790313, "percentage": 92.83, "elapsed_time": "1 day, 15:25:02", "remaining_time": "3:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16655, "total_steps": 17941, "loss": 1.5997, "learning_rate": 1.3135963201649393e-06, "epoch": 0.9283206064321944, "percentage": 92.83, "elapsed_time": "1 day, 15:25:10", "remaining_time": "3:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16656, "total_steps": 17941, "loss": 1.5001, "learning_rate": 1.3115694734638028e-06, "epoch": 0.9283763446853576, "percentage": 92.84, "elapsed_time": "1 day, 15:25:19", "remaining_time": "3:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16657, "total_steps": 17941, "loss": 1.2605, "learning_rate": 1.3095441708758037e-06, "epoch": 0.9284320829385208, "percentage": 92.84, "elapsed_time": "1 day, 15:25:27", "remaining_time": "3:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16658, "total_steps": 17941, "loss": 1.3539, "learning_rate": 1.307520412465185e-06, "epoch": 0.9284878211916838, "percentage": 92.85, "elapsed_time": "1 day, 15:25:35", "remaining_time": "3:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16659, "total_steps": 17941, "loss": 1.4482, "learning_rate": 1.3054981982961234e-06, "epoch": 0.928543559444847, "percentage": 92.85, "elapsed_time": "1 day, 15:25:44", "remaining_time": "3:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16660, "total_steps": 17941, "loss": 1.5341, "learning_rate": 1.303477528432745e-06, "epoch": 0.9285992976980102, "percentage": 92.86, "elapsed_time": "1 day, 15:25:53", "remaining_time": "3:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16661, "total_steps": 17941, "loss": 1.6272, "learning_rate": 1.301458402939132e-06, "epoch": 0.9286550359511733, "percentage": 92.87, "elapsed_time": "1 day, 15:26:01", "remaining_time": "3:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16662, "total_steps": 17941, "loss": 1.4829, "learning_rate": 1.2994408218793385e-06, "epoch": 0.9287107742043365, "percentage": 92.87, "elapsed_time": "1 day, 15:26:10", "remaining_time": "3:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16663, "total_steps": 17941, "loss": 1.6001, "learning_rate": 1.297424785317336e-06, "epoch": 0.9287665124574995, "percentage": 92.88, "elapsed_time": "1 day, 15:26:19", "remaining_time": "3:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16664, "total_steps": 17941, "loss": 1.7221, "learning_rate": 1.2954102933170564e-06, "epoch": 0.9288222507106627, "percentage": 92.88, "elapsed_time": "1 day, 15:26:27", "remaining_time": "3:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16665, "total_steps": 17941, "loss": 1.6743, "learning_rate": 1.2933973459423987e-06, "epoch": 0.9288779889638259, "percentage": 92.89, "elapsed_time": "1 day, 15:26:36", "remaining_time": "3:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16666, "total_steps": 17941, "loss": 1.741, "learning_rate": 1.2913859432572007e-06, "epoch": 0.928933727216989, "percentage": 92.89, "elapsed_time": "1 day, 15:26:44", "remaining_time": "3:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16667, "total_steps": 17941, "loss": 1.7181, "learning_rate": 1.2893760853252501e-06, "epoch": 0.9289894654701522, "percentage": 92.9, "elapsed_time": "1 day, 15:26:53", "remaining_time": "3:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16668, "total_steps": 17941, "loss": 1.36, "learning_rate": 1.2873677722102795e-06, "epoch": 0.9290452037233153, "percentage": 92.9, "elapsed_time": "1 day, 15:27:01", "remaining_time": "3:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16669, "total_steps": 17941, "loss": 1.4247, "learning_rate": 1.285361003975999e-06, "epoch": 0.9291009419764784, "percentage": 92.91, "elapsed_time": "1 day, 15:27:09", "remaining_time": "3:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16670, "total_steps": 17941, "loss": 1.4759, "learning_rate": 1.2833557806860407e-06, "epoch": 0.9291566802296416, "percentage": 92.92, "elapsed_time": "1 day, 15:27:18", "remaining_time": "3:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16671, "total_steps": 17941, "loss": 1.738, "learning_rate": 1.2813521024039987e-06, "epoch": 0.9292124184828048, "percentage": 92.92, "elapsed_time": "1 day, 15:27:27", "remaining_time": "3:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16672, "total_steps": 17941, "loss": 1.509, "learning_rate": 1.2793499691934107e-06, "epoch": 0.9292681567359679, "percentage": 92.93, "elapsed_time": "1 day, 15:27:35", "remaining_time": "3:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16673, "total_steps": 17941, "loss": 1.555, "learning_rate": 1.2773493811177817e-06, "epoch": 0.929323894989131, "percentage": 92.93, "elapsed_time": "1 day, 15:27:44", "remaining_time": "3:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16674, "total_steps": 17941, "loss": 1.5637, "learning_rate": 1.2753503382405662e-06, "epoch": 0.9293796332422942, "percentage": 92.94, "elapsed_time": "1 day, 15:27:52", "remaining_time": "2:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16675, "total_steps": 17941, "loss": 1.627, "learning_rate": 1.2733528406251471e-06, "epoch": 0.9294353714954573, "percentage": 92.94, "elapsed_time": "1 day, 15:28:01", "remaining_time": "2:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16676, "total_steps": 17941, "loss": 1.1211, "learning_rate": 1.2713568883348848e-06, "epoch": 0.9294911097486205, "percentage": 92.95, "elapsed_time": "1 day, 15:28:09", "remaining_time": "2:59:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16677, "total_steps": 17941, "loss": 1.5907, "learning_rate": 1.2693624814330674e-06, "epoch": 0.9295468480017837, "percentage": 92.95, "elapsed_time": "1 day, 15:28:18", "remaining_time": "2:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16678, "total_steps": 17941, "loss": 1.6616, "learning_rate": 1.267369619982961e-06, "epoch": 0.9296025862549467, "percentage": 92.96, "elapsed_time": "1 day, 15:28:27", "remaining_time": "2:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16679, "total_steps": 17941, "loss": 1.6527, "learning_rate": 1.2653783040477486e-06, "epoch": 0.9296583245081099, "percentage": 92.97, "elapsed_time": "1 day, 15:28:35", "remaining_time": "2:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16680, "total_steps": 17941, "loss": 1.7218, "learning_rate": 1.2633885336906015e-06, "epoch": 0.9297140627612731, "percentage": 92.97, "elapsed_time": "1 day, 15:28:43", "remaining_time": "2:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16681, "total_steps": 17941, "loss": 1.617, "learning_rate": 1.2614003089746196e-06, "epoch": 0.9297698010144362, "percentage": 92.98, "elapsed_time": "1 day, 15:28:52", "remaining_time": "2:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16682, "total_steps": 17941, "loss": 1.8366, "learning_rate": 1.2594136299628467e-06, "epoch": 0.9298255392675994, "percentage": 92.98, "elapsed_time": "1 day, 15:29:00", "remaining_time": "2:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16683, "total_steps": 17941, "loss": 1.4348, "learning_rate": 1.2574284967182992e-06, "epoch": 0.9298812775207626, "percentage": 92.99, "elapsed_time": "1 day, 15:29:09", "remaining_time": "2:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16684, "total_steps": 17941, "loss": 1.7107, "learning_rate": 1.2554449093039267e-06, "epoch": 0.9299370157739256, "percentage": 92.99, "elapsed_time": "1 day, 15:29:17", "remaining_time": "2:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16685, "total_steps": 17941, "loss": 1.6215, "learning_rate": 1.253462867782651e-06, "epoch": 0.9299927540270888, "percentage": 93.0, "elapsed_time": "1 day, 15:29:26", "remaining_time": "2:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16686, "total_steps": 17941, "loss": 1.6611, "learning_rate": 1.2514823722173108e-06, "epoch": 0.9300484922802519, "percentage": 93.0, "elapsed_time": "1 day, 15:29:34", "remaining_time": "2:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16687, "total_steps": 17941, "loss": 1.568, "learning_rate": 1.249503422670728e-06, "epoch": 0.9301042305334151, "percentage": 93.01, "elapsed_time": "1 day, 15:29:43", "remaining_time": "2:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16688, "total_steps": 17941, "loss": 1.752, "learning_rate": 1.2475260192056638e-06, "epoch": 0.9301599687865783, "percentage": 93.02, "elapsed_time": "1 day, 15:29:51", "remaining_time": "2:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16689, "total_steps": 17941, "loss": 1.6086, "learning_rate": 1.2455501618848285e-06, "epoch": 0.9302157070397413, "percentage": 93.02, "elapsed_time": "1 day, 15:30:00", "remaining_time": "2:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16690, "total_steps": 17941, "loss": 1.7463, "learning_rate": 1.243575850770884e-06, "epoch": 0.9302714452929045, "percentage": 93.03, "elapsed_time": "1 day, 15:30:08", "remaining_time": "2:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16691, "total_steps": 17941, "loss": 1.5899, "learning_rate": 1.2416030859264406e-06, "epoch": 0.9303271835460677, "percentage": 93.03, "elapsed_time": "1 day, 15:30:17", "remaining_time": "2:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16692, "total_steps": 17941, "loss": 1.6088, "learning_rate": 1.2396318674140651e-06, "epoch": 0.9303829217992308, "percentage": 93.04, "elapsed_time": "1 day, 15:30:25", "remaining_time": "2:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16693, "total_steps": 17941, "loss": 1.6877, "learning_rate": 1.2376621952962851e-06, "epoch": 0.930438660052394, "percentage": 93.04, "elapsed_time": "1 day, 15:30:34", "remaining_time": "2:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16694, "total_steps": 17941, "loss": 1.6779, "learning_rate": 1.2356940696355401e-06, "epoch": 0.9304943983055571, "percentage": 93.05, "elapsed_time": "1 day, 15:30:43", "remaining_time": "2:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16695, "total_steps": 17941, "loss": 1.7652, "learning_rate": 1.2337274904942796e-06, "epoch": 0.9305501365587202, "percentage": 93.06, "elapsed_time": "1 day, 15:30:51", "remaining_time": "2:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16696, "total_steps": 17941, "loss": 1.7286, "learning_rate": 1.231762457934843e-06, "epoch": 0.9306058748118834, "percentage": 93.06, "elapsed_time": "1 day, 15:30:59", "remaining_time": "2:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16697, "total_steps": 17941, "loss": 1.5344, "learning_rate": 1.2297989720195747e-06, "epoch": 0.9306616130650466, "percentage": 93.07, "elapsed_time": "1 day, 15:31:08", "remaining_time": "2:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16698, "total_steps": 17941, "loss": 1.4956, "learning_rate": 1.2278370328107192e-06, "epoch": 0.9307173513182097, "percentage": 93.07, "elapsed_time": "1 day, 15:31:16", "remaining_time": "2:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16699, "total_steps": 17941, "loss": 1.5858, "learning_rate": 1.2258766403705157e-06, "epoch": 0.9307730895713728, "percentage": 93.08, "elapsed_time": "1 day, 15:31:25", "remaining_time": "2:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16700, "total_steps": 17941, "loss": 1.713, "learning_rate": 1.2239177947611423e-06, "epoch": 0.930828827824536, "percentage": 93.08, "elapsed_time": "1 day, 15:31:34", "remaining_time": "2:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16701, "total_steps": 17941, "loss": 1.8718, "learning_rate": 1.221960496044705e-06, "epoch": 0.9308845660776991, "percentage": 93.09, "elapsed_time": "1 day, 15:31:42", "remaining_time": "2:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16702, "total_steps": 17941, "loss": 1.724, "learning_rate": 1.2200047442832817e-06, "epoch": 0.9309403043308623, "percentage": 93.09, "elapsed_time": "1 day, 15:31:50", "remaining_time": "2:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16703, "total_steps": 17941, "loss": 1.7801, "learning_rate": 1.2180505395389064e-06, "epoch": 0.9309960425840255, "percentage": 93.1, "elapsed_time": "1 day, 15:31:59", "remaining_time": "2:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16704, "total_steps": 17941, "loss": 1.7699, "learning_rate": 1.2160978818735514e-06, "epoch": 0.9310517808371885, "percentage": 93.11, "elapsed_time": "1 day, 15:32:08", "remaining_time": "2:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16705, "total_steps": 17941, "loss": 1.6572, "learning_rate": 1.2141467713491284e-06, "epoch": 0.9311075190903517, "percentage": 93.11, "elapsed_time": "1 day, 15:32:17", "remaining_time": "2:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16706, "total_steps": 17941, "loss": 1.6102, "learning_rate": 1.212197208027538e-06, "epoch": 0.9311632573435149, "percentage": 93.12, "elapsed_time": "1 day, 15:32:25", "remaining_time": "2:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16707, "total_steps": 17941, "loss": 1.3241, "learning_rate": 1.2102491919706027e-06, "epoch": 0.931218995596678, "percentage": 93.12, "elapsed_time": "1 day, 15:32:34", "remaining_time": "2:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16708, "total_steps": 17941, "loss": 1.7006, "learning_rate": 1.2083027232400957e-06, "epoch": 0.9312747338498412, "percentage": 93.13, "elapsed_time": "1 day, 15:32:42", "remaining_time": "2:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16709, "total_steps": 17941, "loss": 1.3477, "learning_rate": 1.2063578018977507e-06, "epoch": 0.9313304721030042, "percentage": 93.13, "elapsed_time": "1 day, 15:32:50", "remaining_time": "2:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16710, "total_steps": 17941, "loss": 1.7295, "learning_rate": 1.2044144280052517e-06, "epoch": 0.9313862103561674, "percentage": 93.14, "elapsed_time": "1 day, 15:32:59", "remaining_time": "2:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16711, "total_steps": 17941, "loss": 1.6229, "learning_rate": 1.2024726016242272e-06, "epoch": 0.9314419486093306, "percentage": 93.14, "elapsed_time": "1 day, 15:33:07", "remaining_time": "2:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16712, "total_steps": 17941, "loss": 1.2124, "learning_rate": 1.2005323228162612e-06, "epoch": 0.9314976868624937, "percentage": 93.15, "elapsed_time": "1 day, 15:33:16", "remaining_time": "2:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16713, "total_steps": 17941, "loss": 1.5589, "learning_rate": 1.198593591642888e-06, "epoch": 0.9315534251156569, "percentage": 93.16, "elapsed_time": "1 day, 15:33:24", "remaining_time": "2:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16714, "total_steps": 17941, "loss": 1.4937, "learning_rate": 1.196656408165603e-06, "epoch": 0.93160916336882, "percentage": 93.16, "elapsed_time": "1 day, 15:33:33", "remaining_time": "2:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16715, "total_steps": 17941, "loss": 1.3918, "learning_rate": 1.1947207724458232e-06, "epoch": 0.9316649016219831, "percentage": 93.17, "elapsed_time": "1 day, 15:33:41", "remaining_time": "2:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16716, "total_steps": 17941, "loss": 1.6976, "learning_rate": 1.1927866845449499e-06, "epoch": 0.9317206398751463, "percentage": 93.17, "elapsed_time": "1 day, 15:33:50", "remaining_time": "2:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16717, "total_steps": 17941, "loss": 1.6336, "learning_rate": 1.190854144524317e-06, "epoch": 0.9317763781283095, "percentage": 93.18, "elapsed_time": "1 day, 15:33:59", "remaining_time": "2:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16718, "total_steps": 17941, "loss": 1.8903, "learning_rate": 1.188923152445215e-06, "epoch": 0.9318321163814726, "percentage": 93.18, "elapsed_time": "1 day, 15:34:07", "remaining_time": "2:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16719, "total_steps": 17941, "loss": 1.7302, "learning_rate": 1.1869937083688831e-06, "epoch": 0.9318878546346357, "percentage": 93.19, "elapsed_time": "1 day, 15:34:16", "remaining_time": "2:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16720, "total_steps": 17941, "loss": 1.6667, "learning_rate": 1.1850658123565007e-06, "epoch": 0.9319435928877989, "percentage": 93.19, "elapsed_time": "1 day, 15:34:25", "remaining_time": "2:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16721, "total_steps": 17941, "loss": 1.8157, "learning_rate": 1.183139464469235e-06, "epoch": 0.931999331140962, "percentage": 93.2, "elapsed_time": "1 day, 15:34:33", "remaining_time": "2:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16722, "total_steps": 17941, "loss": 1.4797, "learning_rate": 1.1812146647681543e-06, "epoch": 0.9320550693941252, "percentage": 93.21, "elapsed_time": "1 day, 15:34:42", "remaining_time": "2:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16723, "total_steps": 17941, "loss": 1.7114, "learning_rate": 1.1792914133143208e-06, "epoch": 0.9321108076472884, "percentage": 93.21, "elapsed_time": "1 day, 15:34:50", "remaining_time": "2:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16724, "total_steps": 17941, "loss": 1.4327, "learning_rate": 1.177369710168702e-06, "epoch": 0.9321665459004514, "percentage": 93.22, "elapsed_time": "1 day, 15:34:59", "remaining_time": "2:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16725, "total_steps": 17941, "loss": 1.7566, "learning_rate": 1.1754495553922718e-06, "epoch": 0.9322222841536146, "percentage": 93.22, "elapsed_time": "1 day, 15:35:07", "remaining_time": "2:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16726, "total_steps": 17941, "loss": 1.5927, "learning_rate": 1.17353094904592e-06, "epoch": 0.9322780224067778, "percentage": 93.23, "elapsed_time": "1 day, 15:35:16", "remaining_time": "2:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16727, "total_steps": 17941, "loss": 1.7087, "learning_rate": 1.1716138911904816e-06, "epoch": 0.9323337606599409, "percentage": 93.23, "elapsed_time": "1 day, 15:35:24", "remaining_time": "2:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16728, "total_steps": 17941, "loss": 1.1584, "learning_rate": 1.169698381886758e-06, "epoch": 0.9323894989131041, "percentage": 93.24, "elapsed_time": "1 day, 15:35:33", "remaining_time": "2:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16729, "total_steps": 17941, "loss": 1.6593, "learning_rate": 1.1677844211955058e-06, "epoch": 0.9324452371662673, "percentage": 93.24, "elapsed_time": "1 day, 15:35:41", "remaining_time": "2:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16730, "total_steps": 17941, "loss": 1.6306, "learning_rate": 1.1658720091774211e-06, "epoch": 0.9325009754194303, "percentage": 93.25, "elapsed_time": "1 day, 15:35:49", "remaining_time": "2:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16731, "total_steps": 17941, "loss": 1.616, "learning_rate": 1.1639611458931498e-06, "epoch": 0.9325567136725935, "percentage": 93.26, "elapsed_time": "1 day, 15:35:58", "remaining_time": "2:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16732, "total_steps": 17941, "loss": 1.701, "learning_rate": 1.1620518314032935e-06, "epoch": 0.9326124519257566, "percentage": 93.26, "elapsed_time": "1 day, 15:36:06", "remaining_time": "2:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16733, "total_steps": 17941, "loss": 1.727, "learning_rate": 1.1601440657684204e-06, "epoch": 0.9326681901789198, "percentage": 93.27, "elapsed_time": "1 day, 15:36:15", "remaining_time": "2:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16734, "total_steps": 17941, "loss": 1.5478, "learning_rate": 1.1582378490490154e-06, "epoch": 0.932723928432083, "percentage": 93.27, "elapsed_time": "1 day, 15:36:23", "remaining_time": "2:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16735, "total_steps": 17941, "loss": 1.6477, "learning_rate": 1.1563331813055356e-06, "epoch": 0.932779666685246, "percentage": 93.28, "elapsed_time": "1 day, 15:36:32", "remaining_time": "2:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16736, "total_steps": 17941, "loss": 1.7011, "learning_rate": 1.1544300625983884e-06, "epoch": 0.9328354049384092, "percentage": 93.28, "elapsed_time": "1 day, 15:36:40", "remaining_time": "2:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16737, "total_steps": 17941, "loss": 1.7284, "learning_rate": 1.1525284929879364e-06, "epoch": 0.9328911431915724, "percentage": 93.29, "elapsed_time": "1 day, 15:36:49", "remaining_time": "2:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16738, "total_steps": 17941, "loss": 1.5, "learning_rate": 1.1506284725344763e-06, "epoch": 0.9329468814447355, "percentage": 93.29, "elapsed_time": "1 day, 15:36:58", "remaining_time": "2:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16739, "total_steps": 17941, "loss": 1.6443, "learning_rate": 1.1487300012982649e-06, "epoch": 0.9330026196978987, "percentage": 93.3, "elapsed_time": "1 day, 15:37:06", "remaining_time": "2:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16740, "total_steps": 17941, "loss": 1.5057, "learning_rate": 1.1468330793395266e-06, "epoch": 0.9330583579510618, "percentage": 93.31, "elapsed_time": "1 day, 15:37:15", "remaining_time": "2:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16741, "total_steps": 17941, "loss": 1.4323, "learning_rate": 1.144937706718402e-06, "epoch": 0.9331140962042249, "percentage": 93.31, "elapsed_time": "1 day, 15:37:23", "remaining_time": "2:50:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16742, "total_steps": 17941, "loss": 1.5609, "learning_rate": 1.1430438834950096e-06, "epoch": 0.9331698344573881, "percentage": 93.32, "elapsed_time": "1 day, 15:37:32", "remaining_time": "2:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16743, "total_steps": 17941, "loss": 1.6138, "learning_rate": 1.1411516097294073e-06, "epoch": 0.9332255727105513, "percentage": 93.32, "elapsed_time": "1 day, 15:37:40", "remaining_time": "2:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16744, "total_steps": 17941, "loss": 1.4596, "learning_rate": 1.1392608854816133e-06, "epoch": 0.9332813109637144, "percentage": 93.33, "elapsed_time": "1 day, 15:37:49", "remaining_time": "2:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16745, "total_steps": 17941, "loss": 1.635, "learning_rate": 1.1373717108115857e-06, "epoch": 0.9333370492168775, "percentage": 93.33, "elapsed_time": "1 day, 15:37:57", "remaining_time": "2:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16746, "total_steps": 17941, "loss": 1.5789, "learning_rate": 1.1354840857792315e-06, "epoch": 0.9333927874700407, "percentage": 93.34, "elapsed_time": "1 day, 15:38:06", "remaining_time": "2:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16747, "total_steps": 17941, "loss": 1.5497, "learning_rate": 1.133598010444431e-06, "epoch": 0.9334485257232038, "percentage": 93.34, "elapsed_time": "1 day, 15:38:15", "remaining_time": "2:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16748, "total_steps": 17941, "loss": 1.6279, "learning_rate": 1.1317134848669864e-06, "epoch": 0.933504263976367, "percentage": 93.35, "elapsed_time": "1 day, 15:38:23", "remaining_time": "2:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16749, "total_steps": 17941, "loss": 1.5749, "learning_rate": 1.1298305091066664e-06, "epoch": 0.9335600022295302, "percentage": 93.36, "elapsed_time": "1 day, 15:38:32", "remaining_time": "2:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16750, "total_steps": 17941, "loss": 1.7361, "learning_rate": 1.1279490832231954e-06, "epoch": 0.9336157404826932, "percentage": 93.36, "elapsed_time": "1 day, 15:38:40", "remaining_time": "2:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16751, "total_steps": 17941, "loss": 1.7525, "learning_rate": 1.1260692072762313e-06, "epoch": 0.9336714787358564, "percentage": 93.37, "elapsed_time": "1 day, 15:38:49", "remaining_time": "2:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16752, "total_steps": 17941, "loss": 1.731, "learning_rate": 1.1241908813253987e-06, "epoch": 0.9337272169890196, "percentage": 93.37, "elapsed_time": "1 day, 15:38:57", "remaining_time": "2:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16753, "total_steps": 17941, "loss": 1.6132, "learning_rate": 1.1223141054302665e-06, "epoch": 0.9337829552421827, "percentage": 93.38, "elapsed_time": "1 day, 15:39:06", "remaining_time": "2:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16754, "total_steps": 17941, "loss": 1.8055, "learning_rate": 1.120438879650354e-06, "epoch": 0.9338386934953459, "percentage": 93.38, "elapsed_time": "1 day, 15:39:14", "remaining_time": "2:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16755, "total_steps": 17941, "loss": 1.4531, "learning_rate": 1.11856520404513e-06, "epoch": 0.933894431748509, "percentage": 93.39, "elapsed_time": "1 day, 15:39:23", "remaining_time": "2:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16756, "total_steps": 17941, "loss": 1.7555, "learning_rate": 1.116693078674025e-06, "epoch": 0.9339501700016721, "percentage": 93.4, "elapsed_time": "1 day, 15:39:31", "remaining_time": "2:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16757, "total_steps": 17941, "loss": 1.6048, "learning_rate": 1.1148225035963966e-06, "epoch": 0.9340059082548353, "percentage": 93.4, "elapsed_time": "1 day, 15:39:40", "remaining_time": "2:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16758, "total_steps": 17941, "loss": 1.5587, "learning_rate": 1.1129534788715812e-06, "epoch": 0.9340616465079984, "percentage": 93.41, "elapsed_time": "1 day, 15:39:48", "remaining_time": "2:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16759, "total_steps": 17941, "loss": 1.6526, "learning_rate": 1.1110860045588589e-06, "epoch": 0.9341173847611616, "percentage": 93.41, "elapsed_time": "1 day, 15:39:56", "remaining_time": "2:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16760, "total_steps": 17941, "loss": 1.8698, "learning_rate": 1.109220080717438e-06, "epoch": 0.9341731230143248, "percentage": 93.42, "elapsed_time": "1 day, 15:40:05", "remaining_time": "2:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16761, "total_steps": 17941, "loss": 1.5642, "learning_rate": 1.1073557074065044e-06, "epoch": 0.9342288612674878, "percentage": 93.42, "elapsed_time": "1 day, 15:40:13", "remaining_time": "2:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16762, "total_steps": 17941, "loss": 1.6282, "learning_rate": 1.105492884685183e-06, "epoch": 0.934284599520651, "percentage": 93.43, "elapsed_time": "1 day, 15:40:22", "remaining_time": "2:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16763, "total_steps": 17941, "loss": 1.4938, "learning_rate": 1.10363161261256e-06, "epoch": 0.9343403377738142, "percentage": 93.43, "elapsed_time": "1 day, 15:40:30", "remaining_time": "2:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16764, "total_steps": 17941, "loss": 1.6369, "learning_rate": 1.1017718912476493e-06, "epoch": 0.9343960760269773, "percentage": 93.44, "elapsed_time": "1 day, 15:40:39", "remaining_time": "2:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16765, "total_steps": 17941, "loss": 1.447, "learning_rate": 1.0999137206494314e-06, "epoch": 0.9344518142801405, "percentage": 93.45, "elapsed_time": "1 day, 15:40:47", "remaining_time": "2:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16766, "total_steps": 17941, "loss": 1.6531, "learning_rate": 1.0980571008768592e-06, "epoch": 0.9345075525333036, "percentage": 93.45, "elapsed_time": "1 day, 15:40:56", "remaining_time": "2:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16767, "total_steps": 17941, "loss": 1.6529, "learning_rate": 1.0962020319887856e-06, "epoch": 0.9345632907864667, "percentage": 93.46, "elapsed_time": "1 day, 15:41:04", "remaining_time": "2:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16768, "total_steps": 17941, "loss": 1.7453, "learning_rate": 1.0943485140440578e-06, "epoch": 0.9346190290396299, "percentage": 93.46, "elapsed_time": "1 day, 15:41:12", "remaining_time": "2:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16769, "total_steps": 17941, "loss": 1.9268, "learning_rate": 1.092496547101457e-06, "epoch": 0.9346747672927931, "percentage": 93.47, "elapsed_time": "1 day, 15:41:21", "remaining_time": "2:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16770, "total_steps": 17941, "loss": 1.5568, "learning_rate": 1.0906461312197135e-06, "epoch": 0.9347305055459562, "percentage": 93.47, "elapsed_time": "1 day, 15:41:29", "remaining_time": "2:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16771, "total_steps": 17941, "loss": 1.5729, "learning_rate": 1.0887972664575141e-06, "epoch": 0.9347862437991193, "percentage": 93.48, "elapsed_time": "1 day, 15:41:39", "remaining_time": "2:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16772, "total_steps": 17941, "loss": 1.6663, "learning_rate": 1.0869499528734895e-06, "epoch": 0.9348419820522825, "percentage": 93.48, "elapsed_time": "1 day, 15:41:47", "remaining_time": "2:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16773, "total_steps": 17941, "loss": 1.6167, "learning_rate": 1.0851041905262372e-06, "epoch": 0.9348977203054456, "percentage": 93.49, "elapsed_time": "1 day, 15:41:56", "remaining_time": "2:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16774, "total_steps": 17941, "loss": 1.5327, "learning_rate": 1.0832599794742826e-06, "epoch": 0.9349534585586088, "percentage": 93.5, "elapsed_time": "1 day, 15:42:05", "remaining_time": "2:45:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16775, "total_steps": 17941, "loss": 1.8459, "learning_rate": 1.0814173197761178e-06, "epoch": 0.935009196811772, "percentage": 93.5, "elapsed_time": "1 day, 15:42:13", "remaining_time": "2:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16776, "total_steps": 17941, "loss": 1.6765, "learning_rate": 1.0795762114901742e-06, "epoch": 0.935064935064935, "percentage": 93.51, "elapsed_time": "1 day, 15:42:21", "remaining_time": "2:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16777, "total_steps": 17941, "loss": 1.6937, "learning_rate": 1.0777366546748547e-06, "epoch": 0.9351206733180982, "percentage": 93.51, "elapsed_time": "1 day, 15:42:30", "remaining_time": "2:45:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16778, "total_steps": 17941, "loss": 1.5319, "learning_rate": 1.075898649388496e-06, "epoch": 0.9351764115712613, "percentage": 93.52, "elapsed_time": "1 day, 15:42:38", "remaining_time": "2:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16779, "total_steps": 17941, "loss": 1.5061, "learning_rate": 1.0740621956893736e-06, "epoch": 0.9352321498244245, "percentage": 93.52, "elapsed_time": "1 day, 15:42:47", "remaining_time": "2:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16780, "total_steps": 17941, "loss": 1.623, "learning_rate": 1.072227293635747e-06, "epoch": 0.9352878880775877, "percentage": 93.53, "elapsed_time": "1 day, 15:42:55", "remaining_time": "2:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16781, "total_steps": 17941, "loss": 1.657, "learning_rate": 1.0703939432857969e-06, "epoch": 0.9353436263307507, "percentage": 93.53, "elapsed_time": "1 day, 15:43:04", "remaining_time": "2:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16782, "total_steps": 17941, "loss": 1.6301, "learning_rate": 1.0685621446976823e-06, "epoch": 0.9353993645839139, "percentage": 93.54, "elapsed_time": "1 day, 15:43:12", "remaining_time": "2:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16783, "total_steps": 17941, "loss": 1.738, "learning_rate": 1.0667318979294739e-06, "epoch": 0.9354551028370771, "percentage": 93.55, "elapsed_time": "1 day, 15:43:21", "remaining_time": "2:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16784, "total_steps": 17941, "loss": 1.7667, "learning_rate": 1.0649032030392304e-06, "epoch": 0.9355108410902402, "percentage": 93.55, "elapsed_time": "1 day, 15:43:30", "remaining_time": "2:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16785, "total_steps": 17941, "loss": 1.5402, "learning_rate": 1.0630760600849555e-06, "epoch": 0.9355665793434034, "percentage": 93.56, "elapsed_time": "1 day, 15:43:39", "remaining_time": "2:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16786, "total_steps": 17941, "loss": 1.6312, "learning_rate": 1.0612504691245807e-06, "epoch": 0.9356223175965666, "percentage": 93.56, "elapsed_time": "1 day, 15:43:47", "remaining_time": "2:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16787, "total_steps": 17941, "loss": 1.6652, "learning_rate": 1.059426430216004e-06, "epoch": 0.9356780558497296, "percentage": 93.57, "elapsed_time": "1 day, 15:43:56", "remaining_time": "2:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16788, "total_steps": 17941, "loss": 1.3273, "learning_rate": 1.0576039434170848e-06, "epoch": 0.9357337941028928, "percentage": 93.57, "elapsed_time": "1 day, 15:44:04", "remaining_time": "2:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16789, "total_steps": 17941, "loss": 1.6496, "learning_rate": 1.0557830087856102e-06, "epoch": 0.935789532356056, "percentage": 93.58, "elapsed_time": "1 day, 15:44:12", "remaining_time": "2:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16790, "total_steps": 17941, "loss": 1.872, "learning_rate": 1.0539636263793394e-06, "epoch": 0.9358452706092191, "percentage": 93.58, "elapsed_time": "1 day, 15:44:21", "remaining_time": "2:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16791, "total_steps": 17941, "loss": 1.7581, "learning_rate": 1.0521457962559545e-06, "epoch": 0.9359010088623823, "percentage": 93.59, "elapsed_time": "1 day, 15:44:29", "remaining_time": "2:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16792, "total_steps": 17941, "loss": 1.7107, "learning_rate": 1.050329518473131e-06, "epoch": 0.9359567471155454, "percentage": 93.6, "elapsed_time": "1 day, 15:44:39", "remaining_time": "2:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16793, "total_steps": 17941, "loss": 1.5497, "learning_rate": 1.0485147930884565e-06, "epoch": 0.9360124853687085, "percentage": 93.6, "elapsed_time": "1 day, 15:44:48", "remaining_time": "2:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16794, "total_steps": 17941, "loss": 1.6007, "learning_rate": 1.0467016201594849e-06, "epoch": 0.9360682236218717, "percentage": 93.61, "elapsed_time": "1 day, 15:44:56", "remaining_time": "2:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16795, "total_steps": 17941, "loss": 1.7443, "learning_rate": 1.0448899997437144e-06, "epoch": 0.9361239618750349, "percentage": 93.61, "elapsed_time": "1 day, 15:45:05", "remaining_time": "2:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16796, "total_steps": 17941, "loss": 2.0844, "learning_rate": 1.0430799318986162e-06, "epoch": 0.936179700128198, "percentage": 93.62, "elapsed_time": "1 day, 15:45:13", "remaining_time": "2:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16797, "total_steps": 17941, "loss": 1.6163, "learning_rate": 1.0412714166815773e-06, "epoch": 0.9362354383813611, "percentage": 93.62, "elapsed_time": "1 day, 15:45:22", "remaining_time": "2:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16798, "total_steps": 17941, "loss": 1.7549, "learning_rate": 1.0394644541499576e-06, "epoch": 0.9362911766345243, "percentage": 93.63, "elapsed_time": "1 day, 15:45:30", "remaining_time": "2:42:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16799, "total_steps": 17941, "loss": 1.5603, "learning_rate": 1.0376590443610723e-06, "epoch": 0.9363469148876874, "percentage": 93.63, "elapsed_time": "1 day, 15:45:39", "remaining_time": "2:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16800, "total_steps": 17941, "loss": 1.7288, "learning_rate": 1.0358551873721645e-06, "epoch": 0.9364026531408506, "percentage": 93.64, "elapsed_time": "1 day, 15:45:47", "remaining_time": "2:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16801, "total_steps": 17941, "loss": 1.6673, "learning_rate": 1.034052883240455e-06, "epoch": 0.9364583913940137, "percentage": 93.65, "elapsed_time": "1 day, 15:45:57", "remaining_time": "2:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16802, "total_steps": 17941, "loss": 1.7246, "learning_rate": 1.0322521320230927e-06, "epoch": 0.9365141296471768, "percentage": 93.65, "elapsed_time": "1 day, 15:46:05", "remaining_time": "2:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16803, "total_steps": 17941, "loss": 1.6787, "learning_rate": 1.030452933777193e-06, "epoch": 0.93656986790034, "percentage": 93.66, "elapsed_time": "1 day, 15:46:14", "remaining_time": "2:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16804, "total_steps": 17941, "loss": 1.4616, "learning_rate": 1.028655288559821e-06, "epoch": 0.9366256061535031, "percentage": 93.66, "elapsed_time": "1 day, 15:46:22", "remaining_time": "2:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16805, "total_steps": 17941, "loss": 1.5618, "learning_rate": 1.0268591964279707e-06, "epoch": 0.9366813444066663, "percentage": 93.67, "elapsed_time": "1 day, 15:46:31", "remaining_time": "2:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16806, "total_steps": 17941, "loss": 1.5928, "learning_rate": 1.025064657438618e-06, "epoch": 0.9367370826598295, "percentage": 93.67, "elapsed_time": "1 day, 15:46:39", "remaining_time": "2:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16807, "total_steps": 17941, "loss": 1.4486, "learning_rate": 1.0232716716486678e-06, "epoch": 0.9367928209129925, "percentage": 93.68, "elapsed_time": "1 day, 15:46:47", "remaining_time": "2:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16808, "total_steps": 17941, "loss": 1.6045, "learning_rate": 1.0214802391149914e-06, "epoch": 0.9368485591661557, "percentage": 93.68, "elapsed_time": "1 day, 15:46:56", "remaining_time": "2:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16809, "total_steps": 17941, "loss": 1.5062, "learning_rate": 1.0196903598943874e-06, "epoch": 0.9369042974193189, "percentage": 93.69, "elapsed_time": "1 day, 15:47:04", "remaining_time": "2:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16810, "total_steps": 17941, "loss": 1.5983, "learning_rate": 1.0179020340436385e-06, "epoch": 0.936960035672482, "percentage": 93.7, "elapsed_time": "1 day, 15:47:13", "remaining_time": "2:40:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16811, "total_steps": 17941, "loss": 1.5915, "learning_rate": 1.016115261619449e-06, "epoch": 0.9370157739256452, "percentage": 93.7, "elapsed_time": "1 day, 15:47:21", "remaining_time": "2:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16812, "total_steps": 17941, "loss": 1.6147, "learning_rate": 1.0143300426784906e-06, "epoch": 0.9370715121788084, "percentage": 93.71, "elapsed_time": "1 day, 15:47:31", "remaining_time": "2:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16813, "total_steps": 17941, "loss": 1.726, "learning_rate": 1.0125463772773735e-06, "epoch": 0.9371272504319714, "percentage": 93.71, "elapsed_time": "1 day, 15:47:40", "remaining_time": "2:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16814, "total_steps": 17941, "loss": 1.589, "learning_rate": 1.010764265472669e-06, "epoch": 0.9371829886851346, "percentage": 93.72, "elapsed_time": "1 day, 15:47:48", "remaining_time": "2:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16815, "total_steps": 17941, "loss": 1.764, "learning_rate": 1.0089837073208985e-06, "epoch": 0.9372387269382978, "percentage": 93.72, "elapsed_time": "1 day, 15:47:57", "remaining_time": "2:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16816, "total_steps": 17941, "loss": 1.651, "learning_rate": 1.0072047028785224e-06, "epoch": 0.9372944651914609, "percentage": 93.73, "elapsed_time": "1 day, 15:48:05", "remaining_time": "2:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16817, "total_steps": 17941, "loss": 1.5316, "learning_rate": 1.0054272522019626e-06, "epoch": 0.937350203444624, "percentage": 93.74, "elapsed_time": "1 day, 15:48:14", "remaining_time": "2:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16818, "total_steps": 17941, "loss": 1.475, "learning_rate": 1.0036513553476012e-06, "epoch": 0.9374059416977872, "percentage": 93.74, "elapsed_time": "1 day, 15:48:22", "remaining_time": "2:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16819, "total_steps": 17941, "loss": 1.3326, "learning_rate": 1.0018770123717436e-06, "epoch": 0.9374616799509503, "percentage": 93.75, "elapsed_time": "1 day, 15:48:31", "remaining_time": "2:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16820, "total_steps": 17941, "loss": 1.5274, "learning_rate": 1.0001042233306723e-06, "epoch": 0.9375174182041135, "percentage": 93.75, "elapsed_time": "1 day, 15:48:39", "remaining_time": "2:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16821, "total_steps": 17941, "loss": 1.484, "learning_rate": 9.983329882806037e-07, "epoch": 0.9375731564572767, "percentage": 93.76, "elapsed_time": "1 day, 15:48:47", "remaining_time": "2:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16822, "total_steps": 17941, "loss": 1.5763, "learning_rate": 9.965633072777147e-07, "epoch": 0.9376288947104398, "percentage": 93.76, "elapsed_time": "1 day, 15:48:56", "remaining_time": "2:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16823, "total_steps": 17941, "loss": 1.5261, "learning_rate": 9.947951803781274e-07, "epoch": 0.9376846329636029, "percentage": 93.77, "elapsed_time": "1 day, 15:49:04", "remaining_time": "2:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16824, "total_steps": 17941, "loss": 1.6338, "learning_rate": 9.93028607637908e-07, "epoch": 0.9377403712167661, "percentage": 93.77, "elapsed_time": "1 day, 15:49:13", "remaining_time": "2:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16825, "total_steps": 17941, "loss": 1.6033, "learning_rate": 9.91263589113106e-07, "epoch": 0.9377961094699292, "percentage": 93.78, "elapsed_time": "1 day, 15:49:21", "remaining_time": "2:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16826, "total_steps": 17941, "loss": 1.6361, "learning_rate": 9.895001248596714e-07, "epoch": 0.9378518477230924, "percentage": 93.79, "elapsed_time": "1 day, 15:49:30", "remaining_time": "2:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16827, "total_steps": 17941, "loss": 1.6824, "learning_rate": 9.877382149335478e-07, "epoch": 0.9379075859762555, "percentage": 93.79, "elapsed_time": "1 day, 15:49:38", "remaining_time": "2:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16828, "total_steps": 17941, "loss": 1.9127, "learning_rate": 9.859778593906023e-07, "epoch": 0.9379633242294186, "percentage": 93.8, "elapsed_time": "1 day, 15:49:47", "remaining_time": "2:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16829, "total_steps": 17941, "loss": 1.4649, "learning_rate": 9.842190582866672e-07, "epoch": 0.9380190624825818, "percentage": 93.8, "elapsed_time": "1 day, 15:49:55", "remaining_time": "2:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16830, "total_steps": 17941, "loss": 1.6229, "learning_rate": 9.824618116775264e-07, "epoch": 0.9380748007357449, "percentage": 93.81, "elapsed_time": "1 day, 15:50:04", "remaining_time": "2:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16831, "total_steps": 17941, "loss": 1.8311, "learning_rate": 9.807061196189016e-07, "epoch": 0.9381305389889081, "percentage": 93.81, "elapsed_time": "1 day, 15:50:12", "remaining_time": "2:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16832, "total_steps": 17941, "loss": 1.3583, "learning_rate": 9.78951982166476e-07, "epoch": 0.9381862772420713, "percentage": 93.82, "elapsed_time": "1 day, 15:50:21", "remaining_time": "2:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16833, "total_steps": 17941, "loss": 1.5562, "learning_rate": 9.771993993758831e-07, "epoch": 0.9382420154952343, "percentage": 93.82, "elapsed_time": "1 day, 15:50:29", "remaining_time": "2:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16834, "total_steps": 17941, "loss": 1.644, "learning_rate": 9.754483713027063e-07, "epoch": 0.9382977537483975, "percentage": 93.83, "elapsed_time": "1 day, 15:50:38", "remaining_time": "2:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16835, "total_steps": 17941, "loss": 1.5279, "learning_rate": 9.73698898002462e-07, "epoch": 0.9383534920015607, "percentage": 93.84, "elapsed_time": "1 day, 15:50:46", "remaining_time": "2:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16836, "total_steps": 17941, "loss": 1.6109, "learning_rate": 9.719509795306559e-07, "epoch": 0.9384092302547238, "percentage": 93.84, "elapsed_time": "1 day, 15:50:54", "remaining_time": "2:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16837, "total_steps": 17941, "loss": 1.4811, "learning_rate": 9.702046159427104e-07, "epoch": 0.938464968507887, "percentage": 93.85, "elapsed_time": "1 day, 15:51:03", "remaining_time": "2:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16838, "total_steps": 17941, "loss": 1.9212, "learning_rate": 9.684598072940089e-07, "epoch": 0.9385207067610501, "percentage": 93.85, "elapsed_time": "1 day, 15:51:12", "remaining_time": "2:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16839, "total_steps": 17941, "loss": 1.4313, "learning_rate": 9.667165536398904e-07, "epoch": 0.9385764450142132, "percentage": 93.86, "elapsed_time": "1 day, 15:51:20", "remaining_time": "2:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16840, "total_steps": 17941, "loss": 1.5254, "learning_rate": 9.64974855035633e-07, "epoch": 0.9386321832673764, "percentage": 93.86, "elapsed_time": "1 day, 15:51:29", "remaining_time": "2:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16841, "total_steps": 17941, "loss": 1.7144, "learning_rate": 9.632347115364871e-07, "epoch": 0.9386879215205396, "percentage": 93.87, "elapsed_time": "1 day, 15:51:37", "remaining_time": "2:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16842, "total_steps": 17941, "loss": 1.604, "learning_rate": 9.61496123197625e-07, "epoch": 0.9387436597737027, "percentage": 93.87, "elapsed_time": "1 day, 15:51:46", "remaining_time": "2:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16843, "total_steps": 17941, "loss": 1.7027, "learning_rate": 9.597590900741916e-07, "epoch": 0.9387993980268659, "percentage": 93.88, "elapsed_time": "1 day, 15:51:54", "remaining_time": "2:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16844, "total_steps": 17941, "loss": 1.6507, "learning_rate": 9.58023612221287e-07, "epoch": 0.938855136280029, "percentage": 93.89, "elapsed_time": "1 day, 15:52:03", "remaining_time": "2:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16845, "total_steps": 17941, "loss": 1.6674, "learning_rate": 9.562896896939288e-07, "epoch": 0.9389108745331921, "percentage": 93.89, "elapsed_time": "1 day, 15:52:11", "remaining_time": "2:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16846, "total_steps": 17941, "loss": 1.7702, "learning_rate": 9.545573225471171e-07, "epoch": 0.9389666127863553, "percentage": 93.9, "elapsed_time": "1 day, 15:52:20", "remaining_time": "2:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16847, "total_steps": 17941, "loss": 1.9243, "learning_rate": 9.528265108357915e-07, "epoch": 0.9390223510395185, "percentage": 93.9, "elapsed_time": "1 day, 15:52:28", "remaining_time": "2:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16848, "total_steps": 17941, "loss": 1.8476, "learning_rate": 9.510972546148522e-07, "epoch": 0.9390780892926816, "percentage": 93.91, "elapsed_time": "1 day, 15:52:37", "remaining_time": "2:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16849, "total_steps": 17941, "loss": 1.6859, "learning_rate": 9.493695539391278e-07, "epoch": 0.9391338275458447, "percentage": 93.91, "elapsed_time": "1 day, 15:52:45", "remaining_time": "2:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16850, "total_steps": 17941, "loss": 1.5396, "learning_rate": 9.476434088634078e-07, "epoch": 0.9391895657990078, "percentage": 93.92, "elapsed_time": "1 day, 15:52:54", "remaining_time": "2:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16851, "total_steps": 17941, "loss": 1.6498, "learning_rate": 9.459188194424595e-07, "epoch": 0.939245304052171, "percentage": 93.92, "elapsed_time": "1 day, 15:53:02", "remaining_time": "2:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16852, "total_steps": 17941, "loss": 1.6658, "learning_rate": 9.441957857309502e-07, "epoch": 0.9393010423053342, "percentage": 93.93, "elapsed_time": "1 day, 15:53:10", "remaining_time": "2:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16853, "total_steps": 17941, "loss": 1.2825, "learning_rate": 9.424743077835363e-07, "epoch": 0.9393567805584973, "percentage": 93.94, "elapsed_time": "1 day, 15:53:19", "remaining_time": "2:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16854, "total_steps": 17941, "loss": 1.8969, "learning_rate": 9.407543856548185e-07, "epoch": 0.9394125188116604, "percentage": 93.94, "elapsed_time": "1 day, 15:53:27", "remaining_time": "2:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16855, "total_steps": 17941, "loss": 1.6525, "learning_rate": 9.390360193993309e-07, "epoch": 0.9394682570648236, "percentage": 93.95, "elapsed_time": "1 day, 15:53:36", "remaining_time": "2:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16856, "total_steps": 17941, "loss": 1.7488, "learning_rate": 9.373192090715799e-07, "epoch": 0.9395239953179867, "percentage": 93.95, "elapsed_time": "1 day, 15:53:44", "remaining_time": "2:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16857, "total_steps": 17941, "loss": 1.4556, "learning_rate": 9.356039547260054e-07, "epoch": 0.9395797335711499, "percentage": 93.96, "elapsed_time": "1 day, 15:53:53", "remaining_time": "2:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16858, "total_steps": 17941, "loss": 1.6622, "learning_rate": 9.338902564170027e-07, "epoch": 0.9396354718243131, "percentage": 93.96, "elapsed_time": "1 day, 15:54:01", "remaining_time": "2:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16859, "total_steps": 17941, "loss": 1.3895, "learning_rate": 9.321781141989339e-07, "epoch": 0.9396912100774761, "percentage": 93.97, "elapsed_time": "1 day, 15:54:09", "remaining_time": "2:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16860, "total_steps": 17941, "loss": 1.6764, "learning_rate": 9.304675281260889e-07, "epoch": 0.9397469483306393, "percentage": 93.97, "elapsed_time": "1 day, 15:54:18", "remaining_time": "2:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16861, "total_steps": 17941, "loss": 1.4854, "learning_rate": 9.287584982527131e-07, "epoch": 0.9398026865838025, "percentage": 93.98, "elapsed_time": "1 day, 15:54:27", "remaining_time": "2:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16862, "total_steps": 17941, "loss": 1.6977, "learning_rate": 9.270510246330188e-07, "epoch": 0.9398584248369656, "percentage": 93.99, "elapsed_time": "1 day, 15:54:35", "remaining_time": "2:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16863, "total_steps": 17941, "loss": 1.5387, "learning_rate": 9.253451073211517e-07, "epoch": 0.9399141630901288, "percentage": 93.99, "elapsed_time": "1 day, 15:54:43", "remaining_time": "2:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16864, "total_steps": 17941, "loss": 1.6416, "learning_rate": 9.236407463712071e-07, "epoch": 0.939969901343292, "percentage": 94.0, "elapsed_time": "1 day, 15:54:52", "remaining_time": "2:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16865, "total_steps": 17941, "loss": 1.722, "learning_rate": 9.219379418372476e-07, "epoch": 0.940025639596455, "percentage": 94.0, "elapsed_time": "1 day, 15:55:00", "remaining_time": "2:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16866, "total_steps": 17941, "loss": 1.5153, "learning_rate": 9.202366937732687e-07, "epoch": 0.9400813778496182, "percentage": 94.01, "elapsed_time": "1 day, 15:55:09", "remaining_time": "2:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16867, "total_steps": 17941, "loss": 1.6314, "learning_rate": 9.185370022332274e-07, "epoch": 0.9401371161027814, "percentage": 94.01, "elapsed_time": "1 day, 15:55:17", "remaining_time": "2:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16868, "total_steps": 17941, "loss": 1.9229, "learning_rate": 9.168388672710248e-07, "epoch": 0.9401928543559445, "percentage": 94.02, "elapsed_time": "1 day, 15:55:26", "remaining_time": "2:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16869, "total_steps": 17941, "loss": 1.6497, "learning_rate": 9.151422889405237e-07, "epoch": 0.9402485926091076, "percentage": 94.02, "elapsed_time": "1 day, 15:55:34", "remaining_time": "2:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16870, "total_steps": 17941, "loss": 1.4396, "learning_rate": 9.134472672955252e-07, "epoch": 0.9403043308622708, "percentage": 94.03, "elapsed_time": "1 day, 15:55:43", "remaining_time": "2:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16871, "total_steps": 17941, "loss": 1.6452, "learning_rate": 9.117538023897809e-07, "epoch": 0.9403600691154339, "percentage": 94.04, "elapsed_time": "1 day, 15:55:51", "remaining_time": "2:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16872, "total_steps": 17941, "loss": 1.6783, "learning_rate": 9.100618942770034e-07, "epoch": 0.9404158073685971, "percentage": 94.04, "elapsed_time": "1 day, 15:55:59", "remaining_time": "2:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16873, "total_steps": 17941, "loss": 1.4322, "learning_rate": 9.083715430108497e-07, "epoch": 0.9404715456217602, "percentage": 94.05, "elapsed_time": "1 day, 15:56:08", "remaining_time": "2:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16874, "total_steps": 17941, "loss": 1.6379, "learning_rate": 9.06682748644927e-07, "epoch": 0.9405272838749233, "percentage": 94.05, "elapsed_time": "1 day, 15:56:16", "remaining_time": "2:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16875, "total_steps": 17941, "loss": 1.7436, "learning_rate": 9.049955112327923e-07, "epoch": 0.9405830221280865, "percentage": 94.06, "elapsed_time": "1 day, 15:56:25", "remaining_time": "2:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16876, "total_steps": 17941, "loss": 1.5094, "learning_rate": 9.033098308279475e-07, "epoch": 0.9406387603812496, "percentage": 94.06, "elapsed_time": "1 day, 15:56:33", "remaining_time": "2:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16877, "total_steps": 17941, "loss": 1.5522, "learning_rate": 9.016257074838775e-07, "epoch": 0.9406944986344128, "percentage": 94.07, "elapsed_time": "1 day, 15:56:42", "remaining_time": "2:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16878, "total_steps": 17941, "loss": 1.5814, "learning_rate": 8.999431412539672e-07, "epoch": 0.940750236887576, "percentage": 94.08, "elapsed_time": "1 day, 15:56:51", "remaining_time": "2:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16879, "total_steps": 17941, "loss": 1.7722, "learning_rate": 8.982621321915852e-07, "epoch": 0.940805975140739, "percentage": 94.08, "elapsed_time": "1 day, 15:56:59", "remaining_time": "2:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16880, "total_steps": 17941, "loss": 1.2975, "learning_rate": 8.965826803500499e-07, "epoch": 0.9408617133939022, "percentage": 94.09, "elapsed_time": "1 day, 15:57:08", "remaining_time": "2:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16881, "total_steps": 17941, "loss": 1.7634, "learning_rate": 8.949047857826242e-07, "epoch": 0.9409174516470654, "percentage": 94.09, "elapsed_time": "1 day, 15:57:16", "remaining_time": "2:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16882, "total_steps": 17941, "loss": 1.6529, "learning_rate": 8.932284485425102e-07, "epoch": 0.9409731899002285, "percentage": 94.1, "elapsed_time": "1 day, 15:57:25", "remaining_time": "2:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16883, "total_steps": 17941, "loss": 1.6217, "learning_rate": 8.915536686828763e-07, "epoch": 0.9410289281533917, "percentage": 94.1, "elapsed_time": "1 day, 15:57:33", "remaining_time": "2:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16884, "total_steps": 17941, "loss": 1.8195, "learning_rate": 8.898804462568355e-07, "epoch": 0.9410846664065549, "percentage": 94.11, "elapsed_time": "1 day, 15:57:42", "remaining_time": "2:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16885, "total_steps": 17941, "loss": 1.6975, "learning_rate": 8.882087813174622e-07, "epoch": 0.9411404046597179, "percentage": 94.11, "elapsed_time": "1 day, 15:57:50", "remaining_time": "2:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16886, "total_steps": 17941, "loss": 1.6651, "learning_rate": 8.865386739177639e-07, "epoch": 0.9411961429128811, "percentage": 94.12, "elapsed_time": "1 day, 15:57:59", "remaining_time": "2:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16887, "total_steps": 17941, "loss": 1.8084, "learning_rate": 8.848701241106982e-07, "epoch": 0.9412518811660443, "percentage": 94.13, "elapsed_time": "1 day, 15:58:07", "remaining_time": "2:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16888, "total_steps": 17941, "loss": 1.5518, "learning_rate": 8.832031319492007e-07, "epoch": 0.9413076194192074, "percentage": 94.13, "elapsed_time": "1 day, 15:58:16", "remaining_time": "2:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16889, "total_steps": 17941, "loss": 1.6356, "learning_rate": 8.815376974861289e-07, "epoch": 0.9413633576723706, "percentage": 94.14, "elapsed_time": "1 day, 15:58:24", "remaining_time": "2:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16890, "total_steps": 17941, "loss": 1.6015, "learning_rate": 8.798738207742963e-07, "epoch": 0.9414190959255337, "percentage": 94.14, "elapsed_time": "1 day, 15:58:32", "remaining_time": "2:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16891, "total_steps": 17941, "loss": 1.5823, "learning_rate": 8.782115018664771e-07, "epoch": 0.9414748341786968, "percentage": 94.15, "elapsed_time": "1 day, 15:58:41", "remaining_time": "2:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16892, "total_steps": 17941, "loss": 1.5989, "learning_rate": 8.765507408153906e-07, "epoch": 0.94153057243186, "percentage": 94.15, "elapsed_time": "1 day, 15:58:49", "remaining_time": "2:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16893, "total_steps": 17941, "loss": 1.8058, "learning_rate": 8.748915376737054e-07, "epoch": 0.9415863106850232, "percentage": 94.16, "elapsed_time": "1 day, 15:58:58", "remaining_time": "2:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16894, "total_steps": 17941, "loss": 1.617, "learning_rate": 8.732338924940353e-07, "epoch": 0.9416420489381863, "percentage": 94.16, "elapsed_time": "1 day, 15:59:06", "remaining_time": "2:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16895, "total_steps": 17941, "loss": 1.554, "learning_rate": 8.715778053289603e-07, "epoch": 0.9416977871913494, "percentage": 94.17, "elapsed_time": "1 day, 15:59:15", "remaining_time": "2:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16896, "total_steps": 17941, "loss": 1.5602, "learning_rate": 8.69923276231005e-07, "epoch": 0.9417535254445125, "percentage": 94.18, "elapsed_time": "1 day, 15:59:23", "remaining_time": "2:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16897, "total_steps": 17941, "loss": 1.7909, "learning_rate": 8.682703052526331e-07, "epoch": 0.9418092636976757, "percentage": 94.18, "elapsed_time": "1 day, 15:59:32", "remaining_time": "2:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16898, "total_steps": 17941, "loss": 1.5703, "learning_rate": 8.666188924462637e-07, "epoch": 0.9418650019508389, "percentage": 94.19, "elapsed_time": "1 day, 15:59:40", "remaining_time": "2:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16899, "total_steps": 17941, "loss": 1.4395, "learning_rate": 8.649690378642772e-07, "epoch": 0.941920740204002, "percentage": 94.19, "elapsed_time": "1 day, 15:59:49", "remaining_time": "2:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16900, "total_steps": 17941, "loss": 1.478, "learning_rate": 8.633207415590039e-07, "epoch": 0.9419764784571651, "percentage": 94.2, "elapsed_time": "1 day, 15:59:57", "remaining_time": "2:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16901, "total_steps": 17941, "loss": 1.8977, "learning_rate": 8.61674003582702e-07, "epoch": 0.9420322167103283, "percentage": 94.2, "elapsed_time": "1 day, 16:00:06", "remaining_time": "2:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16902, "total_steps": 17941, "loss": 1.522, "learning_rate": 8.60028823987602e-07, "epoch": 0.9420879549634914, "percentage": 94.21, "elapsed_time": "1 day, 16:00:15", "remaining_time": "2:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16903, "total_steps": 17941, "loss": 1.6179, "learning_rate": 8.583852028258899e-07, "epoch": 0.9421436932166546, "percentage": 94.21, "elapsed_time": "1 day, 16:00:23", "remaining_time": "2:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16904, "total_steps": 17941, "loss": 1.3213, "learning_rate": 8.567431401496795e-07, "epoch": 0.9421994314698178, "percentage": 94.22, "elapsed_time": "1 day, 16:00:32", "remaining_time": "2:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16905, "total_steps": 17941, "loss": 1.421, "learning_rate": 8.551026360110458e-07, "epoch": 0.9422551697229808, "percentage": 94.23, "elapsed_time": "1 day, 16:00:40", "remaining_time": "2:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16906, "total_steps": 17941, "loss": 1.5467, "learning_rate": 8.534636904620308e-07, "epoch": 0.942310907976144, "percentage": 94.23, "elapsed_time": "1 day, 16:00:49", "remaining_time": "2:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16907, "total_steps": 17941, "loss": 1.7246, "learning_rate": 8.518263035546037e-07, "epoch": 0.9423666462293072, "percentage": 94.24, "elapsed_time": "1 day, 16:00:57", "remaining_time": "2:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16908, "total_steps": 17941, "loss": 1.5566, "learning_rate": 8.501904753406898e-07, "epoch": 0.9424223844824703, "percentage": 94.24, "elapsed_time": "1 day, 16:01:06", "remaining_time": "2:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16909, "total_steps": 17941, "loss": 1.5759, "learning_rate": 8.485562058721641e-07, "epoch": 0.9424781227356335, "percentage": 94.25, "elapsed_time": "1 day, 16:01:14", "remaining_time": "2:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16910, "total_steps": 17941, "loss": 1.6642, "learning_rate": 8.469234952008687e-07, "epoch": 0.9425338609887967, "percentage": 94.25, "elapsed_time": "1 day, 16:01:23", "remaining_time": "2:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16911, "total_steps": 17941, "loss": 1.6105, "learning_rate": 8.452923433785787e-07, "epoch": 0.9425895992419597, "percentage": 94.26, "elapsed_time": "1 day, 16:01:31", "remaining_time": "2:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16912, "total_steps": 17941, "loss": 1.455, "learning_rate": 8.436627504570249e-07, "epoch": 0.9426453374951229, "percentage": 94.26, "elapsed_time": "1 day, 16:01:40", "remaining_time": "2:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16913, "total_steps": 17941, "loss": 1.5826, "learning_rate": 8.420347164878828e-07, "epoch": 0.9427010757482861, "percentage": 94.27, "elapsed_time": "1 day, 16:01:49", "remaining_time": "2:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16914, "total_steps": 17941, "loss": 1.5373, "learning_rate": 8.404082415227887e-07, "epoch": 0.9427568140014492, "percentage": 94.28, "elapsed_time": "1 day, 16:01:57", "remaining_time": "2:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16915, "total_steps": 17941, "loss": 1.5081, "learning_rate": 8.387833256133292e-07, "epoch": 0.9428125522546124, "percentage": 94.28, "elapsed_time": "1 day, 16:02:06", "remaining_time": "2:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16916, "total_steps": 17941, "loss": 1.7214, "learning_rate": 8.371599688110299e-07, "epoch": 0.9428682905077755, "percentage": 94.29, "elapsed_time": "1 day, 16:02:14", "remaining_time": "2:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16917, "total_steps": 17941, "loss": 1.571, "learning_rate": 8.355381711673771e-07, "epoch": 0.9429240287609386, "percentage": 94.29, "elapsed_time": "1 day, 16:02:22", "remaining_time": "2:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16918, "total_steps": 17941, "loss": 1.4953, "learning_rate": 8.339179327338076e-07, "epoch": 0.9429797670141018, "percentage": 94.3, "elapsed_time": "1 day, 16:02:31", "remaining_time": "2:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16919, "total_steps": 17941, "loss": 1.7961, "learning_rate": 8.322992535617025e-07, "epoch": 0.9430355052672649, "percentage": 94.3, "elapsed_time": "1 day, 16:02:39", "remaining_time": "2:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16920, "total_steps": 17941, "loss": 1.8401, "learning_rate": 8.306821337023929e-07, "epoch": 0.9430912435204281, "percentage": 94.31, "elapsed_time": "1 day, 16:02:48", "remaining_time": "2:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16921, "total_steps": 17941, "loss": 1.4785, "learning_rate": 8.290665732071711e-07, "epoch": 0.9431469817735912, "percentage": 94.31, "elapsed_time": "1 day, 16:02:56", "remaining_time": "2:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16922, "total_steps": 17941, "loss": 1.7048, "learning_rate": 8.274525721272741e-07, "epoch": 0.9432027200267543, "percentage": 94.32, "elapsed_time": "1 day, 16:03:05", "remaining_time": "2:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16923, "total_steps": 17941, "loss": 1.508, "learning_rate": 8.258401305138885e-07, "epoch": 0.9432584582799175, "percentage": 94.33, "elapsed_time": "1 day, 16:03:13", "remaining_time": "2:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16924, "total_steps": 17941, "loss": 1.4915, "learning_rate": 8.242292484181402e-07, "epoch": 0.9433141965330807, "percentage": 94.33, "elapsed_time": "1 day, 16:03:21", "remaining_time": "2:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16925, "total_steps": 17941, "loss": 1.6707, "learning_rate": 8.226199258911327e-07, "epoch": 0.9433699347862438, "percentage": 94.34, "elapsed_time": "1 day, 16:03:30", "remaining_time": "2:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16926, "total_steps": 17941, "loss": 1.5004, "learning_rate": 8.210121629838918e-07, "epoch": 0.9434256730394069, "percentage": 94.34, "elapsed_time": "1 day, 16:03:38", "remaining_time": "2:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16927, "total_steps": 17941, "loss": 1.5514, "learning_rate": 8.194059597474158e-07, "epoch": 0.9434814112925701, "percentage": 94.35, "elapsed_time": "1 day, 16:03:47", "remaining_time": "2:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16928, "total_steps": 17941, "loss": 1.7864, "learning_rate": 8.178013162326359e-07, "epoch": 0.9435371495457332, "percentage": 94.35, "elapsed_time": "1 day, 16:03:55", "remaining_time": "2:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16929, "total_steps": 17941, "loss": 1.64, "learning_rate": 8.161982324904505e-07, "epoch": 0.9435928877988964, "percentage": 94.36, "elapsed_time": "1 day, 16:04:04", "remaining_time": "2:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16930, "total_steps": 17941, "loss": 1.6564, "learning_rate": 8.14596708571691e-07, "epoch": 0.9436486260520596, "percentage": 94.36, "elapsed_time": "1 day, 16:04:12", "remaining_time": "2:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16931, "total_steps": 17941, "loss": 1.6213, "learning_rate": 8.129967445271558e-07, "epoch": 0.9437043643052226, "percentage": 94.37, "elapsed_time": "1 day, 16:04:21", "remaining_time": "2:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16932, "total_steps": 17941, "loss": 1.7619, "learning_rate": 8.11398340407582e-07, "epoch": 0.9437601025583858, "percentage": 94.38, "elapsed_time": "1 day, 16:04:29", "remaining_time": "2:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16933, "total_steps": 17941, "loss": 1.7034, "learning_rate": 8.09801496263668e-07, "epoch": 0.943815840811549, "percentage": 94.38, "elapsed_time": "1 day, 16:04:38", "remaining_time": "2:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16934, "total_steps": 17941, "loss": 1.632, "learning_rate": 8.08206212146051e-07, "epoch": 0.9438715790647121, "percentage": 94.39, "elapsed_time": "1 day, 16:04:46", "remaining_time": "2:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16935, "total_steps": 17941, "loss": 1.6041, "learning_rate": 8.066124881053183e-07, "epoch": 0.9439273173178753, "percentage": 94.39, "elapsed_time": "1 day, 16:04:54", "remaining_time": "2:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16936, "total_steps": 17941, "loss": 1.5342, "learning_rate": 8.05020324192024e-07, "epoch": 0.9439830555710385, "percentage": 94.4, "elapsed_time": "1 day, 16:05:03", "remaining_time": "2:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16937, "total_steps": 17941, "loss": 1.8362, "learning_rate": 8.03429720456661e-07, "epoch": 0.9440387938242015, "percentage": 94.4, "elapsed_time": "1 day, 16:05:11", "remaining_time": "2:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16938, "total_steps": 17941, "loss": 1.7253, "learning_rate": 8.018406769496722e-07, "epoch": 0.9440945320773647, "percentage": 94.41, "elapsed_time": "1 day, 16:05:20", "remaining_time": "2:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16939, "total_steps": 17941, "loss": 1.7858, "learning_rate": 8.002531937214452e-07, "epoch": 0.9441502703305279, "percentage": 94.42, "elapsed_time": "1 day, 16:05:28", "remaining_time": "2:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16940, "total_steps": 17941, "loss": 1.6108, "learning_rate": 7.986672708223341e-07, "epoch": 0.944206008583691, "percentage": 94.42, "elapsed_time": "1 day, 16:05:37", "remaining_time": "2:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16941, "total_steps": 17941, "loss": 1.4481, "learning_rate": 7.970829083026377e-07, "epoch": 0.9442617468368542, "percentage": 94.43, "elapsed_time": "1 day, 16:05:45", "remaining_time": "2:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16942, "total_steps": 17941, "loss": 1.8286, "learning_rate": 7.955001062125988e-07, "epoch": 0.9443174850900172, "percentage": 94.43, "elapsed_time": "1 day, 16:05:54", "remaining_time": "2:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16943, "total_steps": 17941, "loss": 1.6667, "learning_rate": 7.93918864602411e-07, "epoch": 0.9443732233431804, "percentage": 94.44, "elapsed_time": "1 day, 16:06:02", "remaining_time": "2:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16944, "total_steps": 17941, "loss": 1.6067, "learning_rate": 7.923391835222227e-07, "epoch": 0.9444289615963436, "percentage": 94.44, "elapsed_time": "1 day, 16:06:10", "remaining_time": "2:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16945, "total_steps": 17941, "loss": 1.7842, "learning_rate": 7.90761063022144e-07, "epoch": 0.9444846998495067, "percentage": 94.45, "elapsed_time": "1 day, 16:06:19", "remaining_time": "2:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16946, "total_steps": 17941, "loss": 1.7356, "learning_rate": 7.891845031522072e-07, "epoch": 0.9445404381026699, "percentage": 94.45, "elapsed_time": "1 day, 16:06:27", "remaining_time": "2:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16947, "total_steps": 17941, "loss": 1.3916, "learning_rate": 7.876095039624165e-07, "epoch": 0.944596176355833, "percentage": 94.46, "elapsed_time": "1 day, 16:06:36", "remaining_time": "2:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16948, "total_steps": 17941, "loss": 1.732, "learning_rate": 7.860360655027377e-07, "epoch": 0.9446519146089961, "percentage": 94.47, "elapsed_time": "1 day, 16:06:44", "remaining_time": "2:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16949, "total_steps": 17941, "loss": 1.6551, "learning_rate": 7.844641878230474e-07, "epoch": 0.9447076528621593, "percentage": 94.47, "elapsed_time": "1 day, 16:06:53", "remaining_time": "2:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16950, "total_steps": 17941, "loss": 1.4815, "learning_rate": 7.828938709732059e-07, "epoch": 0.9447633911153225, "percentage": 94.48, "elapsed_time": "1 day, 16:07:01", "remaining_time": "2:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16951, "total_steps": 17941, "loss": 1.5795, "learning_rate": 7.813251150030176e-07, "epoch": 0.9448191293684856, "percentage": 94.48, "elapsed_time": "1 day, 16:07:10", "remaining_time": "2:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16952, "total_steps": 17941, "loss": 1.7019, "learning_rate": 7.797579199622318e-07, "epoch": 0.9448748676216487, "percentage": 94.49, "elapsed_time": "1 day, 16:07:18", "remaining_time": "2:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16953, "total_steps": 17941, "loss": 1.5984, "learning_rate": 7.78192285900553e-07, "epoch": 0.9449306058748119, "percentage": 94.49, "elapsed_time": "1 day, 16:07:26", "remaining_time": "2:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16954, "total_steps": 17941, "loss": 1.6128, "learning_rate": 7.76628212867625e-07, "epoch": 0.944986344127975, "percentage": 94.5, "elapsed_time": "1 day, 16:07:35", "remaining_time": "2:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16955, "total_steps": 17941, "loss": 1.7367, "learning_rate": 7.750657009130635e-07, "epoch": 0.9450420823811382, "percentage": 94.5, "elapsed_time": "1 day, 16:07:43", "remaining_time": "2:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16956, "total_steps": 17941, "loss": 1.4785, "learning_rate": 7.735047500864179e-07, "epoch": 0.9450978206343014, "percentage": 94.51, "elapsed_time": "1 day, 16:07:52", "remaining_time": "2:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16957, "total_steps": 17941, "loss": 1.5787, "learning_rate": 7.719453604371874e-07, "epoch": 0.9451535588874644, "percentage": 94.52, "elapsed_time": "1 day, 16:08:00", "remaining_time": "2:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16958, "total_steps": 17941, "loss": 1.9061, "learning_rate": 7.703875320148323e-07, "epoch": 0.9452092971406276, "percentage": 94.52, "elapsed_time": "1 day, 16:08:09", "remaining_time": "2:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16959, "total_steps": 17941, "loss": 1.681, "learning_rate": 7.688312648687579e-07, "epoch": 0.9452650353937908, "percentage": 94.53, "elapsed_time": "1 day, 16:08:17", "remaining_time": "2:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16960, "total_steps": 17941, "loss": 1.6794, "learning_rate": 7.672765590483133e-07, "epoch": 0.9453207736469539, "percentage": 94.53, "elapsed_time": "1 day, 16:08:26", "remaining_time": "2:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16961, "total_steps": 17941, "loss": 1.6617, "learning_rate": 7.657234146028092e-07, "epoch": 0.9453765119001171, "percentage": 94.54, "elapsed_time": "1 day, 16:08:34", "remaining_time": "2:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16962, "total_steps": 17941, "loss": 1.5476, "learning_rate": 7.641718315815116e-07, "epoch": 0.9454322501532803, "percentage": 94.54, "elapsed_time": "1 day, 16:08:42", "remaining_time": "2:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16963, "total_steps": 17941, "loss": 1.9378, "learning_rate": 7.626218100336091e-07, "epoch": 0.9454879884064433, "percentage": 94.55, "elapsed_time": "1 day, 16:08:51", "remaining_time": "2:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16964, "total_steps": 17941, "loss": 1.3775, "learning_rate": 7.610733500082789e-07, "epoch": 0.9455437266596065, "percentage": 94.55, "elapsed_time": "1 day, 16:08:59", "remaining_time": "2:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16965, "total_steps": 17941, "loss": 1.6954, "learning_rate": 7.595264515546097e-07, "epoch": 0.9455994649127696, "percentage": 94.56, "elapsed_time": "1 day, 16:09:08", "remaining_time": "2:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16966, "total_steps": 17941, "loss": 1.6822, "learning_rate": 7.579811147216731e-07, "epoch": 0.9456552031659328, "percentage": 94.57, "elapsed_time": "1 day, 16:09:16", "remaining_time": "2:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16967, "total_steps": 17941, "loss": 1.6487, "learning_rate": 7.564373395584745e-07, "epoch": 0.945710941419096, "percentage": 94.57, "elapsed_time": "1 day, 16:09:25", "remaining_time": "2:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16968, "total_steps": 17941, "loss": 1.552, "learning_rate": 7.548951261139747e-07, "epoch": 0.945766679672259, "percentage": 94.58, "elapsed_time": "1 day, 16:09:33", "remaining_time": "2:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16969, "total_steps": 17941, "loss": 1.5766, "learning_rate": 7.53354474437079e-07, "epoch": 0.9458224179254222, "percentage": 94.58, "elapsed_time": "1 day, 16:09:41", "remaining_time": "2:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16970, "total_steps": 17941, "loss": 1.519, "learning_rate": 7.51815384576654e-07, "epoch": 0.9458781561785854, "percentage": 94.59, "elapsed_time": "1 day, 16:09:50", "remaining_time": "2:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16971, "total_steps": 17941, "loss": 1.4053, "learning_rate": 7.502778565815105e-07, "epoch": 0.9459338944317485, "percentage": 94.59, "elapsed_time": "1 day, 16:09:58", "remaining_time": "2:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16972, "total_steps": 17941, "loss": 1.5938, "learning_rate": 7.48741890500404e-07, "epoch": 0.9459896326849117, "percentage": 94.6, "elapsed_time": "1 day, 16:10:07", "remaining_time": "2:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16973, "total_steps": 17941, "loss": 1.7217, "learning_rate": 7.472074863820511e-07, "epoch": 0.9460453709380748, "percentage": 94.6, "elapsed_time": "1 day, 16:10:15", "remaining_time": "2:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16974, "total_steps": 17941, "loss": 1.5028, "learning_rate": 7.456746442751129e-07, "epoch": 0.9461011091912379, "percentage": 94.61, "elapsed_time": "1 day, 16:10:24", "remaining_time": "2:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16975, "total_steps": 17941, "loss": 1.5843, "learning_rate": 7.441433642282059e-07, "epoch": 0.9461568474444011, "percentage": 94.62, "elapsed_time": "1 day, 16:10:32", "remaining_time": "2:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16976, "total_steps": 17941, "loss": 1.456, "learning_rate": 7.426136462898859e-07, "epoch": 0.9462125856975643, "percentage": 94.62, "elapsed_time": "1 day, 16:10:41", "remaining_time": "2:17:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16977, "total_steps": 17941, "loss": 1.654, "learning_rate": 7.410854905086695e-07, "epoch": 0.9462683239507274, "percentage": 94.63, "elapsed_time": "1 day, 16:10:49", "remaining_time": "2:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16978, "total_steps": 17941, "loss": 1.5899, "learning_rate": 7.395588969330292e-07, "epoch": 0.9463240622038905, "percentage": 94.63, "elapsed_time": "1 day, 16:10:57", "remaining_time": "2:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16979, "total_steps": 17941, "loss": 1.6535, "learning_rate": 7.38033865611365e-07, "epoch": 0.9463798004570537, "percentage": 94.64, "elapsed_time": "1 day, 16:11:06", "remaining_time": "2:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16980, "total_steps": 17941, "loss": 1.5952, "learning_rate": 7.365103965920439e-07, "epoch": 0.9464355387102168, "percentage": 94.64, "elapsed_time": "1 day, 16:11:14", "remaining_time": "2:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16981, "total_steps": 17941, "loss": 1.6768, "learning_rate": 7.349884899233994e-07, "epoch": 0.94649127696338, "percentage": 94.65, "elapsed_time": "1 day, 16:11:23", "remaining_time": "2:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16982, "total_steps": 17941, "loss": 1.7187, "learning_rate": 7.334681456536818e-07, "epoch": 0.9465470152165432, "percentage": 94.65, "elapsed_time": "1 day, 16:11:31", "remaining_time": "2:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16983, "total_steps": 17941, "loss": 1.6883, "learning_rate": 7.319493638311082e-07, "epoch": 0.9466027534697062, "percentage": 94.66, "elapsed_time": "1 day, 16:11:40", "remaining_time": "2:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16984, "total_steps": 17941, "loss": 1.2998, "learning_rate": 7.304321445038453e-07, "epoch": 0.9466584917228694, "percentage": 94.67, "elapsed_time": "1 day, 16:11:48", "remaining_time": "2:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16985, "total_steps": 17941, "loss": 1.7541, "learning_rate": 7.289164877200216e-07, "epoch": 0.9467142299760326, "percentage": 94.67, "elapsed_time": "1 day, 16:11:56", "remaining_time": "2:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16986, "total_steps": 17941, "loss": 1.6901, "learning_rate": 7.27402393527693e-07, "epoch": 0.9467699682291957, "percentage": 94.68, "elapsed_time": "1 day, 16:12:05", "remaining_time": "2:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16987, "total_steps": 17941, "loss": 1.3803, "learning_rate": 7.258898619748767e-07, "epoch": 0.9468257064823589, "percentage": 94.68, "elapsed_time": "1 day, 16:12:13", "remaining_time": "2:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16988, "total_steps": 17941, "loss": 1.6025, "learning_rate": 7.243788931095508e-07, "epoch": 0.9468814447355219, "percentage": 94.69, "elapsed_time": "1 day, 16:12:22", "remaining_time": "2:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16989, "total_steps": 17941, "loss": 1.5792, "learning_rate": 7.228694869796271e-07, "epoch": 0.9469371829886851, "percentage": 94.69, "elapsed_time": "1 day, 16:12:30", "remaining_time": "2:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16990, "total_steps": 17941, "loss": 1.8059, "learning_rate": 7.21361643632984e-07, "epoch": 0.9469929212418483, "percentage": 94.7, "elapsed_time": "1 day, 16:12:39", "remaining_time": "2:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16991, "total_steps": 17941, "loss": 1.9646, "learning_rate": 7.198553631174221e-07, "epoch": 0.9470486594950114, "percentage": 94.7, "elapsed_time": "1 day, 16:12:48", "remaining_time": "2:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16992, "total_steps": 17941, "loss": 1.7726, "learning_rate": 7.183506454807365e-07, "epoch": 0.9471043977481746, "percentage": 94.71, "elapsed_time": "1 day, 16:12:56", "remaining_time": "2:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16993, "total_steps": 17941, "loss": 1.645, "learning_rate": 7.168474907706335e-07, "epoch": 0.9471601360013377, "percentage": 94.72, "elapsed_time": "1 day, 16:13:05", "remaining_time": "2:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16994, "total_steps": 17941, "loss": 1.4872, "learning_rate": 7.153458990347861e-07, "epoch": 0.9472158742545008, "percentage": 94.72, "elapsed_time": "1 day, 16:13:13", "remaining_time": "2:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16995, "total_steps": 17941, "loss": 1.6738, "learning_rate": 7.138458703208173e-07, "epoch": 0.947271612507664, "percentage": 94.73, "elapsed_time": "1 day, 16:13:22", "remaining_time": "2:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16996, "total_steps": 17941, "loss": 1.7239, "learning_rate": 7.123474046763002e-07, "epoch": 0.9473273507608272, "percentage": 94.73, "elapsed_time": "1 day, 16:13:30", "remaining_time": "2:14:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16997, "total_steps": 17941, "loss": 1.6759, "learning_rate": 7.108505021487577e-07, "epoch": 0.9473830890139903, "percentage": 94.74, "elapsed_time": "1 day, 16:13:39", "remaining_time": "2:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16998, "total_steps": 17941, "loss": 1.5727, "learning_rate": 7.093551627856576e-07, "epoch": 0.9474388272671534, "percentage": 94.74, "elapsed_time": "1 day, 16:13:48", "remaining_time": "2:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16999, "total_steps": 17941, "loss": 1.6551, "learning_rate": 7.078613866344286e-07, "epoch": 0.9474945655203166, "percentage": 94.75, "elapsed_time": "1 day, 16:13:57", "remaining_time": "2:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17000, "total_steps": 17941, "loss": 1.4096, "learning_rate": 7.063691737424494e-07, "epoch": 0.9475503037734797, "percentage": 94.76, "elapsed_time": "1 day, 16:14:05", "remaining_time": "2:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17001, "total_steps": 17941, "loss": 1.5989, "learning_rate": 7.048785241570321e-07, "epoch": 0.9476060420266429, "percentage": 94.76, "elapsed_time": "1 day, 16:14:14", "remaining_time": "2:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17002, "total_steps": 17941, "loss": 1.4911, "learning_rate": 7.033894379254557e-07, "epoch": 0.9476617802798061, "percentage": 94.77, "elapsed_time": "1 day, 16:14:22", "remaining_time": "2:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17003, "total_steps": 17941, "loss": 1.6911, "learning_rate": 7.019019150949546e-07, "epoch": 0.9477175185329691, "percentage": 94.77, "elapsed_time": "1 day, 16:14:31", "remaining_time": "2:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17004, "total_steps": 17941, "loss": 1.3522, "learning_rate": 7.00415955712691e-07, "epoch": 0.9477732567861323, "percentage": 94.78, "elapsed_time": "1 day, 16:14:40", "remaining_time": "2:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17005, "total_steps": 17941, "loss": 1.6699, "learning_rate": 6.989315598257995e-07, "epoch": 0.9478289950392955, "percentage": 94.78, "elapsed_time": "1 day, 16:14:48", "remaining_time": "2:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17006, "total_steps": 17941, "loss": 1.6929, "learning_rate": 6.974487274813479e-07, "epoch": 0.9478847332924586, "percentage": 94.79, "elapsed_time": "1 day, 16:14:56", "remaining_time": "2:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17007, "total_steps": 17941, "loss": 1.6404, "learning_rate": 6.959674587263765e-07, "epoch": 0.9479404715456218, "percentage": 94.79, "elapsed_time": "1 day, 16:15:05", "remaining_time": "2:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17008, "total_steps": 17941, "loss": 1.5798, "learning_rate": 6.944877536078531e-07, "epoch": 0.947996209798785, "percentage": 94.8, "elapsed_time": "1 day, 16:15:14", "remaining_time": "2:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17009, "total_steps": 17941, "loss": 1.4725, "learning_rate": 6.93009612172707e-07, "epoch": 0.948051948051948, "percentage": 94.81, "elapsed_time": "1 day, 16:15:23", "remaining_time": "2:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17010, "total_steps": 17941, "loss": 1.5175, "learning_rate": 6.915330344678117e-07, "epoch": 0.9481076863051112, "percentage": 94.81, "elapsed_time": "1 day, 16:15:31", "remaining_time": "2:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17011, "total_steps": 17941, "loss": 1.7627, "learning_rate": 6.900580205400076e-07, "epoch": 0.9481634245582743, "percentage": 94.82, "elapsed_time": "1 day, 16:15:39", "remaining_time": "2:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17012, "total_steps": 17941, "loss": 1.494, "learning_rate": 6.885845704360627e-07, "epoch": 0.9482191628114375, "percentage": 94.82, "elapsed_time": "1 day, 16:15:48", "remaining_time": "2:11:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17013, "total_steps": 17941, "loss": 1.5726, "learning_rate": 6.871126842027064e-07, "epoch": 0.9482749010646007, "percentage": 94.83, "elapsed_time": "1 day, 16:15:57", "remaining_time": "2:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17014, "total_steps": 17941, "loss": 1.7376, "learning_rate": 6.856423618866237e-07, "epoch": 0.9483306393177637, "percentage": 94.83, "elapsed_time": "1 day, 16:16:05", "remaining_time": "2:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17015, "total_steps": 17941, "loss": 1.6236, "learning_rate": 6.841736035344437e-07, "epoch": 0.9483863775709269, "percentage": 94.84, "elapsed_time": "1 day, 16:16:14", "remaining_time": "2:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17016, "total_steps": 17941, "loss": 1.583, "learning_rate": 6.82706409192746e-07, "epoch": 0.9484421158240901, "percentage": 94.84, "elapsed_time": "1 day, 16:16:22", "remaining_time": "2:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17017, "total_steps": 17941, "loss": 1.5396, "learning_rate": 6.812407789080599e-07, "epoch": 0.9484978540772532, "percentage": 94.85, "elapsed_time": "1 day, 16:16:31", "remaining_time": "2:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17018, "total_steps": 17941, "loss": 1.5526, "learning_rate": 6.797767127268706e-07, "epoch": 0.9485535923304164, "percentage": 94.86, "elapsed_time": "1 day, 16:16:39", "remaining_time": "2:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17019, "total_steps": 17941, "loss": 1.5421, "learning_rate": 6.783142106956075e-07, "epoch": 0.9486093305835795, "percentage": 94.86, "elapsed_time": "1 day, 16:16:48", "remaining_time": "2:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17020, "total_steps": 17941, "loss": 1.6919, "learning_rate": 6.768532728606502e-07, "epoch": 0.9486650688367426, "percentage": 94.87, "elapsed_time": "1 day, 16:16:56", "remaining_time": "2:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17021, "total_steps": 17941, "loss": 1.7134, "learning_rate": 6.753938992683339e-07, "epoch": 0.9487208070899058, "percentage": 94.87, "elapsed_time": "1 day, 16:17:05", "remaining_time": "2:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17022, "total_steps": 17941, "loss": 1.7222, "learning_rate": 6.739360899649383e-07, "epoch": 0.948776545343069, "percentage": 94.88, "elapsed_time": "1 day, 16:17:13", "remaining_time": "2:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17023, "total_steps": 17941, "loss": 1.631, "learning_rate": 6.724798449967041e-07, "epoch": 0.9488322835962321, "percentage": 94.88, "elapsed_time": "1 day, 16:17:22", "remaining_time": "2:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17024, "total_steps": 17941, "loss": 1.8997, "learning_rate": 6.710251644097998e-07, "epoch": 0.9488880218493952, "percentage": 94.89, "elapsed_time": "1 day, 16:17:30", "remaining_time": "2:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17025, "total_steps": 17941, "loss": 1.7108, "learning_rate": 6.695720482503776e-07, "epoch": 0.9489437601025584, "percentage": 94.89, "elapsed_time": "1 day, 16:17:39", "remaining_time": "2:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17026, "total_steps": 17941, "loss": 1.7563, "learning_rate": 6.681204965645171e-07, "epoch": 0.9489994983557215, "percentage": 94.9, "elapsed_time": "1 day, 16:17:48", "remaining_time": "2:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17027, "total_steps": 17941, "loss": 1.6225, "learning_rate": 6.666705093982428e-07, "epoch": 0.9490552366088847, "percentage": 94.91, "elapsed_time": "1 day, 16:17:56", "remaining_time": "2:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17028, "total_steps": 17941, "loss": 1.5518, "learning_rate": 6.652220867975456e-07, "epoch": 0.9491109748620479, "percentage": 94.91, "elapsed_time": "1 day, 16:18:05", "remaining_time": "2:09:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17029, "total_steps": 17941, "loss": 1.6425, "learning_rate": 6.637752288083666e-07, "epoch": 0.949166713115211, "percentage": 94.92, "elapsed_time": "1 day, 16:18:13", "remaining_time": "2:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17030, "total_steps": 17941, "loss": 1.45, "learning_rate": 6.623299354765911e-07, "epoch": 0.9492224513683741, "percentage": 94.92, "elapsed_time": "1 day, 16:18:22", "remaining_time": "2:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17031, "total_steps": 17941, "loss": 1.4817, "learning_rate": 6.608862068480437e-07, "epoch": 0.9492781896215373, "percentage": 94.93, "elapsed_time": "1 day, 16:18:30", "remaining_time": "2:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17032, "total_steps": 17941, "loss": 1.4503, "learning_rate": 6.594440429685156e-07, "epoch": 0.9493339278747004, "percentage": 94.93, "elapsed_time": "1 day, 16:18:38", "remaining_time": "2:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17033, "total_steps": 17941, "loss": 1.7839, "learning_rate": 6.58003443883759e-07, "epoch": 0.9493896661278636, "percentage": 94.94, "elapsed_time": "1 day, 16:18:47", "remaining_time": "2:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17034, "total_steps": 17941, "loss": 1.8742, "learning_rate": 6.56564409639443e-07, "epoch": 0.9494454043810266, "percentage": 94.94, "elapsed_time": "1 day, 16:18:55", "remaining_time": "2:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17035, "total_steps": 17941, "loss": 1.7448, "learning_rate": 6.551269402812088e-07, "epoch": 0.9495011426341898, "percentage": 94.95, "elapsed_time": "1 day, 16:19:04", "remaining_time": "2:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17036, "total_steps": 17941, "loss": 1.5972, "learning_rate": 6.536910358546477e-07, "epoch": 0.949556880887353, "percentage": 94.96, "elapsed_time": "1 day, 16:19:12", "remaining_time": "2:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17037, "total_steps": 17941, "loss": 1.8572, "learning_rate": 6.522566964053068e-07, "epoch": 0.9496126191405161, "percentage": 94.96, "elapsed_time": "1 day, 16:19:21", "remaining_time": "2:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17038, "total_steps": 17941, "loss": 1.4599, "learning_rate": 6.508239219786605e-07, "epoch": 0.9496683573936793, "percentage": 94.97, "elapsed_time": "1 day, 16:19:29", "remaining_time": "2:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17039, "total_steps": 17941, "loss": 1.5872, "learning_rate": 6.493927126201504e-07, "epoch": 0.9497240956468425, "percentage": 94.97, "elapsed_time": "1 day, 16:19:37", "remaining_time": "2:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17040, "total_steps": 17941, "loss": 1.6558, "learning_rate": 6.479630683751736e-07, "epoch": 0.9497798339000055, "percentage": 94.98, "elapsed_time": "1 day, 16:19:46", "remaining_time": "2:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17041, "total_steps": 17941, "loss": 1.4328, "learning_rate": 6.465349892890659e-07, "epoch": 0.9498355721531687, "percentage": 94.98, "elapsed_time": "1 day, 16:19:54", "remaining_time": "2:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17042, "total_steps": 17941, "loss": 1.5492, "learning_rate": 6.451084754071135e-07, "epoch": 0.9498913104063319, "percentage": 94.99, "elapsed_time": "1 day, 16:20:03", "remaining_time": "2:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17043, "total_steps": 17941, "loss": 1.567, "learning_rate": 6.436835267745634e-07, "epoch": 0.949947048659495, "percentage": 94.99, "elapsed_time": "1 day, 16:20:11", "remaining_time": "2:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17044, "total_steps": 17941, "loss": 1.667, "learning_rate": 6.422601434366071e-07, "epoch": 0.9500027869126582, "percentage": 95.0, "elapsed_time": "1 day, 16:20:19", "remaining_time": "2:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17045, "total_steps": 17941, "loss": 1.4466, "learning_rate": 6.408383254383809e-07, "epoch": 0.9500585251658213, "percentage": 95.01, "elapsed_time": "1 day, 16:20:28", "remaining_time": "2:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17046, "total_steps": 17941, "loss": 1.9481, "learning_rate": 6.394180728249821e-07, "epoch": 0.9501142634189844, "percentage": 95.01, "elapsed_time": "1 day, 16:20:36", "remaining_time": "2:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17047, "total_steps": 17941, "loss": 1.6337, "learning_rate": 6.379993856414468e-07, "epoch": 0.9501700016721476, "percentage": 95.02, "elapsed_time": "1 day, 16:20:45", "remaining_time": "2:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17048, "total_steps": 17941, "loss": 1.55, "learning_rate": 6.365822639327723e-07, "epoch": 0.9502257399253108, "percentage": 95.02, "elapsed_time": "1 day, 16:20:53", "remaining_time": "2:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17049, "total_steps": 17941, "loss": 1.5785, "learning_rate": 6.351667077439006e-07, "epoch": 0.9502814781784739, "percentage": 95.03, "elapsed_time": "1 day, 16:21:02", "remaining_time": "2:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17050, "total_steps": 17941, "loss": 1.7686, "learning_rate": 6.337527171197177e-07, "epoch": 0.950337216431637, "percentage": 95.03, "elapsed_time": "1 day, 16:21:10", "remaining_time": "2:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17051, "total_steps": 17941, "loss": 1.4871, "learning_rate": 6.32340292105077e-07, "epoch": 0.9503929546848002, "percentage": 95.04, "elapsed_time": "1 day, 16:21:19", "remaining_time": "2:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17052, "total_steps": 17941, "loss": 1.3882, "learning_rate": 6.309294327447756e-07, "epoch": 0.9504486929379633, "percentage": 95.04, "elapsed_time": "1 day, 16:21:27", "remaining_time": "2:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17053, "total_steps": 17941, "loss": 1.7842, "learning_rate": 6.295201390835448e-07, "epoch": 0.9505044311911265, "percentage": 95.05, "elapsed_time": "1 day, 16:21:36", "remaining_time": "2:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17054, "total_steps": 17941, "loss": 1.5399, "learning_rate": 6.281124111660875e-07, "epoch": 0.9505601694442897, "percentage": 95.06, "elapsed_time": "1 day, 16:21:44", "remaining_time": "2:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17055, "total_steps": 17941, "loss": 1.4698, "learning_rate": 6.267062490370401e-07, "epoch": 0.9506159076974527, "percentage": 95.06, "elapsed_time": "1 day, 16:21:53", "remaining_time": "2:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17056, "total_steps": 17941, "loss": 2.0197, "learning_rate": 6.253016527410116e-07, "epoch": 0.9506716459506159, "percentage": 95.07, "elapsed_time": "1 day, 16:22:02", "remaining_time": "2:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17057, "total_steps": 17941, "loss": 1.6629, "learning_rate": 6.238986223225384e-07, "epoch": 0.950727384203779, "percentage": 95.07, "elapsed_time": "1 day, 16:22:10", "remaining_time": "2:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17058, "total_steps": 17941, "loss": 1.758, "learning_rate": 6.22497157826113e-07, "epoch": 0.9507831224569422, "percentage": 95.08, "elapsed_time": "1 day, 16:22:19", "remaining_time": "2:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17059, "total_steps": 17941, "loss": 1.6158, "learning_rate": 6.210972592961938e-07, "epoch": 0.9508388607101054, "percentage": 95.08, "elapsed_time": "1 day, 16:22:27", "remaining_time": "2:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17060, "total_steps": 17941, "loss": 1.7162, "learning_rate": 6.19698926777168e-07, "epoch": 0.9508945989632684, "percentage": 95.09, "elapsed_time": "1 day, 16:22:36", "remaining_time": "2:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17061, "total_steps": 17941, "loss": 1.8092, "learning_rate": 6.183021603133887e-07, "epoch": 0.9509503372164316, "percentage": 95.1, "elapsed_time": "1 day, 16:22:44", "remaining_time": "2:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17062, "total_steps": 17941, "loss": 1.4472, "learning_rate": 6.169069599491428e-07, "epoch": 0.9510060754695948, "percentage": 95.1, "elapsed_time": "1 day, 16:22:53", "remaining_time": "2:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17063, "total_steps": 17941, "loss": 1.598, "learning_rate": 6.155133257286893e-07, "epoch": 0.9510618137227579, "percentage": 95.11, "elapsed_time": "1 day, 16:23:01", "remaining_time": "2:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17064, "total_steps": 17941, "loss": 1.5263, "learning_rate": 6.141212576962207e-07, "epoch": 0.9511175519759211, "percentage": 95.11, "elapsed_time": "1 day, 16:23:10", "remaining_time": "2:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17065, "total_steps": 17941, "loss": 1.7322, "learning_rate": 6.12730755895885e-07, "epoch": 0.9511732902290843, "percentage": 95.12, "elapsed_time": "1 day, 16:23:19", "remaining_time": "2:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17066, "total_steps": 17941, "loss": 1.6605, "learning_rate": 6.113418203717858e-07, "epoch": 0.9512290284822473, "percentage": 95.12, "elapsed_time": "1 day, 16:23:27", "remaining_time": "2:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17067, "total_steps": 17941, "loss": 1.8248, "learning_rate": 6.0995445116796e-07, "epoch": 0.9512847667354105, "percentage": 95.13, "elapsed_time": "1 day, 16:23:36", "remaining_time": "2:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17068, "total_steps": 17941, "loss": 1.4618, "learning_rate": 6.085686483284225e-07, "epoch": 0.9513405049885737, "percentage": 95.13, "elapsed_time": "1 day, 16:23:44", "remaining_time": "2:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17069, "total_steps": 17941, "loss": 1.6171, "learning_rate": 6.071844118971104e-07, "epoch": 0.9513962432417368, "percentage": 95.14, "elapsed_time": "1 day, 16:23:53", "remaining_time": "2:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17070, "total_steps": 17941, "loss": 1.6565, "learning_rate": 6.058017419179384e-07, "epoch": 0.9514519814949, "percentage": 95.15, "elapsed_time": "1 day, 16:24:01", "remaining_time": "2:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17071, "total_steps": 17941, "loss": 1.5644, "learning_rate": 6.044206384347384e-07, "epoch": 0.9515077197480631, "percentage": 95.15, "elapsed_time": "1 day, 16:24:10", "remaining_time": "2:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17072, "total_steps": 17941, "loss": 1.6023, "learning_rate": 6.030411014913196e-07, "epoch": 0.9515634580012262, "percentage": 95.16, "elapsed_time": "1 day, 16:24:18", "remaining_time": "2:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17073, "total_steps": 17941, "loss": 1.3485, "learning_rate": 6.016631311314358e-07, "epoch": 0.9516191962543894, "percentage": 95.16, "elapsed_time": "1 day, 16:24:27", "remaining_time": "2:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17074, "total_steps": 17941, "loss": 1.6505, "learning_rate": 6.0028672739878e-07, "epoch": 0.9516749345075526, "percentage": 95.17, "elapsed_time": "1 day, 16:24:35", "remaining_time": "2:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17075, "total_steps": 17941, "loss": 1.5776, "learning_rate": 5.989118903370172e-07, "epoch": 0.9517306727607157, "percentage": 95.17, "elapsed_time": "1 day, 16:24:44", "remaining_time": "2:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17076, "total_steps": 17941, "loss": 1.6576, "learning_rate": 5.975386199897348e-07, "epoch": 0.9517864110138788, "percentage": 95.18, "elapsed_time": "1 day, 16:24:52", "remaining_time": "2:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17077, "total_steps": 17941, "loss": 1.5698, "learning_rate": 5.961669164004924e-07, "epoch": 0.951842149267042, "percentage": 95.18, "elapsed_time": "1 day, 16:25:01", "remaining_time": "2:02:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17078, "total_steps": 17941, "loss": 1.5342, "learning_rate": 5.94796779612794e-07, "epoch": 0.9518978875202051, "percentage": 95.19, "elapsed_time": "1 day, 16:25:09", "remaining_time": "2:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17079, "total_steps": 17941, "loss": 1.7001, "learning_rate": 5.934282096700827e-07, "epoch": 0.9519536257733683, "percentage": 95.2, "elapsed_time": "1 day, 16:25:18", "remaining_time": "2:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17080, "total_steps": 17941, "loss": 1.3442, "learning_rate": 5.920612066157738e-07, "epoch": 0.9520093640265314, "percentage": 95.2, "elapsed_time": "1 day, 16:25:26", "remaining_time": "2:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17081, "total_steps": 17941, "loss": 1.55, "learning_rate": 5.906957704932104e-07, "epoch": 0.9520651022796945, "percentage": 95.21, "elapsed_time": "1 day, 16:25:35", "remaining_time": "2:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17082, "total_steps": 17941, "loss": 1.8351, "learning_rate": 5.893319013457077e-07, "epoch": 0.9521208405328577, "percentage": 95.21, "elapsed_time": "1 day, 16:25:43", "remaining_time": "2:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17083, "total_steps": 17941, "loss": 1.6878, "learning_rate": 5.879695992165091e-07, "epoch": 0.9521765787860208, "percentage": 95.22, "elapsed_time": "1 day, 16:25:52", "remaining_time": "2:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17084, "total_steps": 17941, "loss": 1.7578, "learning_rate": 5.866088641488188e-07, "epoch": 0.952232317039184, "percentage": 95.22, "elapsed_time": "1 day, 16:26:00", "remaining_time": "2:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17085, "total_steps": 17941, "loss": 1.8184, "learning_rate": 5.852496961858023e-07, "epoch": 0.9522880552923472, "percentage": 95.23, "elapsed_time": "1 day, 16:26:09", "remaining_time": "2:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17086, "total_steps": 17941, "loss": 1.4511, "learning_rate": 5.838920953705584e-07, "epoch": 0.9523437935455102, "percentage": 95.23, "elapsed_time": "1 day, 16:26:17", "remaining_time": "2:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17087, "total_steps": 17941, "loss": 1.6303, "learning_rate": 5.825360617461362e-07, "epoch": 0.9523995317986734, "percentage": 95.24, "elapsed_time": "1 day, 16:26:26", "remaining_time": "2:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17088, "total_steps": 17941, "loss": 1.6204, "learning_rate": 5.811815953555456e-07, "epoch": 0.9524552700518366, "percentage": 95.25, "elapsed_time": "1 day, 16:26:34", "remaining_time": "2:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17089, "total_steps": 17941, "loss": 1.7111, "learning_rate": 5.798286962417465e-07, "epoch": 0.9525110083049997, "percentage": 95.25, "elapsed_time": "1 day, 16:26:42", "remaining_time": "2:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17090, "total_steps": 17941, "loss": 1.6455, "learning_rate": 5.784773644476438e-07, "epoch": 0.9525667465581629, "percentage": 95.26, "elapsed_time": "1 day, 16:26:51", "remaining_time": "2:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17091, "total_steps": 17941, "loss": 1.4845, "learning_rate": 5.771276000160808e-07, "epoch": 0.952622484811326, "percentage": 95.26, "elapsed_time": "1 day, 16:26:59", "remaining_time": "2:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17092, "total_steps": 17941, "loss": 1.7556, "learning_rate": 5.757794029898844e-07, "epoch": 0.9526782230644891, "percentage": 95.27, "elapsed_time": "1 day, 16:27:08", "remaining_time": "2:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17093, "total_steps": 17941, "loss": 1.5055, "learning_rate": 5.744327734118037e-07, "epoch": 0.9527339613176523, "percentage": 95.27, "elapsed_time": "1 day, 16:27:16", "remaining_time": "2:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17094, "total_steps": 17941, "loss": 1.7597, "learning_rate": 5.730877113245381e-07, "epoch": 0.9527896995708155, "percentage": 95.28, "elapsed_time": "1 day, 16:27:25", "remaining_time": "2:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17095, "total_steps": 17941, "loss": 1.6878, "learning_rate": 5.717442167707531e-07, "epoch": 0.9528454378239786, "percentage": 95.28, "elapsed_time": "1 day, 16:27:33", "remaining_time": "2:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17096, "total_steps": 17941, "loss": 1.5908, "learning_rate": 5.704022897930594e-07, "epoch": 0.9529011760771418, "percentage": 95.29, "elapsed_time": "1 day, 16:27:42", "remaining_time": "1:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17097, "total_steps": 17941, "loss": 1.7469, "learning_rate": 5.690619304340061e-07, "epoch": 0.9529569143303049, "percentage": 95.3, "elapsed_time": "1 day, 16:27:50", "remaining_time": "1:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17098, "total_steps": 17941, "loss": 1.8152, "learning_rate": 5.677231387361093e-07, "epoch": 0.953012652583468, "percentage": 95.3, "elapsed_time": "1 day, 16:27:59", "remaining_time": "1:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17099, "total_steps": 17941, "loss": 1.6877, "learning_rate": 5.663859147418183e-07, "epoch": 0.9530683908366312, "percentage": 95.31, "elapsed_time": "1 day, 16:28:07", "remaining_time": "1:59:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17100, "total_steps": 17941, "loss": 1.964, "learning_rate": 5.650502584935546e-07, "epoch": 0.9531241290897944, "percentage": 95.31, "elapsed_time": "1 day, 16:28:16", "remaining_time": "1:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17101, "total_steps": 17941, "loss": 1.6014, "learning_rate": 5.63716170033668e-07, "epoch": 0.9531798673429575, "percentage": 95.32, "elapsed_time": "1 day, 16:28:24", "remaining_time": "1:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17102, "total_steps": 17941, "loss": 1.805, "learning_rate": 5.623836494044687e-07, "epoch": 0.9532356055961206, "percentage": 95.32, "elapsed_time": "1 day, 16:28:33", "remaining_time": "1:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17103, "total_steps": 17941, "loss": 1.463, "learning_rate": 5.610526966482232e-07, "epoch": 0.9532913438492837, "percentage": 95.33, "elapsed_time": "1 day, 16:28:41", "remaining_time": "1:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17104, "total_steps": 17941, "loss": 1.8894, "learning_rate": 5.597233118071365e-07, "epoch": 0.9533470821024469, "percentage": 95.33, "elapsed_time": "1 day, 16:28:50", "remaining_time": "1:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17105, "total_steps": 17941, "loss": 1.6705, "learning_rate": 5.583954949233638e-07, "epoch": 0.9534028203556101, "percentage": 95.34, "elapsed_time": "1 day, 16:28:58", "remaining_time": "1:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17106, "total_steps": 17941, "loss": 1.6637, "learning_rate": 5.57069246039027e-07, "epoch": 0.9534585586087732, "percentage": 95.35, "elapsed_time": "1 day, 16:29:07", "remaining_time": "1:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17107, "total_steps": 17941, "loss": 1.5197, "learning_rate": 5.557445651961812e-07, "epoch": 0.9535142968619363, "percentage": 95.35, "elapsed_time": "1 day, 16:29:15", "remaining_time": "1:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17108, "total_steps": 17941, "loss": 1.5722, "learning_rate": 5.544214524368374e-07, "epoch": 0.9535700351150995, "percentage": 95.36, "elapsed_time": "1 day, 16:29:24", "remaining_time": "1:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17109, "total_steps": 17941, "loss": 1.7963, "learning_rate": 5.530999078029563e-07, "epoch": 0.9536257733682626, "percentage": 95.36, "elapsed_time": "1 day, 16:29:32", "remaining_time": "1:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17110, "total_steps": 17941, "loss": 1.5337, "learning_rate": 5.517799313364491e-07, "epoch": 0.9536815116214258, "percentage": 95.37, "elapsed_time": "1 day, 16:29:41", "remaining_time": "1:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17111, "total_steps": 17941, "loss": 1.7755, "learning_rate": 5.504615230791821e-07, "epoch": 0.953737249874589, "percentage": 95.37, "elapsed_time": "1 day, 16:29:49", "remaining_time": "1:57:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17112, "total_steps": 17941, "loss": 1.7108, "learning_rate": 5.491446830729663e-07, "epoch": 0.953792988127752, "percentage": 95.38, "elapsed_time": "1 day, 16:29:57", "remaining_time": "1:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17113, "total_steps": 17941, "loss": 1.7004, "learning_rate": 5.478294113595573e-07, "epoch": 0.9538487263809152, "percentage": 95.38, "elapsed_time": "1 day, 16:30:06", "remaining_time": "1:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17114, "total_steps": 17941, "loss": 1.7245, "learning_rate": 5.465157079806771e-07, "epoch": 0.9539044646340784, "percentage": 95.39, "elapsed_time": "1 day, 16:30:15", "remaining_time": "1:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17115, "total_steps": 17941, "loss": 1.5044, "learning_rate": 5.452035729779869e-07, "epoch": 0.9539602028872415, "percentage": 95.4, "elapsed_time": "1 day, 16:30:23", "remaining_time": "1:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17116, "total_steps": 17941, "loss": 1.5727, "learning_rate": 5.438930063930925e-07, "epoch": 0.9540159411404047, "percentage": 95.4, "elapsed_time": "1 day, 16:30:32", "remaining_time": "1:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17117, "total_steps": 17941, "loss": 1.7628, "learning_rate": 5.42584008267566e-07, "epoch": 0.9540716793935679, "percentage": 95.41, "elapsed_time": "1 day, 16:30:40", "remaining_time": "1:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17118, "total_steps": 17941, "loss": 1.644, "learning_rate": 5.412765786429186e-07, "epoch": 0.9541274176467309, "percentage": 95.41, "elapsed_time": "1 day, 16:30:48", "remaining_time": "1:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17119, "total_steps": 17941, "loss": 1.456, "learning_rate": 5.399707175606117e-07, "epoch": 0.9541831558998941, "percentage": 95.42, "elapsed_time": "1 day, 16:30:57", "remaining_time": "1:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17120, "total_steps": 17941, "loss": 1.5407, "learning_rate": 5.386664250620621e-07, "epoch": 0.9542388941530573, "percentage": 95.42, "elapsed_time": "1 day, 16:31:05", "remaining_time": "1:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17121, "total_steps": 17941, "loss": 1.7538, "learning_rate": 5.373637011886312e-07, "epoch": 0.9542946324062204, "percentage": 95.43, "elapsed_time": "1 day, 16:31:14", "remaining_time": "1:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17122, "total_steps": 17941, "loss": 1.6037, "learning_rate": 5.36062545981647e-07, "epoch": 0.9543503706593836, "percentage": 95.44, "elapsed_time": "1 day, 16:31:23", "remaining_time": "1:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17123, "total_steps": 17941, "loss": 1.6391, "learning_rate": 5.347629594823544e-07, "epoch": 0.9544061089125467, "percentage": 95.44, "elapsed_time": "1 day, 16:31:31", "remaining_time": "1:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17124, "total_steps": 17941, "loss": 1.692, "learning_rate": 5.334649417319815e-07, "epoch": 0.9544618471657098, "percentage": 95.45, "elapsed_time": "1 day, 16:31:39", "remaining_time": "1:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17125, "total_steps": 17941, "loss": 1.6215, "learning_rate": 5.321684927716897e-07, "epoch": 0.954517585418873, "percentage": 95.45, "elapsed_time": "1 day, 16:31:48", "remaining_time": "1:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17126, "total_steps": 17941, "loss": 1.7474, "learning_rate": 5.308736126425962e-07, "epoch": 0.9545733236720361, "percentage": 95.46, "elapsed_time": "1 day, 16:31:56", "remaining_time": "1:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17127, "total_steps": 17941, "loss": 1.6767, "learning_rate": 5.295803013857681e-07, "epoch": 0.9546290619251993, "percentage": 95.46, "elapsed_time": "1 day, 16:32:05", "remaining_time": "1:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17128, "total_steps": 17941, "loss": 1.4194, "learning_rate": 5.282885590422171e-07, "epoch": 0.9546848001783624, "percentage": 95.47, "elapsed_time": "1 day, 16:32:13", "remaining_time": "1:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17129, "total_steps": 17941, "loss": 1.4386, "learning_rate": 5.269983856529159e-07, "epoch": 0.9547405384315255, "percentage": 95.47, "elapsed_time": "1 day, 16:32:22", "remaining_time": "1:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17130, "total_steps": 17941, "loss": 1.6629, "learning_rate": 5.257097812587763e-07, "epoch": 0.9547962766846887, "percentage": 95.48, "elapsed_time": "1 day, 16:32:31", "remaining_time": "1:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17131, "total_steps": 17941, "loss": 1.6166, "learning_rate": 5.244227459006656e-07, "epoch": 0.9548520149378519, "percentage": 95.49, "elapsed_time": "1 day, 16:32:40", "remaining_time": "1:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17132, "total_steps": 17941, "loss": 1.588, "learning_rate": 5.231372796194068e-07, "epoch": 0.954907753191015, "percentage": 95.49, "elapsed_time": "1 day, 16:32:49", "remaining_time": "1:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17133, "total_steps": 17941, "loss": 1.4972, "learning_rate": 5.218533824557614e-07, "epoch": 0.9549634914441781, "percentage": 95.5, "elapsed_time": "1 day, 16:32:57", "remaining_time": "1:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17134, "total_steps": 17941, "loss": 1.6878, "learning_rate": 5.205710544504527e-07, "epoch": 0.9550192296973413, "percentage": 95.5, "elapsed_time": "1 day, 16:33:05", "remaining_time": "1:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17135, "total_steps": 17941, "loss": 1.4775, "learning_rate": 5.19290295644137e-07, "epoch": 0.9550749679505044, "percentage": 95.51, "elapsed_time": "1 day, 16:33:14", "remaining_time": "1:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17136, "total_steps": 17941, "loss": 1.6239, "learning_rate": 5.180111060774429e-07, "epoch": 0.9551307062036676, "percentage": 95.51, "elapsed_time": "1 day, 16:33:22", "remaining_time": "1:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17137, "total_steps": 17941, "loss": 1.6065, "learning_rate": 5.167334857909434e-07, "epoch": 0.9551864444568308, "percentage": 95.52, "elapsed_time": "1 day, 16:33:31", "remaining_time": "1:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17138, "total_steps": 17941, "loss": 1.6714, "learning_rate": 5.15457434825145e-07, "epoch": 0.9552421827099938, "percentage": 95.52, "elapsed_time": "1 day, 16:33:39", "remaining_time": "1:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17139, "total_steps": 17941, "loss": 2.0025, "learning_rate": 5.141829532205211e-07, "epoch": 0.955297920963157, "percentage": 95.53, "elapsed_time": "1 day, 16:33:48", "remaining_time": "1:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17140, "total_steps": 17941, "loss": 1.6201, "learning_rate": 5.129100410174947e-07, "epoch": 0.9553536592163202, "percentage": 95.54, "elapsed_time": "1 day, 16:33:56", "remaining_time": "1:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17141, "total_steps": 17941, "loss": 1.5489, "learning_rate": 5.116386982564336e-07, "epoch": 0.9554093974694833, "percentage": 95.54, "elapsed_time": "1 day, 16:34:05", "remaining_time": "1:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17142, "total_steps": 17941, "loss": 1.5875, "learning_rate": 5.103689249776555e-07, "epoch": 0.9554651357226465, "percentage": 95.55, "elapsed_time": "1 day, 16:34:13", "remaining_time": "1:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17143, "total_steps": 17941, "loss": 1.6044, "learning_rate": 5.091007212214227e-07, "epoch": 0.9555208739758096, "percentage": 95.55, "elapsed_time": "1 day, 16:34:22", "remaining_time": "1:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17144, "total_steps": 17941, "loss": 1.7169, "learning_rate": 5.078340870279697e-07, "epoch": 0.9555766122289727, "percentage": 95.56, "elapsed_time": "1 day, 16:34:31", "remaining_time": "1:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17145, "total_steps": 17941, "loss": 1.2724, "learning_rate": 5.065690224374587e-07, "epoch": 0.9556323504821359, "percentage": 95.56, "elapsed_time": "1 day, 16:34:40", "remaining_time": "1:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17146, "total_steps": 17941, "loss": 1.6387, "learning_rate": 5.053055274900131e-07, "epoch": 0.9556880887352991, "percentage": 95.57, "elapsed_time": "1 day, 16:34:48", "remaining_time": "1:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17147, "total_steps": 17941, "loss": 2.1196, "learning_rate": 5.040436022256956e-07, "epoch": 0.9557438269884622, "percentage": 95.57, "elapsed_time": "1 day, 16:34:57", "remaining_time": "1:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17148, "total_steps": 17941, "loss": 1.5834, "learning_rate": 5.027832466845462e-07, "epoch": 0.9557995652416253, "percentage": 95.58, "elapsed_time": "1 day, 16:35:05", "remaining_time": "1:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17149, "total_steps": 17941, "loss": 1.5055, "learning_rate": 5.015244609065106e-07, "epoch": 0.9558553034947884, "percentage": 95.59, "elapsed_time": "1 day, 16:35:14", "remaining_time": "1:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17150, "total_steps": 17941, "loss": 1.4226, "learning_rate": 5.002672449315293e-07, "epoch": 0.9559110417479516, "percentage": 95.59, "elapsed_time": "1 day, 16:35:22", "remaining_time": "1:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17151, "total_steps": 17941, "loss": 1.7643, "learning_rate": 4.990115987994648e-07, "epoch": 0.9559667800011148, "percentage": 95.6, "elapsed_time": "1 day, 16:35:31", "remaining_time": "1:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17152, "total_steps": 17941, "loss": 1.418, "learning_rate": 4.977575225501463e-07, "epoch": 0.9560225182542779, "percentage": 95.6, "elapsed_time": "1 day, 16:35:39", "remaining_time": "1:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17153, "total_steps": 17941, "loss": 1.7449, "learning_rate": 4.965050162233365e-07, "epoch": 0.956078256507441, "percentage": 95.61, "elapsed_time": "1 day, 16:35:48", "remaining_time": "1:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17154, "total_steps": 17941, "loss": 1.8759, "learning_rate": 4.952540798587646e-07, "epoch": 0.9561339947606042, "percentage": 95.61, "elapsed_time": "1 day, 16:35:56", "remaining_time": "1:51:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17155, "total_steps": 17941, "loss": 1.8904, "learning_rate": 4.94004713496099e-07, "epoch": 0.9561897330137673, "percentage": 95.62, "elapsed_time": "1 day, 16:36:05", "remaining_time": "1:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17156, "total_steps": 17941, "loss": 1.4976, "learning_rate": 4.927569171749635e-07, "epoch": 0.9562454712669305, "percentage": 95.62, "elapsed_time": "1 day, 16:36:13", "remaining_time": "1:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17157, "total_steps": 17941, "loss": 1.6972, "learning_rate": 4.915106909349321e-07, "epoch": 0.9563012095200937, "percentage": 95.63, "elapsed_time": "1 day, 16:36:22", "remaining_time": "1:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17158, "total_steps": 17941, "loss": 1.6761, "learning_rate": 4.902660348155285e-07, "epoch": 0.9563569477732567, "percentage": 95.64, "elapsed_time": "1 day, 16:36:31", "remaining_time": "1:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17159, "total_steps": 17941, "loss": 1.6926, "learning_rate": 4.890229488562215e-07, "epoch": 0.9564126860264199, "percentage": 95.64, "elapsed_time": "1 day, 16:36:39", "remaining_time": "1:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17160, "total_steps": 17941, "loss": 1.5531, "learning_rate": 4.877814330964458e-07, "epoch": 0.9564684242795831, "percentage": 95.65, "elapsed_time": "1 day, 16:36:47", "remaining_time": "1:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17161, "total_steps": 17941, "loss": 1.7092, "learning_rate": 4.865414875755537e-07, "epoch": 0.9565241625327462, "percentage": 95.65, "elapsed_time": "1 day, 16:36:56", "remaining_time": "1:50:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17162, "total_steps": 17941, "loss": 1.6221, "learning_rate": 4.85303112332891e-07, "epoch": 0.9565799007859094, "percentage": 95.66, "elapsed_time": "1 day, 16:37:04", "remaining_time": "1:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17163, "total_steps": 17941, "loss": 1.7214, "learning_rate": 4.840663074077212e-07, "epoch": 0.9566356390390726, "percentage": 95.66, "elapsed_time": "1 day, 16:37:13", "remaining_time": "1:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17164, "total_steps": 17941, "loss": 1.5189, "learning_rate": 4.828310728392682e-07, "epoch": 0.9566913772922356, "percentage": 95.67, "elapsed_time": "1 day, 16:37:21", "remaining_time": "1:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17165, "total_steps": 17941, "loss": 1.6799, "learning_rate": 4.815974086667119e-07, "epoch": 0.9567471155453988, "percentage": 95.67, "elapsed_time": "1 day, 16:37:30", "remaining_time": "1:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17166, "total_steps": 17941, "loss": 1.7674, "learning_rate": 4.80365314929171e-07, "epoch": 0.956802853798562, "percentage": 95.68, "elapsed_time": "1 day, 16:37:38", "remaining_time": "1:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17167, "total_steps": 17941, "loss": 1.8631, "learning_rate": 4.791347916657252e-07, "epoch": 0.9568585920517251, "percentage": 95.69, "elapsed_time": "1 day, 16:37:47", "remaining_time": "1:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17168, "total_steps": 17941, "loss": 1.6842, "learning_rate": 4.779058389153934e-07, "epoch": 0.9569143303048883, "percentage": 95.69, "elapsed_time": "1 day, 16:37:55", "remaining_time": "1:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17169, "total_steps": 17941, "loss": 1.9205, "learning_rate": 4.766784567171556e-07, "epoch": 0.9569700685580514, "percentage": 95.7, "elapsed_time": "1 day, 16:38:04", "remaining_time": "1:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17170, "total_steps": 17941, "loss": 1.7295, "learning_rate": 4.754526451099417e-07, "epoch": 0.9570258068112145, "percentage": 95.7, "elapsed_time": "1 day, 16:38:12", "remaining_time": "1:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17171, "total_steps": 17941, "loss": 1.5759, "learning_rate": 4.7422840413261504e-07, "epoch": 0.9570815450643777, "percentage": 95.71, "elapsed_time": "1 day, 16:38:21", "remaining_time": "1:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17172, "total_steps": 17941, "loss": 1.8294, "learning_rate": 4.7300573382401123e-07, "epoch": 0.9571372833175408, "percentage": 95.71, "elapsed_time": "1 day, 16:38:29", "remaining_time": "1:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17173, "total_steps": 17941, "loss": 1.6738, "learning_rate": 4.717846342228993e-07, "epoch": 0.957193021570704, "percentage": 95.72, "elapsed_time": "1 day, 16:38:38", "remaining_time": "1:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17174, "total_steps": 17941, "loss": 1.4396, "learning_rate": 4.705651053680149e-07, "epoch": 0.9572487598238671, "percentage": 95.72, "elapsed_time": "1 day, 16:38:47", "remaining_time": "1:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17175, "total_steps": 17941, "loss": 1.6577, "learning_rate": 4.693471472980271e-07, "epoch": 0.9573044980770302, "percentage": 95.73, "elapsed_time": "1 day, 16:38:55", "remaining_time": "1:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17176, "total_steps": 17941, "loss": 1.6601, "learning_rate": 4.6813076005156054e-07, "epoch": 0.9573602363301934, "percentage": 95.74, "elapsed_time": "1 day, 16:39:04", "remaining_time": "1:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17177, "total_steps": 17941, "loss": 1.769, "learning_rate": 4.6691594366719547e-07, "epoch": 0.9574159745833566, "percentage": 95.74, "elapsed_time": "1 day, 16:39:12", "remaining_time": "1:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17178, "total_steps": 17941, "loss": 1.394, "learning_rate": 4.6570269818346224e-07, "epoch": 0.9574717128365197, "percentage": 95.75, "elapsed_time": "1 day, 16:39:21", "remaining_time": "1:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17179, "total_steps": 17941, "loss": 1.6643, "learning_rate": 4.644910236388356e-07, "epoch": 0.9575274510896828, "percentage": 95.75, "elapsed_time": "1 day, 16:39:29", "remaining_time": "1:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17180, "total_steps": 17941, "loss": 1.8785, "learning_rate": 4.6328092007173475e-07, "epoch": 0.957583189342846, "percentage": 95.76, "elapsed_time": "1 day, 16:39:38", "remaining_time": "1:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17181, "total_steps": 17941, "loss": 1.8076, "learning_rate": 4.620723875205513e-07, "epoch": 0.9576389275960091, "percentage": 95.76, "elapsed_time": "1 day, 16:39:47", "remaining_time": "1:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17182, "total_steps": 17941, "loss": 1.1926, "learning_rate": 4.608654260236045e-07, "epoch": 0.9576946658491723, "percentage": 95.77, "elapsed_time": "1 day, 16:39:56", "remaining_time": "1:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17183, "total_steps": 17941, "loss": 1.4759, "learning_rate": 4.596600356191694e-07, "epoch": 0.9577504041023355, "percentage": 95.78, "elapsed_time": "1 day, 16:40:04", "remaining_time": "1:47:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17184, "total_steps": 17941, "loss": 1.6676, "learning_rate": 4.5845621634548195e-07, "epoch": 0.9578061423554985, "percentage": 95.78, "elapsed_time": "1 day, 16:40:13", "remaining_time": "1:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17185, "total_steps": 17941, "loss": 1.6399, "learning_rate": 4.5725396824071177e-07, "epoch": 0.9578618806086617, "percentage": 95.79, "elapsed_time": "1 day, 16:40:21", "remaining_time": "1:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17186, "total_steps": 17941, "loss": 1.7609, "learning_rate": 4.560532913429949e-07, "epoch": 0.9579176188618249, "percentage": 95.79, "elapsed_time": "1 day, 16:40:30", "remaining_time": "1:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17187, "total_steps": 17941, "loss": 1.5248, "learning_rate": 4.5485418569040095e-07, "epoch": 0.957973357114988, "percentage": 95.8, "elapsed_time": "1 day, 16:40:38", "remaining_time": "1:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17188, "total_steps": 17941, "loss": 1.7189, "learning_rate": 4.536566513209717e-07, "epoch": 0.9580290953681512, "percentage": 95.8, "elapsed_time": "1 day, 16:40:47", "remaining_time": "1:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17189, "total_steps": 17941, "loss": 1.7432, "learning_rate": 4.524606882726767e-07, "epoch": 0.9580848336213144, "percentage": 95.81, "elapsed_time": "1 day, 16:40:55", "remaining_time": "1:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17190, "total_steps": 17941, "loss": 1.7686, "learning_rate": 4.512662965834413e-07, "epoch": 0.9581405718744774, "percentage": 95.81, "elapsed_time": "1 day, 16:41:04", "remaining_time": "1:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17191, "total_steps": 17941, "loss": 1.7781, "learning_rate": 4.500734762911518e-07, "epoch": 0.9581963101276406, "percentage": 95.82, "elapsed_time": "1 day, 16:41:12", "remaining_time": "1:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17192, "total_steps": 17941, "loss": 2.2384, "learning_rate": 4.4888222743363906e-07, "epoch": 0.9582520483808038, "percentage": 95.83, "elapsed_time": "1 day, 16:41:21", "remaining_time": "1:46:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17193, "total_steps": 17941, "loss": 1.6351, "learning_rate": 4.476925500486784e-07, "epoch": 0.9583077866339669, "percentage": 95.83, "elapsed_time": "1 day, 16:41:29", "remaining_time": "1:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17194, "total_steps": 17941, "loss": 1.4533, "learning_rate": 4.4650444417400075e-07, "epoch": 0.9583635248871301, "percentage": 95.84, "elapsed_time": "1 day, 16:41:38", "remaining_time": "1:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17195, "total_steps": 17941, "loss": 1.6649, "learning_rate": 4.4531790984727594e-07, "epoch": 0.9584192631402931, "percentage": 95.84, "elapsed_time": "1 day, 16:41:46", "remaining_time": "1:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17196, "total_steps": 17941, "loss": 1.7243, "learning_rate": 4.441329471061517e-07, "epoch": 0.9584750013934563, "percentage": 95.85, "elapsed_time": "1 day, 16:41:55", "remaining_time": "1:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17197, "total_steps": 17941, "loss": 1.8475, "learning_rate": 4.42949555988198e-07, "epoch": 0.9585307396466195, "percentage": 95.85, "elapsed_time": "1 day, 16:42:03", "remaining_time": "1:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17198, "total_steps": 17941, "loss": 1.4875, "learning_rate": 4.4176773653094583e-07, "epoch": 0.9585864778997826, "percentage": 95.86, "elapsed_time": "1 day, 16:42:12", "remaining_time": "1:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17199, "total_steps": 17941, "loss": 1.821, "learning_rate": 4.4058748877188196e-07, "epoch": 0.9586422161529458, "percentage": 95.86, "elapsed_time": "1 day, 16:42:20", "remaining_time": "1:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17200, "total_steps": 17941, "loss": 1.6276, "learning_rate": 4.3940881274842637e-07, "epoch": 0.9586979544061089, "percentage": 95.87, "elapsed_time": "1 day, 16:42:28", "remaining_time": "1:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17201, "total_steps": 17941, "loss": 1.4243, "learning_rate": 4.3823170849796593e-07, "epoch": 0.958753692659272, "percentage": 95.88, "elapsed_time": "1 day, 16:42:37", "remaining_time": "1:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17202, "total_steps": 17941, "loss": 1.7216, "learning_rate": 4.370561760578262e-07, "epoch": 0.9588094309124352, "percentage": 95.88, "elapsed_time": "1 day, 16:42:45", "remaining_time": "1:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17203, "total_steps": 17941, "loss": 1.5975, "learning_rate": 4.358822154652997e-07, "epoch": 0.9588651691655984, "percentage": 95.89, "elapsed_time": "1 day, 16:42:54", "remaining_time": "1:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17204, "total_steps": 17941, "loss": 1.468, "learning_rate": 4.347098267576066e-07, "epoch": 0.9589209074187615, "percentage": 95.89, "elapsed_time": "1 day, 16:43:03", "remaining_time": "1:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17205, "total_steps": 17941, "loss": 1.586, "learning_rate": 4.3353900997193384e-07, "epoch": 0.9589766456719246, "percentage": 95.9, "elapsed_time": "1 day, 16:43:12", "remaining_time": "1:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17206, "total_steps": 17941, "loss": 1.4871, "learning_rate": 4.323697651454073e-07, "epoch": 0.9590323839250878, "percentage": 95.9, "elapsed_time": "1 day, 16:43:20", "remaining_time": "1:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17207, "total_steps": 17941, "loss": 1.6051, "learning_rate": 4.3120209231511946e-07, "epoch": 0.9590881221782509, "percentage": 95.91, "elapsed_time": "1 day, 16:43:28", "remaining_time": "1:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17208, "total_steps": 17941, "loss": 1.5162, "learning_rate": 4.300359915180907e-07, "epoch": 0.9591438604314141, "percentage": 95.91, "elapsed_time": "1 day, 16:43:37", "remaining_time": "1:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17209, "total_steps": 17941, "loss": 1.6967, "learning_rate": 4.288714627913082e-07, "epoch": 0.9591995986845773, "percentage": 95.92, "elapsed_time": "1 day, 16:43:45", "remaining_time": "1:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17210, "total_steps": 17941, "loss": 1.6838, "learning_rate": 4.277085061716979e-07, "epoch": 0.9592553369377403, "percentage": 95.93, "elapsed_time": "1 day, 16:43:54", "remaining_time": "1:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17211, "total_steps": 17941, "loss": 1.5101, "learning_rate": 4.265471216961525e-07, "epoch": 0.9593110751909035, "percentage": 95.93, "elapsed_time": "1 day, 16:44:02", "remaining_time": "1:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17212, "total_steps": 17941, "loss": 1.8355, "learning_rate": 4.2538730940150373e-07, "epoch": 0.9593668134440667, "percentage": 95.94, "elapsed_time": "1 day, 16:44:11", "remaining_time": "1:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17213, "total_steps": 17941, "loss": 1.4289, "learning_rate": 4.242290693245221e-07, "epoch": 0.9594225516972298, "percentage": 95.94, "elapsed_time": "1 day, 16:44:20", "remaining_time": "1:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17214, "total_steps": 17941, "loss": 1.6346, "learning_rate": 4.2307240150195047e-07, "epoch": 0.959478289950393, "percentage": 95.95, "elapsed_time": "1 day, 16:44:28", "remaining_time": "1:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17215, "total_steps": 17941, "loss": 1.6333, "learning_rate": 4.219173059704651e-07, "epoch": 0.9595340282035562, "percentage": 95.95, "elapsed_time": "1 day, 16:44:37", "remaining_time": "1:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17216, "total_steps": 17941, "loss": 1.6506, "learning_rate": 4.207637827667088e-07, "epoch": 0.9595897664567192, "percentage": 95.96, "elapsed_time": "1 day, 16:44:45", "remaining_time": "1:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17217, "total_steps": 17941, "loss": 1.6314, "learning_rate": 4.196118319272524e-07, "epoch": 0.9596455047098824, "percentage": 95.96, "elapsed_time": "1 day, 16:44:53", "remaining_time": "1:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17218, "total_steps": 17941, "loss": 1.3523, "learning_rate": 4.1846145348863883e-07, "epoch": 0.9597012429630455, "percentage": 95.97, "elapsed_time": "1 day, 16:45:02", "remaining_time": "1:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17219, "total_steps": 17941, "loss": 1.4213, "learning_rate": 4.173126474873501e-07, "epoch": 0.9597569812162087, "percentage": 95.98, "elapsed_time": "1 day, 16:45:10", "remaining_time": "1:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17220, "total_steps": 17941, "loss": 1.4499, "learning_rate": 4.1616541395981256e-07, "epoch": 0.9598127194693719, "percentage": 95.98, "elapsed_time": "1 day, 16:45:19", "remaining_time": "1:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17221, "total_steps": 17941, "loss": 1.9351, "learning_rate": 4.1501975294240824e-07, "epoch": 0.9598684577225349, "percentage": 95.99, "elapsed_time": "1 day, 16:45:27", "remaining_time": "1:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17222, "total_steps": 17941, "loss": 1.6842, "learning_rate": 4.1387566447148585e-07, "epoch": 0.9599241959756981, "percentage": 95.99, "elapsed_time": "1 day, 16:45:36", "remaining_time": "1:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17223, "total_steps": 17941, "loss": 1.6548, "learning_rate": 4.127331485833219e-07, "epoch": 0.9599799342288613, "percentage": 96.0, "elapsed_time": "1 day, 16:45:44", "remaining_time": "1:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17224, "total_steps": 17941, "loss": 1.7442, "learning_rate": 4.1159220531414297e-07, "epoch": 0.9600356724820244, "percentage": 96.0, "elapsed_time": "1 day, 16:45:52", "remaining_time": "1:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17225, "total_steps": 17941, "loss": 1.6952, "learning_rate": 4.104528347001368e-07, "epoch": 0.9600914107351876, "percentage": 96.01, "elapsed_time": "1 day, 16:46:01", "remaining_time": "1:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17226, "total_steps": 17941, "loss": 1.5481, "learning_rate": 4.0931503677744676e-07, "epoch": 0.9601471489883507, "percentage": 96.01, "elapsed_time": "1 day, 16:46:09", "remaining_time": "1:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17227, "total_steps": 17941, "loss": 1.7855, "learning_rate": 4.0817881158214946e-07, "epoch": 0.9602028872415138, "percentage": 96.02, "elapsed_time": "1 day, 16:46:18", "remaining_time": "1:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17228, "total_steps": 17941, "loss": 1.5109, "learning_rate": 4.070441591502716e-07, "epoch": 0.960258625494677, "percentage": 96.03, "elapsed_time": "1 day, 16:46:26", "remaining_time": "1:41:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17229, "total_steps": 17941, "loss": 1.6554, "learning_rate": 4.0591107951781227e-07, "epoch": 0.9603143637478402, "percentage": 96.03, "elapsed_time": "1 day, 16:46:35", "remaining_time": "1:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17230, "total_steps": 17941, "loss": 1.7827, "learning_rate": 4.047795727207038e-07, "epoch": 0.9603701020010033, "percentage": 96.04, "elapsed_time": "1 day, 16:46:43", "remaining_time": "1:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17231, "total_steps": 17941, "loss": 1.6885, "learning_rate": 4.03649638794823e-07, "epoch": 0.9604258402541664, "percentage": 96.04, "elapsed_time": "1 day, 16:46:52", "remaining_time": "1:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17232, "total_steps": 17941, "loss": 1.6805, "learning_rate": 4.0252127777600236e-07, "epoch": 0.9604815785073296, "percentage": 96.05, "elapsed_time": "1 day, 16:47:01", "remaining_time": "1:40:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17233, "total_steps": 17941, "loss": 1.552, "learning_rate": 4.01394489700041e-07, "epoch": 0.9605373167604927, "percentage": 96.05, "elapsed_time": "1 day, 16:47:10", "remaining_time": "1:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17234, "total_steps": 17941, "loss": 1.6936, "learning_rate": 4.0026927460266594e-07, "epoch": 0.9605930550136559, "percentage": 96.06, "elapsed_time": "1 day, 16:47:18", "remaining_time": "1:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17235, "total_steps": 17941, "loss": 1.5903, "learning_rate": 3.9914563251956525e-07, "epoch": 0.9606487932668191, "percentage": 96.06, "elapsed_time": "1 day, 16:47:27", "remaining_time": "1:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17236, "total_steps": 17941, "loss": 1.8814, "learning_rate": 3.98023563486366e-07, "epoch": 0.9607045315199821, "percentage": 96.07, "elapsed_time": "1 day, 16:47:35", "remaining_time": "1:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17237, "total_steps": 17941, "loss": 1.4595, "learning_rate": 3.96903067538662e-07, "epoch": 0.9607602697731453, "percentage": 96.08, "elapsed_time": "1 day, 16:47:44", "remaining_time": "1:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17238, "total_steps": 17941, "loss": 1.4028, "learning_rate": 3.9578414471199145e-07, "epoch": 0.9608160080263085, "percentage": 96.08, "elapsed_time": "1 day, 16:47:52", "remaining_time": "1:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17239, "total_steps": 17941, "loss": 1.3832, "learning_rate": 3.946667950418259e-07, "epoch": 0.9608717462794716, "percentage": 96.09, "elapsed_time": "1 day, 16:48:00", "remaining_time": "1:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17240, "total_steps": 17941, "loss": 1.5302, "learning_rate": 3.935510185636149e-07, "epoch": 0.9609274845326348, "percentage": 96.09, "elapsed_time": "1 day, 16:48:09", "remaining_time": "1:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17241, "total_steps": 17941, "loss": 1.5696, "learning_rate": 3.924368153127411e-07, "epoch": 0.9609832227857978, "percentage": 96.1, "elapsed_time": "1 day, 16:48:17", "remaining_time": "1:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17242, "total_steps": 17941, "loss": 1.5546, "learning_rate": 3.913241853245375e-07, "epoch": 0.961038961038961, "percentage": 96.1, "elapsed_time": "1 day, 16:48:26", "remaining_time": "1:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17243, "total_steps": 17941, "loss": 1.8268, "learning_rate": 3.902131286342925e-07, "epoch": 0.9610946992921242, "percentage": 96.11, "elapsed_time": "1 day, 16:48:34", "remaining_time": "1:39:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17244, "total_steps": 17941, "loss": 1.7141, "learning_rate": 3.891036452772445e-07, "epoch": 0.9611504375452873, "percentage": 96.12, "elapsed_time": "1 day, 16:48:43", "remaining_time": "1:38:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17245, "total_steps": 17941, "loss": 1.6503, "learning_rate": 3.879957352885766e-07, "epoch": 0.9612061757984505, "percentage": 96.12, "elapsed_time": "1 day, 16:48:51", "remaining_time": "1:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17246, "total_steps": 17941, "loss": 1.6333, "learning_rate": 3.868893987034272e-07, "epoch": 0.9612619140516137, "percentage": 96.13, "elapsed_time": "1 day, 16:49:00", "remaining_time": "1:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17247, "total_steps": 17941, "loss": 1.8458, "learning_rate": 3.8578463555687396e-07, "epoch": 0.9613176523047767, "percentage": 96.13, "elapsed_time": "1 day, 16:49:08", "remaining_time": "1:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17248, "total_steps": 17941, "loss": 1.7948, "learning_rate": 3.8468144588396647e-07, "epoch": 0.9613733905579399, "percentage": 96.14, "elapsed_time": "1 day, 16:49:17", "remaining_time": "1:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17249, "total_steps": 17941, "loss": 1.6938, "learning_rate": 3.8357982971968796e-07, "epoch": 0.9614291288111031, "percentage": 96.14, "elapsed_time": "1 day, 16:49:25", "remaining_time": "1:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17250, "total_steps": 17941, "loss": 1.7462, "learning_rate": 3.824797870989716e-07, "epoch": 0.9614848670642662, "percentage": 96.15, "elapsed_time": "1 day, 16:49:33", "remaining_time": "1:38:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17251, "total_steps": 17941, "loss": 1.5328, "learning_rate": 3.8138131805670606e-07, "epoch": 0.9615406053174294, "percentage": 96.15, "elapsed_time": "1 day, 16:49:42", "remaining_time": "1:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17252, "total_steps": 17941, "loss": 1.8171, "learning_rate": 3.8028442262773026e-07, "epoch": 0.9615963435705925, "percentage": 96.16, "elapsed_time": "1 day, 16:49:50", "remaining_time": "1:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17253, "total_steps": 17941, "loss": 1.6913, "learning_rate": 3.7918910084682734e-07, "epoch": 0.9616520818237556, "percentage": 96.17, "elapsed_time": "1 day, 16:49:59", "remaining_time": "1:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17254, "total_steps": 17941, "loss": 1.6028, "learning_rate": 3.780953527487363e-07, "epoch": 0.9617078200769188, "percentage": 96.17, "elapsed_time": "1 day, 16:50:07", "remaining_time": "1:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17255, "total_steps": 17941, "loss": 1.6237, "learning_rate": 3.77003178368146e-07, "epoch": 0.961763558330082, "percentage": 96.18, "elapsed_time": "1 day, 16:50:16", "remaining_time": "1:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17256, "total_steps": 17941, "loss": 1.6616, "learning_rate": 3.759125777396899e-07, "epoch": 0.961819296583245, "percentage": 96.18, "elapsed_time": "1 day, 16:50:24", "remaining_time": "1:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17257, "total_steps": 17941, "loss": 1.5478, "learning_rate": 3.7482355089796253e-07, "epoch": 0.9618750348364082, "percentage": 96.19, "elapsed_time": "1 day, 16:50:33", "remaining_time": "1:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17258, "total_steps": 17941, "loss": 1.6128, "learning_rate": 3.737360978774973e-07, "epoch": 0.9619307730895714, "percentage": 96.19, "elapsed_time": "1 day, 16:50:42", "remaining_time": "1:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17259, "total_steps": 17941, "loss": 1.5874, "learning_rate": 3.726502187127834e-07, "epoch": 0.9619865113427345, "percentage": 96.2, "elapsed_time": "1 day, 16:50:50", "remaining_time": "1:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17260, "total_steps": 17941, "loss": 1.6423, "learning_rate": 3.7156591343824874e-07, "epoch": 0.9620422495958977, "percentage": 96.2, "elapsed_time": "1 day, 16:50:59", "remaining_time": "1:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17261, "total_steps": 17941, "loss": 1.4805, "learning_rate": 3.7048318208829924e-07, "epoch": 0.9620979878490609, "percentage": 96.21, "elapsed_time": "1 day, 16:51:08", "remaining_time": "1:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17262, "total_steps": 17941, "loss": 1.646, "learning_rate": 3.694020246972574e-07, "epoch": 0.9621537261022239, "percentage": 96.22, "elapsed_time": "1 day, 16:51:16", "remaining_time": "1:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17263, "total_steps": 17941, "loss": 1.8116, "learning_rate": 3.6832244129941796e-07, "epoch": 0.9622094643553871, "percentage": 96.22, "elapsed_time": "1 day, 16:51:25", "remaining_time": "1:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17264, "total_steps": 17941, "loss": 1.5197, "learning_rate": 3.6724443192902026e-07, "epoch": 0.9622652026085502, "percentage": 96.23, "elapsed_time": "1 day, 16:51:33", "remaining_time": "1:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17265, "total_steps": 17941, "loss": 1.5514, "learning_rate": 3.6616799662024246e-07, "epoch": 0.9623209408617134, "percentage": 96.23, "elapsed_time": "1 day, 16:51:42", "remaining_time": "1:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17266, "total_steps": 17941, "loss": 1.6777, "learning_rate": 3.6509313540724067e-07, "epoch": 0.9623766791148766, "percentage": 96.24, "elapsed_time": "1 day, 16:51:51", "remaining_time": "1:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17267, "total_steps": 17941, "loss": 1.644, "learning_rate": 3.6401984832408754e-07, "epoch": 0.9624324173680396, "percentage": 96.24, "elapsed_time": "1 day, 16:51:59", "remaining_time": "1:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17268, "total_steps": 17941, "loss": 1.6234, "learning_rate": 3.629481354048281e-07, "epoch": 0.9624881556212028, "percentage": 96.25, "elapsed_time": "1 day, 16:52:09", "remaining_time": "1:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17269, "total_steps": 17941, "loss": 1.4791, "learning_rate": 3.6187799668344626e-07, "epoch": 0.962543893874366, "percentage": 96.25, "elapsed_time": "1 day, 16:52:17", "remaining_time": "1:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17270, "total_steps": 17941, "loss": 1.8732, "learning_rate": 3.608094321938871e-07, "epoch": 0.9625996321275291, "percentage": 96.26, "elapsed_time": "1 day, 16:52:26", "remaining_time": "1:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17271, "total_steps": 17941, "loss": 1.686, "learning_rate": 3.5974244197004016e-07, "epoch": 0.9626553703806923, "percentage": 96.27, "elapsed_time": "1 day, 16:52:34", "remaining_time": "1:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17272, "total_steps": 17941, "loss": 1.4681, "learning_rate": 3.5867702604573395e-07, "epoch": 0.9627111086338555, "percentage": 96.27, "elapsed_time": "1 day, 16:52:42", "remaining_time": "1:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17273, "total_steps": 17941, "loss": 1.6921, "learning_rate": 3.5761318445476367e-07, "epoch": 0.9627668468870185, "percentage": 96.28, "elapsed_time": "1 day, 16:52:51", "remaining_time": "1:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17274, "total_steps": 17941, "loss": 1.821, "learning_rate": 3.56550917230869e-07, "epoch": 0.9628225851401817, "percentage": 96.28, "elapsed_time": "1 day, 16:52:59", "remaining_time": "1:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17275, "total_steps": 17941, "loss": 1.4901, "learning_rate": 3.554902244077396e-07, "epoch": 0.9628783233933449, "percentage": 96.29, "elapsed_time": "1 day, 16:53:08", "remaining_time": "1:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17276, "total_steps": 17941, "loss": 1.3337, "learning_rate": 3.5443110601901533e-07, "epoch": 0.962934061646508, "percentage": 96.29, "elapsed_time": "1 day, 16:53:16", "remaining_time": "1:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17277, "total_steps": 17941, "loss": 1.5836, "learning_rate": 3.5337356209827477e-07, "epoch": 0.9629897998996712, "percentage": 96.3, "elapsed_time": "1 day, 16:53:25", "remaining_time": "1:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17278, "total_steps": 17941, "loss": 1.3261, "learning_rate": 3.523175926790745e-07, "epoch": 0.9630455381528343, "percentage": 96.3, "elapsed_time": "1 day, 16:53:33", "remaining_time": "1:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17279, "total_steps": 17941, "loss": 1.7087, "learning_rate": 3.512631977948877e-07, "epoch": 0.9631012764059974, "percentage": 96.31, "elapsed_time": "1 day, 16:53:42", "remaining_time": "1:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17280, "total_steps": 17941, "loss": 1.6478, "learning_rate": 3.5021037747915987e-07, "epoch": 0.9631570146591606, "percentage": 96.32, "elapsed_time": "1 day, 16:53:51", "remaining_time": "1:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17281, "total_steps": 17941, "loss": 1.8982, "learning_rate": 3.4915913176528094e-07, "epoch": 0.9632127529123238, "percentage": 96.32, "elapsed_time": "1 day, 16:53:59", "remaining_time": "1:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17282, "total_steps": 17941, "loss": 1.5759, "learning_rate": 3.481094606865909e-07, "epoch": 0.9632684911654869, "percentage": 96.33, "elapsed_time": "1 day, 16:54:08", "remaining_time": "1:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17283, "total_steps": 17941, "loss": 1.6012, "learning_rate": 3.470613642763798e-07, "epoch": 0.96332422941865, "percentage": 96.33, "elapsed_time": "1 day, 16:54:16", "remaining_time": "1:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17284, "total_steps": 17941, "loss": 1.7879, "learning_rate": 3.460148425678822e-07, "epoch": 0.9633799676718132, "percentage": 96.34, "elapsed_time": "1 day, 16:54:25", "remaining_time": "1:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17285, "total_steps": 17941, "loss": 1.6797, "learning_rate": 3.449698955942937e-07, "epoch": 0.9634357059249763, "percentage": 96.34, "elapsed_time": "1 day, 16:54:33", "remaining_time": "1:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17286, "total_steps": 17941, "loss": 1.6003, "learning_rate": 3.4392652338875453e-07, "epoch": 0.9634914441781395, "percentage": 96.35, "elapsed_time": "1 day, 16:54:41", "remaining_time": "1:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17287, "total_steps": 17941, "loss": 1.4621, "learning_rate": 3.428847259843437e-07, "epoch": 0.9635471824313026, "percentage": 96.35, "elapsed_time": "1 day, 16:54:50", "remaining_time": "1:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17288, "total_steps": 17941, "loss": 1.6383, "learning_rate": 3.418445034141127e-07, "epoch": 0.9636029206844657, "percentage": 96.36, "elapsed_time": "1 day, 16:54:58", "remaining_time": "1:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17289, "total_steps": 17941, "loss": 1.5645, "learning_rate": 3.408058557110461e-07, "epoch": 0.9636586589376289, "percentage": 96.37, "elapsed_time": "1 day, 16:55:07", "remaining_time": "1:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17290, "total_steps": 17941, "loss": 1.7982, "learning_rate": 3.3976878290808423e-07, "epoch": 0.963714397190792, "percentage": 96.37, "elapsed_time": "1 day, 16:55:15", "remaining_time": "1:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17291, "total_steps": 17941, "loss": 1.5192, "learning_rate": 3.3873328503811195e-07, "epoch": 0.9637701354439552, "percentage": 96.38, "elapsed_time": "1 day, 16:55:24", "remaining_time": "1:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17292, "total_steps": 17941, "loss": 1.4408, "learning_rate": 3.3769936213398635e-07, "epoch": 0.9638258736971184, "percentage": 96.38, "elapsed_time": "1 day, 16:55:33", "remaining_time": "1:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17293, "total_steps": 17941, "loss": 1.6641, "learning_rate": 3.366670142284756e-07, "epoch": 0.9638816119502814, "percentage": 96.39, "elapsed_time": "1 day, 16:55:42", "remaining_time": "1:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17294, "total_steps": 17941, "loss": 1.5355, "learning_rate": 3.356362413543313e-07, "epoch": 0.9639373502034446, "percentage": 96.39, "elapsed_time": "1 day, 16:55:50", "remaining_time": "1:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17295, "total_steps": 17941, "loss": 1.7866, "learning_rate": 3.346070435442439e-07, "epoch": 0.9639930884566078, "percentage": 96.4, "elapsed_time": "1 day, 16:55:59", "remaining_time": "1:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17296, "total_steps": 17941, "loss": 1.725, "learning_rate": 3.3357942083085405e-07, "epoch": 0.9640488267097709, "percentage": 96.4, "elapsed_time": "1 day, 16:56:07", "remaining_time": "1:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17297, "total_steps": 17941, "loss": 1.6818, "learning_rate": 3.325533732467523e-07, "epoch": 0.9641045649629341, "percentage": 96.41, "elapsed_time": "1 day, 16:56:15", "remaining_time": "1:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17298, "total_steps": 17941, "loss": 1.634, "learning_rate": 3.315289008244682e-07, "epoch": 0.9641603032160972, "percentage": 96.42, "elapsed_time": "1 day, 16:56:24", "remaining_time": "1:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17299, "total_steps": 17941, "loss": 1.6775, "learning_rate": 3.3050600359650354e-07, "epoch": 0.9642160414692603, "percentage": 96.42, "elapsed_time": "1 day, 16:56:32", "remaining_time": "1:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17300, "total_steps": 17941, "loss": 1.7811, "learning_rate": 3.2948468159529343e-07, "epoch": 0.9642717797224235, "percentage": 96.43, "elapsed_time": "1 day, 16:56:41", "remaining_time": "1:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17301, "total_steps": 17941, "loss": 1.6629, "learning_rate": 3.2846493485323426e-07, "epoch": 0.9643275179755867, "percentage": 96.43, "elapsed_time": "1 day, 16:56:50", "remaining_time": "1:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17302, "total_steps": 17941, "loss": 1.5419, "learning_rate": 3.274467634026557e-07, "epoch": 0.9643832562287498, "percentage": 96.44, "elapsed_time": "1 day, 16:56:58", "remaining_time": "1:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17303, "total_steps": 17941, "loss": 1.4743, "learning_rate": 3.2643016727585964e-07, "epoch": 0.964438994481913, "percentage": 96.44, "elapsed_time": "1 day, 16:57:07", "remaining_time": "1:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17304, "total_steps": 17941, "loss": 1.7358, "learning_rate": 3.2541514650508144e-07, "epoch": 0.9644947327350761, "percentage": 96.45, "elapsed_time": "1 day, 16:57:15", "remaining_time": "1:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17305, "total_steps": 17941, "loss": 1.7541, "learning_rate": 3.24401701122512e-07, "epoch": 0.9645504709882392, "percentage": 96.46, "elapsed_time": "1 day, 16:57:24", "remaining_time": "1:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17306, "total_steps": 17941, "loss": 1.6517, "learning_rate": 3.233898311602923e-07, "epoch": 0.9646062092414024, "percentage": 96.46, "elapsed_time": "1 day, 16:57:32", "remaining_time": "1:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17307, "total_steps": 17941, "loss": 1.3316, "learning_rate": 3.223795366505133e-07, "epoch": 0.9646619474945656, "percentage": 96.47, "elapsed_time": "1 day, 16:57:41", "remaining_time": "1:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17308, "total_steps": 17941, "loss": 1.8486, "learning_rate": 3.213708176252106e-07, "epoch": 0.9647176857477286, "percentage": 96.47, "elapsed_time": "1 day, 16:57:49", "remaining_time": "1:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17309, "total_steps": 17941, "loss": 1.6671, "learning_rate": 3.2036367411638066e-07, "epoch": 0.9647734240008918, "percentage": 96.48, "elapsed_time": "1 day, 16:57:58", "remaining_time": "1:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17310, "total_steps": 17941, "loss": 1.636, "learning_rate": 3.193581061559592e-07, "epoch": 0.9648291622540549, "percentage": 96.48, "elapsed_time": "1 day, 16:58:06", "remaining_time": "1:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17311, "total_steps": 17941, "loss": 1.6163, "learning_rate": 3.1835411377584833e-07, "epoch": 0.9648849005072181, "percentage": 96.49, "elapsed_time": "1 day, 16:58:14", "remaining_time": "1:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17312, "total_steps": 17941, "loss": 1.7554, "learning_rate": 3.1735169700787823e-07, "epoch": 0.9649406387603813, "percentage": 96.49, "elapsed_time": "1 day, 16:58:23", "remaining_time": "1:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17313, "total_steps": 17941, "loss": 1.5399, "learning_rate": 3.1635085588384016e-07, "epoch": 0.9649963770135443, "percentage": 96.5, "elapsed_time": "1 day, 16:58:31", "remaining_time": "1:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17314, "total_steps": 17941, "loss": 1.5671, "learning_rate": 3.1535159043547533e-07, "epoch": 0.9650521152667075, "percentage": 96.51, "elapsed_time": "1 day, 16:58:40", "remaining_time": "1:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17315, "total_steps": 17941, "loss": 1.6985, "learning_rate": 3.143539006944807e-07, "epoch": 0.9651078535198707, "percentage": 96.51, "elapsed_time": "1 day, 16:58:48", "remaining_time": "1:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17316, "total_steps": 17941, "loss": 1.3725, "learning_rate": 3.1335778669249196e-07, "epoch": 0.9651635917730338, "percentage": 96.52, "elapsed_time": "1 day, 16:58:57", "remaining_time": "1:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17317, "total_steps": 17941, "loss": 1.7234, "learning_rate": 3.1236324846110055e-07, "epoch": 0.965219330026197, "percentage": 96.52, "elapsed_time": "1 day, 16:59:05", "remaining_time": "1:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17318, "total_steps": 17941, "loss": 1.5436, "learning_rate": 3.113702860318479e-07, "epoch": 0.9652750682793602, "percentage": 96.53, "elapsed_time": "1 day, 16:59:14", "remaining_time": "1:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17319, "total_steps": 17941, "loss": 1.7209, "learning_rate": 3.1037889943622555e-07, "epoch": 0.9653308065325232, "percentage": 96.53, "elapsed_time": "1 day, 16:59:22", "remaining_time": "1:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17320, "total_steps": 17941, "loss": 1.6455, "learning_rate": 3.093890887056694e-07, "epoch": 0.9653865447856864, "percentage": 96.54, "elapsed_time": "1 day, 16:59:30", "remaining_time": "1:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17321, "total_steps": 17941, "loss": 1.4525, "learning_rate": 3.0840085387158214e-07, "epoch": 0.9654422830388496, "percentage": 96.54, "elapsed_time": "1 day, 16:59:40", "remaining_time": "1:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17322, "total_steps": 17941, "loss": 1.6845, "learning_rate": 3.074141949652942e-07, "epoch": 0.9654980212920127, "percentage": 96.55, "elapsed_time": "1 day, 16:59:48", "remaining_time": "1:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17323, "total_steps": 17941, "loss": 1.6338, "learning_rate": 3.064291120180973e-07, "epoch": 0.9655537595451759, "percentage": 96.56, "elapsed_time": "1 day, 16:59:57", "remaining_time": "1:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17324, "total_steps": 17941, "loss": 1.788, "learning_rate": 3.0544560506123865e-07, "epoch": 0.965609497798339, "percentage": 96.56, "elapsed_time": "1 day, 17:00:06", "remaining_time": "1:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17325, "total_steps": 17941, "loss": 1.6008, "learning_rate": 3.0446367412590435e-07, "epoch": 0.9656652360515021, "percentage": 96.57, "elapsed_time": "1 day, 17:00:14", "remaining_time": "1:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17326, "total_steps": 17941, "loss": 1.4603, "learning_rate": 3.034833192432418e-07, "epoch": 0.9657209743046653, "percentage": 96.57, "elapsed_time": "1 day, 17:00:23", "remaining_time": "1:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17327, "total_steps": 17941, "loss": 1.5596, "learning_rate": 3.0250454044433164e-07, "epoch": 0.9657767125578285, "percentage": 96.58, "elapsed_time": "1 day, 17:00:31", "remaining_time": "1:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17328, "total_steps": 17941, "loss": 1.4737, "learning_rate": 3.015273377602268e-07, "epoch": 0.9658324508109916, "percentage": 96.58, "elapsed_time": "1 day, 17:00:40", "remaining_time": "1:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17329, "total_steps": 17941, "loss": 1.6263, "learning_rate": 3.0055171122190806e-07, "epoch": 0.9658881890641547, "percentage": 96.59, "elapsed_time": "1 day, 17:00:48", "remaining_time": "1:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17330, "total_steps": 17941, "loss": 1.6034, "learning_rate": 2.995776608603229e-07, "epoch": 0.9659439273173179, "percentage": 96.59, "elapsed_time": "1 day, 17:00:57", "remaining_time": "1:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17331, "total_steps": 17941, "loss": 1.4754, "learning_rate": 2.986051867063577e-07, "epoch": 0.965999665570481, "percentage": 96.6, "elapsed_time": "1 day, 17:01:05", "remaining_time": "1:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17332, "total_steps": 17941, "loss": 1.6227, "learning_rate": 2.976342887908601e-07, "epoch": 0.9660554038236442, "percentage": 96.61, "elapsed_time": "1 day, 17:01:13", "remaining_time": "1:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17333, "total_steps": 17941, "loss": 1.9817, "learning_rate": 2.9666496714461645e-07, "epoch": 0.9661111420768073, "percentage": 96.61, "elapsed_time": "1 day, 17:01:22", "remaining_time": "1:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17334, "total_steps": 17941, "loss": 1.6725, "learning_rate": 2.956972217983689e-07, "epoch": 0.9661668803299704, "percentage": 96.62, "elapsed_time": "1 day, 17:01:30", "remaining_time": "1:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17335, "total_steps": 17941, "loss": 1.6861, "learning_rate": 2.947310527828151e-07, "epoch": 0.9662226185831336, "percentage": 96.62, "elapsed_time": "1 day, 17:01:39", "remaining_time": "1:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17336, "total_steps": 17941, "loss": 1.5534, "learning_rate": 2.937664601285861e-07, "epoch": 0.9662783568362967, "percentage": 96.63, "elapsed_time": "1 day, 17:01:47", "remaining_time": "1:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17337, "total_steps": 17941, "loss": 1.7596, "learning_rate": 2.928034438662797e-07, "epoch": 0.9663340950894599, "percentage": 96.63, "elapsed_time": "1 day, 17:01:56", "remaining_time": "1:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17338, "total_steps": 17941, "loss": 1.6954, "learning_rate": 2.9184200402643247e-07, "epoch": 0.9663898333426231, "percentage": 96.64, "elapsed_time": "1 day, 17:02:04", "remaining_time": "1:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17339, "total_steps": 17941, "loss": 1.6415, "learning_rate": 2.9088214063953677e-07, "epoch": 0.9664455715957861, "percentage": 96.64, "elapsed_time": "1 day, 17:02:14", "remaining_time": "1:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17340, "total_steps": 17941, "loss": 2.1054, "learning_rate": 2.8992385373603494e-07, "epoch": 0.9665013098489493, "percentage": 96.65, "elapsed_time": "1 day, 17:02:22", "remaining_time": "1:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17341, "total_steps": 17941, "loss": 1.5307, "learning_rate": 2.8896714334631925e-07, "epoch": 0.9665570481021125, "percentage": 96.66, "elapsed_time": "1 day, 17:02:30", "remaining_time": "1:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17342, "total_steps": 17941, "loss": 1.6503, "learning_rate": 2.880120095007377e-07, "epoch": 0.9666127863552756, "percentage": 96.66, "elapsed_time": "1 day, 17:02:39", "remaining_time": "1:25:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17343, "total_steps": 17941, "loss": 1.9174, "learning_rate": 2.8705845222956607e-07, "epoch": 0.9666685246084388, "percentage": 96.67, "elapsed_time": "1 day, 17:02:47", "remaining_time": "1:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17344, "total_steps": 17941, "loss": 1.422, "learning_rate": 2.861064715630579e-07, "epoch": 0.966724262861602, "percentage": 96.67, "elapsed_time": "1 day, 17:02:56", "remaining_time": "1:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17345, "total_steps": 17941, "loss": 1.5975, "learning_rate": 2.8515606753139466e-07, "epoch": 0.966780001114765, "percentage": 96.68, "elapsed_time": "1 day, 17:03:04", "remaining_time": "1:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17346, "total_steps": 17941, "loss": 1.6251, "learning_rate": 2.8420724016473e-07, "epoch": 0.9668357393679282, "percentage": 96.68, "elapsed_time": "1 day, 17:03:13", "remaining_time": "1:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17347, "total_steps": 17941, "loss": 1.6007, "learning_rate": 2.8325998949314536e-07, "epoch": 0.9668914776210914, "percentage": 96.69, "elapsed_time": "1 day, 17:03:21", "remaining_time": "1:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17348, "total_steps": 17941, "loss": 1.5968, "learning_rate": 2.823143155466834e-07, "epoch": 0.9669472158742545, "percentage": 96.69, "elapsed_time": "1 day, 17:03:30", "remaining_time": "1:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17349, "total_steps": 17941, "loss": 1.6994, "learning_rate": 2.8137021835534237e-07, "epoch": 0.9670029541274177, "percentage": 96.7, "elapsed_time": "1 day, 17:03:38", "remaining_time": "1:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17350, "total_steps": 17941, "loss": 1.6549, "learning_rate": 2.8042769794905387e-07, "epoch": 0.9670586923805808, "percentage": 96.71, "elapsed_time": "1 day, 17:03:46", "remaining_time": "1:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17351, "total_steps": 17941, "loss": 1.5995, "learning_rate": 2.794867543577162e-07, "epoch": 0.9671144306337439, "percentage": 96.71, "elapsed_time": "1 day, 17:03:55", "remaining_time": "1:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17352, "total_steps": 17941, "loss": 1.6002, "learning_rate": 2.7854738761116663e-07, "epoch": 0.9671701688869071, "percentage": 96.72, "elapsed_time": "1 day, 17:04:03", "remaining_time": "1:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17353, "total_steps": 17941, "loss": 1.9395, "learning_rate": 2.776095977391979e-07, "epoch": 0.9672259071400703, "percentage": 96.72, "elapsed_time": "1 day, 17:04:12", "remaining_time": "1:23:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17354, "total_steps": 17941, "loss": 1.6846, "learning_rate": 2.766733847715475e-07, "epoch": 0.9672816453932334, "percentage": 96.73, "elapsed_time": "1 day, 17:04:20", "remaining_time": "1:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17355, "total_steps": 17941, "loss": 1.4772, "learning_rate": 2.7573874873791373e-07, "epoch": 0.9673373836463965, "percentage": 96.73, "elapsed_time": "1 day, 17:04:29", "remaining_time": "1:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17356, "total_steps": 17941, "loss": 1.5267, "learning_rate": 2.7480568966793407e-07, "epoch": 0.9673931218995596, "percentage": 96.74, "elapsed_time": "1 day, 17:04:38", "remaining_time": "1:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17357, "total_steps": 17941, "loss": 1.6162, "learning_rate": 2.7387420759120154e-07, "epoch": 0.9674488601527228, "percentage": 96.74, "elapsed_time": "1 day, 17:04:46", "remaining_time": "1:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17358, "total_steps": 17941, "loss": 1.237, "learning_rate": 2.7294430253725357e-07, "epoch": 0.967504598405886, "percentage": 96.75, "elapsed_time": "1 day, 17:04:55", "remaining_time": "1:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17359, "total_steps": 17941, "loss": 1.5605, "learning_rate": 2.7201597453558325e-07, "epoch": 0.9675603366590491, "percentage": 96.76, "elapsed_time": "1 day, 17:05:03", "remaining_time": "1:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17360, "total_steps": 17941, "loss": 1.6469, "learning_rate": 2.710892236156337e-07, "epoch": 0.9676160749122122, "percentage": 96.76, "elapsed_time": "1 day, 17:05:12", "remaining_time": "1:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17361, "total_steps": 17941, "loss": 1.759, "learning_rate": 2.7016404980679253e-07, "epoch": 0.9676718131653754, "percentage": 96.77, "elapsed_time": "1 day, 17:05:20", "remaining_time": "1:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17362, "total_steps": 17941, "loss": 1.6129, "learning_rate": 2.6924045313840296e-07, "epoch": 0.9677275514185385, "percentage": 96.77, "elapsed_time": "1 day, 17:05:29", "remaining_time": "1:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17363, "total_steps": 17941, "loss": 1.5556, "learning_rate": 2.6831843363975815e-07, "epoch": 0.9677832896717017, "percentage": 96.78, "elapsed_time": "1 day, 17:05:37", "remaining_time": "1:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17364, "total_steps": 17941, "loss": 1.5573, "learning_rate": 2.673979913400959e-07, "epoch": 0.9678390279248649, "percentage": 96.78, "elapsed_time": "1 day, 17:05:45", "remaining_time": "1:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17365, "total_steps": 17941, "loss": 1.6159, "learning_rate": 2.664791262686095e-07, "epoch": 0.9678947661780279, "percentage": 96.79, "elapsed_time": "1 day, 17:05:54", "remaining_time": "1:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17366, "total_steps": 17941, "loss": 1.7405, "learning_rate": 2.655618384544367e-07, "epoch": 0.9679505044311911, "percentage": 96.8, "elapsed_time": "1 day, 17:06:02", "remaining_time": "1:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17367, "total_steps": 17941, "loss": 1.3257, "learning_rate": 2.6464612792666544e-07, "epoch": 0.9680062426843543, "percentage": 96.8, "elapsed_time": "1 day, 17:06:11", "remaining_time": "1:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17368, "total_steps": 17941, "loss": 1.5611, "learning_rate": 2.637319947143502e-07, "epoch": 0.9680619809375174, "percentage": 96.81, "elapsed_time": "1 day, 17:06:20", "remaining_time": "1:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17369, "total_steps": 17941, "loss": 1.795, "learning_rate": 2.6281943884646776e-07, "epoch": 0.9681177191906806, "percentage": 96.81, "elapsed_time": "1 day, 17:06:28", "remaining_time": "1:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17370, "total_steps": 17941, "loss": 1.7284, "learning_rate": 2.6190846035196725e-07, "epoch": 0.9681734574438438, "percentage": 96.82, "elapsed_time": "1 day, 17:06:37", "remaining_time": "1:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17371, "total_steps": 17941, "loss": 1.8973, "learning_rate": 2.609990592597422e-07, "epoch": 0.9682291956970068, "percentage": 96.82, "elapsed_time": "1 day, 17:06:45", "remaining_time": "1:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17372, "total_steps": 17941, "loss": 1.2629, "learning_rate": 2.600912355986196e-07, "epoch": 0.96828493395017, "percentage": 96.83, "elapsed_time": "1 day, 17:06:53", "remaining_time": "1:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17373, "total_steps": 17941, "loss": 1.6609, "learning_rate": 2.591849893974041e-07, "epoch": 0.9683406722033332, "percentage": 96.83, "elapsed_time": "1 day, 17:07:02", "remaining_time": "1:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17374, "total_steps": 17941, "loss": 1.7628, "learning_rate": 2.582803206848283e-07, "epoch": 0.9683964104564963, "percentage": 96.84, "elapsed_time": "1 day, 17:07:10", "remaining_time": "1:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17375, "total_steps": 17941, "loss": 1.3498, "learning_rate": 2.5737722948959155e-07, "epoch": 0.9684521487096595, "percentage": 96.85, "elapsed_time": "1 day, 17:07:19", "remaining_time": "1:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17376, "total_steps": 17941, "loss": 1.6097, "learning_rate": 2.5647571584032635e-07, "epoch": 0.9685078869628226, "percentage": 96.85, "elapsed_time": "1 day, 17:07:27", "remaining_time": "1:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17377, "total_steps": 17941, "loss": 1.4861, "learning_rate": 2.555757797656266e-07, "epoch": 0.9685636252159857, "percentage": 96.86, "elapsed_time": "1 day, 17:07:36", "remaining_time": "1:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17378, "total_steps": 17941, "loss": 1.6977, "learning_rate": 2.546774212940306e-07, "epoch": 0.9686193634691489, "percentage": 96.86, "elapsed_time": "1 day, 17:07:44", "remaining_time": "1:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17379, "total_steps": 17941, "loss": 1.5545, "learning_rate": 2.537806404540377e-07, "epoch": 0.968675101722312, "percentage": 96.87, "elapsed_time": "1 day, 17:07:52", "remaining_time": "1:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17380, "total_steps": 17941, "loss": 1.827, "learning_rate": 2.528854372740752e-07, "epoch": 0.9687308399754752, "percentage": 96.87, "elapsed_time": "1 day, 17:08:01", "remaining_time": "1:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17381, "total_steps": 17941, "loss": 1.4785, "learning_rate": 2.5199181178254814e-07, "epoch": 0.9687865782286383, "percentage": 96.88, "elapsed_time": "1 day, 17:08:09", "remaining_time": "1:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17382, "total_steps": 17941, "loss": 1.6028, "learning_rate": 2.510997640077839e-07, "epoch": 0.9688423164818014, "percentage": 96.88, "elapsed_time": "1 day, 17:08:18", "remaining_time": "1:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17383, "total_steps": 17941, "loss": 1.6416, "learning_rate": 2.50209293978082e-07, "epoch": 0.9688980547349646, "percentage": 96.89, "elapsed_time": "1 day, 17:08:26", "remaining_time": "1:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17384, "total_steps": 17941, "loss": 1.5737, "learning_rate": 2.493204017216755e-07, "epoch": 0.9689537929881278, "percentage": 96.9, "elapsed_time": "1 day, 17:08:35", "remaining_time": "1:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17385, "total_steps": 17941, "loss": 1.6412, "learning_rate": 2.4843308726676396e-07, "epoch": 0.9690095312412909, "percentage": 96.9, "elapsed_time": "1 day, 17:08:43", "remaining_time": "1:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17386, "total_steps": 17941, "loss": 1.6683, "learning_rate": 2.475473506414805e-07, "epoch": 0.969065269494454, "percentage": 96.91, "elapsed_time": "1 day, 17:08:52", "remaining_time": "1:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17387, "total_steps": 17941, "loss": 1.6574, "learning_rate": 2.466631918739193e-07, "epoch": 0.9691210077476172, "percentage": 96.91, "elapsed_time": "1 day, 17:09:00", "remaining_time": "1:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17388, "total_steps": 17941, "loss": 1.7983, "learning_rate": 2.45780610992119e-07, "epoch": 0.9691767460007803, "percentage": 96.92, "elapsed_time": "1 day, 17:09:09", "remaining_time": "1:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17389, "total_steps": 17941, "loss": 1.8562, "learning_rate": 2.44899608024074e-07, "epoch": 0.9692324842539435, "percentage": 96.92, "elapsed_time": "1 day, 17:09:17", "remaining_time": "1:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17390, "total_steps": 17941, "loss": 1.2506, "learning_rate": 2.4402018299771736e-07, "epoch": 0.9692882225071067, "percentage": 96.93, "elapsed_time": "1 day, 17:09:26", "remaining_time": "1:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17391, "total_steps": 17941, "loss": 1.6392, "learning_rate": 2.4314233594094904e-07, "epoch": 0.9693439607602697, "percentage": 96.93, "elapsed_time": "1 day, 17:09:34", "remaining_time": "1:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17392, "total_steps": 17941, "loss": 1.6612, "learning_rate": 2.422660668815968e-07, "epoch": 0.9693996990134329, "percentage": 96.94, "elapsed_time": "1 day, 17:09:42", "remaining_time": "1:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17393, "total_steps": 17941, "loss": 1.6994, "learning_rate": 2.4139137584745507e-07, "epoch": 0.9694554372665961, "percentage": 96.95, "elapsed_time": "1 day, 17:09:51", "remaining_time": "1:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17394, "total_steps": 17941, "loss": 1.5613, "learning_rate": 2.4051826286627386e-07, "epoch": 0.9695111755197592, "percentage": 96.95, "elapsed_time": "1 day, 17:10:00", "remaining_time": "1:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17395, "total_steps": 17941, "loss": 1.5602, "learning_rate": 2.396467279657255e-07, "epoch": 0.9695669137729224, "percentage": 96.96, "elapsed_time": "1 day, 17:10:08", "remaining_time": "1:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17396, "total_steps": 17941, "loss": 1.6979, "learning_rate": 2.387767711734712e-07, "epoch": 0.9696226520260856, "percentage": 96.96, "elapsed_time": "1 day, 17:10:16", "remaining_time": "1:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17397, "total_steps": 17941, "loss": 1.5671, "learning_rate": 2.379083925170833e-07, "epoch": 0.9696783902792486, "percentage": 96.97, "elapsed_time": "1 day, 17:10:25", "remaining_time": "1:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17398, "total_steps": 17941, "loss": 1.728, "learning_rate": 2.3704159202410647e-07, "epoch": 0.9697341285324118, "percentage": 96.97, "elapsed_time": "1 day, 17:10:34", "remaining_time": "1:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17399, "total_steps": 17941, "loss": 1.612, "learning_rate": 2.361763697220354e-07, "epoch": 0.969789866785575, "percentage": 96.98, "elapsed_time": "1 day, 17:10:42", "remaining_time": "1:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17400, "total_steps": 17941, "loss": 1.7587, "learning_rate": 2.3531272563830364e-07, "epoch": 0.9698456050387381, "percentage": 96.98, "elapsed_time": "1 day, 17:10:52", "remaining_time": "1:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17401, "total_steps": 17941, "loss": 1.6518, "learning_rate": 2.3445065980031156e-07, "epoch": 0.9699013432919013, "percentage": 96.99, "elapsed_time": "1 day, 17:11:00", "remaining_time": "1:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17402, "total_steps": 17941, "loss": 1.7213, "learning_rate": 2.335901722353817e-07, "epoch": 0.9699570815450643, "percentage": 97.0, "elapsed_time": "1 day, 17:11:08", "remaining_time": "1:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17403, "total_steps": 17941, "loss": 1.5702, "learning_rate": 2.3273126297082003e-07, "epoch": 0.9700128197982275, "percentage": 97.0, "elapsed_time": "1 day, 17:11:17", "remaining_time": "1:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17404, "total_steps": 17941, "loss": 1.7451, "learning_rate": 2.3187393203385476e-07, "epoch": 0.9700685580513907, "percentage": 97.01, "elapsed_time": "1 day, 17:11:25", "remaining_time": "1:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17405, "total_steps": 17941, "loss": 1.7603, "learning_rate": 2.310181794516808e-07, "epoch": 0.9701242963045538, "percentage": 97.01, "elapsed_time": "1 day, 17:11:34", "remaining_time": "1:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17406, "total_steps": 17941, "loss": 1.701, "learning_rate": 2.301640052514431e-07, "epoch": 0.970180034557717, "percentage": 97.02, "elapsed_time": "1 day, 17:11:42", "remaining_time": "1:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17407, "total_steps": 17941, "loss": 1.5951, "learning_rate": 2.2931140946021445e-07, "epoch": 0.9702357728108801, "percentage": 97.02, "elapsed_time": "1 day, 17:11:51", "remaining_time": "1:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17408, "total_steps": 17941, "loss": 1.5476, "learning_rate": 2.2846039210505653e-07, "epoch": 0.9702915110640432, "percentage": 97.03, "elapsed_time": "1 day, 17:11:59", "remaining_time": "1:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17409, "total_steps": 17941, "loss": 1.5117, "learning_rate": 2.2761095321293667e-07, "epoch": 0.9703472493172064, "percentage": 97.03, "elapsed_time": "1 day, 17:12:07", "remaining_time": "1:15:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17410, "total_steps": 17941, "loss": 1.5716, "learning_rate": 2.2676309281080555e-07, "epoch": 0.9704029875703696, "percentage": 97.04, "elapsed_time": "1 day, 17:12:16", "remaining_time": "1:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17411, "total_steps": 17941, "loss": 1.7473, "learning_rate": 2.2591681092555827e-07, "epoch": 0.9704587258235327, "percentage": 97.05, "elapsed_time": "1 day, 17:12:24", "remaining_time": "1:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17412, "total_steps": 17941, "loss": 1.954, "learning_rate": 2.2507210758401787e-07, "epoch": 0.9705144640766958, "percentage": 97.05, "elapsed_time": "1 day, 17:12:33", "remaining_time": "1:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17413, "total_steps": 17941, "loss": 1.4049, "learning_rate": 2.2422898281299064e-07, "epoch": 0.970570202329859, "percentage": 97.06, "elapsed_time": "1 day, 17:12:41", "remaining_time": "1:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17414, "total_steps": 17941, "loss": 1.6264, "learning_rate": 2.233874366391997e-07, "epoch": 0.9706259405830221, "percentage": 97.06, "elapsed_time": "1 day, 17:12:50", "remaining_time": "1:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17415, "total_steps": 17941, "loss": 1.4372, "learning_rate": 2.2254746908934588e-07, "epoch": 0.9706816788361853, "percentage": 97.07, "elapsed_time": "1 day, 17:12:59", "remaining_time": "1:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17416, "total_steps": 17941, "loss": 1.4728, "learning_rate": 2.2170908019006344e-07, "epoch": 0.9707374170893485, "percentage": 97.07, "elapsed_time": "1 day, 17:13:07", "remaining_time": "1:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17417, "total_steps": 17941, "loss": 1.7119, "learning_rate": 2.2087226996794218e-07, "epoch": 0.9707931553425115, "percentage": 97.08, "elapsed_time": "1 day, 17:13:16", "remaining_time": "1:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17418, "total_steps": 17941, "loss": 1.5581, "learning_rate": 2.200370384495165e-07, "epoch": 0.9708488935956747, "percentage": 97.08, "elapsed_time": "1 day, 17:13:24", "remaining_time": "1:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17419, "total_steps": 17941, "loss": 1.4902, "learning_rate": 2.1920338566128185e-07, "epoch": 0.9709046318488379, "percentage": 97.09, "elapsed_time": "1 day, 17:13:32", "remaining_time": "1:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17420, "total_steps": 17941, "loss": 1.5332, "learning_rate": 2.1837131162967263e-07, "epoch": 0.970960370102001, "percentage": 97.1, "elapsed_time": "1 day, 17:13:41", "remaining_time": "1:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17421, "total_steps": 17941, "loss": 1.7266, "learning_rate": 2.1754081638107326e-07, "epoch": 0.9710161083551642, "percentage": 97.1, "elapsed_time": "1 day, 17:13:50", "remaining_time": "1:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17422, "total_steps": 17941, "loss": 1.7387, "learning_rate": 2.1671189994183493e-07, "epoch": 0.9710718466083273, "percentage": 97.11, "elapsed_time": "1 day, 17:13:58", "remaining_time": "1:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17423, "total_steps": 17941, "loss": 1.6106, "learning_rate": 2.1588456233823662e-07, "epoch": 0.9711275848614904, "percentage": 97.11, "elapsed_time": "1 day, 17:14:06", "remaining_time": "1:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17424, "total_steps": 17941, "loss": 1.6707, "learning_rate": 2.1505880359651842e-07, "epoch": 0.9711833231146536, "percentage": 97.12, "elapsed_time": "1 day, 17:14:15", "remaining_time": "1:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17425, "total_steps": 17941, "loss": 1.5115, "learning_rate": 2.1423462374286496e-07, "epoch": 0.9712390613678167, "percentage": 97.12, "elapsed_time": "1 day, 17:14:23", "remaining_time": "1:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17426, "total_steps": 17941, "loss": 1.4976, "learning_rate": 2.1341202280342198e-07, "epoch": 0.9712947996209799, "percentage": 97.13, "elapsed_time": "1 day, 17:14:32", "remaining_time": "1:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17427, "total_steps": 17941, "loss": 1.6415, "learning_rate": 2.125910008042742e-07, "epoch": 0.971350537874143, "percentage": 97.14, "elapsed_time": "1 day, 17:14:40", "remaining_time": "1:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17428, "total_steps": 17941, "loss": 1.8922, "learning_rate": 2.1177155777145075e-07, "epoch": 0.9714062761273061, "percentage": 97.14, "elapsed_time": "1 day, 17:14:50", "remaining_time": "1:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17429, "total_steps": 17941, "loss": 1.7416, "learning_rate": 2.1095369373095864e-07, "epoch": 0.9714620143804693, "percentage": 97.15, "elapsed_time": "1 day, 17:14:58", "remaining_time": "1:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17430, "total_steps": 17941, "loss": 1.6385, "learning_rate": 2.1013740870872157e-07, "epoch": 0.9715177526336325, "percentage": 97.15, "elapsed_time": "1 day, 17:15:07", "remaining_time": "1:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17431, "total_steps": 17941, "loss": 1.6032, "learning_rate": 2.0932270273062993e-07, "epoch": 0.9715734908867956, "percentage": 97.16, "elapsed_time": "1 day, 17:15:15", "remaining_time": "1:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17432, "total_steps": 17941, "loss": 1.8481, "learning_rate": 2.0850957582252418e-07, "epoch": 0.9716292291399587, "percentage": 97.16, "elapsed_time": "1 day, 17:15:24", "remaining_time": "1:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17433, "total_steps": 17941, "loss": 1.6074, "learning_rate": 2.0769802801018923e-07, "epoch": 0.9716849673931219, "percentage": 97.17, "elapsed_time": "1 day, 17:15:32", "remaining_time": "1:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17434, "total_steps": 17941, "loss": 1.6911, "learning_rate": 2.0688805931936006e-07, "epoch": 0.971740705646285, "percentage": 97.17, "elapsed_time": "1 day, 17:15:40", "remaining_time": "1:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17435, "total_steps": 17941, "loss": 1.805, "learning_rate": 2.0607966977573278e-07, "epoch": 0.9717964438994482, "percentage": 97.18, "elapsed_time": "1 day, 17:15:49", "remaining_time": "1:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17436, "total_steps": 17941, "loss": 1.5898, "learning_rate": 2.052728594049369e-07, "epoch": 0.9718521821526114, "percentage": 97.19, "elapsed_time": "1 day, 17:15:57", "remaining_time": "1:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17437, "total_steps": 17941, "loss": 1.556, "learning_rate": 2.0446762823256304e-07, "epoch": 0.9719079204057745, "percentage": 97.19, "elapsed_time": "1 day, 17:16:06", "remaining_time": "1:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17438, "total_steps": 17941, "loss": 1.7866, "learning_rate": 2.0366397628414634e-07, "epoch": 0.9719636586589376, "percentage": 97.2, "elapsed_time": "1 day, 17:16:15", "remaining_time": "1:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17439, "total_steps": 17941, "loss": 1.6995, "learning_rate": 2.0286190358517753e-07, "epoch": 0.9720193969121008, "percentage": 97.2, "elapsed_time": "1 day, 17:16:23", "remaining_time": "1:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17440, "total_steps": 17941, "loss": 1.2878, "learning_rate": 2.020614101610918e-07, "epoch": 0.9720751351652639, "percentage": 97.21, "elapsed_time": "1 day, 17:16:32", "remaining_time": "1:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17441, "total_steps": 17941, "loss": 1.5829, "learning_rate": 2.0126249603727998e-07, "epoch": 0.9721308734184271, "percentage": 97.21, "elapsed_time": "1 day, 17:16:41", "remaining_time": "1:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17442, "total_steps": 17941, "loss": 1.535, "learning_rate": 2.0046516123906623e-07, "epoch": 0.9721866116715903, "percentage": 97.22, "elapsed_time": "1 day, 17:16:49", "remaining_time": "1:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17443, "total_steps": 17941, "loss": 1.5099, "learning_rate": 1.9966940579175253e-07, "epoch": 0.9722423499247533, "percentage": 97.22, "elapsed_time": "1 day, 17:16:58", "remaining_time": "1:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17444, "total_steps": 17941, "loss": 1.5699, "learning_rate": 1.988752297205687e-07, "epoch": 0.9722980881779165, "percentage": 97.23, "elapsed_time": "1 day, 17:17:06", "remaining_time": "1:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17445, "total_steps": 17941, "loss": 1.4562, "learning_rate": 1.980826330507002e-07, "epoch": 0.9723538264310797, "percentage": 97.24, "elapsed_time": "1 day, 17:17:15", "remaining_time": "1:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17446, "total_steps": 17941, "loss": 1.5444, "learning_rate": 1.9729161580728794e-07, "epoch": 0.9724095646842428, "percentage": 97.24, "elapsed_time": "1 day, 17:17:24", "remaining_time": "1:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17447, "total_steps": 17941, "loss": 1.7887, "learning_rate": 1.9650217801540637e-07, "epoch": 0.972465302937406, "percentage": 97.25, "elapsed_time": "1 day, 17:17:32", "remaining_time": "1:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17448, "total_steps": 17941, "loss": 1.3856, "learning_rate": 1.9571431970011322e-07, "epoch": 0.972521041190569, "percentage": 97.25, "elapsed_time": "1 day, 17:17:42", "remaining_time": "1:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17449, "total_steps": 17941, "loss": 1.621, "learning_rate": 1.9492804088637739e-07, "epoch": 0.9725767794437322, "percentage": 97.26, "elapsed_time": "1 day, 17:17:50", "remaining_time": "1:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17450, "total_steps": 17941, "loss": 1.5547, "learning_rate": 1.9414334159914006e-07, "epoch": 0.9726325176968954, "percentage": 97.26, "elapsed_time": "1 day, 17:17:58", "remaining_time": "1:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17451, "total_steps": 17941, "loss": 1.7351, "learning_rate": 1.9336022186328683e-07, "epoch": 0.9726882559500585, "percentage": 97.27, "elapsed_time": "1 day, 17:18:07", "remaining_time": "1:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17452, "total_steps": 17941, "loss": 1.4511, "learning_rate": 1.9257868170365346e-07, "epoch": 0.9727439942032217, "percentage": 97.27, "elapsed_time": "1 day, 17:18:16", "remaining_time": "1:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17453, "total_steps": 17941, "loss": 1.5941, "learning_rate": 1.9179872114503118e-07, "epoch": 0.9727997324563848, "percentage": 97.28, "elapsed_time": "1 day, 17:18:24", "remaining_time": "1:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17454, "total_steps": 17941, "loss": 1.5145, "learning_rate": 1.9102034021215022e-07, "epoch": 0.9728554707095479, "percentage": 97.29, "elapsed_time": "1 day, 17:18:33", "remaining_time": "1:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17455, "total_steps": 17941, "loss": 1.8374, "learning_rate": 1.9024353892969639e-07, "epoch": 0.9729112089627111, "percentage": 97.29, "elapsed_time": "1 day, 17:18:41", "remaining_time": "1:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17456, "total_steps": 17941, "loss": 1.6687, "learning_rate": 1.8946831732231107e-07, "epoch": 0.9729669472158743, "percentage": 97.3, "elapsed_time": "1 day, 17:18:50", "remaining_time": "1:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17457, "total_steps": 17941, "loss": 1.7319, "learning_rate": 1.886946754145691e-07, "epoch": 0.9730226854690374, "percentage": 97.3, "elapsed_time": "1 day, 17:18:58", "remaining_time": "1:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17458, "total_steps": 17941, "loss": 1.7592, "learning_rate": 1.879226132310119e-07, "epoch": 0.9730784237222005, "percentage": 97.31, "elapsed_time": "1 day, 17:19:07", "remaining_time": "1:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17459, "total_steps": 17941, "loss": 1.7894, "learning_rate": 1.8715213079612548e-07, "epoch": 0.9731341619753637, "percentage": 97.31, "elapsed_time": "1 day, 17:19:15", "remaining_time": "1:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17460, "total_steps": 17941, "loss": 1.751, "learning_rate": 1.8638322813435138e-07, "epoch": 0.9731899002285268, "percentage": 97.32, "elapsed_time": "1 day, 17:19:23", "remaining_time": "1:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17461, "total_steps": 17941, "loss": 1.8523, "learning_rate": 1.85615905270059e-07, "epoch": 0.97324563848169, "percentage": 97.32, "elapsed_time": "1 day, 17:19:32", "remaining_time": "1:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17462, "total_steps": 17941, "loss": 1.7618, "learning_rate": 1.8485016222759555e-07, "epoch": 0.9733013767348532, "percentage": 97.33, "elapsed_time": "1 day, 17:19:41", "remaining_time": "1:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17463, "total_steps": 17941, "loss": 1.5608, "learning_rate": 1.8408599903124156e-07, "epoch": 0.9733571149880162, "percentage": 97.34, "elapsed_time": "1 day, 17:19:49", "remaining_time": "1:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17464, "total_steps": 17941, "loss": 1.2819, "learning_rate": 1.8332341570523326e-07, "epoch": 0.9734128532411794, "percentage": 97.34, "elapsed_time": "1 day, 17:19:58", "remaining_time": "1:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17465, "total_steps": 17941, "loss": 1.7922, "learning_rate": 1.8256241227375682e-07, "epoch": 0.9734685914943426, "percentage": 97.35, "elapsed_time": "1 day, 17:20:07", "remaining_time": "1:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17466, "total_steps": 17941, "loss": 1.6168, "learning_rate": 1.8180298876094294e-07, "epoch": 0.9735243297475057, "percentage": 97.35, "elapsed_time": "1 day, 17:20:15", "remaining_time": "1:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17467, "total_steps": 17941, "loss": 1.6254, "learning_rate": 1.810451451908779e-07, "epoch": 0.9735800680006689, "percentage": 97.36, "elapsed_time": "1 day, 17:20:25", "remaining_time": "1:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17468, "total_steps": 17941, "loss": 1.3905, "learning_rate": 1.8028888158759806e-07, "epoch": 0.9736358062538321, "percentage": 97.36, "elapsed_time": "1 day, 17:20:33", "remaining_time": "1:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17469, "total_steps": 17941, "loss": 1.7984, "learning_rate": 1.7953419797508418e-07, "epoch": 0.9736915445069951, "percentage": 97.37, "elapsed_time": "1 day, 17:20:42", "remaining_time": "1:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17470, "total_steps": 17941, "loss": 1.5176, "learning_rate": 1.7878109437727275e-07, "epoch": 0.9737472827601583, "percentage": 97.37, "elapsed_time": "1 day, 17:20:50", "remaining_time": "1:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17471, "total_steps": 17941, "loss": 1.5487, "learning_rate": 1.780295708180446e-07, "epoch": 0.9738030210133214, "percentage": 97.38, "elapsed_time": "1 day, 17:20:59", "remaining_time": "1:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17472, "total_steps": 17941, "loss": 1.1495, "learning_rate": 1.772796273212418e-07, "epoch": 0.9738587592664846, "percentage": 97.39, "elapsed_time": "1 day, 17:21:07", "remaining_time": "1:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17473, "total_steps": 17941, "loss": 1.4882, "learning_rate": 1.7653126391063422e-07, "epoch": 0.9739144975196478, "percentage": 97.39, "elapsed_time": "1 day, 17:21:15", "remaining_time": "1:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17474, "total_steps": 17941, "loss": 1.449, "learning_rate": 1.757844806099751e-07, "epoch": 0.9739702357728108, "percentage": 97.4, "elapsed_time": "1 day, 17:21:24", "remaining_time": "1:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17475, "total_steps": 17941, "loss": 1.6215, "learning_rate": 1.750392774429288e-07, "epoch": 0.974025974025974, "percentage": 97.4, "elapsed_time": "1 day, 17:21:33", "remaining_time": "1:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17476, "total_steps": 17941, "loss": 1.6578, "learning_rate": 1.7429565443313755e-07, "epoch": 0.9740817122791372, "percentage": 97.41, "elapsed_time": "1 day, 17:21:41", "remaining_time": "1:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17477, "total_steps": 17941, "loss": 1.4979, "learning_rate": 1.735536116041825e-07, "epoch": 0.9741374505323003, "percentage": 97.41, "elapsed_time": "1 day, 17:21:49", "remaining_time": "1:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17478, "total_steps": 17941, "loss": 1.406, "learning_rate": 1.7281314897960587e-07, "epoch": 0.9741931887854635, "percentage": 97.42, "elapsed_time": "1 day, 17:21:58", "remaining_time": "1:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17479, "total_steps": 17941, "loss": 1.8241, "learning_rate": 1.7207426658287783e-07, "epoch": 0.9742489270386266, "percentage": 97.42, "elapsed_time": "1 day, 17:22:07", "remaining_time": "1:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17480, "total_steps": 17941, "loss": 1.4602, "learning_rate": 1.7133696443743518e-07, "epoch": 0.9743046652917897, "percentage": 97.43, "elapsed_time": "1 day, 17:22:15", "remaining_time": "1:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17481, "total_steps": 17941, "loss": 1.4693, "learning_rate": 1.7060124256667032e-07, "epoch": 0.9743604035449529, "percentage": 97.44, "elapsed_time": "1 day, 17:22:24", "remaining_time": "1:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17482, "total_steps": 17941, "loss": 1.5575, "learning_rate": 1.6986710099390347e-07, "epoch": 0.9744161417981161, "percentage": 97.44, "elapsed_time": "1 day, 17:22:33", "remaining_time": "1:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17483, "total_steps": 17941, "loss": 1.3921, "learning_rate": 1.6913453974242155e-07, "epoch": 0.9744718800512792, "percentage": 97.45, "elapsed_time": "1 day, 17:22:42", "remaining_time": "1:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17484, "total_steps": 17941, "loss": 1.8316, "learning_rate": 1.6840355883546154e-07, "epoch": 0.9745276183044423, "percentage": 97.45, "elapsed_time": "1 day, 17:22:50", "remaining_time": "1:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17485, "total_steps": 17941, "loss": 1.7087, "learning_rate": 1.6767415829619936e-07, "epoch": 0.9745833565576055, "percentage": 97.46, "elapsed_time": "1 day, 17:22:58", "remaining_time": "1:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17486, "total_steps": 17941, "loss": 1.8712, "learning_rate": 1.6694633814777204e-07, "epoch": 0.9746390948107686, "percentage": 97.46, "elapsed_time": "1 day, 17:23:07", "remaining_time": "1:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17487, "total_steps": 17941, "loss": 1.6848, "learning_rate": 1.662200984132556e-07, "epoch": 0.9746948330639318, "percentage": 97.47, "elapsed_time": "1 day, 17:23:15", "remaining_time": "1:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17488, "total_steps": 17941, "loss": 1.5194, "learning_rate": 1.6549543911569265e-07, "epoch": 0.974750571317095, "percentage": 97.48, "elapsed_time": "1 day, 17:23:25", "remaining_time": "1:04:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17489, "total_steps": 17941, "loss": 1.6262, "learning_rate": 1.6477236027805376e-07, "epoch": 0.974806309570258, "percentage": 97.48, "elapsed_time": "1 day, 17:23:34", "remaining_time": "1:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17490, "total_steps": 17941, "loss": 1.6148, "learning_rate": 1.6405086192328168e-07, "epoch": 0.9748620478234212, "percentage": 97.49, "elapsed_time": "1 day, 17:23:42", "remaining_time": "1:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17491, "total_steps": 17941, "loss": 1.8156, "learning_rate": 1.63330944074247e-07, "epoch": 0.9749177860765844, "percentage": 97.49, "elapsed_time": "1 day, 17:23:50", "remaining_time": "1:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17492, "total_steps": 17941, "loss": 1.5922, "learning_rate": 1.6261260675379254e-07, "epoch": 0.9749735243297475, "percentage": 97.5, "elapsed_time": "1 day, 17:23:59", "remaining_time": "1:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17493, "total_steps": 17941, "loss": 1.6144, "learning_rate": 1.6189584998468897e-07, "epoch": 0.9750292625829107, "percentage": 97.5, "elapsed_time": "1 day, 17:24:07", "remaining_time": "1:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17494, "total_steps": 17941, "loss": 1.4621, "learning_rate": 1.6118067378967373e-07, "epoch": 0.9750850008360737, "percentage": 97.51, "elapsed_time": "1 day, 17:24:16", "remaining_time": "1:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17495, "total_steps": 17941, "loss": 1.6115, "learning_rate": 1.604670781914286e-07, "epoch": 0.9751407390892369, "percentage": 97.51, "elapsed_time": "1 day, 17:24:24", "remaining_time": "1:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17496, "total_steps": 17941, "loss": 1.7181, "learning_rate": 1.5975506321257995e-07, "epoch": 0.9751964773424001, "percentage": 97.52, "elapsed_time": "1 day, 17:24:34", "remaining_time": "1:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17497, "total_steps": 17941, "loss": 1.6811, "learning_rate": 1.5904462887571526e-07, "epoch": 0.9752522155955632, "percentage": 97.53, "elapsed_time": "1 day, 17:24:42", "remaining_time": "1:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17498, "total_steps": 17941, "loss": 1.6505, "learning_rate": 1.5833577520336652e-07, "epoch": 0.9753079538487264, "percentage": 97.53, "elapsed_time": "1 day, 17:24:50", "remaining_time": "1:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17499, "total_steps": 17941, "loss": 1.5923, "learning_rate": 1.5762850221799908e-07, "epoch": 0.9753636921018896, "percentage": 97.54, "elapsed_time": "1 day, 17:24:59", "remaining_time": "1:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17500, "total_steps": 17941, "loss": 1.5352, "learning_rate": 1.5692280994206166e-07, "epoch": 0.9754194303550526, "percentage": 97.54, "elapsed_time": "1 day, 17:25:07", "remaining_time": "1:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17501, "total_steps": 17941, "loss": 1.6762, "learning_rate": 1.5621869839792525e-07, "epoch": 0.9754751686082158, "percentage": 97.55, "elapsed_time": "1 day, 17:25:16", "remaining_time": "1:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17502, "total_steps": 17941, "loss": 1.6437, "learning_rate": 1.5551616760792198e-07, "epoch": 0.975530906861379, "percentage": 97.55, "elapsed_time": "1 day, 17:25:24", "remaining_time": "1:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17503, "total_steps": 17941, "loss": 1.8254, "learning_rate": 1.5481521759433403e-07, "epoch": 0.9755866451145421, "percentage": 97.56, "elapsed_time": "1 day, 17:25:33", "remaining_time": "1:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17504, "total_steps": 17941, "loss": 1.7997, "learning_rate": 1.5411584837938808e-07, "epoch": 0.9756423833677053, "percentage": 97.56, "elapsed_time": "1 day, 17:25:41", "remaining_time": "1:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17505, "total_steps": 17941, "loss": 1.4193, "learning_rate": 1.5341805998526638e-07, "epoch": 0.9756981216208684, "percentage": 97.57, "elapsed_time": "1 day, 17:25:50", "remaining_time": "1:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17506, "total_steps": 17941, "loss": 1.8292, "learning_rate": 1.527218524341012e-07, "epoch": 0.9757538598740315, "percentage": 97.58, "elapsed_time": "1 day, 17:25:58", "remaining_time": "1:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17507, "total_steps": 17941, "loss": 1.6791, "learning_rate": 1.520272257479638e-07, "epoch": 0.9758095981271947, "percentage": 97.58, "elapsed_time": "1 day, 17:26:07", "remaining_time": "1:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17508, "total_steps": 17941, "loss": 1.6145, "learning_rate": 1.5133417994889208e-07, "epoch": 0.9758653363803579, "percentage": 97.59, "elapsed_time": "1 day, 17:26:16", "remaining_time": "1:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17509, "total_steps": 17941, "loss": 1.5854, "learning_rate": 1.5064271505886297e-07, "epoch": 0.975921074633521, "percentage": 97.59, "elapsed_time": "1 day, 17:26:24", "remaining_time": "1:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17510, "total_steps": 17941, "loss": 1.7567, "learning_rate": 1.4995283109980329e-07, "epoch": 0.9759768128866841, "percentage": 97.6, "elapsed_time": "1 day, 17:26:33", "remaining_time": "1:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17511, "total_steps": 17941, "loss": 1.4395, "learning_rate": 1.4926452809359004e-07, "epoch": 0.9760325511398473, "percentage": 97.6, "elapsed_time": "1 day, 17:26:41", "remaining_time": "1:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17512, "total_steps": 17941, "loss": 1.6581, "learning_rate": 1.4857780606206685e-07, "epoch": 0.9760882893930104, "percentage": 97.61, "elapsed_time": "1 day, 17:26:50", "remaining_time": "1:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17513, "total_steps": 17941, "loss": 1.6412, "learning_rate": 1.4789266502699406e-07, "epoch": 0.9761440276461736, "percentage": 97.61, "elapsed_time": "1 day, 17:26:59", "remaining_time": "1:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17514, "total_steps": 17941, "loss": 1.7759, "learning_rate": 1.4720910501010432e-07, "epoch": 0.9761997658993368, "percentage": 97.62, "elapsed_time": "1 day, 17:27:07", "remaining_time": "1:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17515, "total_steps": 17941, "loss": 1.4624, "learning_rate": 1.4652712603308583e-07, "epoch": 0.9762555041524998, "percentage": 97.63, "elapsed_time": "1 day, 17:27:16", "remaining_time": "1:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17516, "total_steps": 17941, "loss": 1.7039, "learning_rate": 1.4584672811756017e-07, "epoch": 0.976311242405663, "percentage": 97.63, "elapsed_time": "1 day, 17:27:24", "remaining_time": "1:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17517, "total_steps": 17941, "loss": 1.5521, "learning_rate": 1.4516791128510453e-07, "epoch": 0.9763669806588261, "percentage": 97.64, "elapsed_time": "1 day, 17:27:33", "remaining_time": "1:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17518, "total_steps": 17941, "loss": 1.688, "learning_rate": 1.444906755572517e-07, "epoch": 0.9764227189119893, "percentage": 97.64, "elapsed_time": "1 day, 17:27:41", "remaining_time": "1:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17519, "total_steps": 17941, "loss": 1.3975, "learning_rate": 1.438150209554734e-07, "epoch": 0.9764784571651525, "percentage": 97.65, "elapsed_time": "1 day, 17:27:50", "remaining_time": "0:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17520, "total_steps": 17941, "loss": 1.686, "learning_rate": 1.4314094750120244e-07, "epoch": 0.9765341954183155, "percentage": 97.65, "elapsed_time": "1 day, 17:27:58", "remaining_time": "0:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17521, "total_steps": 17941, "loss": 1.7495, "learning_rate": 1.424684552158162e-07, "epoch": 0.9765899336714787, "percentage": 97.66, "elapsed_time": "1 day, 17:28:06", "remaining_time": "0:59:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17522, "total_steps": 17941, "loss": 1.6879, "learning_rate": 1.4179754412064205e-07, "epoch": 0.9766456719246419, "percentage": 97.66, "elapsed_time": "1 day, 17:28:15", "remaining_time": "0:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17523, "total_steps": 17941, "loss": 1.643, "learning_rate": 1.4112821423695188e-07, "epoch": 0.976701410177805, "percentage": 97.67, "elapsed_time": "1 day, 17:28:23", "remaining_time": "0:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17524, "total_steps": 17941, "loss": 1.7498, "learning_rate": 1.4046046558598424e-07, "epoch": 0.9767571484309682, "percentage": 97.68, "elapsed_time": "1 day, 17:28:32", "remaining_time": "0:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17525, "total_steps": 17941, "loss": 1.4685, "learning_rate": 1.397942981889e-07, "epoch": 0.9768128866841314, "percentage": 97.68, "elapsed_time": "1 day, 17:28:40", "remaining_time": "0:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17526, "total_steps": 17941, "loss": 1.5475, "learning_rate": 1.3912971206684333e-07, "epoch": 0.9768686249372944, "percentage": 97.69, "elapsed_time": "1 day, 17:28:49", "remaining_time": "0:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17527, "total_steps": 17941, "loss": 1.6087, "learning_rate": 1.3846670724088073e-07, "epoch": 0.9769243631904576, "percentage": 97.69, "elapsed_time": "1 day, 17:28:57", "remaining_time": "0:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17528, "total_steps": 17941, "loss": 1.8259, "learning_rate": 1.3780528373203984e-07, "epoch": 0.9769801014436208, "percentage": 97.7, "elapsed_time": "1 day, 17:29:06", "remaining_time": "0:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17529, "total_steps": 17941, "loss": 1.5683, "learning_rate": 1.3714544156129828e-07, "epoch": 0.9770358396967839, "percentage": 97.7, "elapsed_time": "1 day, 17:29:14", "remaining_time": "0:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17530, "total_steps": 17941, "loss": 1.84, "learning_rate": 1.3648718074958378e-07, "epoch": 0.977091577949947, "percentage": 97.71, "elapsed_time": "1 day, 17:29:23", "remaining_time": "0:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17531, "total_steps": 17941, "loss": 1.6083, "learning_rate": 1.3583050131777408e-07, "epoch": 0.9771473162031102, "percentage": 97.71, "elapsed_time": "1 day, 17:29:32", "remaining_time": "0:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17532, "total_steps": 17941, "loss": 1.6145, "learning_rate": 1.3517540328669143e-07, "epoch": 0.9772030544562733, "percentage": 97.72, "elapsed_time": "1 day, 17:29:40", "remaining_time": "0:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17533, "total_steps": 17941, "loss": 1.6176, "learning_rate": 1.3452188667711364e-07, "epoch": 0.9772587927094365, "percentage": 97.73, "elapsed_time": "1 day, 17:29:49", "remaining_time": "0:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17534, "total_steps": 17941, "loss": 1.6213, "learning_rate": 1.33869951509763e-07, "epoch": 0.9773145309625997, "percentage": 97.73, "elapsed_time": "1 day, 17:29:57", "remaining_time": "0:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17535, "total_steps": 17941, "loss": 1.476, "learning_rate": 1.3321959780531747e-07, "epoch": 0.9773702692157628, "percentage": 97.74, "elapsed_time": "1 day, 17:30:06", "remaining_time": "0:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17536, "total_steps": 17941, "loss": 1.5191, "learning_rate": 1.3257082558440493e-07, "epoch": 0.9774260074689259, "percentage": 97.74, "elapsed_time": "1 day, 17:30:15", "remaining_time": "0:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17537, "total_steps": 17941, "loss": 1.5931, "learning_rate": 1.319236348675923e-07, "epoch": 0.9774817457220891, "percentage": 97.75, "elapsed_time": "1 day, 17:30:23", "remaining_time": "0:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17538, "total_steps": 17941, "loss": 1.5943, "learning_rate": 1.312780256754187e-07, "epoch": 0.9775374839752522, "percentage": 97.75, "elapsed_time": "1 day, 17:30:32", "remaining_time": "0:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17539, "total_steps": 17941, "loss": 1.6834, "learning_rate": 1.306339980283511e-07, "epoch": 0.9775932222284154, "percentage": 97.76, "elapsed_time": "1 day, 17:30:40", "remaining_time": "0:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17540, "total_steps": 17941, "loss": 1.6299, "learning_rate": 1.29991551946812e-07, "epoch": 0.9776489604815785, "percentage": 97.76, "elapsed_time": "1 day, 17:30:48", "remaining_time": "0:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17541, "total_steps": 17941, "loss": 1.5637, "learning_rate": 1.2935068745117962e-07, "epoch": 0.9777046987347416, "percentage": 97.77, "elapsed_time": "1 day, 17:30:57", "remaining_time": "0:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17542, "total_steps": 17941, "loss": 1.7262, "learning_rate": 1.28711404561771e-07, "epoch": 0.9777604369879048, "percentage": 97.78, "elapsed_time": "1 day, 17:31:05", "remaining_time": "0:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17543, "total_steps": 17941, "loss": 1.6842, "learning_rate": 1.2807370329887546e-07, "epoch": 0.9778161752410679, "percentage": 97.78, "elapsed_time": "1 day, 17:31:14", "remaining_time": "0:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17544, "total_steps": 17941, "loss": 1.7178, "learning_rate": 1.2743758368270464e-07, "epoch": 0.9778719134942311, "percentage": 97.79, "elapsed_time": "1 day, 17:31:22", "remaining_time": "0:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17545, "total_steps": 17941, "loss": 1.4419, "learning_rate": 1.268030457334368e-07, "epoch": 0.9779276517473943, "percentage": 97.79, "elapsed_time": "1 day, 17:31:31", "remaining_time": "0:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17546, "total_steps": 17941, "loss": 1.5456, "learning_rate": 1.261700894711948e-07, "epoch": 0.9779833900005573, "percentage": 97.8, "elapsed_time": "1 day, 17:31:39", "remaining_time": "0:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17547, "total_steps": 17941, "loss": 1.6811, "learning_rate": 1.2553871491605697e-07, "epoch": 0.9780391282537205, "percentage": 97.8, "elapsed_time": "1 day, 17:31:48", "remaining_time": "0:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17548, "total_steps": 17941, "loss": 1.5014, "learning_rate": 1.249089220880406e-07, "epoch": 0.9780948665068837, "percentage": 97.81, "elapsed_time": "1 day, 17:31:57", "remaining_time": "0:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17549, "total_steps": 17941, "loss": 1.6858, "learning_rate": 1.2428071100711869e-07, "epoch": 0.9781506047600468, "percentage": 97.82, "elapsed_time": "1 day, 17:32:06", "remaining_time": "0:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17550, "total_steps": 17941, "loss": 1.5579, "learning_rate": 1.2365408169321968e-07, "epoch": 0.97820634301321, "percentage": 97.82, "elapsed_time": "1 day, 17:32:14", "remaining_time": "0:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17551, "total_steps": 17941, "loss": 1.5839, "learning_rate": 1.2302903416621103e-07, "epoch": 0.9782620812663732, "percentage": 97.83, "elapsed_time": "1 day, 17:32:23", "remaining_time": "0:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17552, "total_steps": 17941, "loss": 1.5508, "learning_rate": 1.2240556844592133e-07, "epoch": 0.9783178195195362, "percentage": 97.83, "elapsed_time": "1 day, 17:32:31", "remaining_time": "0:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17553, "total_steps": 17941, "loss": 1.7075, "learning_rate": 1.217836845521181e-07, "epoch": 0.9783735577726994, "percentage": 97.84, "elapsed_time": "1 day, 17:32:39", "remaining_time": "0:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17554, "total_steps": 17941, "loss": 1.8348, "learning_rate": 1.2116338250452995e-07, "epoch": 0.9784292960258626, "percentage": 97.84, "elapsed_time": "1 day, 17:32:48", "remaining_time": "0:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17555, "total_steps": 17941, "loss": 1.9305, "learning_rate": 1.2054466232282457e-07, "epoch": 0.9784850342790257, "percentage": 97.85, "elapsed_time": "1 day, 17:32:57", "remaining_time": "0:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17556, "total_steps": 17941, "loss": 1.5773, "learning_rate": 1.199275240266251e-07, "epoch": 0.9785407725321889, "percentage": 97.85, "elapsed_time": "1 day, 17:33:06", "remaining_time": "0:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17557, "total_steps": 17941, "loss": 1.493, "learning_rate": 1.1931196763549924e-07, "epoch": 0.978596510785352, "percentage": 97.86, "elapsed_time": "1 day, 17:33:14", "remaining_time": "0:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17558, "total_steps": 17941, "loss": 1.4702, "learning_rate": 1.1869799316897579e-07, "epoch": 0.9786522490385151, "percentage": 97.87, "elapsed_time": "1 day, 17:33:23", "remaining_time": "0:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17559, "total_steps": 17941, "loss": 1.7745, "learning_rate": 1.1808560064652807e-07, "epoch": 0.9787079872916783, "percentage": 97.87, "elapsed_time": "1 day, 17:33:31", "remaining_time": "0:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17560, "total_steps": 17941, "loss": 1.6221, "learning_rate": 1.1747479008756835e-07, "epoch": 0.9787637255448415, "percentage": 97.88, "elapsed_time": "1 day, 17:33:40", "remaining_time": "0:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17561, "total_steps": 17941, "loss": 1.5683, "learning_rate": 1.1686556151147554e-07, "epoch": 0.9788194637980046, "percentage": 97.88, "elapsed_time": "1 day, 17:33:48", "remaining_time": "0:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17562, "total_steps": 17941, "loss": 1.5488, "learning_rate": 1.1625791493756755e-07, "epoch": 0.9788752020511677, "percentage": 97.89, "elapsed_time": "1 day, 17:33:56", "remaining_time": "0:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17563, "total_steps": 17941, "loss": 1.6573, "learning_rate": 1.1565185038511229e-07, "epoch": 0.9789309403043308, "percentage": 97.89, "elapsed_time": "1 day, 17:34:05", "remaining_time": "0:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17564, "total_steps": 17941, "loss": 1.8614, "learning_rate": 1.150473678733388e-07, "epoch": 0.978986678557494, "percentage": 97.9, "elapsed_time": "1 day, 17:34:13", "remaining_time": "0:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17565, "total_steps": 17941, "loss": 1.281, "learning_rate": 1.1444446742141512e-07, "epoch": 0.9790424168106572, "percentage": 97.9, "elapsed_time": "1 day, 17:34:22", "remaining_time": "0:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17566, "total_steps": 17941, "loss": 1.7311, "learning_rate": 1.1384314904845372e-07, "epoch": 0.9790981550638203, "percentage": 97.91, "elapsed_time": "1 day, 17:34:30", "remaining_time": "0:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17567, "total_steps": 17941, "loss": 1.5461, "learning_rate": 1.1324341277353378e-07, "epoch": 0.9791538933169834, "percentage": 97.92, "elapsed_time": "1 day, 17:34:39", "remaining_time": "0:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17568, "total_steps": 17941, "loss": 1.6261, "learning_rate": 1.1264525861567344e-07, "epoch": 0.9792096315701466, "percentage": 97.92, "elapsed_time": "1 day, 17:34:47", "remaining_time": "0:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17569, "total_steps": 17941, "loss": 1.5654, "learning_rate": 1.1204868659384082e-07, "epoch": 0.9792653698233097, "percentage": 97.93, "elapsed_time": "1 day, 17:34:56", "remaining_time": "0:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17570, "total_steps": 17941, "loss": 1.4733, "learning_rate": 1.1145369672695971e-07, "epoch": 0.9793211080764729, "percentage": 97.93, "elapsed_time": "1 day, 17:35:04", "remaining_time": "0:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17571, "total_steps": 17941, "loss": 1.724, "learning_rate": 1.1086028903389833e-07, "epoch": 0.9793768463296361, "percentage": 97.94, "elapsed_time": "1 day, 17:35:13", "remaining_time": "0:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17572, "total_steps": 17941, "loss": 1.6512, "learning_rate": 1.1026846353346943e-07, "epoch": 0.9794325845827991, "percentage": 97.94, "elapsed_time": "1 day, 17:35:21", "remaining_time": "0:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17573, "total_steps": 17941, "loss": 1.7214, "learning_rate": 1.096782202444524e-07, "epoch": 0.9794883228359623, "percentage": 97.95, "elapsed_time": "1 day, 17:35:30", "remaining_time": "0:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17574, "total_steps": 17941, "loss": 1.6191, "learning_rate": 1.0908955918556007e-07, "epoch": 0.9795440610891255, "percentage": 97.95, "elapsed_time": "1 day, 17:35:38", "remaining_time": "0:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17575, "total_steps": 17941, "loss": 1.5329, "learning_rate": 1.0850248037546085e-07, "epoch": 0.9795997993422886, "percentage": 97.96, "elapsed_time": "1 day, 17:35:47", "remaining_time": "0:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17576, "total_steps": 17941, "loss": 1.6629, "learning_rate": 1.0791698383277315e-07, "epoch": 0.9796555375954518, "percentage": 97.97, "elapsed_time": "1 day, 17:35:56", "remaining_time": "0:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17577, "total_steps": 17941, "loss": 1.6974, "learning_rate": 1.0733306957607104e-07, "epoch": 0.979711275848615, "percentage": 97.97, "elapsed_time": "1 day, 17:36:04", "remaining_time": "0:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17578, "total_steps": 17941, "loss": 1.6688, "learning_rate": 1.06750737623873e-07, "epoch": 0.979767014101778, "percentage": 97.98, "elapsed_time": "1 day, 17:36:13", "remaining_time": "0:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17579, "total_steps": 17941, "loss": 1.7467, "learning_rate": 1.0616998799463651e-07, "epoch": 0.9798227523549412, "percentage": 97.98, "elapsed_time": "1 day, 17:36:22", "remaining_time": "0:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17580, "total_steps": 17941, "loss": 1.8833, "learning_rate": 1.0559082070679127e-07, "epoch": 0.9798784906081044, "percentage": 97.99, "elapsed_time": "1 day, 17:36:30", "remaining_time": "0:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17581, "total_steps": 17941, "loss": 1.5387, "learning_rate": 1.0501323577870037e-07, "epoch": 0.9799342288612675, "percentage": 97.99, "elapsed_time": "1 day, 17:36:39", "remaining_time": "0:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17582, "total_steps": 17941, "loss": 1.6262, "learning_rate": 1.0443723322868248e-07, "epoch": 0.9799899671144306, "percentage": 98.0, "elapsed_time": "1 day, 17:36:47", "remaining_time": "0:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17583, "total_steps": 17941, "loss": 1.5699, "learning_rate": 1.0386281307500079e-07, "epoch": 0.9800457053675938, "percentage": 98.0, "elapsed_time": "1 day, 17:36:55", "remaining_time": "0:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17584, "total_steps": 17941, "loss": 1.6014, "learning_rate": 1.0328997533587958e-07, "epoch": 0.9801014436207569, "percentage": 98.01, "elapsed_time": "1 day, 17:37:04", "remaining_time": "0:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17585, "total_steps": 17941, "loss": 1.7115, "learning_rate": 1.0271872002948213e-07, "epoch": 0.9801571818739201, "percentage": 98.02, "elapsed_time": "1 day, 17:37:13", "remaining_time": "0:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17586, "total_steps": 17941, "loss": 1.6098, "learning_rate": 1.0214904717392171e-07, "epoch": 0.9802129201270832, "percentage": 98.02, "elapsed_time": "1 day, 17:37:22", "remaining_time": "0:50:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17587, "total_steps": 17941, "loss": 1.4817, "learning_rate": 1.0158095678727275e-07, "epoch": 0.9802686583802463, "percentage": 98.03, "elapsed_time": "1 day, 17:37:30", "remaining_time": "0:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17588, "total_steps": 17941, "loss": 1.4595, "learning_rate": 1.0101444888754308e-07, "epoch": 0.9803243966334095, "percentage": 98.03, "elapsed_time": "1 day, 17:37:38", "remaining_time": "0:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17589, "total_steps": 17941, "loss": 1.6758, "learning_rate": 1.004495234927072e-07, "epoch": 0.9803801348865726, "percentage": 98.04, "elapsed_time": "1 day, 17:37:47", "remaining_time": "0:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17590, "total_steps": 17941, "loss": 1.9659, "learning_rate": 9.988618062068411e-08, "epoch": 0.9804358731397358, "percentage": 98.04, "elapsed_time": "1 day, 17:37:55", "remaining_time": "0:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17591, "total_steps": 17941, "loss": 1.8171, "learning_rate": 9.93244202893262e-08, "epoch": 0.980491611392899, "percentage": 98.05, "elapsed_time": "1 day, 17:38:04", "remaining_time": "0:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17592, "total_steps": 17941, "loss": 1.6474, "learning_rate": 9.87642425164581e-08, "epoch": 0.980547349646062, "percentage": 98.05, "elapsed_time": "1 day, 17:38:12", "remaining_time": "0:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17593, "total_steps": 17941, "loss": 1.7013, "learning_rate": 9.820564731984339e-08, "epoch": 0.9806030878992252, "percentage": 98.06, "elapsed_time": "1 day, 17:38:21", "remaining_time": "0:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17594, "total_steps": 17941, "loss": 1.7987, "learning_rate": 9.764863471719565e-08, "epoch": 0.9806588261523884, "percentage": 98.07, "elapsed_time": "1 day, 17:38:30", "remaining_time": "0:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17595, "total_steps": 17941, "loss": 1.6046, "learning_rate": 9.70932047261841e-08, "epoch": 0.9807145644055515, "percentage": 98.07, "elapsed_time": "1 day, 17:38:39", "remaining_time": "0:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17596, "total_steps": 17941, "loss": 1.7104, "learning_rate": 9.653935736442244e-08, "epoch": 0.9807703026587147, "percentage": 98.08, "elapsed_time": "1 day, 17:38:47", "remaining_time": "0:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17597, "total_steps": 17941, "loss": 1.4238, "learning_rate": 9.598709264947436e-08, "epoch": 0.9808260409118779, "percentage": 98.08, "elapsed_time": "1 day, 17:38:56", "remaining_time": "0:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17598, "total_steps": 17941, "loss": 1.8799, "learning_rate": 9.543641059885922e-08, "epoch": 0.9808817791650409, "percentage": 98.09, "elapsed_time": "1 day, 17:39:04", "remaining_time": "0:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17599, "total_steps": 17941, "loss": 1.4658, "learning_rate": 9.48873112300297e-08, "epoch": 0.9809375174182041, "percentage": 98.09, "elapsed_time": "1 day, 17:39:13", "remaining_time": "0:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17600, "total_steps": 17941, "loss": 1.5968, "learning_rate": 9.433979456041631e-08, "epoch": 0.9809932556713673, "percentage": 98.1, "elapsed_time": "1 day, 17:39:21", "remaining_time": "0:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17601, "total_steps": 17941, "loss": 1.655, "learning_rate": 9.379386060736628e-08, "epoch": 0.9810489939245304, "percentage": 98.1, "elapsed_time": "1 day, 17:39:30", "remaining_time": "0:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17602, "total_steps": 17941, "loss": 1.6373, "learning_rate": 9.324950938820465e-08, "epoch": 0.9811047321776936, "percentage": 98.11, "elapsed_time": "1 day, 17:39:38", "remaining_time": "0:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17603, "total_steps": 17941, "loss": 1.5491, "learning_rate": 9.270674092019537e-08, "epoch": 0.9811604704308567, "percentage": 98.12, "elapsed_time": "1 day, 17:39:47", "remaining_time": "0:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17604, "total_steps": 17941, "loss": 1.5259, "learning_rate": 9.216555522054692e-08, "epoch": 0.9812162086840198, "percentage": 98.12, "elapsed_time": "1 day, 17:39:56", "remaining_time": "0:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17605, "total_steps": 17941, "loss": 1.589, "learning_rate": 9.162595230642334e-08, "epoch": 0.981271946937183, "percentage": 98.13, "elapsed_time": "1 day, 17:40:04", "remaining_time": "0:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17606, "total_steps": 17941, "loss": 1.5886, "learning_rate": 9.108793219493872e-08, "epoch": 0.9813276851903462, "percentage": 98.13, "elapsed_time": "1 day, 17:40:13", "remaining_time": "0:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17607, "total_steps": 17941, "loss": 1.4713, "learning_rate": 9.055149490315163e-08, "epoch": 0.9813834234435093, "percentage": 98.14, "elapsed_time": "1 day, 17:40:21", "remaining_time": "0:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17608, "total_steps": 17941, "loss": 1.5119, "learning_rate": 9.001664044808733e-08, "epoch": 0.9814391616966724, "percentage": 98.14, "elapsed_time": "1 day, 17:40:30", "remaining_time": "0:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17609, "total_steps": 17941, "loss": 1.5986, "learning_rate": 8.94833688466934e-08, "epoch": 0.9814948999498355, "percentage": 98.15, "elapsed_time": "1 day, 17:40:39", "remaining_time": "0:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17610, "total_steps": 17941, "loss": 1.6371, "learning_rate": 8.895168011588961e-08, "epoch": 0.9815506382029987, "percentage": 98.16, "elapsed_time": "1 day, 17:40:47", "remaining_time": "0:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17611, "total_steps": 17941, "loss": 1.4524, "learning_rate": 8.842157427254027e-08, "epoch": 0.9816063764561619, "percentage": 98.16, "elapsed_time": "1 day, 17:40:56", "remaining_time": "0:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17612, "total_steps": 17941, "loss": 1.5316, "learning_rate": 8.78930513334486e-08, "epoch": 0.981662114709325, "percentage": 98.17, "elapsed_time": "1 day, 17:41:04", "remaining_time": "0:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17613, "total_steps": 17941, "loss": 1.6934, "learning_rate": 8.736611131538452e-08, "epoch": 0.9817178529624881, "percentage": 98.17, "elapsed_time": "1 day, 17:41:12", "remaining_time": "0:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17614, "total_steps": 17941, "loss": 1.676, "learning_rate": 8.684075423505688e-08, "epoch": 0.9817735912156513, "percentage": 98.18, "elapsed_time": "1 day, 17:41:21", "remaining_time": "0:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17615, "total_steps": 17941, "loss": 1.5567, "learning_rate": 8.631698010912459e-08, "epoch": 0.9818293294688144, "percentage": 98.18, "elapsed_time": "1 day, 17:41:29", "remaining_time": "0:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17616, "total_steps": 17941, "loss": 1.5866, "learning_rate": 8.579478895420212e-08, "epoch": 0.9818850677219776, "percentage": 98.19, "elapsed_time": "1 day, 17:41:38", "remaining_time": "0:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17617, "total_steps": 17941, "loss": 1.729, "learning_rate": 8.527418078684845e-08, "epoch": 0.9819408059751408, "percentage": 98.19, "elapsed_time": "1 day, 17:41:47", "remaining_time": "0:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17618, "total_steps": 17941, "loss": 1.5519, "learning_rate": 8.475515562357816e-08, "epoch": 0.9819965442283038, "percentage": 98.2, "elapsed_time": "1 day, 17:41:55", "remaining_time": "0:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17619, "total_steps": 17941, "loss": 1.3238, "learning_rate": 8.423771348084474e-08, "epoch": 0.982052282481467, "percentage": 98.21, "elapsed_time": "1 day, 17:42:03", "remaining_time": "0:45:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17620, "total_steps": 17941, "loss": 1.6958, "learning_rate": 8.372185437506285e-08, "epoch": 0.9821080207346302, "percentage": 98.21, "elapsed_time": "1 day, 17:42:12", "remaining_time": "0:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17621, "total_steps": 17941, "loss": 1.5099, "learning_rate": 8.320757832259163e-08, "epoch": 0.9821637589877933, "percentage": 98.22, "elapsed_time": "1 day, 17:42:20", "remaining_time": "0:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17622, "total_steps": 17941, "loss": 1.8139, "learning_rate": 8.269488533974024e-08, "epoch": 0.9822194972409565, "percentage": 98.22, "elapsed_time": "1 day, 17:42:29", "remaining_time": "0:45:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17623, "total_steps": 17941, "loss": 1.7761, "learning_rate": 8.21837754427679e-08, "epoch": 0.9822752354941197, "percentage": 98.23, "elapsed_time": "1 day, 17:42:37", "remaining_time": "0:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17624, "total_steps": 17941, "loss": 1.5626, "learning_rate": 8.167424864788942e-08, "epoch": 0.9823309737472827, "percentage": 98.23, "elapsed_time": "1 day, 17:42:46", "remaining_time": "0:45:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17625, "total_steps": 17941, "loss": 1.29, "learning_rate": 8.1166304971253e-08, "epoch": 0.9823867120004459, "percentage": 98.24, "elapsed_time": "1 day, 17:42:54", "remaining_time": "0:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17626, "total_steps": 17941, "loss": 1.779, "learning_rate": 8.065994442897906e-08, "epoch": 0.9824424502536091, "percentage": 98.24, "elapsed_time": "1 day, 17:43:03", "remaining_time": "0:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17627, "total_steps": 17941, "loss": 1.5287, "learning_rate": 8.015516703712145e-08, "epoch": 0.9824981885067722, "percentage": 98.25, "elapsed_time": "1 day, 17:43:11", "remaining_time": "0:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17628, "total_steps": 17941, "loss": 1.6058, "learning_rate": 7.965197281168957e-08, "epoch": 0.9825539267599354, "percentage": 98.26, "elapsed_time": "1 day, 17:43:19", "remaining_time": "0:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17629, "total_steps": 17941, "loss": 1.5269, "learning_rate": 7.915036176864288e-08, "epoch": 0.9826096650130985, "percentage": 98.26, "elapsed_time": "1 day, 17:43:28", "remaining_time": "0:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17630, "total_steps": 17941, "loss": 1.6304, "learning_rate": 7.865033392388533e-08, "epoch": 0.9826654032662616, "percentage": 98.27, "elapsed_time": "1 day, 17:43:36", "remaining_time": "0:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17631, "total_steps": 17941, "loss": 1.6169, "learning_rate": 7.815188929327644e-08, "epoch": 0.9827211415194248, "percentage": 98.27, "elapsed_time": "1 day, 17:43:45", "remaining_time": "0:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17632, "total_steps": 17941, "loss": 1.4114, "learning_rate": 7.76550278926258e-08, "epoch": 0.9827768797725879, "percentage": 98.28, "elapsed_time": "1 day, 17:43:53", "remaining_time": "0:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17633, "total_steps": 17941, "loss": 1.5866, "learning_rate": 7.715974973769302e-08, "epoch": 0.9828326180257511, "percentage": 98.28, "elapsed_time": "1 day, 17:44:02", "remaining_time": "0:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17634, "total_steps": 17941, "loss": 1.4801, "learning_rate": 7.666605484417666e-08, "epoch": 0.9828883562789142, "percentage": 98.29, "elapsed_time": "1 day, 17:44:10", "remaining_time": "0:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17635, "total_steps": 17941, "loss": 1.5682, "learning_rate": 7.617394322774752e-08, "epoch": 0.9829440945320773, "percentage": 98.29, "elapsed_time": "1 day, 17:44:18", "remaining_time": "0:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17636, "total_steps": 17941, "loss": 1.7344, "learning_rate": 7.568341490399866e-08, "epoch": 0.9829998327852405, "percentage": 98.3, "elapsed_time": "1 day, 17:44:27", "remaining_time": "0:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17637, "total_steps": 17941, "loss": 1.6406, "learning_rate": 7.519446988849543e-08, "epoch": 0.9830555710384037, "percentage": 98.31, "elapsed_time": "1 day, 17:44:36", "remaining_time": "0:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17638, "total_steps": 17941, "loss": 1.6992, "learning_rate": 7.470710819674209e-08, "epoch": 0.9831113092915668, "percentage": 98.31, "elapsed_time": "1 day, 17:44:44", "remaining_time": "0:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17639, "total_steps": 17941, "loss": 1.5221, "learning_rate": 7.422132984419294e-08, "epoch": 0.9831670475447299, "percentage": 98.32, "elapsed_time": "1 day, 17:44:52", "remaining_time": "0:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17640, "total_steps": 17941, "loss": 1.9106, "learning_rate": 7.373713484625789e-08, "epoch": 0.9832227857978931, "percentage": 98.32, "elapsed_time": "1 day, 17:45:01", "remaining_time": "0:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17641, "total_steps": 17941, "loss": 2.0823, "learning_rate": 7.325452321828574e-08, "epoch": 0.9832785240510562, "percentage": 98.33, "elapsed_time": "1 day, 17:45:10", "remaining_time": "0:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17642, "total_steps": 17941, "loss": 1.5629, "learning_rate": 7.277349497559205e-08, "epoch": 0.9833342623042194, "percentage": 98.33, "elapsed_time": "1 day, 17:45:18", "remaining_time": "0:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17643, "total_steps": 17941, "loss": 1.4567, "learning_rate": 7.229405013342572e-08, "epoch": 0.9833900005573826, "percentage": 98.34, "elapsed_time": "1 day, 17:45:27", "remaining_time": "0:42:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17644, "total_steps": 17941, "loss": 1.6365, "learning_rate": 7.18161887069968e-08, "epoch": 0.9834457388105456, "percentage": 98.34, "elapsed_time": "1 day, 17:45:36", "remaining_time": "0:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17645, "total_steps": 17941, "loss": 1.6963, "learning_rate": 7.133991071145429e-08, "epoch": 0.9835014770637088, "percentage": 98.35, "elapsed_time": "1 day, 17:45:44", "remaining_time": "0:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17646, "total_steps": 17941, "loss": 1.8795, "learning_rate": 7.086521616190279e-08, "epoch": 0.983557215316872, "percentage": 98.36, "elapsed_time": "1 day, 17:45:52", "remaining_time": "0:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17647, "total_steps": 17941, "loss": 1.7972, "learning_rate": 7.039210507340244e-08, "epoch": 0.9836129535700351, "percentage": 98.36, "elapsed_time": "1 day, 17:46:01", "remaining_time": "0:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17648, "total_steps": 17941, "loss": 1.6461, "learning_rate": 6.992057746095237e-08, "epoch": 0.9836686918231983, "percentage": 98.37, "elapsed_time": "1 day, 17:46:09", "remaining_time": "0:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17649, "total_steps": 17941, "loss": 1.5296, "learning_rate": 6.945063333951285e-08, "epoch": 0.9837244300763615, "percentage": 98.37, "elapsed_time": "1 day, 17:46:18", "remaining_time": "0:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17650, "total_steps": 17941, "loss": 1.7309, "learning_rate": 6.898227272398305e-08, "epoch": 0.9837801683295245, "percentage": 98.38, "elapsed_time": "1 day, 17:46:27", "remaining_time": "0:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17651, "total_steps": 17941, "loss": 1.4404, "learning_rate": 6.851549562921223e-08, "epoch": 0.9838359065826877, "percentage": 98.38, "elapsed_time": "1 day, 17:46:35", "remaining_time": "0:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17652, "total_steps": 17941, "loss": 1.515, "learning_rate": 6.805030207001629e-08, "epoch": 0.9838916448358509, "percentage": 98.39, "elapsed_time": "1 day, 17:46:44", "remaining_time": "0:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17653, "total_steps": 17941, "loss": 1.7107, "learning_rate": 6.758669206113899e-08, "epoch": 0.983947383089014, "percentage": 98.39, "elapsed_time": "1 day, 17:46:52", "remaining_time": "0:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17654, "total_steps": 17941, "loss": 1.7174, "learning_rate": 6.71246656172797e-08, "epoch": 0.9840031213421772, "percentage": 98.4, "elapsed_time": "1 day, 17:47:01", "remaining_time": "0:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17655, "total_steps": 17941, "loss": 1.7076, "learning_rate": 6.666422275310446e-08, "epoch": 0.9840588595953402, "percentage": 98.41, "elapsed_time": "1 day, 17:47:09", "remaining_time": "0:40:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17656, "total_steps": 17941, "loss": 1.5258, "learning_rate": 6.620536348320716e-08, "epoch": 0.9841145978485034, "percentage": 98.41, "elapsed_time": "1 day, 17:47:18", "remaining_time": "0:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17657, "total_steps": 17941, "loss": 1.6819, "learning_rate": 6.574808782214282e-08, "epoch": 0.9841703361016666, "percentage": 98.42, "elapsed_time": "1 day, 17:47:26", "remaining_time": "0:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17658, "total_steps": 17941, "loss": 1.5465, "learning_rate": 6.529239578440539e-08, "epoch": 0.9842260743548297, "percentage": 98.42, "elapsed_time": "1 day, 17:47:34", "remaining_time": "0:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17659, "total_steps": 17941, "loss": 1.7137, "learning_rate": 6.483828738446107e-08, "epoch": 0.9842818126079929, "percentage": 98.43, "elapsed_time": "1 day, 17:47:43", "remaining_time": "0:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17660, "total_steps": 17941, "loss": 1.4516, "learning_rate": 6.438576263669838e-08, "epoch": 0.984337550861156, "percentage": 98.43, "elapsed_time": "1 day, 17:47:52", "remaining_time": "0:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17661, "total_steps": 17941, "loss": 1.5397, "learning_rate": 6.393482155547803e-08, "epoch": 0.9843932891143191, "percentage": 98.44, "elapsed_time": "1 day, 17:48:00", "remaining_time": "0:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17662, "total_steps": 17941, "loss": 1.6758, "learning_rate": 6.34854641550997e-08, "epoch": 0.9844490273674823, "percentage": 98.44, "elapsed_time": "1 day, 17:48:09", "remaining_time": "0:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17663, "total_steps": 17941, "loss": 1.4918, "learning_rate": 6.303769044980757e-08, "epoch": 0.9845047656206455, "percentage": 98.45, "elapsed_time": "1 day, 17:48:17", "remaining_time": "0:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17664, "total_steps": 17941, "loss": 1.7168, "learning_rate": 6.259150045381245e-08, "epoch": 0.9845605038738086, "percentage": 98.46, "elapsed_time": "1 day, 17:48:26", "remaining_time": "0:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17665, "total_steps": 17941, "loss": 1.562, "learning_rate": 6.214689418125308e-08, "epoch": 0.9846162421269717, "percentage": 98.46, "elapsed_time": "1 day, 17:48:35", "remaining_time": "0:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17666, "total_steps": 17941, "loss": 1.4466, "learning_rate": 6.170387164624036e-08, "epoch": 0.9846719803801349, "percentage": 98.47, "elapsed_time": "1 day, 17:48:43", "remaining_time": "0:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17667, "total_steps": 17941, "loss": 1.3996, "learning_rate": 6.126243286281863e-08, "epoch": 0.984727718633298, "percentage": 98.47, "elapsed_time": "1 day, 17:48:51", "remaining_time": "0:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17668, "total_steps": 17941, "loss": 1.4558, "learning_rate": 6.082257784499335e-08, "epoch": 0.9847834568864612, "percentage": 98.48, "elapsed_time": "1 day, 17:49:00", "remaining_time": "0:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17669, "total_steps": 17941, "loss": 1.5282, "learning_rate": 6.038430660670891e-08, "epoch": 0.9848391951396244, "percentage": 98.48, "elapsed_time": "1 day, 17:49:08", "remaining_time": "0:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17670, "total_steps": 17941, "loss": 1.5312, "learning_rate": 5.99476191618653e-08, "epoch": 0.9848949333927874, "percentage": 98.49, "elapsed_time": "1 day, 17:49:17", "remaining_time": "0:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17671, "total_steps": 17941, "loss": 1.6531, "learning_rate": 5.9512515524312586e-08, "epoch": 0.9849506716459506, "percentage": 98.5, "elapsed_time": "1 day, 17:49:25", "remaining_time": "0:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17672, "total_steps": 17941, "loss": 1.3456, "learning_rate": 5.9078995707845255e-08, "epoch": 0.9850064098991138, "percentage": 98.5, "elapsed_time": "1 day, 17:49:34", "remaining_time": "0:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17673, "total_steps": 17941, "loss": 1.581, "learning_rate": 5.864705972622453e-08, "epoch": 0.9850621481522769, "percentage": 98.51, "elapsed_time": "1 day, 17:49:43", "remaining_time": "0:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17674, "total_steps": 17941, "loss": 1.5573, "learning_rate": 5.8216707593133915e-08, "epoch": 0.9851178864054401, "percentage": 98.51, "elapsed_time": "1 day, 17:49:52", "remaining_time": "0:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17675, "total_steps": 17941, "loss": 1.4311, "learning_rate": 5.77879393222347e-08, "epoch": 0.9851736246586033, "percentage": 98.52, "elapsed_time": "1 day, 17:50:00", "remaining_time": "0:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17676, "total_steps": 17941, "loss": 1.5767, "learning_rate": 5.7360754927110464e-08, "epoch": 0.9852293629117663, "percentage": 98.52, "elapsed_time": "1 day, 17:50:09", "remaining_time": "0:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17677, "total_steps": 17941, "loss": 1.7955, "learning_rate": 5.693515442132258e-08, "epoch": 0.9852851011649295, "percentage": 98.53, "elapsed_time": "1 day, 17:50:17", "remaining_time": "0:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17678, "total_steps": 17941, "loss": 1.5223, "learning_rate": 5.651113781836581e-08, "epoch": 0.9853408394180926, "percentage": 98.53, "elapsed_time": "1 day, 17:50:26", "remaining_time": "0:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17679, "total_steps": 17941, "loss": 1.6272, "learning_rate": 5.6088705131679407e-08, "epoch": 0.9853965776712558, "percentage": 98.54, "elapsed_time": "1 day, 17:50:34", "remaining_time": "0:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17680, "total_steps": 17941, "loss": 1.5475, "learning_rate": 5.5667856374669314e-08, "epoch": 0.985452315924419, "percentage": 98.55, "elapsed_time": "1 day, 17:50:43", "remaining_time": "0:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17681, "total_steps": 17941, "loss": 1.7325, "learning_rate": 5.524859156068041e-08, "epoch": 0.985508054177582, "percentage": 98.55, "elapsed_time": "1 day, 17:50:52", "remaining_time": "0:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17682, "total_steps": 17941, "loss": 1.4162, "learning_rate": 5.483091070300761e-08, "epoch": 0.9855637924307452, "percentage": 98.56, "elapsed_time": "1 day, 17:51:00", "remaining_time": "0:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17683, "total_steps": 17941, "loss": 1.5781, "learning_rate": 5.441481381489588e-08, "epoch": 0.9856195306839084, "percentage": 98.56, "elapsed_time": "1 day, 17:51:09", "remaining_time": "0:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17684, "total_steps": 17941, "loss": 1.6112, "learning_rate": 5.4000300909540224e-08, "epoch": 0.9856752689370715, "percentage": 98.57, "elapsed_time": "1 day, 17:51:17", "remaining_time": "0:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17685, "total_steps": 17941, "loss": 1.4819, "learning_rate": 5.358737200009678e-08, "epoch": 0.9857310071902347, "percentage": 98.57, "elapsed_time": "1 day, 17:51:26", "remaining_time": "0:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17686, "total_steps": 17941, "loss": 1.6226, "learning_rate": 5.3176027099649526e-08, "epoch": 0.9857867454433978, "percentage": 98.58, "elapsed_time": "1 day, 17:51:35", "remaining_time": "0:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17687, "total_steps": 17941, "loss": 1.6784, "learning_rate": 5.276626622124914e-08, "epoch": 0.9858424836965609, "percentage": 98.58, "elapsed_time": "1 day, 17:51:43", "remaining_time": "0:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17688, "total_steps": 17941, "loss": 1.8073, "learning_rate": 5.2358089377890776e-08, "epoch": 0.9858982219497241, "percentage": 98.59, "elapsed_time": "1 day, 17:51:52", "remaining_time": "0:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17689, "total_steps": 17941, "loss": 1.6573, "learning_rate": 5.195149658251963e-08, "epoch": 0.9859539602028873, "percentage": 98.6, "elapsed_time": "1 day, 17:52:00", "remaining_time": "0:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17690, "total_steps": 17941, "loss": 1.473, "learning_rate": 5.15464878480254e-08, "epoch": 0.9860096984560504, "percentage": 98.6, "elapsed_time": "1 day, 17:52:09", "remaining_time": "0:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17691, "total_steps": 17941, "loss": 1.6588, "learning_rate": 5.114306318726447e-08, "epoch": 0.9860654367092135, "percentage": 98.61, "elapsed_time": "1 day, 17:52:17", "remaining_time": "0:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17692, "total_steps": 17941, "loss": 1.6358, "learning_rate": 5.074122261301551e-08, "epoch": 0.9861211749623767, "percentage": 98.61, "elapsed_time": "1 day, 17:52:26", "remaining_time": "0:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17693, "total_steps": 17941, "loss": 1.8155, "learning_rate": 5.034096613803496e-08, "epoch": 0.9861769132155398, "percentage": 98.62, "elapsed_time": "1 day, 17:52:34", "remaining_time": "0:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17694, "total_steps": 17941, "loss": 1.4193, "learning_rate": 4.9942293775012696e-08, "epoch": 0.986232651468703, "percentage": 98.62, "elapsed_time": "1 day, 17:52:43", "remaining_time": "0:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17695, "total_steps": 17941, "loss": 1.7525, "learning_rate": 4.954520553658859e-08, "epoch": 0.9862883897218662, "percentage": 98.63, "elapsed_time": "1 day, 17:52:51", "remaining_time": "0:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17696, "total_steps": 17941, "loss": 1.4906, "learning_rate": 4.914970143536368e-08, "epoch": 0.9863441279750292, "percentage": 98.63, "elapsed_time": "1 day, 17:53:00", "remaining_time": "0:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17697, "total_steps": 17941, "loss": 1.789, "learning_rate": 4.875578148387794e-08, "epoch": 0.9863998662281924, "percentage": 98.64, "elapsed_time": "1 day, 17:53:08", "remaining_time": "0:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17698, "total_steps": 17941, "loss": 1.7271, "learning_rate": 4.8363445694615814e-08, "epoch": 0.9864556044813556, "percentage": 98.65, "elapsed_time": "1 day, 17:53:17", "remaining_time": "0:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17699, "total_steps": 17941, "loss": 1.9038, "learning_rate": 4.797269408002847e-08, "epoch": 0.9865113427345187, "percentage": 98.65, "elapsed_time": "1 day, 17:53:26", "remaining_time": "0:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17700, "total_steps": 17941, "loss": 1.6516, "learning_rate": 4.758352665251153e-08, "epoch": 0.9865670809876819, "percentage": 98.66, "elapsed_time": "1 day, 17:53:34", "remaining_time": "0:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17701, "total_steps": 17941, "loss": 1.6106, "learning_rate": 4.719594342439959e-08, "epoch": 0.9866228192408449, "percentage": 98.66, "elapsed_time": "1 day, 17:53:43", "remaining_time": "0:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17702, "total_steps": 17941, "loss": 1.5687, "learning_rate": 4.680994440798836e-08, "epoch": 0.9866785574940081, "percentage": 98.67, "elapsed_time": "1 day, 17:53:51", "remaining_time": "0:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17703, "total_steps": 17941, "loss": 1.7888, "learning_rate": 4.642552961551805e-08, "epoch": 0.9867342957471713, "percentage": 98.67, "elapsed_time": "1 day, 17:54:00", "remaining_time": "0:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17704, "total_steps": 17941, "loss": 1.4133, "learning_rate": 4.604269905917891e-08, "epoch": 0.9867900340003344, "percentage": 98.68, "elapsed_time": "1 day, 17:54:08", "remaining_time": "0:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17705, "total_steps": 17941, "loss": 1.7083, "learning_rate": 4.5661452751111223e-08, "epoch": 0.9868457722534976, "percentage": 98.68, "elapsed_time": "1 day, 17:54:17", "remaining_time": "0:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17706, "total_steps": 17941, "loss": 1.6912, "learning_rate": 4.5281790703410875e-08, "epoch": 0.9869015105066608, "percentage": 98.69, "elapsed_time": "1 day, 17:54:25", "remaining_time": "0:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17707, "total_steps": 17941, "loss": 1.115, "learning_rate": 4.490371292811824e-08, "epoch": 0.9869572487598238, "percentage": 98.7, "elapsed_time": "1 day, 17:54:34", "remaining_time": "0:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17708, "total_steps": 17941, "loss": 1.6267, "learning_rate": 4.452721943721816e-08, "epoch": 0.987012987012987, "percentage": 98.7, "elapsed_time": "1 day, 17:54:42", "remaining_time": "0:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17709, "total_steps": 17941, "loss": 1.8893, "learning_rate": 4.4152310242656646e-08, "epoch": 0.9870687252661502, "percentage": 98.71, "elapsed_time": "1 day, 17:54:51", "remaining_time": "0:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17710, "total_steps": 17941, "loss": 1.7032, "learning_rate": 4.377898535631863e-08, "epoch": 0.9871244635193133, "percentage": 98.71, "elapsed_time": "1 day, 17:54:59", "remaining_time": "0:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17711, "total_steps": 17941, "loss": 1.5622, "learning_rate": 4.3407244790050207e-08, "epoch": 0.9871802017724765, "percentage": 98.72, "elapsed_time": "1 day, 17:55:07", "remaining_time": "0:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17712, "total_steps": 17941, "loss": 1.5024, "learning_rate": 4.303708855563082e-08, "epoch": 0.9872359400256396, "percentage": 98.72, "elapsed_time": "1 day, 17:55:16", "remaining_time": "0:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17713, "total_steps": 17941, "loss": 1.6252, "learning_rate": 4.26685166648122e-08, "epoch": 0.9872916782788027, "percentage": 98.73, "elapsed_time": "1 day, 17:55:24", "remaining_time": "0:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17714, "total_steps": 17941, "loss": 1.5022, "learning_rate": 4.230152912927387e-08, "epoch": 0.9873474165319659, "percentage": 98.73, "elapsed_time": "1 day, 17:55:34", "remaining_time": "0:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17715, "total_steps": 17941, "loss": 1.3451, "learning_rate": 4.193612596065655e-08, "epoch": 0.9874031547851291, "percentage": 98.74, "elapsed_time": "1 day, 17:55:43", "remaining_time": "0:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17716, "total_steps": 17941, "loss": 1.4555, "learning_rate": 4.1572307170550936e-08, "epoch": 0.9874588930382922, "percentage": 98.75, "elapsed_time": "1 day, 17:55:51", "remaining_time": "0:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17717, "total_steps": 17941, "loss": 1.4166, "learning_rate": 4.121007277049227e-08, "epoch": 0.9875146312914553, "percentage": 98.75, "elapsed_time": "1 day, 17:56:00", "remaining_time": "0:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17718, "total_steps": 17941, "loss": 1.5581, "learning_rate": 4.084942277197135e-08, "epoch": 0.9875703695446185, "percentage": 98.76, "elapsed_time": "1 day, 17:56:09", "remaining_time": "0:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17719, "total_steps": 17941, "loss": 1.6954, "learning_rate": 4.049035718642347e-08, "epoch": 0.9876261077977816, "percentage": 98.76, "elapsed_time": "1 day, 17:56:17", "remaining_time": "0:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17720, "total_steps": 17941, "loss": 1.5224, "learning_rate": 4.013287602523952e-08, "epoch": 0.9876818460509448, "percentage": 98.77, "elapsed_time": "1 day, 17:56:26", "remaining_time": "0:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17721, "total_steps": 17941, "loss": 1.6119, "learning_rate": 3.9776979299749326e-08, "epoch": 0.987737584304108, "percentage": 98.77, "elapsed_time": "1 day, 17:56:35", "remaining_time": "0:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17722, "total_steps": 17941, "loss": 1.9024, "learning_rate": 3.9422667021249414e-08, "epoch": 0.987793322557271, "percentage": 98.78, "elapsed_time": "1 day, 17:56:43", "remaining_time": "0:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17723, "total_steps": 17941, "loss": 1.7866, "learning_rate": 3.906993920097524e-08, "epoch": 0.9878490608104342, "percentage": 98.78, "elapsed_time": "1 day, 17:56:52", "remaining_time": "0:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17724, "total_steps": 17941, "loss": 1.4668, "learning_rate": 3.871879585010674e-08, "epoch": 0.9879047990635973, "percentage": 98.79, "elapsed_time": "1 day, 17:57:00", "remaining_time": "0:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17725, "total_steps": 17941, "loss": 1.5639, "learning_rate": 3.8369236979779455e-08, "epoch": 0.9879605373167605, "percentage": 98.8, "elapsed_time": "1 day, 17:57:08", "remaining_time": "0:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17726, "total_steps": 17941, "loss": 1.6867, "learning_rate": 3.8021262601090066e-08, "epoch": 0.9880162755699237, "percentage": 98.8, "elapsed_time": "1 day, 17:57:17", "remaining_time": "0:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17727, "total_steps": 17941, "loss": 1.4791, "learning_rate": 3.767487272506309e-08, "epoch": 0.9880720138230867, "percentage": 98.81, "elapsed_time": "1 day, 17:57:25", "remaining_time": "0:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17728, "total_steps": 17941, "loss": 1.482, "learning_rate": 3.7330067362689736e-08, "epoch": 0.9881277520762499, "percentage": 98.81, "elapsed_time": "1 day, 17:57:35", "remaining_time": "0:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17729, "total_steps": 17941, "loss": 1.7269, "learning_rate": 3.698684652490569e-08, "epoch": 0.9881834903294131, "percentage": 98.82, "elapsed_time": "1 day, 17:57:43", "remaining_time": "0:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17730, "total_steps": 17941, "loss": 1.8449, "learning_rate": 3.664521022259671e-08, "epoch": 0.9882392285825762, "percentage": 98.82, "elapsed_time": "1 day, 17:57:52", "remaining_time": "0:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17731, "total_steps": 17941, "loss": 1.8374, "learning_rate": 3.630515846658744e-08, "epoch": 0.9882949668357394, "percentage": 98.83, "elapsed_time": "1 day, 17:58:00", "remaining_time": "0:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17732, "total_steps": 17941, "loss": 1.5831, "learning_rate": 3.5966691267674824e-08, "epoch": 0.9883507050889025, "percentage": 98.84, "elapsed_time": "1 day, 17:58:09", "remaining_time": "0:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17733, "total_steps": 17941, "loss": 1.541, "learning_rate": 3.5629808636589154e-08, "epoch": 0.9884064433420656, "percentage": 98.84, "elapsed_time": "1 day, 17:58:18", "remaining_time": "0:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17734, "total_steps": 17941, "loss": 1.3535, "learning_rate": 3.529451058401079e-08, "epoch": 0.9884621815952288, "percentage": 98.85, "elapsed_time": "1 day, 17:58:26", "remaining_time": "0:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17735, "total_steps": 17941, "loss": 1.6024, "learning_rate": 3.4960797120581204e-08, "epoch": 0.988517919848392, "percentage": 98.85, "elapsed_time": "1 day, 17:58:35", "remaining_time": "0:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17736, "total_steps": 17941, "loss": 1.532, "learning_rate": 3.4628668256875273e-08, "epoch": 0.9885736581015551, "percentage": 98.86, "elapsed_time": "1 day, 17:58:44", "remaining_time": "0:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17737, "total_steps": 17941, "loss": 1.7255, "learning_rate": 3.429812400342902e-08, "epoch": 0.9886293963547182, "percentage": 98.86, "elapsed_time": "1 day, 17:58:52", "remaining_time": "0:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17738, "total_steps": 17941, "loss": 1.6464, "learning_rate": 3.396916437072295e-08, "epoch": 0.9886851346078814, "percentage": 98.87, "elapsed_time": "1 day, 17:59:01", "remaining_time": "0:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17739, "total_steps": 17941, "loss": 1.6756, "learning_rate": 3.3641789369198706e-08, "epoch": 0.9887408728610445, "percentage": 98.87, "elapsed_time": "1 day, 17:59:09", "remaining_time": "0:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17740, "total_steps": 17941, "loss": 1.7003, "learning_rate": 3.3315999009231324e-08, "epoch": 0.9887966111142077, "percentage": 98.88, "elapsed_time": "1 day, 17:59:18", "remaining_time": "0:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17741, "total_steps": 17941, "loss": 1.5417, "learning_rate": 3.299179330115143e-08, "epoch": 0.9888523493673709, "percentage": 98.89, "elapsed_time": "1 day, 17:59:27", "remaining_time": "0:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17742, "total_steps": 17941, "loss": 1.8359, "learning_rate": 3.266917225524524e-08, "epoch": 0.988908087620534, "percentage": 98.89, "elapsed_time": "1 day, 17:59:35", "remaining_time": "0:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17743, "total_steps": 17941, "loss": 1.7218, "learning_rate": 3.234813588174346e-08, "epoch": 0.9889638258736971, "percentage": 98.9, "elapsed_time": "1 day, 17:59:44", "remaining_time": "0:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17744, "total_steps": 17941, "loss": 1.8224, "learning_rate": 3.202868419082683e-08, "epoch": 0.9890195641268603, "percentage": 98.9, "elapsed_time": "1 day, 17:59:52", "remaining_time": "0:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17745, "total_steps": 17941, "loss": 2.0053, "learning_rate": 3.1710817192631693e-08, "epoch": 0.9890753023800234, "percentage": 98.91, "elapsed_time": "1 day, 18:00:01", "remaining_time": "0:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17746, "total_steps": 17941, "loss": 1.4328, "learning_rate": 3.139453489722777e-08, "epoch": 0.9891310406331866, "percentage": 98.91, "elapsed_time": "1 day, 18:00:09", "remaining_time": "0:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17747, "total_steps": 17941, "loss": 1.8279, "learning_rate": 3.1079837314657025e-08, "epoch": 0.9891867788863496, "percentage": 98.92, "elapsed_time": "1 day, 18:00:18", "remaining_time": "0:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17748, "total_steps": 17941, "loss": 1.6699, "learning_rate": 3.076672445488926e-08, "epoch": 0.9892425171395128, "percentage": 98.92, "elapsed_time": "1 day, 18:00:26", "remaining_time": "0:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17749, "total_steps": 17941, "loss": 1.4811, "learning_rate": 3.045519632786653e-08, "epoch": 0.989298255392676, "percentage": 98.93, "elapsed_time": "1 day, 18:00:35", "remaining_time": "0:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17750, "total_steps": 17941, "loss": 1.2753, "learning_rate": 3.014525294345871e-08, "epoch": 0.9893539936458391, "percentage": 98.94, "elapsed_time": "1 day, 18:00:43", "remaining_time": "0:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17751, "total_steps": 17941, "loss": 1.6277, "learning_rate": 2.983689431149683e-08, "epoch": 0.9894097318990023, "percentage": 98.94, "elapsed_time": "1 day, 18:00:52", "remaining_time": "0:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17752, "total_steps": 17941, "loss": 1.5578, "learning_rate": 2.9530120441761956e-08, "epoch": 0.9894654701521655, "percentage": 98.95, "elapsed_time": "1 day, 18:01:00", "remaining_time": "0:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17753, "total_steps": 17941, "loss": 1.4695, "learning_rate": 2.9224931343990737e-08, "epoch": 0.9895212084053285, "percentage": 98.95, "elapsed_time": "1 day, 18:01:09", "remaining_time": "0:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17754, "total_steps": 17941, "loss": 1.9163, "learning_rate": 2.8921327027847667e-08, "epoch": 0.9895769466584917, "percentage": 98.96, "elapsed_time": "1 day, 18:01:17", "remaining_time": "0:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17755, "total_steps": 17941, "loss": 1.5151, "learning_rate": 2.8619307502975035e-08, "epoch": 0.9896326849116549, "percentage": 98.96, "elapsed_time": "1 day, 18:01:26", "remaining_time": "0:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17756, "total_steps": 17941, "loss": 1.7624, "learning_rate": 2.831887277893741e-08, "epoch": 0.989688423164818, "percentage": 98.97, "elapsed_time": "1 day, 18:01:34", "remaining_time": "0:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17757, "total_steps": 17941, "loss": 1.6216, "learning_rate": 2.8020022865277163e-08, "epoch": 0.9897441614179812, "percentage": 98.97, "elapsed_time": "1 day, 18:01:42", "remaining_time": "0:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17758, "total_steps": 17941, "loss": 1.7067, "learning_rate": 2.7722757771458942e-08, "epoch": 0.9897998996711443, "percentage": 98.98, "elapsed_time": "1 day, 18:01:52", "remaining_time": "0:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17759, "total_steps": 17941, "loss": 1.6443, "learning_rate": 2.7427077506919642e-08, "epoch": 0.9898556379243074, "percentage": 98.99, "elapsed_time": "1 day, 18:02:00", "remaining_time": "0:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17760, "total_steps": 17941, "loss": 1.6573, "learning_rate": 2.7132982081029544e-08, "epoch": 0.9899113761774706, "percentage": 98.99, "elapsed_time": "1 day, 18:02:08", "remaining_time": "0:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17761, "total_steps": 17941, "loss": 1.8253, "learning_rate": 2.684047150312563e-08, "epoch": 0.9899671144306338, "percentage": 99.0, "elapsed_time": "1 day, 18:02:17", "remaining_time": "0:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17762, "total_steps": 17941, "loss": 1.581, "learning_rate": 2.6549545782472708e-08, "epoch": 0.9900228526837969, "percentage": 99.0, "elapsed_time": "1 day, 18:02:25", "remaining_time": "0:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17763, "total_steps": 17941, "loss": 1.7049, "learning_rate": 2.6260204928302278e-08, "epoch": 0.99007859093696, "percentage": 99.01, "elapsed_time": "1 day, 18:02:34", "remaining_time": "0:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17764, "total_steps": 17941, "loss": 1.6109, "learning_rate": 2.597244894979589e-08, "epoch": 0.9901343291901232, "percentage": 99.01, "elapsed_time": "1 day, 18:02:42", "remaining_time": "0:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17765, "total_steps": 17941, "loss": 1.6352, "learning_rate": 2.5686277856074026e-08, "epoch": 0.9901900674432863, "percentage": 99.02, "elapsed_time": "1 day, 18:02:51", "remaining_time": "0:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17766, "total_steps": 17941, "loss": 1.4389, "learning_rate": 2.5401691656207206e-08, "epoch": 0.9902458056964495, "percentage": 99.02, "elapsed_time": "1 day, 18:03:00", "remaining_time": "0:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17767, "total_steps": 17941, "loss": 1.8776, "learning_rate": 2.5118690359232644e-08, "epoch": 0.9903015439496127, "percentage": 99.03, "elapsed_time": "1 day, 18:03:08", "remaining_time": "0:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17768, "total_steps": 17941, "loss": 1.6979, "learning_rate": 2.4837273974115395e-08, "epoch": 0.9903572822027757, "percentage": 99.04, "elapsed_time": "1 day, 18:03:16", "remaining_time": "0:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17769, "total_steps": 17941, "loss": 1.6877, "learning_rate": 2.4557442509787198e-08, "epoch": 0.9904130204559389, "percentage": 99.04, "elapsed_time": "1 day, 18:03:25", "remaining_time": "0:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17770, "total_steps": 17941, "loss": 1.7037, "learning_rate": 2.427919597511874e-08, "epoch": 0.990468758709102, "percentage": 99.05, "elapsed_time": "1 day, 18:03:33", "remaining_time": "0:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17771, "total_steps": 17941, "loss": 1.7178, "learning_rate": 2.4002534378936293e-08, "epoch": 0.9905244969622652, "percentage": 99.05, "elapsed_time": "1 day, 18:03:42", "remaining_time": "0:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17772, "total_steps": 17941, "loss": 1.6152, "learning_rate": 2.3727457730010616e-08, "epoch": 0.9905802352154284, "percentage": 99.06, "elapsed_time": "1 day, 18:03:50", "remaining_time": "0:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17773, "total_steps": 17941, "loss": 1.7571, "learning_rate": 2.3453966037068066e-08, "epoch": 0.9906359734685914, "percentage": 99.06, "elapsed_time": "1 day, 18:04:00", "remaining_time": "0:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17774, "total_steps": 17941, "loss": 1.9999, "learning_rate": 2.318205930878503e-08, "epoch": 0.9906917117217546, "percentage": 99.07, "elapsed_time": "1 day, 18:04:08", "remaining_time": "0:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17775, "total_steps": 17941, "loss": 1.6135, "learning_rate": 2.2911737553782398e-08, "epoch": 0.9907474499749178, "percentage": 99.07, "elapsed_time": "1 day, 18:04:17", "remaining_time": "0:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17776, "total_steps": 17941, "loss": 1.5198, "learning_rate": 2.2643000780631086e-08, "epoch": 0.9908031882280809, "percentage": 99.08, "elapsed_time": "1 day, 18:04:25", "remaining_time": "0:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17777, "total_steps": 17941, "loss": 1.653, "learning_rate": 2.2375848997857608e-08, "epoch": 0.9908589264812441, "percentage": 99.09, "elapsed_time": "1 day, 18:04:34", "remaining_time": "0:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17778, "total_steps": 17941, "loss": 1.77, "learning_rate": 2.2110282213927413e-08, "epoch": 0.9909146647344073, "percentage": 99.09, "elapsed_time": "1 day, 18:04:42", "remaining_time": "0:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17779, "total_steps": 17941, "loss": 1.5992, "learning_rate": 2.1846300437272648e-08, "epoch": 0.9909704029875703, "percentage": 99.1, "elapsed_time": "1 day, 18:04:50", "remaining_time": "0:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17780, "total_steps": 17941, "loss": 1.8138, "learning_rate": 2.1583903676258842e-08, "epoch": 0.9910261412407335, "percentage": 99.1, "elapsed_time": "1 day, 18:04:59", "remaining_time": "0:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17781, "total_steps": 17941, "loss": 1.4731, "learning_rate": 2.132309193921267e-08, "epoch": 0.9910818794938967, "percentage": 99.11, "elapsed_time": "1 day, 18:05:07", "remaining_time": "0:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17782, "total_steps": 17941, "loss": 1.4826, "learning_rate": 2.1063865234399738e-08, "epoch": 0.9911376177470598, "percentage": 99.11, "elapsed_time": "1 day, 18:05:16", "remaining_time": "0:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17783, "total_steps": 17941, "loss": 1.5009, "learning_rate": 2.080622357004125e-08, "epoch": 0.991193356000223, "percentage": 99.12, "elapsed_time": "1 day, 18:05:24", "remaining_time": "0:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17784, "total_steps": 17941, "loss": 1.6499, "learning_rate": 2.0550166954308448e-08, "epoch": 0.9912490942533861, "percentage": 99.12, "elapsed_time": "1 day, 18:05:33", "remaining_time": "0:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17785, "total_steps": 17941, "loss": 1.608, "learning_rate": 2.0295695395328164e-08, "epoch": 0.9913048325065492, "percentage": 99.13, "elapsed_time": "1 day, 18:05:41", "remaining_time": "0:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17786, "total_steps": 17941, "loss": 1.7485, "learning_rate": 2.0042808901166166e-08, "epoch": 0.9913605707597124, "percentage": 99.14, "elapsed_time": "1 day, 18:05:50", "remaining_time": "0:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17787, "total_steps": 17941, "loss": 1.6374, "learning_rate": 1.979150747984382e-08, "epoch": 0.9914163090128756, "percentage": 99.14, "elapsed_time": "1 day, 18:05:58", "remaining_time": "0:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17788, "total_steps": 17941, "loss": 1.6544, "learning_rate": 1.954179113932697e-08, "epoch": 0.9914720472660387, "percentage": 99.15, "elapsed_time": "1 day, 18:06:06", "remaining_time": "0:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17789, "total_steps": 17941, "loss": 1.7181, "learning_rate": 1.9293659887542613e-08, "epoch": 0.9915277855192018, "percentage": 99.15, "elapsed_time": "1 day, 18:06:15", "remaining_time": "0:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17790, "total_steps": 17941, "loss": 1.6068, "learning_rate": 1.904711373235113e-08, "epoch": 0.991583523772365, "percentage": 99.16, "elapsed_time": "1 day, 18:06:24", "remaining_time": "0:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17791, "total_steps": 17941, "loss": 1.6995, "learning_rate": 1.8802152681579587e-08, "epoch": 0.9916392620255281, "percentage": 99.16, "elapsed_time": "1 day, 18:06:33", "remaining_time": "0:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17792, "total_steps": 17941, "loss": 1.3236, "learning_rate": 1.8558776742988448e-08, "epoch": 0.9916950002786913, "percentage": 99.17, "elapsed_time": "1 day, 18:06:41", "remaining_time": "0:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17793, "total_steps": 17941, "loss": 1.7792, "learning_rate": 1.8316985924304864e-08, "epoch": 0.9917507385318544, "percentage": 99.18, "elapsed_time": "1 day, 18:06:49", "remaining_time": "0:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17794, "total_steps": 17941, "loss": 1.6207, "learning_rate": 1.8076780233194923e-08, "epoch": 0.9918064767850175, "percentage": 99.18, "elapsed_time": "1 day, 18:06:58", "remaining_time": "0:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17795, "total_steps": 17941, "loss": 1.6762, "learning_rate": 1.7838159677269206e-08, "epoch": 0.9918622150381807, "percentage": 99.19, "elapsed_time": "1 day, 18:07:06", "remaining_time": "0:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17796, "total_steps": 17941, "loss": 1.6446, "learning_rate": 1.7601124264104985e-08, "epoch": 0.9919179532913438, "percentage": 99.19, "elapsed_time": "1 day, 18:07:15", "remaining_time": "0:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17797, "total_steps": 17941, "loss": 1.6751, "learning_rate": 1.7365674001212918e-08, "epoch": 0.991973691544507, "percentage": 99.2, "elapsed_time": "1 day, 18:07:23", "remaining_time": "0:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17798, "total_steps": 17941, "loss": 1.3628, "learning_rate": 1.7131808896064805e-08, "epoch": 0.9920294297976702, "percentage": 99.2, "elapsed_time": "1 day, 18:07:32", "remaining_time": "0:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17799, "total_steps": 17941, "loss": 1.7296, "learning_rate": 1.6899528956071387e-08, "epoch": 0.9920851680508332, "percentage": 99.21, "elapsed_time": "1 day, 18:07:40", "remaining_time": "0:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17800, "total_steps": 17941, "loss": 1.5786, "learning_rate": 1.6668834188610096e-08, "epoch": 0.9921409063039964, "percentage": 99.21, "elapsed_time": "1 day, 18:07:49", "remaining_time": "0:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17801, "total_steps": 17941, "loss": 1.5854, "learning_rate": 1.6439724600986196e-08, "epoch": 0.9921966445571596, "percentage": 99.22, "elapsed_time": "1 day, 18:07:57", "remaining_time": "0:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17802, "total_steps": 17941, "loss": 1.5773, "learning_rate": 1.62122002004661e-08, "epoch": 0.9922523828103227, "percentage": 99.23, "elapsed_time": "1 day, 18:08:06", "remaining_time": "0:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17803, "total_steps": 17941, "loss": 1.7926, "learning_rate": 1.5986260994277358e-08, "epoch": 0.9923081210634859, "percentage": 99.23, "elapsed_time": "1 day, 18:08:14", "remaining_time": "0:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17804, "total_steps": 17941, "loss": 1.7704, "learning_rate": 1.5761906989569808e-08, "epoch": 0.992363859316649, "percentage": 99.24, "elapsed_time": "1 day, 18:08:22", "remaining_time": "0:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17805, "total_steps": 17941, "loss": 1.5083, "learning_rate": 1.5539138193471082e-08, "epoch": 0.9924195975698121, "percentage": 99.24, "elapsed_time": "1 day, 18:08:31", "remaining_time": "0:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17806, "total_steps": 17941, "loss": 1.6763, "learning_rate": 1.5317954613042197e-08, "epoch": 0.9924753358229753, "percentage": 99.25, "elapsed_time": "1 day, 18:08:40", "remaining_time": "0:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17807, "total_steps": 17941, "loss": 2.0011, "learning_rate": 1.509835625529421e-08, "epoch": 0.9925310740761385, "percentage": 99.25, "elapsed_time": "1 day, 18:08:48", "remaining_time": "0:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17808, "total_steps": 17941, "loss": 1.2496, "learning_rate": 1.4880343127193774e-08, "epoch": 0.9925868123293016, "percentage": 99.26, "elapsed_time": "1 day, 18:08:57", "remaining_time": "0:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17809, "total_steps": 17941, "loss": 1.6381, "learning_rate": 1.4663915235657577e-08, "epoch": 0.9926425505824648, "percentage": 99.26, "elapsed_time": "1 day, 18:09:05", "remaining_time": "0:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17810, "total_steps": 17941, "loss": 1.7707, "learning_rate": 1.4449072587546797e-08, "epoch": 0.9926982888356279, "percentage": 99.27, "elapsed_time": "1 day, 18:09:14", "remaining_time": "0:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17811, "total_steps": 17941, "loss": 1.7729, "learning_rate": 1.4235815189672652e-08, "epoch": 0.992754027088791, "percentage": 99.28, "elapsed_time": "1 day, 18:09:22", "remaining_time": "0:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17812, "total_steps": 17941, "loss": 1.5435, "learning_rate": 1.4024143048801952e-08, "epoch": 0.9928097653419542, "percentage": 99.28, "elapsed_time": "1 day, 18:09:31", "remaining_time": "0:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17813, "total_steps": 17941, "loss": 1.6541, "learning_rate": 1.3814056171651546e-08, "epoch": 0.9928655035951174, "percentage": 99.29, "elapsed_time": "1 day, 18:09:39", "remaining_time": "0:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17814, "total_steps": 17941, "loss": 1.4937, "learning_rate": 1.3605554564871669e-08, "epoch": 0.9929212418482805, "percentage": 99.29, "elapsed_time": "1 day, 18:09:47", "remaining_time": "0:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17815, "total_steps": 17941, "loss": 1.5573, "learning_rate": 1.3398638235090355e-08, "epoch": 0.9929769801014436, "percentage": 99.3, "elapsed_time": "1 day, 18:09:56", "remaining_time": "0:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17816, "total_steps": 17941, "loss": 1.7921, "learning_rate": 1.3193307188857917e-08, "epoch": 0.9930327183546067, "percentage": 99.3, "elapsed_time": "1 day, 18:10:04", "remaining_time": "0:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17817, "total_steps": 17941, "loss": 1.6022, "learning_rate": 1.2989561432691366e-08, "epoch": 0.9930884566077699, "percentage": 99.31, "elapsed_time": "1 day, 18:10:13", "remaining_time": "0:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17818, "total_steps": 17941, "loss": 1.234, "learning_rate": 1.2787400973052199e-08, "epoch": 0.9931441948609331, "percentage": 99.31, "elapsed_time": "1 day, 18:10:21", "remaining_time": "0:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17819, "total_steps": 17941, "loss": 1.5633, "learning_rate": 1.2586825816351954e-08, "epoch": 0.9931999331140962, "percentage": 99.32, "elapsed_time": "1 day, 18:10:30", "remaining_time": "0:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17820, "total_steps": 17941, "loss": 1.496, "learning_rate": 1.238783596894666e-08, "epoch": 0.9932556713672593, "percentage": 99.33, "elapsed_time": "1 day, 18:10:38", "remaining_time": "0:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17821, "total_steps": 17941, "loss": 1.628, "learning_rate": 1.2190431437153483e-08, "epoch": 0.9933114096204225, "percentage": 99.33, "elapsed_time": "1 day, 18:10:47", "remaining_time": "0:17:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17822, "total_steps": 17941, "loss": 1.6507, "learning_rate": 1.1994612227234081e-08, "epoch": 0.9933671478735856, "percentage": 99.34, "elapsed_time": "1 day, 18:10:55", "remaining_time": "0:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17823, "total_steps": 17941, "loss": 1.8845, "learning_rate": 1.1800378345389051e-08, "epoch": 0.9934228861267488, "percentage": 99.34, "elapsed_time": "1 day, 18:11:03", "remaining_time": "0:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17824, "total_steps": 17941, "loss": 1.7482, "learning_rate": 1.1607729797791233e-08, "epoch": 0.993478624379912, "percentage": 99.35, "elapsed_time": "1 day, 18:11:12", "remaining_time": "0:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17825, "total_steps": 17941, "loss": 1.6669, "learning_rate": 1.1416666590535752e-08, "epoch": 0.993534362633075, "percentage": 99.35, "elapsed_time": "1 day, 18:11:21", "remaining_time": "0:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17826, "total_steps": 17941, "loss": 1.8451, "learning_rate": 1.1227188729695525e-08, "epoch": 0.9935901008862382, "percentage": 99.36, "elapsed_time": "1 day, 18:11:29", "remaining_time": "0:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17827, "total_steps": 17941, "loss": 1.8348, "learning_rate": 1.1039296221276863e-08, "epoch": 0.9936458391394014, "percentage": 99.36, "elapsed_time": "1 day, 18:11:38", "remaining_time": "0:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17828, "total_steps": 17941, "loss": 1.5636, "learning_rate": 1.0852989071230557e-08, "epoch": 0.9937015773925645, "percentage": 99.37, "elapsed_time": "1 day, 18:11:46", "remaining_time": "0:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17829, "total_steps": 17941, "loss": 1.7154, "learning_rate": 1.0668267285474099e-08, "epoch": 0.9937573156457277, "percentage": 99.38, "elapsed_time": "1 day, 18:11:55", "remaining_time": "0:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17830, "total_steps": 17941, "loss": 1.6266, "learning_rate": 1.0485130869858362e-08, "epoch": 0.9938130538988909, "percentage": 99.38, "elapsed_time": "1 day, 18:12:03", "remaining_time": "0:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17831, "total_steps": 17941, "loss": 1.4427, "learning_rate": 1.0303579830195364e-08, "epoch": 0.9938687921520539, "percentage": 99.39, "elapsed_time": "1 day, 18:12:12", "remaining_time": "0:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17832, "total_steps": 17941, "loss": 1.5355, "learning_rate": 1.0123614172247164e-08, "epoch": 0.9939245304052171, "percentage": 99.39, "elapsed_time": "1 day, 18:12:20", "remaining_time": "0:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17833, "total_steps": 17941, "loss": 1.7237, "learning_rate": 9.945233901709206e-09, "epoch": 0.9939802686583803, "percentage": 99.4, "elapsed_time": "1 day, 18:12:28", "remaining_time": "0:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17834, "total_steps": 17941, "loss": 1.636, "learning_rate": 9.768439024254727e-09, "epoch": 0.9940360069115434, "percentage": 99.4, "elapsed_time": "1 day, 18:12:37", "remaining_time": "0:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17835, "total_steps": 17941, "loss": 1.624, "learning_rate": 9.593229545473704e-09, "epoch": 0.9940917451647066, "percentage": 99.41, "elapsed_time": "1 day, 18:12:45", "remaining_time": "0:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17836, "total_steps": 17941, "loss": 1.7618, "learning_rate": 9.419605470939452e-09, "epoch": 0.9941474834178697, "percentage": 99.41, "elapsed_time": "1 day, 18:12:54", "remaining_time": "0:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17837, "total_steps": 17941, "loss": 1.6754, "learning_rate": 9.247566806147579e-09, "epoch": 0.9942032216710328, "percentage": 99.42, "elapsed_time": "1 day, 18:13:02", "remaining_time": "0:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17838, "total_steps": 17941, "loss": 1.5919, "learning_rate": 9.077113556554829e-09, "epoch": 0.994258959924196, "percentage": 99.43, "elapsed_time": "1 day, 18:13:11", "remaining_time": "0:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17839, "total_steps": 17941, "loss": 1.6583, "learning_rate": 8.908245727567988e-09, "epoch": 0.9943146981773591, "percentage": 99.43, "elapsed_time": "1 day, 18:13:19", "remaining_time": "0:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17840, "total_steps": 17941, "loss": 1.906, "learning_rate": 8.740963324543883e-09, "epoch": 0.9943704364305223, "percentage": 99.44, "elapsed_time": "1 day, 18:13:28", "remaining_time": "0:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17841, "total_steps": 17941, "loss": 1.6375, "learning_rate": 8.575266352789379e-09, "epoch": 0.9944261746836854, "percentage": 99.44, "elapsed_time": "1 day, 18:13:36", "remaining_time": "0:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17842, "total_steps": 17941, "loss": 1.6561, "learning_rate": 8.411154817550283e-09, "epoch": 0.9944819129368485, "percentage": 99.45, "elapsed_time": "1 day, 18:13:45", "remaining_time": "0:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17843, "total_steps": 17941, "loss": 1.7869, "learning_rate": 8.248628724044637e-09, "epoch": 0.9945376511900117, "percentage": 99.45, "elapsed_time": "1 day, 18:13:53", "remaining_time": "0:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17844, "total_steps": 17941, "loss": 1.5893, "learning_rate": 8.087688077418332e-09, "epoch": 0.9945933894431749, "percentage": 99.46, "elapsed_time": "1 day, 18:14:02", "remaining_time": "0:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17845, "total_steps": 17941, "loss": 1.629, "learning_rate": 7.92833288277839e-09, "epoch": 0.994649127696338, "percentage": 99.46, "elapsed_time": "1 day, 18:14:10", "remaining_time": "0:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17846, "total_steps": 17941, "loss": 1.66, "learning_rate": 7.770563145181874e-09, "epoch": 0.9947048659495011, "percentage": 99.47, "elapsed_time": "1 day, 18:14:19", "remaining_time": "0:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17847, "total_steps": 17941, "loss": 1.6057, "learning_rate": 7.614378869619244e-09, "epoch": 0.9947606042026643, "percentage": 99.48, "elapsed_time": "1 day, 18:14:27", "remaining_time": "0:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17848, "total_steps": 17941, "loss": 1.7555, "learning_rate": 7.45978006105874e-09, "epoch": 0.9948163424558274, "percentage": 99.48, "elapsed_time": "1 day, 18:14:36", "remaining_time": "0:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17849, "total_steps": 17941, "loss": 1.3339, "learning_rate": 7.306766724396452e-09, "epoch": 0.9948720807089906, "percentage": 99.49, "elapsed_time": "1 day, 18:14:45", "remaining_time": "0:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17850, "total_steps": 17941, "loss": 1.7004, "learning_rate": 7.1553388644840515e-09, "epoch": 0.9949278189621538, "percentage": 99.49, "elapsed_time": "1 day, 18:14:54", "remaining_time": "0:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17851, "total_steps": 17941, "loss": 1.571, "learning_rate": 7.005496486128804e-09, "epoch": 0.9949835572153168, "percentage": 99.5, "elapsed_time": "1 day, 18:15:02", "remaining_time": "0:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17852, "total_steps": 17941, "loss": 1.6759, "learning_rate": 6.857239594076914e-09, "epoch": 0.99503929546848, "percentage": 99.5, "elapsed_time": "1 day, 18:15:11", "remaining_time": "0:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17853, "total_steps": 17941, "loss": 1.7104, "learning_rate": 6.710568193035727e-09, "epoch": 0.9950950337216432, "percentage": 99.51, "elapsed_time": "1 day, 18:15:20", "remaining_time": "0:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17854, "total_steps": 17941, "loss": 1.7512, "learning_rate": 6.5654822876515255e-09, "epoch": 0.9951507719748063, "percentage": 99.52, "elapsed_time": "1 day, 18:15:29", "remaining_time": "0:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17855, "total_steps": 17941, "loss": 1.7223, "learning_rate": 6.421981882531736e-09, "epoch": 0.9952065102279695, "percentage": 99.52, "elapsed_time": "1 day, 18:15:38", "remaining_time": "0:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17856, "total_steps": 17941, "loss": 1.7547, "learning_rate": 6.280066982222721e-09, "epoch": 0.9952622484811326, "percentage": 99.53, "elapsed_time": "1 day, 18:15:46", "remaining_time": "0:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17857, "total_steps": 17941, "loss": 1.4622, "learning_rate": 6.139737591226436e-09, "epoch": 0.9953179867342957, "percentage": 99.53, "elapsed_time": "1 day, 18:15:55", "remaining_time": "0:11:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17858, "total_steps": 17941, "loss": 1.7235, "learning_rate": 6.000993713989322e-09, "epoch": 0.9953737249874589, "percentage": 99.54, "elapsed_time": "1 day, 18:16:03", "remaining_time": "0:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17859, "total_steps": 17941, "loss": 1.7357, "learning_rate": 5.863835354918967e-09, "epoch": 0.9954294632406221, "percentage": 99.54, "elapsed_time": "1 day, 18:16:11", "remaining_time": "0:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17860, "total_steps": 17941, "loss": 1.4926, "learning_rate": 5.7282625183618936e-09, "epoch": 0.9954852014937852, "percentage": 99.55, "elapsed_time": "1 day, 18:16:20", "remaining_time": "0:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17861, "total_steps": 17941, "loss": 1.8364, "learning_rate": 5.594275208614663e-09, "epoch": 0.9955409397469484, "percentage": 99.55, "elapsed_time": "1 day, 18:16:29", "remaining_time": "0:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17862, "total_steps": 17941, "loss": 1.6545, "learning_rate": 5.461873429929432e-09, "epoch": 0.9955966780001114, "percentage": 99.56, "elapsed_time": "1 day, 18:16:38", "remaining_time": "0:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17863, "total_steps": 17941, "loss": 1.8837, "learning_rate": 5.331057186508392e-09, "epoch": 0.9956524162532746, "percentage": 99.57, "elapsed_time": "1 day, 18:16:47", "remaining_time": "0:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17864, "total_steps": 17941, "loss": 1.6242, "learning_rate": 5.201826482498229e-09, "epoch": 0.9957081545064378, "percentage": 99.57, "elapsed_time": "1 day, 18:16:55", "remaining_time": "0:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17865, "total_steps": 17941, "loss": 1.6272, "learning_rate": 5.0741813219956634e-09, "epoch": 0.9957638927596009, "percentage": 99.58, "elapsed_time": "1 day, 18:17:04", "remaining_time": "0:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17866, "total_steps": 17941, "loss": 1.656, "learning_rate": 4.94812170904746e-09, "epoch": 0.995819631012764, "percentage": 99.58, "elapsed_time": "1 day, 18:17:12", "remaining_time": "0:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17867, "total_steps": 17941, "loss": 1.6829, "learning_rate": 4.82364764765042e-09, "epoch": 0.9958753692659272, "percentage": 99.59, "elapsed_time": "1 day, 18:17:20", "remaining_time": "0:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17868, "total_steps": 17941, "loss": 1.8201, "learning_rate": 4.700759141756939e-09, "epoch": 0.9959311075190903, "percentage": 99.59, "elapsed_time": "1 day, 18:17:29", "remaining_time": "0:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17869, "total_steps": 17941, "loss": 1.9657, "learning_rate": 4.579456195269449e-09, "epoch": 0.9959868457722535, "percentage": 99.6, "elapsed_time": "1 day, 18:17:37", "remaining_time": "0:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17870, "total_steps": 17941, "loss": 1.8972, "learning_rate": 4.4597388120182215e-09, "epoch": 0.9960425840254167, "percentage": 99.6, "elapsed_time": "1 day, 18:17:46", "remaining_time": "0:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17871, "total_steps": 17941, "loss": 1.5479, "learning_rate": 4.341606995816871e-09, "epoch": 0.9960983222785798, "percentage": 99.61, "elapsed_time": "1 day, 18:17:54", "remaining_time": "0:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17872, "total_steps": 17941, "loss": 1.6797, "learning_rate": 4.225060750401299e-09, "epoch": 0.9961540605317429, "percentage": 99.62, "elapsed_time": "1 day, 18:18:03", "remaining_time": "0:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17873, "total_steps": 17941, "loss": 1.658, "learning_rate": 4.110100079474099e-09, "epoch": 0.9962097987849061, "percentage": 99.62, "elapsed_time": "1 day, 18:18:11", "remaining_time": "0:09:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17874, "total_steps": 17941, "loss": 1.6017, "learning_rate": 3.996724986676803e-09, "epoch": 0.9962655370380692, "percentage": 99.63, "elapsed_time": "1 day, 18:18:20", "remaining_time": "0:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17875, "total_steps": 17941, "loss": 1.5619, "learning_rate": 3.884935475606533e-09, "epoch": 0.9963212752912324, "percentage": 99.63, "elapsed_time": "1 day, 18:18:28", "remaining_time": "0:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17876, "total_steps": 17941, "loss": 1.633, "learning_rate": 3.7747315498049e-09, "epoch": 0.9963770135443956, "percentage": 99.64, "elapsed_time": "1 day, 18:18:37", "remaining_time": "0:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17877, "total_steps": 17941, "loss": 1.3805, "learning_rate": 3.6661132127746577e-09, "epoch": 0.9964327517975586, "percentage": 99.64, "elapsed_time": "1 day, 18:18:45", "remaining_time": "0:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17878, "total_steps": 17941, "loss": 1.5279, "learning_rate": 3.5590804679574986e-09, "epoch": 0.9964884900507218, "percentage": 99.65, "elapsed_time": "1 day, 18:18:54", "remaining_time": "0:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17879, "total_steps": 17941, "loss": 1.6911, "learning_rate": 3.453633318745153e-09, "epoch": 0.996544228303885, "percentage": 99.65, "elapsed_time": "1 day, 18:19:02", "remaining_time": "0:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17880, "total_steps": 17941, "loss": 1.522, "learning_rate": 3.349771768479393e-09, "epoch": 0.9965999665570481, "percentage": 99.66, "elapsed_time": "1 day, 18:19:11", "remaining_time": "0:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17881, "total_steps": 17941, "loss": 1.7007, "learning_rate": 3.247495820463131e-09, "epoch": 0.9966557048102113, "percentage": 99.67, "elapsed_time": "1 day, 18:19:19", "remaining_time": "0:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17882, "total_steps": 17941, "loss": 1.6738, "learning_rate": 3.1468054779326684e-09, "epoch": 0.9967114430633744, "percentage": 99.67, "elapsed_time": "1 day, 18:19:27", "remaining_time": "0:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17883, "total_steps": 17941, "loss": 1.7663, "learning_rate": 3.0477007440854464e-09, "epoch": 0.9967671813165375, "percentage": 99.68, "elapsed_time": "1 day, 18:19:36", "remaining_time": "0:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17884, "total_steps": 17941, "loss": 1.6182, "learning_rate": 2.950181622063397e-09, "epoch": 0.9968229195697007, "percentage": 99.68, "elapsed_time": "1 day, 18:19:44", "remaining_time": "0:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17885, "total_steps": 17941, "loss": 1.4883, "learning_rate": 2.854248114958491e-09, "epoch": 0.9968786578228638, "percentage": 99.69, "elapsed_time": "1 day, 18:19:53", "remaining_time": "0:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17886, "total_steps": 17941, "loss": 1.5116, "learning_rate": 2.7599002258127393e-09, "epoch": 0.996934396076027, "percentage": 99.69, "elapsed_time": "1 day, 18:20:01", "remaining_time": "0:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17887, "total_steps": 17941, "loss": 1.7701, "learning_rate": 2.6671379576181934e-09, "epoch": 0.9969901343291901, "percentage": 99.7, "elapsed_time": "1 day, 18:20:10", "remaining_time": "0:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17888, "total_steps": 17941, "loss": 1.758, "learning_rate": 2.5759613133169435e-09, "epoch": 0.9970458725823532, "percentage": 99.7, "elapsed_time": "1 day, 18:20:18", "remaining_time": "0:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17889, "total_steps": 17941, "loss": 1.4548, "learning_rate": 2.4863702958011213e-09, "epoch": 0.9971016108355164, "percentage": 99.71, "elapsed_time": "1 day, 18:20:27", "remaining_time": "0:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17890, "total_steps": 17941, "loss": 1.7625, "learning_rate": 2.3983649079128977e-09, "epoch": 0.9971573490886796, "percentage": 99.72, "elapsed_time": "1 day, 18:20:36", "remaining_time": "0:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17891, "total_steps": 17941, "loss": 1.7275, "learning_rate": 2.3119451524389323e-09, "epoch": 0.9972130873418427, "percentage": 99.72, "elapsed_time": "1 day, 18:20:45", "remaining_time": "0:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17892, "total_steps": 17941, "loss": 1.5049, "learning_rate": 2.227111032127027e-09, "epoch": 0.9972688255950058, "percentage": 99.73, "elapsed_time": "1 day, 18:20:53", "remaining_time": "0:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17893, "total_steps": 17941, "loss": 1.78, "learning_rate": 2.143862549663922e-09, "epoch": 0.997324563848169, "percentage": 99.73, "elapsed_time": "1 day, 18:21:02", "remaining_time": "0:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17894, "total_steps": 17941, "loss": 1.7308, "learning_rate": 2.0621997076863964e-09, "epoch": 0.9973803021013321, "percentage": 99.74, "elapsed_time": "1 day, 18:21:10", "remaining_time": "0:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17895, "total_steps": 17941, "loss": 1.5949, "learning_rate": 1.982122508792372e-09, "epoch": 0.9974360403544953, "percentage": 99.74, "elapsed_time": "1 day, 18:21:20", "remaining_time": "0:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17896, "total_steps": 17941, "loss": 1.6167, "learning_rate": 1.9036309555131582e-09, "epoch": 0.9974917786076585, "percentage": 99.75, "elapsed_time": "1 day, 18:21:28", "remaining_time": "0:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17897, "total_steps": 17941, "loss": 1.6487, "learning_rate": 1.8267250503412048e-09, "epoch": 0.9975475168608215, "percentage": 99.75, "elapsed_time": "1 day, 18:21:37", "remaining_time": "0:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17898, "total_steps": 17941, "loss": 1.7007, "learning_rate": 1.7514047957190027e-09, "epoch": 0.9976032551139847, "percentage": 99.76, "elapsed_time": "1 day, 18:21:46", "remaining_time": "0:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17899, "total_steps": 17941, "loss": 1.8813, "learning_rate": 1.6776701940335315e-09, "epoch": 0.9976589933671479, "percentage": 99.77, "elapsed_time": "1 day, 18:21:54", "remaining_time": "0:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17900, "total_steps": 17941, "loss": 1.4914, "learning_rate": 1.6055212476162595e-09, "epoch": 0.997714731620311, "percentage": 99.77, "elapsed_time": "1 day, 18:22:03", "remaining_time": "0:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17901, "total_steps": 17941, "loss": 1.7087, "learning_rate": 1.5349579587653484e-09, "epoch": 0.9977704698734742, "percentage": 99.78, "elapsed_time": "1 day, 18:22:11", "remaining_time": "0:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17902, "total_steps": 17941, "loss": 1.6502, "learning_rate": 1.4659803297123465e-09, "epoch": 0.9978262081266374, "percentage": 99.78, "elapsed_time": "1 day, 18:22:20", "remaining_time": "0:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17903, "total_steps": 17941, "loss": 1.693, "learning_rate": 1.398588362649944e-09, "epoch": 0.9978819463798004, "percentage": 99.79, "elapsed_time": "1 day, 18:22:28", "remaining_time": "0:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17904, "total_steps": 17941, "loss": 1.7254, "learning_rate": 1.3327820597097695e-09, "epoch": 0.9979376846329636, "percentage": 99.79, "elapsed_time": "1 day, 18:22:37", "remaining_time": "0:05:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17905, "total_steps": 17941, "loss": 1.8097, "learning_rate": 1.268561422979042e-09, "epoch": 0.9979934228861268, "percentage": 99.8, "elapsed_time": "1 day, 18:22:45", "remaining_time": "0:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17906, "total_steps": 17941, "loss": 1.5276, "learning_rate": 1.2059264545005721e-09, "epoch": 0.9980491611392899, "percentage": 99.8, "elapsed_time": "1 day, 18:22:53", "remaining_time": "0:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17907, "total_steps": 17941, "loss": 1.5952, "learning_rate": 1.1448771562561078e-09, "epoch": 0.9981048993924531, "percentage": 99.81, "elapsed_time": "1 day, 18:23:02", "remaining_time": "0:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17908, "total_steps": 17941, "loss": 1.7756, "learning_rate": 1.0854135301774372e-09, "epoch": 0.9981606376456161, "percentage": 99.82, "elapsed_time": "1 day, 18:23:10", "remaining_time": "0:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17909, "total_steps": 17941, "loss": 1.6389, "learning_rate": 1.0275355781630415e-09, "epoch": 0.9982163758987793, "percentage": 99.82, "elapsed_time": "1 day, 18:23:19", "remaining_time": "0:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17910, "total_steps": 17941, "loss": 1.6831, "learning_rate": 9.712433020392375e-10, "epoch": 0.9982721141519425, "percentage": 99.83, "elapsed_time": "1 day, 18:23:27", "remaining_time": "0:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17911, "total_steps": 17941, "loss": 1.5888, "learning_rate": 9.165367035879335e-10, "epoch": 0.9983278524051056, "percentage": 99.83, "elapsed_time": "1 day, 18:23:36", "remaining_time": "0:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17912, "total_steps": 17941, "loss": 1.701, "learning_rate": 8.634157845521796e-10, "epoch": 0.9983835906582688, "percentage": 99.84, "elapsed_time": "1 day, 18:23:44", "remaining_time": "0:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17913, "total_steps": 17941, "loss": 1.4631, "learning_rate": 8.118805466139634e-10, "epoch": 0.998439328911432, "percentage": 99.84, "elapsed_time": "1 day, 18:23:53", "remaining_time": "0:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17914, "total_steps": 17941, "loss": 1.6177, "learning_rate": 7.619309914108641e-10, "epoch": 0.998495067164595, "percentage": 99.85, "elapsed_time": "1 day, 18:24:02", "remaining_time": "0:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17915, "total_steps": 17941, "loss": 1.5327, "learning_rate": 7.135671205193983e-10, "epoch": 0.9985508054177582, "percentage": 99.86, "elapsed_time": "1 day, 18:24:10", "remaining_time": "0:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17916, "total_steps": 17941, "loss": 1.7842, "learning_rate": 6.667889354772249e-10, "epoch": 0.9986065436709214, "percentage": 99.86, "elapsed_time": "1 day, 18:24:18", "remaining_time": "0:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17917, "total_steps": 17941, "loss": 1.8974, "learning_rate": 6.215964377720429e-10, "epoch": 0.9986622819240845, "percentage": 99.87, "elapsed_time": "1 day, 18:24:27", "remaining_time": "0:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17918, "total_steps": 17941, "loss": 1.7538, "learning_rate": 5.779896288304887e-10, "epoch": 0.9987180201772476, "percentage": 99.87, "elapsed_time": "1 day, 18:24:35", "remaining_time": "0:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17919, "total_steps": 17941, "loss": 1.6867, "learning_rate": 5.359685100403411e-10, "epoch": 0.9987737584304108, "percentage": 99.88, "elapsed_time": "1 day, 18:24:44", "remaining_time": "0:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17920, "total_steps": 17941, "loss": 1.5661, "learning_rate": 4.955330827283167e-10, "epoch": 0.9988294966835739, "percentage": 99.88, "elapsed_time": "1 day, 18:24:52", "remaining_time": "0:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17921, "total_steps": 17941, "loss": 1.5337, "learning_rate": 4.566833481822741e-10, "epoch": 0.9988852349367371, "percentage": 99.89, "elapsed_time": "1 day, 18:25:01", "remaining_time": "0:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17922, "total_steps": 17941, "loss": 1.6745, "learning_rate": 4.1941930763456094e-10, "epoch": 0.9989409731899003, "percentage": 99.89, "elapsed_time": "1 day, 18:25:09", "remaining_time": "0:02:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17923, "total_steps": 17941, "loss": 1.6886, "learning_rate": 3.8374096226201363e-10, "epoch": 0.9989967114430633, "percentage": 99.9, "elapsed_time": "1 day, 18:25:18", "remaining_time": "0:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17924, "total_steps": 17941, "loss": 1.7712, "learning_rate": 3.4964831320261074e-10, "epoch": 0.9990524496962265, "percentage": 99.91, "elapsed_time": "1 day, 18:25:26", "remaining_time": "0:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17925, "total_steps": 17941, "loss": 1.7366, "learning_rate": 3.1714136153326856e-10, "epoch": 0.9991081879493897, "percentage": 99.91, "elapsed_time": "1 day, 18:25:35", "remaining_time": "0:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17926, "total_steps": 17941, "loss": 1.6816, "learning_rate": 2.8622010828094347e-10, "epoch": 0.9991639262025528, "percentage": 99.92, "elapsed_time": "1 day, 18:25:43", "remaining_time": "0:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17927, "total_steps": 17941, "loss": 1.4507, "learning_rate": 2.5688455443928504e-10, "epoch": 0.999219664455716, "percentage": 99.92, "elapsed_time": "1 day, 18:25:52", "remaining_time": "0:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17928, "total_steps": 17941, "loss": 1.5333, "learning_rate": 2.291347009242273e-10, "epoch": 0.9992754027088792, "percentage": 99.93, "elapsed_time": "1 day, 18:26:01", "remaining_time": "0:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17929, "total_steps": 17941, "loss": 1.6289, "learning_rate": 2.029705486239486e-10, "epoch": 0.9993311409620422, "percentage": 99.93, "elapsed_time": "1 day, 18:26:09", "remaining_time": "0:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17930, "total_steps": 17941, "loss": 1.5401, "learning_rate": 1.7839209836556513e-10, "epoch": 0.9993868792152054, "percentage": 99.94, "elapsed_time": "1 day, 18:26:17", "remaining_time": "0:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17931, "total_steps": 17941, "loss": 1.6467, "learning_rate": 1.5539935093178414e-10, "epoch": 0.9994426174683685, "percentage": 99.94, "elapsed_time": "1 day, 18:26:26", "remaining_time": "0:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17932, "total_steps": 17941, "loss": 1.7435, "learning_rate": 1.339923070498017e-10, "epoch": 0.9994983557215317, "percentage": 99.95, "elapsed_time": "1 day, 18:26:34", "remaining_time": "0:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17933, "total_steps": 17941, "loss": 1.7012, "learning_rate": 1.1417096739685385e-10, "epoch": 0.9995540939746949, "percentage": 99.96, "elapsed_time": "1 day, 18:26:43", "remaining_time": "0:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17934, "total_steps": 17941, "loss": 1.7907, "learning_rate": 9.593533260021659e-11, "epoch": 0.9996098322278579, "percentage": 99.96, "elapsed_time": "1 day, 18:26:51", "remaining_time": "0:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17935, "total_steps": 17941, "loss": 1.8255, "learning_rate": 7.928540324275702e-11, "epoch": 0.9996655704810211, "percentage": 99.97, "elapsed_time": "1 day, 18:27:00", "remaining_time": "0:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17936, "total_steps": 17941, "loss": 1.5038, "learning_rate": 6.422117985183107e-11, "epoch": 0.9997213087341843, "percentage": 99.97, "elapsed_time": "1 day, 18:27:08", "remaining_time": "0:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17937, "total_steps": 17941, "loss": 1.6391, "learning_rate": 5.074266290483465e-11, "epoch": 0.9997770469873474, "percentage": 99.98, "elapsed_time": "1 day, 18:27:17", "remaining_time": "0:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17938, "total_steps": 17941, "loss": 1.5529, "learning_rate": 3.88498528236525e-11, "epoch": 0.9998327852405106, "percentage": 99.98, "elapsed_time": "1 day, 18:27:26", "remaining_time": "0:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17939, "total_steps": 17941, "loss": 1.6723, "learning_rate": 2.8542749996862682e-11, "epoch": 0.9998885234936737, "percentage": 99.99, "elapsed_time": "1 day, 18:27:34", "remaining_time": "0:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17940, "total_steps": 17941, "loss": 1.5116, "learning_rate": 1.982135474087876e-11, "epoch": 0.9999442617468368, "percentage": 99.99, "elapsed_time": "1 day, 18:27:43", "remaining_time": "0:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17941, "total_steps": 17941, "loss": 1.6776, "learning_rate": 1.268566733325649e-11, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "1 day, 18:27:51", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17941, "total_steps": 17941, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "1 day, 18:27:52", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}