{"current_steps": 5, "total_steps": 1680, "loss": 2.7425, "learning_rate": 2.9761904761904763e-06, "epoch": 0.0178491744756805, "percentage": 0.3, "elapsed_time": "0:01:00", "remaining_time": "5:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 1680, "loss": 2.861, "learning_rate": 5.9523809523809525e-06, "epoch": 0.035698348951361, "percentage": 0.6, "elapsed_time": "0:02:01", "remaining_time": "5:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 1680, "loss": 2.8281, "learning_rate": 8.92857142857143e-06, "epoch": 0.0535475234270415, "percentage": 0.89, "elapsed_time": "0:03:01", "remaining_time": "5:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 1680, "loss": 3.1888, "learning_rate": 1.1904761904761905e-05, "epoch": 0.071396697902722, "percentage": 1.19, "elapsed_time": "0:03:58", "remaining_time": "5:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 1680, "loss": 2.6461, "learning_rate": 1.4880952380952381e-05, "epoch": 0.0892458723784025, "percentage": 1.49, "elapsed_time": "0:04:58", "remaining_time": "5:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 1680, "loss": 2.3212, "learning_rate": 1.785714285714286e-05, "epoch": 0.107095046854083, "percentage": 1.79, "elapsed_time": "0:05:57", "remaining_time": "5:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 1680, "loss": 1.8036, "learning_rate": 2.0833333333333336e-05, "epoch": 0.1249442213297635, "percentage": 2.08, "elapsed_time": "0:06:55", "remaining_time": "5:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 1680, "loss": 1.5552, "learning_rate": 2.380952380952381e-05, "epoch": 0.142793395805444, "percentage": 2.38, "elapsed_time": "0:07:56", "remaining_time": "5:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 1680, "loss": 1.6626, "learning_rate": 2.6785714285714288e-05, "epoch": 0.1606425702811245, "percentage": 2.68, "elapsed_time": "0:08:55", "remaining_time": "5:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 1680, "loss": 1.4897, "learning_rate": 2.9761904761904762e-05, "epoch": 0.178491744756805, "percentage": 2.98, "elapsed_time": "0:09:54", "remaining_time": "5:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 1680, "loss": 1.5373, "learning_rate": 3.273809523809524e-05, "epoch": 0.1963409192324855, "percentage": 3.27, "elapsed_time": "0:10:54", "remaining_time": "5:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 1680, "loss": 1.4779, "learning_rate": 3.571428571428572e-05, "epoch": 0.214190093708166, "percentage": 3.57, "elapsed_time": "0:11:54", "remaining_time": "5:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 1680, "loss": 1.483, "learning_rate": 3.8690476190476195e-05, "epoch": 0.2320392681838465, "percentage": 3.87, "elapsed_time": "0:12:52", "remaining_time": "5:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 1680, "loss": 1.5022, "learning_rate": 4.166666666666667e-05, "epoch": 0.249888442659527, "percentage": 4.17, "elapsed_time": "0:13:52", "remaining_time": "5:19:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 1680, "eval_loss": 1.451762318611145, "epoch": 0.249888442659527, "percentage": 4.17, "elapsed_time": "0:14:10", "remaining_time": "5:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 1680, "loss": 1.4256, "learning_rate": 4.464285714285715e-05, "epoch": 0.2677376171352075, "percentage": 4.46, "elapsed_time": "0:15:11", "remaining_time": "5:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 1680, "loss": 1.3655, "learning_rate": 4.761904761904762e-05, "epoch": 0.285586791610888, "percentage": 4.76, "elapsed_time": "0:16:11", "remaining_time": "5:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 1680, "loss": 1.4478, "learning_rate": 5.05952380952381e-05, "epoch": 0.3034359660865685, "percentage": 5.06, "elapsed_time": "0:17:11", "remaining_time": "5:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 1680, "loss": 1.3305, "learning_rate": 5.3571428571428575e-05, "epoch": 0.321285140562249, "percentage": 5.36, "elapsed_time": "0:18:10", "remaining_time": "5:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 1680, "loss": 1.4279, "learning_rate": 5.6547619047619046e-05, "epoch": 0.3391343150379295, "percentage": 5.65, "elapsed_time": "0:19:08", "remaining_time": "5:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 1680, "loss": 1.4967, "learning_rate": 5.9523809523809524e-05, "epoch": 0.35698348951361, "percentage": 5.95, "elapsed_time": "0:20:08", "remaining_time": "5:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 1680, "loss": 1.4739, "learning_rate": 6.25e-05, "epoch": 0.3748326639892905, "percentage": 6.25, "elapsed_time": "0:21:07", "remaining_time": "5:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 1680, "loss": 1.3751, "learning_rate": 6.547619047619048e-05, "epoch": 0.392681838464971, "percentage": 6.55, "elapsed_time": "0:22:07", "remaining_time": "5:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 1680, "loss": 1.3699, "learning_rate": 6.845238095238096e-05, "epoch": 0.4105310129406515, "percentage": 6.85, "elapsed_time": "0:23:06", "remaining_time": "5:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 1680, "loss": 1.4696, "learning_rate": 7.142857142857143e-05, "epoch": 0.428380187416332, "percentage": 7.14, "elapsed_time": "0:24:07", "remaining_time": "5:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 1680, "loss": 1.4059, "learning_rate": 7.440476190476191e-05, "epoch": 0.4462293618920125, "percentage": 7.44, "elapsed_time": "0:25:06", "remaining_time": "5:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 1680, "loss": 1.3072, "learning_rate": 7.738095238095239e-05, "epoch": 0.464078536367693, "percentage": 7.74, "elapsed_time": "0:26:04", "remaining_time": "5:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 1680, "loss": 1.4132, "learning_rate": 8.035714285714287e-05, "epoch": 0.4819277108433735, "percentage": 8.04, "elapsed_time": "0:27:03", "remaining_time": "5:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 1680, "loss": 1.4121, "learning_rate": 8.333333333333334e-05, "epoch": 0.499776885319054, "percentage": 8.33, "elapsed_time": "0:28:02", "remaining_time": "5:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 1680, "eval_loss": 1.3727394342422485, "epoch": 0.499776885319054, "percentage": 8.33, "elapsed_time": "0:28:20", "remaining_time": "5:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 1680, "loss": 1.3109, "learning_rate": 8.630952380952382e-05, "epoch": 0.5176260597947345, "percentage": 8.63, "elapsed_time": "0:29:21", "remaining_time": "5:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 1680, "loss": 1.3781, "learning_rate": 8.92857142857143e-05, "epoch": 0.535475234270415, "percentage": 8.93, "elapsed_time": "0:30:21", "remaining_time": "5:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 1680, "loss": 1.3564, "learning_rate": 9.226190476190478e-05, "epoch": 0.5533244087460955, "percentage": 9.23, "elapsed_time": "0:31:20", "remaining_time": "5:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 1680, "loss": 1.2387, "learning_rate": 9.523809523809524e-05, "epoch": 0.571173583221776, "percentage": 9.52, "elapsed_time": "0:32:19", "remaining_time": "5:07:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 1680, "loss": 1.3042, "learning_rate": 9.821428571428572e-05, "epoch": 0.5890227576974565, "percentage": 9.82, "elapsed_time": "0:33:18", "remaining_time": "5:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 1680, "loss": 1.3709, "learning_rate": 9.999956828659095e-05, "epoch": 0.606871932173137, "percentage": 10.12, "elapsed_time": "0:34:18", "remaining_time": "5:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 1680, "loss": 1.3844, "learning_rate": 9.999471159635539e-05, "epoch": 0.6247211066488175, "percentage": 10.42, "elapsed_time": "0:35:18", "remaining_time": "5:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 1680, "loss": 1.2852, "learning_rate": 9.998445910004082e-05, "epoch": 0.642570281124498, "percentage": 10.71, "elapsed_time": "0:36:18", "remaining_time": "5:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 1680, "loss": 1.4652, "learning_rate": 9.996881190417393e-05, "epoch": 0.6604194556001785, "percentage": 11.01, "elapsed_time": "0:37:19", "remaining_time": "5:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 1680, "loss": 1.3743, "learning_rate": 9.994777169751806e-05, "epoch": 0.678268630075859, "percentage": 11.31, "elapsed_time": "0:38:19", "remaining_time": "5:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 1680, "loss": 1.2423, "learning_rate": 9.992134075089084e-05, "epoch": 0.6961178045515395, "percentage": 11.61, "elapsed_time": "0:39:19", "remaining_time": "4:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 1680, "loss": 1.3113, "learning_rate": 9.988952191691925e-05, "epoch": 0.71396697902722, "percentage": 11.9, "elapsed_time": "0:40:17", "remaining_time": "4:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 1680, "loss": 1.3524, "learning_rate": 9.985231862973168e-05, "epoch": 0.7318161535029005, "percentage": 12.2, "elapsed_time": "0:41:16", "remaining_time": "4:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 1680, "loss": 1.4038, "learning_rate": 9.980973490458728e-05, "epoch": 0.749665327978581, "percentage": 12.5, "elapsed_time": "0:42:16", "remaining_time": "4:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 1680, "eval_loss": 1.3051044940948486, "epoch": 0.749665327978581, "percentage": 12.5, "elapsed_time": "0:42:34", "remaining_time": "4:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 1680, "loss": 1.3626, "learning_rate": 9.976177533744261e-05, "epoch": 0.7675145024542614, "percentage": 12.8, "elapsed_time": "0:43:36", "remaining_time": "4:57:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 1680, "loss": 1.3232, "learning_rate": 9.97084451044556e-05, "epoch": 0.785363676929942, "percentage": 13.1, "elapsed_time": "0:44:35", "remaining_time": "4:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 1680, "loss": 1.2826, "learning_rate": 9.964974996142698e-05, "epoch": 0.8032128514056225, "percentage": 13.39, "elapsed_time": "0:45:34", "remaining_time": "4:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 1680, "loss": 1.2794, "learning_rate": 9.958569624317893e-05, "epoch": 0.821062025881303, "percentage": 13.69, "elapsed_time": "0:46:32", "remaining_time": "4:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 1680, "loss": 1.3853, "learning_rate": 9.951629086287151e-05, "epoch": 0.8389112003569835, "percentage": 13.99, "elapsed_time": "0:47:32", "remaining_time": "4:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 1680, "loss": 1.3533, "learning_rate": 9.944154131125642e-05, "epoch": 0.856760374832664, "percentage": 14.29, "elapsed_time": "0:48:31", "remaining_time": "4:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 1680, "loss": 1.3395, "learning_rate": 9.936145565586871e-05, "epoch": 0.8746095493083444, "percentage": 14.58, "elapsed_time": "0:49:30", "remaining_time": "4:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 1680, "loss": 1.443, "learning_rate": 9.927604254015585e-05, "epoch": 0.892458723784025, "percentage": 14.88, "elapsed_time": "0:50:30", "remaining_time": "4:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 1680, "loss": 1.398, "learning_rate": 9.918531118254507e-05, "epoch": 0.9103078982597055, "percentage": 15.18, "elapsed_time": "0:51:29", "remaining_time": "4:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 1680, "loss": 1.346, "learning_rate": 9.90892713754483e-05, "epoch": 0.928157072735386, "percentage": 15.48, "elapsed_time": "0:52:30", "remaining_time": "4:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 1680, "loss": 1.3921, "learning_rate": 9.898793348420536e-05, "epoch": 0.9460062472110665, "percentage": 15.77, "elapsed_time": "0:53:30", "remaining_time": "4:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 1680, "loss": 1.3838, "learning_rate": 9.888130844596524e-05, "epoch": 0.963855421686747, "percentage": 16.07, "elapsed_time": "0:54:30", "remaining_time": "4:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 1680, "loss": 1.3529, "learning_rate": 9.876940776850569e-05, "epoch": 0.9817045961624274, "percentage": 16.37, "elapsed_time": "0:55:31", "remaining_time": "4:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 1680, "loss": 1.2739, "learning_rate": 9.865224352899119e-05, "epoch": 0.999553770638108, "percentage": 16.67, "elapsed_time": "0:56:31", "remaining_time": "4:42:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 1680, "eval_loss": 1.289029836654663, "epoch": 0.999553770638108, "percentage": 16.67, "elapsed_time": "0:56:49", "remaining_time": "4:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 1680, "loss": 1.2339, "learning_rate": 9.852982837266955e-05, "epoch": 1.0174029451137885, "percentage": 16.96, "elapsed_time": "0:57:51", "remaining_time": "4:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 1680, "loss": 1.0982, "learning_rate": 9.840217551150706e-05, "epoch": 1.035252119589469, "percentage": 17.26, "elapsed_time": "0:58:49", "remaining_time": "4:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 1680, "loss": 1.2537, "learning_rate": 9.826929872276255e-05, "epoch": 1.0531012940651494, "percentage": 17.56, "elapsed_time": "0:59:50", "remaining_time": "4:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 1680, "loss": 1.1664, "learning_rate": 9.81312123475006e-05, "epoch": 1.07095046854083, "percentage": 17.86, "elapsed_time": "1:00:49", "remaining_time": "4:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 1680, "loss": 1.08, "learning_rate": 9.798793128904356e-05, "epoch": 1.0887996430165106, "percentage": 18.15, "elapsed_time": "1:01:49", "remaining_time": "4:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 1680, "loss": 1.1029, "learning_rate": 9.78394710113631e-05, "epoch": 1.106648817492191, "percentage": 18.45, "elapsed_time": "1:02:47", "remaining_time": "4:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 1680, "loss": 1.1524, "learning_rate": 9.768584753741134e-05, "epoch": 1.1244979919678715, "percentage": 18.75, "elapsed_time": "1:03:46", "remaining_time": "4:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 1680, "loss": 1.1328, "learning_rate": 9.752707744739145e-05, "epoch": 1.142347166443552, "percentage": 19.05, "elapsed_time": "1:04:46", "remaining_time": "4:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 1680, "loss": 1.1174, "learning_rate": 9.736317787696816e-05, "epoch": 1.1601963409192324, "percentage": 19.35, "elapsed_time": "1:05:47", "remaining_time": "4:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 1680, "loss": 1.0493, "learning_rate": 9.719416651541839e-05, "epoch": 1.178045515394913, "percentage": 19.64, "elapsed_time": "1:06:46", "remaining_time": "4:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 1680, "loss": 1.0479, "learning_rate": 9.702006160372209e-05, "epoch": 1.1958946898705936, "percentage": 19.94, "elapsed_time": "1:07:45", "remaining_time": "4:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 1680, "loss": 1.1043, "learning_rate": 9.684088193259355e-05, "epoch": 1.213743864346274, "percentage": 20.24, "elapsed_time": "1:08:43", "remaining_time": "4:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 1680, "loss": 1.1096, "learning_rate": 9.665664684045333e-05, "epoch": 1.2315930388219545, "percentage": 20.54, "elapsed_time": "1:09:43", "remaining_time": "4:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 1680, "loss": 1.1436, "learning_rate": 9.646737621134112e-05, "epoch": 1.249442213297635, "percentage": 20.83, "elapsed_time": "1:10:43", "remaining_time": "4:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 1680, "eval_loss": 1.3194608688354492, "epoch": 1.249442213297635, "percentage": 20.83, "elapsed_time": "1:11:01", "remaining_time": "4:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 1680, "loss": 1.0549, "learning_rate": 9.627309047276974e-05, "epoch": 1.2672913877733154, "percentage": 21.13, "elapsed_time": "1:12:05", "remaining_time": "4:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 1680, "loss": 1.1576, "learning_rate": 9.607381059352038e-05, "epoch": 1.285140562248996, "percentage": 21.43, "elapsed_time": "1:13:05", "remaining_time": "4:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 1680, "loss": 1.1246, "learning_rate": 9.586955808137958e-05, "epoch": 1.3029897367246766, "percentage": 21.73, "elapsed_time": "1:14:05", "remaining_time": "4:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 1680, "loss": 1.125, "learning_rate": 9.566035498081784e-05, "epoch": 1.320838911200357, "percentage": 22.02, "elapsed_time": "1:15:05", "remaining_time": "4:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 1680, "loss": 1.1687, "learning_rate": 9.544622387061055e-05, "epoch": 1.3386880856760375, "percentage": 22.32, "elapsed_time": "1:16:05", "remaining_time": "4:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 1680, "loss": 0.9699, "learning_rate": 9.522718786140097e-05, "epoch": 1.356537260151718, "percentage": 22.62, "elapsed_time": "1:17:04", "remaining_time": "4:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 1680, "loss": 1.1379, "learning_rate": 9.500327059320606e-05, "epoch": 1.3743864346273984, "percentage": 22.92, "elapsed_time": "1:18:03", "remaining_time": "4:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 1680, "loss": 1.0511, "learning_rate": 9.477449623286505e-05, "epoch": 1.392235609103079, "percentage": 23.21, "elapsed_time": "1:19:03", "remaining_time": "4:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 1680, "loss": 1.0003, "learning_rate": 9.454088947143116e-05, "epoch": 1.4100847835787595, "percentage": 23.51, "elapsed_time": "1:20:03", "remaining_time": "4:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 1680, "loss": 1.1631, "learning_rate": 9.430247552150673e-05, "epoch": 1.42793395805444, "percentage": 23.81, "elapsed_time": "1:21:03", "remaining_time": "4:19:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 1680, "loss": 1.045, "learning_rate": 9.405928011452211e-05, "epoch": 1.4457831325301205, "percentage": 24.11, "elapsed_time": "1:22:03", "remaining_time": "4:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 1680, "loss": 1.0511, "learning_rate": 9.381132949795861e-05, "epoch": 1.463632307005801, "percentage": 24.4, "elapsed_time": "1:23:04", "remaining_time": "4:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 1680, "loss": 1.1637, "learning_rate": 9.35586504325155e-05, "epoch": 1.4814814814814814, "percentage": 24.7, "elapsed_time": "1:24:05", "remaining_time": "4:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 1680, "loss": 1.0783, "learning_rate": 9.330127018922194e-05, "epoch": 1.499330655957162, "percentage": 25.0, "elapsed_time": "1:25:05", "remaining_time": "4:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 1680, "eval_loss": 1.3106330633163452, "epoch": 1.499330655957162, "percentage": 25.0, "elapsed_time": "1:25:23", "remaining_time": "4:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 1680, "loss": 1.0406, "learning_rate": 9.303921654649362e-05, "epoch": 1.5171798304328425, "percentage": 25.3, "elapsed_time": "1:26:23", "remaining_time": "4:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 1680, "loss": 1.1469, "learning_rate": 9.277251778713474e-05, "epoch": 1.5350290049085231, "percentage": 25.6, "elapsed_time": "1:27:23", "remaining_time": "4:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 1680, "loss": 1.0453, "learning_rate": 9.250120269528546e-05, "epoch": 1.5528781793842035, "percentage": 25.89, "elapsed_time": "1:28:23", "remaining_time": "4:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 1680, "loss": 1.0611, "learning_rate": 9.22253005533154e-05, "epoch": 1.5707273538598838, "percentage": 26.19, "elapsed_time": "1:29:22", "remaining_time": "4:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 1680, "loss": 1.082, "learning_rate": 9.194484113866313e-05, "epoch": 1.5885765283355644, "percentage": 26.49, "elapsed_time": "1:30:21", "remaining_time": "4:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 1680, "loss": 1.2404, "learning_rate": 9.165985472062246e-05, "epoch": 1.606425702811245, "percentage": 26.79, "elapsed_time": "1:31:18", "remaining_time": "4:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 1680, "loss": 1.0436, "learning_rate": 9.137037205707552e-05, "epoch": 1.6242748772869255, "percentage": 27.08, "elapsed_time": "1:32:17", "remaining_time": "4:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 1680, "loss": 1.1227, "learning_rate": 9.107642439117321e-05, "epoch": 1.6421240517626061, "percentage": 27.38, "elapsed_time": "1:33:13", "remaining_time": "4:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 1680, "loss": 1.0858, "learning_rate": 9.077804344796302e-05, "epoch": 1.6599732262382865, "percentage": 27.68, "elapsed_time": "1:34:15", "remaining_time": "4:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 1680, "loss": 1.0998, "learning_rate": 9.04752614309652e-05, "epoch": 1.6778224007139668, "percentage": 27.98, "elapsed_time": "1:35:16", "remaining_time": "4:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 1680, "loss": 1.0433, "learning_rate": 9.01681110186971e-05, "epoch": 1.6956715751896474, "percentage": 28.27, "elapsed_time": "1:36:15", "remaining_time": "4:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 1680, "loss": 1.0798, "learning_rate": 8.985662536114613e-05, "epoch": 1.713520749665328, "percentage": 28.57, "elapsed_time": "1:37:14", "remaining_time": "4:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 1680, "loss": 1.1012, "learning_rate": 8.954083807619208e-05, "epoch": 1.7313699241410085, "percentage": 28.87, "elapsed_time": "1:38:13", "remaining_time": "4:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 1680, "loss": 1.1219, "learning_rate": 8.922078324597879e-05, "epoch": 1.7492190986166891, "percentage": 29.17, "elapsed_time": "1:39:13", "remaining_time": "4:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 1680, "eval_loss": 1.3044873476028442, "epoch": 1.7492190986166891, "percentage": 29.17, "elapsed_time": "1:39:31", "remaining_time": "4:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 1680, "loss": 1.16, "learning_rate": 8.889649541323574e-05, "epoch": 1.7670682730923695, "percentage": 29.46, "elapsed_time": "1:40:32", "remaining_time": "4:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 1680, "loss": 1.091, "learning_rate": 8.856800957755e-05, "epoch": 1.7849174475680498, "percentage": 29.76, "elapsed_time": "1:41:32", "remaining_time": "3:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 1680, "loss": 1.072, "learning_rate": 8.823536119158864e-05, "epoch": 1.8027666220437304, "percentage": 30.06, "elapsed_time": "1:42:34", "remaining_time": "3:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 1680, "loss": 1.0635, "learning_rate": 8.789858615727265e-05, "epoch": 1.820615796519411, "percentage": 30.36, "elapsed_time": "1:43:32", "remaining_time": "3:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 1680, "loss": 1.0258, "learning_rate": 8.755772082190194e-05, "epoch": 1.8384649709950915, "percentage": 30.65, "elapsed_time": "1:44:31", "remaining_time": "3:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 1680, "loss": 1.2011, "learning_rate": 8.721280197423258e-05, "epoch": 1.8563141454707721, "percentage": 30.95, "elapsed_time": "1:45:32", "remaining_time": "3:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 1680, "loss": 1.0539, "learning_rate": 8.68638668405062e-05, "epoch": 1.8741633199464525, "percentage": 31.25, "elapsed_time": "1:46:30", "remaining_time": "3:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 1680, "loss": 1.0948, "learning_rate": 8.651095308043232e-05, "epoch": 1.8920124944221328, "percentage": 31.55, "elapsed_time": "1:47:29", "remaining_time": "3:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 1680, "loss": 1.1245, "learning_rate": 8.61540987831238e-05, "epoch": 1.9098616688978134, "percentage": 31.85, "elapsed_time": "1:48:28", "remaining_time": "3:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 1680, "loss": 1.2039, "learning_rate": 8.579334246298593e-05, "epoch": 1.927710843373494, "percentage": 32.14, "elapsed_time": "1:49:28", "remaining_time": "3:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 1680, "loss": 1.1077, "learning_rate": 8.542872305555978e-05, "epoch": 1.9455600178491745, "percentage": 32.44, "elapsed_time": "1:50:27", "remaining_time": "3:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 1680, "loss": 1.0603, "learning_rate": 8.50602799133199e-05, "epoch": 1.9634091923248551, "percentage": 32.74, "elapsed_time": "1:51:26", "remaining_time": "3:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 1680, "loss": 1.1376, "learning_rate": 8.468805280142709e-05, "epoch": 1.9812583668005355, "percentage": 33.04, "elapsed_time": "1:52:27", "remaining_time": "3:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 1680, "loss": 1.0966, "learning_rate": 8.43120818934367e-05, "epoch": 1.9991075412762158, "percentage": 33.33, "elapsed_time": "1:53:26", "remaining_time": "3:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 1680, "eval_loss": 1.3094360828399658, "epoch": 1.9991075412762158, "percentage": 33.33, "elapsed_time": "1:53:44", "remaining_time": "3:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 565, "total_steps": 1680, "loss": 0.6867, "learning_rate": 8.393240776696274e-05, "epoch": 2.0169567157518964, "percentage": 33.63, "elapsed_time": "1:54:44", "remaining_time": "3:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 1680, "loss": 0.6025, "learning_rate": 8.354907139929851e-05, "epoch": 2.034805890227577, "percentage": 33.93, "elapsed_time": "1:55:43", "remaining_time": "3:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 575, "total_steps": 1680, "loss": 0.6497, "learning_rate": 8.316211416299397e-05, "epoch": 2.0526550647032575, "percentage": 34.23, "elapsed_time": "1:56:43", "remaining_time": "3:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 1680, "loss": 0.5803, "learning_rate": 8.27715778213905e-05, "epoch": 2.070504239178938, "percentage": 34.52, "elapsed_time": "1:57:41", "remaining_time": "3:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 585, "total_steps": 1680, "loss": 0.494, "learning_rate": 8.237750452411353e-05, "epoch": 2.0883534136546187, "percentage": 34.82, "elapsed_time": "1:58:39", "remaining_time": "3:42:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 1680, "loss": 0.6428, "learning_rate": 8.197993680252334e-05, "epoch": 2.106202588130299, "percentage": 35.12, "elapsed_time": "1:59:40", "remaining_time": "3:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 595, "total_steps": 1680, "loss": 0.6612, "learning_rate": 8.157891756512488e-05, "epoch": 2.1240517626059794, "percentage": 35.42, "elapsed_time": "2:00:41", "remaining_time": "3:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 1680, "loss": 0.5783, "learning_rate": 8.117449009293668e-05, "epoch": 2.14190093708166, "percentage": 35.71, "elapsed_time": "2:01:41", "remaining_time": "3:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 605, "total_steps": 1680, "loss": 0.5799, "learning_rate": 8.076669803481965e-05, "epoch": 2.1597501115573405, "percentage": 36.01, "elapsed_time": "2:02:40", "remaining_time": "3:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 1680, "loss": 0.5344, "learning_rate": 8.035558540276618e-05, "epoch": 2.177599286033021, "percentage": 36.31, "elapsed_time": "2:03:38", "remaining_time": "3:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 615, "total_steps": 1680, "loss": 0.5605, "learning_rate": 7.994119656715002e-05, "epoch": 2.1954484605087012, "percentage": 36.61, "elapsed_time": "2:04:38", "remaining_time": "3:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 1680, "loss": 0.5923, "learning_rate": 7.952357625193749e-05, "epoch": 2.213297634984382, "percentage": 36.9, "elapsed_time": "2:05:38", "remaining_time": "3:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 625, "total_steps": 1680, "loss": 0.6067, "learning_rate": 7.91027695298606e-05, "epoch": 2.2311468094600624, "percentage": 37.2, "elapsed_time": "2:06:36", "remaining_time": "3:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 1680, "loss": 0.6134, "learning_rate": 7.86788218175523e-05, "epoch": 2.248995983935743, "percentage": 37.5, "elapsed_time": "2:07:36", "remaining_time": "3:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 1680, "eval_loss": 1.4945974349975586, "epoch": 2.248995983935743, "percentage": 37.5, "elapsed_time": "2:07:53", "remaining_time": "3:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 635, "total_steps": 1680, "loss": 0.5798, "learning_rate": 7.8251778870645e-05, "epoch": 2.2668451584114235, "percentage": 37.8, "elapsed_time": "2:08:53", "remaining_time": "3:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 1680, "loss": 0.5705, "learning_rate": 7.782168677883206e-05, "epoch": 2.284694332887104, "percentage": 38.1, "elapsed_time": "2:09:52", "remaining_time": "3:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 645, "total_steps": 1680, "loss": 0.6119, "learning_rate": 7.738859196089358e-05, "epoch": 2.3025435073627847, "percentage": 38.39, "elapsed_time": "2:10:51", "remaining_time": "3:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 1680, "loss": 0.6352, "learning_rate": 7.695254115968648e-05, "epoch": 2.320392681838465, "percentage": 38.69, "elapsed_time": "2:11:49", "remaining_time": "3:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 655, "total_steps": 1680, "loss": 0.6341, "learning_rate": 7.651358143709972e-05, "epoch": 2.3382418563141454, "percentage": 38.99, "elapsed_time": "2:12:50", "remaining_time": "3:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 1680, "loss": 0.6695, "learning_rate": 7.60717601689749e-05, "epoch": 2.356091030789826, "percentage": 39.29, "elapsed_time": "2:13:49", "remaining_time": "3:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 665, "total_steps": 1680, "loss": 0.5715, "learning_rate": 7.562712503999327e-05, "epoch": 2.3739402052655065, "percentage": 39.58, "elapsed_time": "2:14:50", "remaining_time": "3:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 1680, "loss": 0.7753, "learning_rate": 7.517972403852905e-05, "epoch": 2.391789379741187, "percentage": 39.88, "elapsed_time": "2:15:52", "remaining_time": "3:24:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 675, "total_steps": 1680, "loss": 0.5529, "learning_rate": 7.472960545147038e-05, "epoch": 2.4096385542168672, "percentage": 40.18, "elapsed_time": "2:16:50", "remaining_time": "3:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 1680, "loss": 0.5715, "learning_rate": 7.427681785900761e-05, "epoch": 2.427487728692548, "percentage": 40.48, "elapsed_time": "2:17:49", "remaining_time": "3:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 685, "total_steps": 1680, "loss": 0.6085, "learning_rate": 7.382141012939034e-05, "epoch": 2.4453369031682284, "percentage": 40.77, "elapsed_time": "2:18:49", "remaining_time": "3:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 1680, "loss": 0.627, "learning_rate": 7.33634314136531e-05, "epoch": 2.463186077643909, "percentage": 41.07, "elapsed_time": "2:19:48", "remaining_time": "3:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 695, "total_steps": 1680, "loss": 0.6403, "learning_rate": 7.290293114031061e-05, "epoch": 2.4810352521195895, "percentage": 41.37, "elapsed_time": "2:20:47", "remaining_time": "3:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 1680, "loss": 0.6342, "learning_rate": 7.243995901002312e-05, "epoch": 2.49888442659527, "percentage": 41.67, "elapsed_time": "2:21:46", "remaining_time": "3:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 1680, "eval_loss": 1.4858874082565308, "epoch": 2.49888442659527, "percentage": 41.67, "elapsed_time": "2:22:04", "remaining_time": "3:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 705, "total_steps": 1680, "loss": 0.5921, "learning_rate": 7.197456499023225e-05, "epoch": 2.5167336010709507, "percentage": 41.96, "elapsed_time": "2:23:06", "remaining_time": "3:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 1680, "loss": 0.5873, "learning_rate": 7.150679930976825e-05, "epoch": 2.534582775546631, "percentage": 42.26, "elapsed_time": "2:24:06", "remaining_time": "3:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 715, "total_steps": 1680, "loss": 0.6661, "learning_rate": 7.103671245342887e-05, "epoch": 2.5524319500223114, "percentage": 42.56, "elapsed_time": "2:25:06", "remaining_time": "3:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 1680, "loss": 0.5388, "learning_rate": 7.056435515653059e-05, "epoch": 2.570281124497992, "percentage": 42.86, "elapsed_time": "2:26:04", "remaining_time": "3:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 725, "total_steps": 1680, "loss": 0.6641, "learning_rate": 7.008977839943299e-05, "epoch": 2.5881302989736725, "percentage": 43.15, "elapsed_time": "2:27:05", "remaining_time": "3:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 1680, "loss": 0.6221, "learning_rate": 6.961303340203653e-05, "epoch": 2.605979473449353, "percentage": 43.45, "elapsed_time": "2:28:04", "remaining_time": "3:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 735, "total_steps": 1680, "loss": 0.599, "learning_rate": 6.91341716182545e-05, "epoch": 2.6238286479250332, "percentage": 43.75, "elapsed_time": "2:29:04", "remaining_time": "3:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 1680, "loss": 0.6047, "learning_rate": 6.86532447304597e-05, "epoch": 2.641677822400714, "percentage": 44.05, "elapsed_time": "2:30:05", "remaining_time": "3:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 745, "total_steps": 1680, "loss": 0.614, "learning_rate": 6.817030464390656e-05, "epoch": 2.6595269968763944, "percentage": 44.35, "elapsed_time": "2:31:02", "remaining_time": "3:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 1680, "loss": 0.6367, "learning_rate": 6.768540348112907e-05, "epoch": 2.677376171352075, "percentage": 44.64, "elapsed_time": "2:32:03", "remaining_time": "3:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 755, "total_steps": 1680, "loss": 0.5681, "learning_rate": 6.719859357631535e-05, "epoch": 2.6952253458277555, "percentage": 44.94, "elapsed_time": "2:33:01", "remaining_time": "3:07:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 1680, "loss": 0.5723, "learning_rate": 6.670992746965938e-05, "epoch": 2.713074520303436, "percentage": 45.24, "elapsed_time": "2:33:59", "remaining_time": "3:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 765, "total_steps": 1680, "loss": 0.6385, "learning_rate": 6.621945790169036e-05, "epoch": 2.7309236947791167, "percentage": 45.54, "elapsed_time": "2:35:00", "remaining_time": "3:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 1680, "loss": 0.6665, "learning_rate": 6.572723780758069e-05, "epoch": 2.748772869254797, "percentage": 45.83, "elapsed_time": "2:35:59", "remaining_time": "3:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 1680, "eval_loss": 1.5236101150512695, "epoch": 2.748772869254797, "percentage": 45.83, "elapsed_time": "2:36:16", "remaining_time": "3:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 775, "total_steps": 1680, "loss": 0.6083, "learning_rate": 6.523332031143272e-05, "epoch": 2.7666220437304774, "percentage": 46.13, "elapsed_time": "2:37:17", "remaining_time": "3:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 1680, "loss": 0.6493, "learning_rate": 6.473775872054521e-05, "epoch": 2.784471218206158, "percentage": 46.43, "elapsed_time": "2:38:17", "remaining_time": "3:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 785, "total_steps": 1680, "loss": 0.5722, "learning_rate": 6.424060651966007e-05, "epoch": 2.8023203926818385, "percentage": 46.73, "elapsed_time": "2:39:15", "remaining_time": "3:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 1680, "loss": 0.611, "learning_rate": 6.374191736518974e-05, "epoch": 2.820169567157519, "percentage": 47.02, "elapsed_time": "2:40:14", "remaining_time": "3:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 795, "total_steps": 1680, "loss": 0.6202, "learning_rate": 6.324174507942637e-05, "epoch": 2.8380187416331992, "percentage": 47.32, "elapsed_time": "2:41:14", "remaining_time": "2:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 1680, "loss": 0.5593, "learning_rate": 6.274014364473274e-05, "epoch": 2.85586791610888, "percentage": 47.62, "elapsed_time": "2:42:12", "remaining_time": "2:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 805, "total_steps": 1680, "loss": 0.7415, "learning_rate": 6.22371671977162e-05, "epoch": 2.8737170905845604, "percentage": 47.92, "elapsed_time": "2:43:14", "remaining_time": "2:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 1680, "loss": 0.6544, "learning_rate": 6.173287002338577e-05, "epoch": 2.891566265060241, "percentage": 48.21, "elapsed_time": "2:44:14", "remaining_time": "2:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 815, "total_steps": 1680, "loss": 0.6421, "learning_rate": 6.122730654929334e-05, "epoch": 2.9094154395359215, "percentage": 48.51, "elapsed_time": "2:45:12", "remaining_time": "2:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 1680, "loss": 0.6332, "learning_rate": 6.072053133965938e-05, "epoch": 2.927264614011602, "percentage": 48.81, "elapsed_time": "2:46:12", "remaining_time": "2:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 825, "total_steps": 1680, "loss": 0.6508, "learning_rate": 6.021259908948402e-05, "epoch": 2.9451137884872827, "percentage": 49.11, "elapsed_time": "2:47:11", "remaining_time": "2:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 1680, "loss": 0.621, "learning_rate": 5.970356461864391e-05, "epoch": 2.962962962962963, "percentage": 49.4, "elapsed_time": "2:48:11", "remaining_time": "2:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 835, "total_steps": 1680, "loss": 0.6347, "learning_rate": 5.919348286597569e-05, "epoch": 2.9808121374386434, "percentage": 49.7, "elapsed_time": "2:49:10", "remaining_time": "2:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 1680, "loss": 0.6101, "learning_rate": 5.868240888334653e-05, "epoch": 2.998661311914324, "percentage": 50.0, "elapsed_time": "2:50:11", "remaining_time": "2:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 1680, "eval_loss": 1.5220016241073608, "epoch": 2.998661311914324, "percentage": 50.0, "elapsed_time": "2:50:29", "remaining_time": "2:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 845, "total_steps": 1680, "loss": 0.4183, "learning_rate": 5.8170397829712485e-05, "epoch": 3.0165104863900045, "percentage": 50.3, "elapsed_time": "2:51:31", "remaining_time": "2:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 1680, "loss": 0.1667, "learning_rate": 5.765750496516547e-05, "epoch": 3.034359660865685, "percentage": 50.6, "elapsed_time": "2:52:28", "remaining_time": "2:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 855, "total_steps": 1680, "loss": 0.255, "learning_rate": 5.714378564496901e-05, "epoch": 3.0522088353413657, "percentage": 50.89, "elapsed_time": "2:53:28", "remaining_time": "2:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 1680, "loss": 0.2424, "learning_rate": 5.6629295313583974e-05, "epoch": 3.070058009817046, "percentage": 51.19, "elapsed_time": "2:54:28", "remaining_time": "2:46:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 865, "total_steps": 1680, "loss": 0.2097, "learning_rate": 5.611408949868457e-05, "epoch": 3.0879071842927264, "percentage": 51.49, "elapsed_time": "2:55:28", "remaining_time": "2:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 1680, "loss": 0.2271, "learning_rate": 5.559822380516539e-05, "epoch": 3.105756358768407, "percentage": 51.79, "elapsed_time": "2:56:27", "remaining_time": "2:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 875, "total_steps": 1680, "loss": 0.1982, "learning_rate": 5.5081753909140096e-05, "epoch": 3.1236055332440875, "percentage": 52.08, "elapsed_time": "2:57:26", "remaining_time": "2:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 1680, "loss": 0.2192, "learning_rate": 5.456473555193242e-05, "epoch": 3.141454707719768, "percentage": 52.38, "elapsed_time": "2:58:27", "remaining_time": "2:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 885, "total_steps": 1680, "loss": 0.2097, "learning_rate": 5.404722453406017e-05, "epoch": 3.1593038821954487, "percentage": 52.68, "elapsed_time": "2:59:25", "remaining_time": "2:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 1680, "loss": 0.2213, "learning_rate": 5.3529276709212816e-05, "epoch": 3.177153056671129, "percentage": 52.98, "elapsed_time": "3:00:24", "remaining_time": "2:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 895, "total_steps": 1680, "loss": 0.2559, "learning_rate": 5.30109479782233e-05, "epoch": 3.1950022311468094, "percentage": 53.27, "elapsed_time": "3:01:24", "remaining_time": "2:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 1680, "loss": 0.1955, "learning_rate": 5.249229428303486e-05, "epoch": 3.21285140562249, "percentage": 53.57, "elapsed_time": "3:02:22", "remaining_time": "2:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 905, "total_steps": 1680, "loss": 0.2642, "learning_rate": 5.197337160066331e-05, "epoch": 3.2307005800981705, "percentage": 53.87, "elapsed_time": "3:03:23", "remaining_time": "2:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 1680, "loss": 0.2467, "learning_rate": 5.145423593715557e-05, "epoch": 3.248549754573851, "percentage": 54.17, "elapsed_time": "3:04:23", "remaining_time": "2:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 1680, "eval_loss": 1.8390079736709595, "epoch": 3.248549754573851, "percentage": 54.17, "elapsed_time": "3:04:41", "remaining_time": "2:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 915, "total_steps": 1680, "loss": 0.2239, "learning_rate": 5.0934943321545115e-05, "epoch": 3.266398929049531, "percentage": 54.46, "elapsed_time": "3:05:43", "remaining_time": "2:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 1680, "loss": 0.1545, "learning_rate": 5.041554979980486e-05, "epoch": 3.284248103525212, "percentage": 54.76, "elapsed_time": "3:06:42", "remaining_time": "2:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 925, "total_steps": 1680, "loss": 0.2819, "learning_rate": 4.9896111428798254e-05, "epoch": 3.3020972780008924, "percentage": 55.06, "elapsed_time": "3:07:43", "remaining_time": "2:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 1680, "loss": 0.3043, "learning_rate": 4.9376684270229254e-05, "epoch": 3.319946452476573, "percentage": 55.36, "elapsed_time": "3:08:44", "remaining_time": "2:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 935, "total_steps": 1680, "loss": 0.2494, "learning_rate": 4.8857324384591653e-05, "epoch": 3.3377956269522535, "percentage": 55.65, "elapsed_time": "3:09:45", "remaining_time": "2:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 1680, "loss": 0.2271, "learning_rate": 4.8338087825118675e-05, "epoch": 3.355644801427934, "percentage": 55.95, "elapsed_time": "3:10:44", "remaining_time": "2:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 945, "total_steps": 1680, "loss": 0.242, "learning_rate": 4.781903063173321e-05, "epoch": 3.3734939759036147, "percentage": 56.25, "elapsed_time": "3:11:45", "remaining_time": "2:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 1680, "loss": 0.2244, "learning_rate": 4.730020882499964e-05, "epoch": 3.391343150379295, "percentage": 56.55, "elapsed_time": "3:12:43", "remaining_time": "2:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 955, "total_steps": 1680, "loss": 0.2552, "learning_rate": 4.678167840007767e-05, "epoch": 3.4091923248549754, "percentage": 56.85, "elapsed_time": "3:13:43", "remaining_time": "2:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 1680, "loss": 0.2542, "learning_rate": 4.626349532067879e-05, "epoch": 3.427041499330656, "percentage": 57.14, "elapsed_time": "3:14:43", "remaining_time": "2:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 965, "total_steps": 1680, "loss": 0.3249, "learning_rate": 4.574571551302647e-05, "epoch": 3.4448906738063365, "percentage": 57.44, "elapsed_time": "3:15:44", "remaining_time": "2:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 1680, "loss": 0.2729, "learning_rate": 4.522839485981994e-05, "epoch": 3.462739848282017, "percentage": 57.74, "elapsed_time": "3:16:45", "remaining_time": "2:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 975, "total_steps": 1680, "loss": 0.2595, "learning_rate": 4.471158919420312e-05, "epoch": 3.480589022757697, "percentage": 58.04, "elapsed_time": "3:17:45", "remaining_time": "2:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 1680, "loss": 0.2284, "learning_rate": 4.4195354293738484e-05, "epoch": 3.498438197233378, "percentage": 58.33, "elapsed_time": "3:18:43", "remaining_time": "2:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 1680, "eval_loss": 1.82525634765625, "epoch": 3.498438197233378, "percentage": 58.33, "elapsed_time": "3:19:01", "remaining_time": "2:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 985, "total_steps": 1680, "loss": 0.1947, "learning_rate": 4.367974587438733e-05, "epoch": 3.5162873717090584, "percentage": 58.63, "elapsed_time": "3:20:01", "remaining_time": "2:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 1680, "loss": 0.2352, "learning_rate": 4.316481958449634e-05, "epoch": 3.534136546184739, "percentage": 58.93, "elapsed_time": "3:21:01", "remaining_time": "2:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 995, "total_steps": 1680, "loss": 0.2047, "learning_rate": 4.2650630998791615e-05, "epoch": 3.5519857206604195, "percentage": 59.23, "elapsed_time": "3:22:00", "remaining_time": "2:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 1680, "loss": 0.2369, "learning_rate": 4.213723561238074e-05, "epoch": 3.5698348951361, "percentage": 59.52, "elapsed_time": "3:23:01", "remaining_time": "2:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1005, "total_steps": 1680, "loss": 0.2416, "learning_rate": 4.162468883476319e-05, "epoch": 3.5876840696117807, "percentage": 59.82, "elapsed_time": "3:23:59", "remaining_time": "2:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 1680, "loss": 0.2353, "learning_rate": 4.111304598385018e-05, "epoch": 3.605533244087461, "percentage": 60.12, "elapsed_time": "3:25:00", "remaining_time": "2:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1015, "total_steps": 1680, "loss": 0.2155, "learning_rate": 4.060236227999441e-05, "epoch": 3.6233824185631414, "percentage": 60.42, "elapsed_time": "3:25:59", "remaining_time": "2:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 1680, "loss": 0.2241, "learning_rate": 4.0092692840030134e-05, "epoch": 3.641231593038822, "percentage": 60.71, "elapsed_time": "3:26:59", "remaining_time": "2:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 1680, "loss": 0.2408, "learning_rate": 3.9584092671324606e-05, "epoch": 3.6590807675145025, "percentage": 61.01, "elapsed_time": "3:27:58", "remaining_time": "2:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 1680, "loss": 0.2423, "learning_rate": 3.907661666584131e-05, "epoch": 3.676929941990183, "percentage": 61.31, "elapsed_time": "3:28:58", "remaining_time": "2:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1035, "total_steps": 1680, "loss": 0.2581, "learning_rate": 3.857031959421553e-05, "epoch": 3.694779116465863, "percentage": 61.61, "elapsed_time": "3:29:57", "remaining_time": "2:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 1680, "loss": 0.206, "learning_rate": 3.806525609984312e-05, "epoch": 3.7126282909415442, "percentage": 61.9, "elapsed_time": "3:30:57", "remaining_time": "2:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1045, "total_steps": 1680, "loss": 0.1956, "learning_rate": 3.7561480692983006e-05, "epoch": 3.7304774654172244, "percentage": 62.2, "elapsed_time": "3:31:55", "remaining_time": "2:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 1680, "loss": 0.2839, "learning_rate": 3.705904774487396e-05, "epoch": 3.748326639892905, "percentage": 62.5, "elapsed_time": "3:32:55", "remaining_time": "2:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 1680, "eval_loss": 1.8687995672225952, "epoch": 3.748326639892905, "percentage": 62.5, "elapsed_time": "3:33:12", "remaining_time": "2:07:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1055, "total_steps": 1680, "loss": 0.2433, "learning_rate": 3.655801148186655e-05, "epoch": 3.7661758143685855, "percentage": 62.8, "elapsed_time": "3:34:14", "remaining_time": "2:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 1680, "loss": 0.2085, "learning_rate": 3.6058425979570485e-05, "epoch": 3.784024988844266, "percentage": 63.1, "elapsed_time": "3:35:11", "remaining_time": "2:05:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1065, "total_steps": 1680, "loss": 0.2277, "learning_rate": 3.556034515701852e-05, "epoch": 3.8018741633199467, "percentage": 63.39, "elapsed_time": "3:36:09", "remaining_time": "2:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 1680, "loss": 0.2497, "learning_rate": 3.506382277084696e-05, "epoch": 3.819723337795627, "percentage": 63.69, "elapsed_time": "3:37:08", "remaining_time": "2:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1075, "total_steps": 1680, "loss": 0.2462, "learning_rate": 3.4568912409493945e-05, "epoch": 3.8375725122713074, "percentage": 63.99, "elapsed_time": "3:38:07", "remaining_time": "2:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 1680, "loss": 0.2004, "learning_rate": 3.4075667487415785e-05, "epoch": 3.855421686746988, "percentage": 64.29, "elapsed_time": "3:39:05", "remaining_time": "2:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1085, "total_steps": 1680, "loss": 0.226, "learning_rate": 3.358414123932195e-05, "epoch": 3.8732708612226685, "percentage": 64.58, "elapsed_time": "3:40:05", "remaining_time": "2:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 1680, "loss": 0.2114, "learning_rate": 3.3094386714429724e-05, "epoch": 3.891120035698349, "percentage": 64.88, "elapsed_time": "3:41:05", "remaining_time": "1:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1095, "total_steps": 1680, "loss": 0.2694, "learning_rate": 3.2606456770738636e-05, "epoch": 3.908969210174029, "percentage": 65.18, "elapsed_time": "3:42:05", "remaining_time": "1:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 1680, "loss": 0.1828, "learning_rate": 3.212040406932569e-05, "epoch": 3.9268183846497102, "percentage": 65.48, "elapsed_time": "3:43:04", "remaining_time": "1:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1105, "total_steps": 1680, "loss": 0.1451, "learning_rate": 3.163628106866172e-05, "epoch": 3.9446675591253904, "percentage": 65.77, "elapsed_time": "3:44:01", "remaining_time": "1:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 1680, "loss": 0.2349, "learning_rate": 3.115414001894974e-05, "epoch": 3.962516733601071, "percentage": 66.07, "elapsed_time": "3:45:02", "remaining_time": "1:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1115, "total_steps": 1680, "loss": 0.2235, "learning_rate": 3.067403295648566e-05, "epoch": 3.9803659080767515, "percentage": 66.37, "elapsed_time": "3:46:00", "remaining_time": "1:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 1680, "loss": 0.2111, "learning_rate": 3.019601169804216e-05, "epoch": 3.998215082552432, "percentage": 66.67, "elapsed_time": "3:47:00", "remaining_time": "1:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 1680, "eval_loss": 1.891045093536377, "epoch": 3.998215082552432, "percentage": 66.67, "elapsed_time": "3:47:17", "remaining_time": "1:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1125, "total_steps": 1680, "loss": 0.1074, "learning_rate": 2.9720127835276256e-05, "epoch": 4.016064257028113, "percentage": 66.96, "elapsed_time": "3:48:19", "remaining_time": "1:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 1680, "loss": 0.0628, "learning_rate": 2.9246432729161055e-05, "epoch": 4.033913431503793, "percentage": 67.26, "elapsed_time": "3:49:19", "remaining_time": "1:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1135, "total_steps": 1680, "loss": 0.0615, "learning_rate": 2.8774977504442647e-05, "epoch": 4.051762605979474, "percentage": 67.56, "elapsed_time": "3:50:19", "remaining_time": "1:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 1680, "loss": 0.0658, "learning_rate": 2.8305813044122097e-05, "epoch": 4.069611780455154, "percentage": 67.86, "elapsed_time": "3:51:17", "remaining_time": "1:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1145, "total_steps": 1680, "loss": 0.0458, "learning_rate": 2.7838989983964065e-05, "epoch": 4.087460954930834, "percentage": 68.15, "elapsed_time": "3:52:15", "remaining_time": "1:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 1680, "loss": 0.0877, "learning_rate": 2.737455870703155e-05, "epoch": 4.105310129406515, "percentage": 68.45, "elapsed_time": "3:53:14", "remaining_time": "1:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1155, "total_steps": 1680, "loss": 0.0567, "learning_rate": 2.6912569338248315e-05, "epoch": 4.123159303882195, "percentage": 68.75, "elapsed_time": "3:54:12", "remaining_time": "1:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 1680, "loss": 0.0817, "learning_rate": 2.645307173898901e-05, "epoch": 4.141008478357876, "percentage": 69.05, "elapsed_time": "3:55:13", "remaining_time": "1:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1165, "total_steps": 1680, "loss": 0.0517, "learning_rate": 2.5996115501697694e-05, "epoch": 4.158857652833556, "percentage": 69.35, "elapsed_time": "3:56:13", "remaining_time": "1:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 1680, "loss": 0.0649, "learning_rate": 2.5541749944535554e-05, "epoch": 4.176706827309237, "percentage": 69.64, "elapsed_time": "3:57:12", "remaining_time": "1:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1175, "total_steps": 1680, "loss": 0.0613, "learning_rate": 2.5090024106057962e-05, "epoch": 4.1945560017849175, "percentage": 69.94, "elapsed_time": "3:58:11", "remaining_time": "1:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 1680, "loss": 0.0763, "learning_rate": 2.464098673992205e-05, "epoch": 4.212405176260598, "percentage": 70.24, "elapsed_time": "3:59:11", "remaining_time": "1:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1185, "total_steps": 1680, "loss": 0.0733, "learning_rate": 2.4194686309624663e-05, "epoch": 4.230254350736279, "percentage": 70.54, "elapsed_time": "4:00:10", "remaining_time": "1:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 1680, "loss": 0.0753, "learning_rate": 2.3751170983272e-05, "epoch": 4.248103525211959, "percentage": 70.83, "elapsed_time": "4:01:10", "remaining_time": "1:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 1680, "eval_loss": 2.2224178314208984, "epoch": 4.248103525211959, "percentage": 70.83, "elapsed_time": "4:01:28", "remaining_time": "1:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1195, "total_steps": 1680, "loss": 0.0839, "learning_rate": 2.3310488628380757e-05, "epoch": 4.26595269968764, "percentage": 71.13, "elapsed_time": "4:02:29", "remaining_time": "1:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 1680, "loss": 0.0811, "learning_rate": 2.2872686806712035e-05, "epoch": 4.28380187416332, "percentage": 71.43, "elapsed_time": "4:03:27", "remaining_time": "1:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1205, "total_steps": 1680, "loss": 0.0783, "learning_rate": 2.243781276913811e-05, "epoch": 4.301651048639, "percentage": 71.73, "elapsed_time": "4:04:28", "remaining_time": "1:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 1680, "loss": 0.0488, "learning_rate": 2.200591345054267e-05, "epoch": 4.319500223114681, "percentage": 72.02, "elapsed_time": "4:05:27", "remaining_time": "1:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1215, "total_steps": 1680, "loss": 0.0704, "learning_rate": 2.157703546475539e-05, "epoch": 4.337349397590361, "percentage": 72.32, "elapsed_time": "4:06:26", "remaining_time": "1:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 1680, "loss": 0.0653, "learning_rate": 2.115122509952085e-05, "epoch": 4.355198572066042, "percentage": 72.62, "elapsed_time": "4:07:26", "remaining_time": "1:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1225, "total_steps": 1680, "loss": 0.0471, "learning_rate": 2.0728528311502976e-05, "epoch": 4.373047746541722, "percentage": 72.92, "elapsed_time": "4:08:24", "remaining_time": "1:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 1680, "loss": 0.0757, "learning_rate": 2.0308990721324927e-05, "epoch": 4.3908969210174025, "percentage": 73.21, "elapsed_time": "4:09:26", "remaining_time": "1:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1235, "total_steps": 1680, "loss": 0.0456, "learning_rate": 1.989265760864542e-05, "epoch": 4.4087460954930835, "percentage": 73.51, "elapsed_time": "4:10:25", "remaining_time": "1:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 1680, "loss": 0.0555, "learning_rate": 1.947957390727185e-05, "epoch": 4.426595269968764, "percentage": 73.81, "elapsed_time": "4:11:25", "remaining_time": "1:29:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1245, "total_steps": 1680, "loss": 0.0559, "learning_rate": 1.906978420031059e-05, "epoch": 4.444444444444445, "percentage": 74.11, "elapsed_time": "4:12:24", "remaining_time": "1:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 1680, "loss": 0.0395, "learning_rate": 1.8663332715355396e-05, "epoch": 4.462293618920125, "percentage": 74.4, "elapsed_time": "4:13:20", "remaining_time": "1:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1255, "total_steps": 1680, "loss": 0.0681, "learning_rate": 1.8260263319713844e-05, "epoch": 4.480142793395806, "percentage": 74.7, "elapsed_time": "4:14:19", "remaining_time": "1:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 1680, "loss": 0.072, "learning_rate": 1.7860619515673033e-05, "epoch": 4.497991967871486, "percentage": 75.0, "elapsed_time": "4:15:17", "remaining_time": "1:25:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 1680, "eval_loss": 2.309265613555908, "epoch": 4.497991967871486, "percentage": 75.0, "elapsed_time": "4:15:35", "remaining_time": "1:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1265, "total_steps": 1680, "loss": 0.0614, "learning_rate": 1.746444443580433e-05, "epoch": 4.515841142347167, "percentage": 75.3, "elapsed_time": "4:16:37", "remaining_time": "1:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 1680, "loss": 0.0644, "learning_rate": 1.7071780838308288e-05, "epoch": 4.533690316822847, "percentage": 75.6, "elapsed_time": "4:17:37", "remaining_time": "1:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1275, "total_steps": 1680, "loss": 0.0678, "learning_rate": 1.6682671102399805e-05, "epoch": 4.551539491298527, "percentage": 75.89, "elapsed_time": "4:18:38", "remaining_time": "1:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 1680, "loss": 0.0474, "learning_rate": 1.629715722373423e-05, "epoch": 4.569388665774208, "percentage": 76.19, "elapsed_time": "4:19:38", "remaining_time": "1:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1285, "total_steps": 1680, "loss": 0.0813, "learning_rate": 1.5915280809874932e-05, "epoch": 4.587237840249888, "percentage": 76.49, "elapsed_time": "4:20:38", "remaining_time": "1:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 1680, "loss": 0.0483, "learning_rate": 1.553708307580265e-05, "epoch": 4.605087014725569, "percentage": 76.79, "elapsed_time": "4:21:37", "remaining_time": "1:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1295, "total_steps": 1680, "loss": 0.0644, "learning_rate": 1.5162604839467265e-05, "epoch": 4.6229361892012495, "percentage": 77.08, "elapsed_time": "4:22:36", "remaining_time": "1:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 1680, "loss": 0.0581, "learning_rate": 1.4791886517382413e-05, "epoch": 4.64078536367693, "percentage": 77.38, "elapsed_time": "4:23:37", "remaining_time": "1:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1305, "total_steps": 1680, "loss": 0.0569, "learning_rate": 1.4424968120263504e-05, "epoch": 4.658634538152611, "percentage": 77.68, "elapsed_time": "4:24:37", "remaining_time": "1:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 1680, "loss": 0.0645, "learning_rate": 1.4061889248709343e-05, "epoch": 4.676483712628291, "percentage": 77.98, "elapsed_time": "4:25:36", "remaining_time": "1:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1315, "total_steps": 1680, "loss": 0.0588, "learning_rate": 1.370268908892825e-05, "epoch": 4.694332887103972, "percentage": 78.27, "elapsed_time": "4:26:35", "remaining_time": "1:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 1680, "loss": 0.078, "learning_rate": 1.3347406408508695e-05, "epoch": 4.712182061579652, "percentage": 78.57, "elapsed_time": "4:27:35", "remaining_time": "1:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1325, "total_steps": 1680, "loss": 0.0948, "learning_rate": 1.2996079552235263e-05, "epoch": 4.730031236055332, "percentage": 78.87, "elapsed_time": "4:28:33", "remaining_time": "1:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 1680, "loss": 0.0351, "learning_rate": 1.264874643795021e-05, "epoch": 4.747880410531013, "percentage": 79.17, "elapsed_time": "4:29:32", "remaining_time": "1:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 1680, "eval_loss": 2.2220773696899414, "epoch": 4.747880410531013, "percentage": 79.17, "elapsed_time": "4:29:49", "remaining_time": "1:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1335, "total_steps": 1680, "loss": 0.031, "learning_rate": 1.230544455246101e-05, "epoch": 4.765729585006693, "percentage": 79.46, "elapsed_time": "4:30:50", "remaining_time": "1:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 1680, "loss": 0.0584, "learning_rate": 1.1966210947494583e-05, "epoch": 4.783578759482374, "percentage": 79.76, "elapsed_time": "4:31:50", "remaining_time": "1:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1345, "total_steps": 1680, "loss": 0.0633, "learning_rate": 1.1631082235698316e-05, "epoch": 4.801427933958054, "percentage": 80.06, "elapsed_time": "4:32:51", "remaining_time": "1:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 1680, "loss": 0.0485, "learning_rate": 1.130009458668863e-05, "epoch": 4.8192771084337345, "percentage": 80.36, "elapsed_time": "4:33:51", "remaining_time": "1:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1355, "total_steps": 1680, "loss": 0.0271, "learning_rate": 1.097328372314721e-05, "epoch": 4.8371262829094155, "percentage": 80.65, "elapsed_time": "4:34:49", "remaining_time": "1:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 1680, "loss": 0.0559, "learning_rate": 1.0650684916965559e-05, "epoch": 4.854975457385096, "percentage": 80.95, "elapsed_time": "4:35:49", "remaining_time": "1:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1365, "total_steps": 1680, "loss": 0.0582, "learning_rate": 1.0332332985438248e-05, "epoch": 4.872824631860777, "percentage": 81.25, "elapsed_time": "4:36:49", "remaining_time": "1:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 1680, "loss": 0.0965, "learning_rate": 1.0018262287505086e-05, "epoch": 4.890673806336457, "percentage": 81.55, "elapsed_time": "4:37:50", "remaining_time": "1:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1375, "total_steps": 1680, "loss": 0.0565, "learning_rate": 9.708506720042932e-06, "epoch": 4.908522980812138, "percentage": 81.85, "elapsed_time": "4:38:49", "remaining_time": "1:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 1680, "loss": 0.0542, "learning_rate": 9.403099714207175e-06, "epoch": 4.926372155287818, "percentage": 82.14, "elapsed_time": "4:39:48", "remaining_time": "1:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1385, "total_steps": 1680, "loss": 0.0856, "learning_rate": 9.102074231823727e-06, "epoch": 4.944221329763499, "percentage": 82.44, "elapsed_time": "4:40:49", "remaining_time": "0:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 1680, "loss": 0.0524, "learning_rate": 8.805462761831418e-06, "epoch": 4.962070504239179, "percentage": 82.74, "elapsed_time": "4:41:50", "remaining_time": "0:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1395, "total_steps": 1680, "loss": 0.0641, "learning_rate": 8.513297316775625e-06, "epoch": 4.979919678714859, "percentage": 83.04, "elapsed_time": "4:42:52", "remaining_time": "0:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 1680, "loss": 0.0644, "learning_rate": 8.225609429353187e-06, "epoch": 4.99776885319054, "percentage": 83.33, "elapsed_time": "4:43:53", "remaining_time": "0:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 1680, "eval_loss": 2.2804083824157715, "epoch": 4.99776885319054, "percentage": 83.33, "elapsed_time": "4:44:11", "remaining_time": "0:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1405, "total_steps": 1680, "loss": 0.0227, "learning_rate": 7.942430149009161e-06, "epoch": 5.01561802766622, "percentage": 83.63, "elapsed_time": "4:45:13", "remaining_time": "0:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 1680, "loss": 0.0175, "learning_rate": 7.663790038585793e-06, "epoch": 5.033467202141901, "percentage": 83.93, "elapsed_time": "4:46:12", "remaining_time": "0:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1415, "total_steps": 1680, "loss": 0.0161, "learning_rate": 7.389719171023857e-06, "epoch": 5.0513163766175815, "percentage": 84.23, "elapsed_time": "4:47:11", "remaining_time": "0:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 1680, "loss": 0.0268, "learning_rate": 7.1202471261170245e-06, "epoch": 5.069165551093262, "percentage": 84.52, "elapsed_time": "4:48:11", "remaining_time": "0:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1425, "total_steps": 1680, "loss": 0.0089, "learning_rate": 6.855402987319348e-06, "epoch": 5.087014725568943, "percentage": 84.82, "elapsed_time": "4:49:10", "remaining_time": "0:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 1680, "loss": 0.0178, "learning_rate": 6.595215338606397e-06, "epoch": 5.104863900044623, "percentage": 85.12, "elapsed_time": "4:50:10", "remaining_time": "0:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1435, "total_steps": 1680, "loss": 0.0132, "learning_rate": 6.339712261390213e-06, "epoch": 5.122713074520304, "percentage": 85.42, "elapsed_time": "4:51:09", "remaining_time": "0:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 1680, "loss": 0.0173, "learning_rate": 6.088921331488568e-06, "epoch": 5.140562248995984, "percentage": 85.71, "elapsed_time": "4:52:08", "remaining_time": "0:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1445, "total_steps": 1680, "loss": 0.0064, "learning_rate": 5.8428696161488215e-06, "epoch": 5.158411423471664, "percentage": 86.01, "elapsed_time": "4:53:07", "remaining_time": "0:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 1680, "loss": 0.021, "learning_rate": 5.601583671126531e-06, "epoch": 5.176260597947345, "percentage": 86.31, "elapsed_time": "4:54:06", "remaining_time": "0:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1455, "total_steps": 1680, "loss": 0.0508, "learning_rate": 5.365089537819434e-06, "epoch": 5.194109772423025, "percentage": 86.61, "elapsed_time": "4:55:06", "remaining_time": "0:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 1680, "loss": 0.0196, "learning_rate": 5.133412740456806e-06, "epoch": 5.211958946898706, "percentage": 86.9, "elapsed_time": "4:56:06", "remaining_time": "0:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1465, "total_steps": 1680, "loss": 0.0109, "learning_rate": 4.906578283344759e-06, "epoch": 5.229808121374386, "percentage": 87.2, "elapsed_time": "4:57:06", "remaining_time": "0:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 1680, "loss": 0.0257, "learning_rate": 4.684610648167503e-06, "epoch": 5.247657295850067, "percentage": 87.5, "elapsed_time": "4:58:06", "remaining_time": "0:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 1680, "eval_loss": 2.559340238571167, "epoch": 5.247657295850067, "percentage": 87.5, "elapsed_time": "4:58:23", "remaining_time": "0:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1475, "total_steps": 1680, "loss": 0.0159, "learning_rate": 4.467533791345191e-06, "epoch": 5.2655064703257475, "percentage": 87.8, "elapsed_time": "4:59:24", "remaining_time": "0:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 1680, "loss": 0.0117, "learning_rate": 4.255371141448272e-06, "epoch": 5.283355644801428, "percentage": 88.1, "elapsed_time": "5:00:23", "remaining_time": "0:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1485, "total_steps": 1680, "loss": 0.0092, "learning_rate": 4.048145596668967e-06, "epoch": 5.301204819277109, "percentage": 88.39, "elapsed_time": "5:01:21", "remaining_time": "0:39:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 1680, "loss": 0.0214, "learning_rate": 3.84587952234991e-06, "epoch": 5.319053993752789, "percentage": 88.69, "elapsed_time": "5:02:22", "remaining_time": "0:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1495, "total_steps": 1680, "loss": 0.0087, "learning_rate": 3.6485947485702832e-06, "epoch": 5.33690316822847, "percentage": 88.99, "elapsed_time": "5:03:20", "remaining_time": "0:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 1680, "loss": 0.0193, "learning_rate": 3.4563125677897932e-06, "epoch": 5.35475234270415, "percentage": 89.29, "elapsed_time": "5:04:19", "remaining_time": "0:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1505, "total_steps": 1680, "loss": 0.0181, "learning_rate": 3.269053732550581e-06, "epoch": 5.37260151717983, "percentage": 89.58, "elapsed_time": "5:05:18", "remaining_time": "0:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 1680, "loss": 0.0184, "learning_rate": 3.086838453237506e-06, "epoch": 5.390450691655511, "percentage": 89.88, "elapsed_time": "5:06:18", "remaining_time": "0:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1515, "total_steps": 1680, "loss": 0.0083, "learning_rate": 2.9096863958968268e-06, "epoch": 5.408299866131191, "percentage": 90.18, "elapsed_time": "5:07:15", "remaining_time": "0:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 1680, "loss": 0.0129, "learning_rate": 2.737616680113758e-06, "epoch": 5.426149040606872, "percentage": 90.48, "elapsed_time": "5:08:14", "remaining_time": "0:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1525, "total_steps": 1680, "loss": 0.0176, "learning_rate": 2.570647876948895e-06, "epoch": 5.443998215082552, "percentage": 90.77, "elapsed_time": "5:09:12", "remaining_time": "0:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 1680, "loss": 0.026, "learning_rate": 2.408798006933882e-06, "epoch": 5.461847389558233, "percentage": 91.07, "elapsed_time": "5:10:12", "remaining_time": "0:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1535, "total_steps": 1680, "loss": 0.0495, "learning_rate": 2.252084538126542e-06, "epoch": 5.4796965640339135, "percentage": 91.37, "elapsed_time": "5:11:13", "remaining_time": "0:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 1680, "loss": 0.0249, "learning_rate": 2.100524384225555e-06, "epoch": 5.497545738509594, "percentage": 91.67, "elapsed_time": "5:12:12", "remaining_time": "0:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 1680, "eval_loss": 2.6220109462738037, "epoch": 5.497545738509594, "percentage": 91.67, "elapsed_time": "5:12:29", "remaining_time": "0:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1545, "total_steps": 1680, "loss": 0.0197, "learning_rate": 1.9541339027450256e-06, "epoch": 5.515394912985275, "percentage": 91.96, "elapsed_time": "5:13:31", "remaining_time": "0:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 1680, "loss": 0.0154, "learning_rate": 1.8129288932490274e-06, "epoch": 5.533244087460955, "percentage": 92.26, "elapsed_time": "5:14:30", "remaining_time": "0:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1555, "total_steps": 1680, "loss": 0.0192, "learning_rate": 1.6769245956464396e-06, "epoch": 5.551093261936636, "percentage": 92.56, "elapsed_time": "5:15:31", "remaining_time": "0:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 1680, "loss": 0.0271, "learning_rate": 1.5461356885461075e-06, "epoch": 5.568942436412316, "percentage": 92.86, "elapsed_time": "5:16:33", "remaining_time": "0:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1565, "total_steps": 1680, "loss": 0.0128, "learning_rate": 1.4205762876726092e-06, "epoch": 5.586791610887996, "percentage": 93.15, "elapsed_time": "5:17:31", "remaining_time": "0:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 1680, "loss": 0.0167, "learning_rate": 1.3002599443428243e-06, "epoch": 5.604640785363677, "percentage": 93.45, "elapsed_time": "5:18:30", "remaining_time": "0:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1575, "total_steps": 1680, "loss": 0.0196, "learning_rate": 1.1851996440033319e-06, "epoch": 5.622489959839357, "percentage": 93.75, "elapsed_time": "5:19:31", "remaining_time": "0:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 1680, "loss": 0.0141, "learning_rate": 1.0754078048289374e-06, "epoch": 5.640339134315038, "percentage": 94.05, "elapsed_time": "5:20:31", "remaining_time": "0:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1585, "total_steps": 1680, "loss": 0.0289, "learning_rate": 9.708962763824048e-07, "epoch": 5.658188308790718, "percentage": 94.35, "elapsed_time": "5:21:32", "remaining_time": "0:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 1680, "loss": 0.0161, "learning_rate": 8.716763383355864e-07, "epoch": 5.6760374832663985, "percentage": 94.64, "elapsed_time": "5:22:31", "remaining_time": "0:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1595, "total_steps": 1680, "loss": 0.0133, "learning_rate": 7.777586992519959e-07, "epoch": 5.6938866577420795, "percentage": 94.94, "elapsed_time": "5:23:31", "remaining_time": "0:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 1680, "loss": 0.0272, "learning_rate": 6.891534954310885e-07, "epoch": 5.71173583221776, "percentage": 95.24, "elapsed_time": "5:24:32", "remaining_time": "0:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1605, "total_steps": 1680, "loss": 0.0084, "learning_rate": 6.058702898142643e-07, "epoch": 5.729585006693441, "percentage": 95.54, "elapsed_time": "5:25:32", "remaining_time": "0:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 1680, "loss": 0.0238, "learning_rate": 5.279180709527765e-07, "epoch": 5.747434181169121, "percentage": 95.83, "elapsed_time": "5:26:32", "remaining_time": "0:14:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 1680, "eval_loss": 2.618908643722534, "epoch": 5.747434181169121, "percentage": 95.83, "elapsed_time": "5:26:49", "remaining_time": "0:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1615, "total_steps": 1680, "loss": 0.0246, "learning_rate": 4.553052520375911e-07, "epoch": 5.765283355644802, "percentage": 96.13, "elapsed_time": "5:27:52", "remaining_time": "0:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 1680, "loss": 0.0098, "learning_rate": 3.8803966999139684e-07, "epoch": 5.783132530120482, "percentage": 96.43, "elapsed_time": "5:28:50", "remaining_time": "0:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1625, "total_steps": 1680, "loss": 0.0179, "learning_rate": 3.261285846227868e-07, "epoch": 5.800981704596163, "percentage": 96.73, "elapsed_time": "5:29:50", "remaining_time": "0:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 1680, "loss": 0.0139, "learning_rate": 2.6957867784270787e-07, "epoch": 5.818830879071843, "percentage": 97.02, "elapsed_time": "5:30:48", "remaining_time": "0:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1635, "total_steps": 1680, "loss": 0.0117, "learning_rate": 2.1839605294330933e-07, "epoch": 5.836680053547523, "percentage": 97.32, "elapsed_time": "5:31:47", "remaining_time": "0:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 1680, "loss": 0.0191, "learning_rate": 1.725862339392259e-07, "epoch": 5.854529228023204, "percentage": 97.62, "elapsed_time": "5:32:46", "remaining_time": "0:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1645, "total_steps": 1680, "loss": 0.0147, "learning_rate": 1.3215416497138754e-07, "epoch": 5.872378402498884, "percentage": 97.92, "elapsed_time": "5:33:44", "remaining_time": "0:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 1680, "loss": 0.014, "learning_rate": 9.710420977340762e-08, "epoch": 5.890227576974565, "percentage": 98.21, "elapsed_time": "5:34:44", "remaining_time": "0:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1655, "total_steps": 1680, "loss": 0.0146, "learning_rate": 6.744015120061509e-08, "epoch": 5.9080767514502455, "percentage": 98.51, "elapsed_time": "5:35:44", "remaining_time": "0:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 1680, "loss": 0.0223, "learning_rate": 4.316519082179227e-08, "epoch": 5.925925925925926, "percentage": 98.81, "elapsed_time": "5:36:45", "remaining_time": "0:04:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1665, "total_steps": 1680, "loss": 0.0112, "learning_rate": 2.4281948573617874e-08, "epoch": 5.943775100401607, "percentage": 99.11, "elapsed_time": "5:37:42", "remaining_time": "0:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 1680, "loss": 0.0273, "learning_rate": 1.0792462477909882e-08, "epoch": 5.961624274877287, "percentage": 99.4, "elapsed_time": "5:38:42", "remaining_time": "0:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1675, "total_steps": 1680, "loss": 0.0282, "learning_rate": 2.6981884216847884e-09, "epoch": 5.979473449352968, "percentage": 99.7, "elapsed_time": "5:39:42", "remaining_time": "0:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 1680, "loss": 0.0262, "learning_rate": 0.0, "epoch": 5.997322623828648, "percentage": 100.0, "elapsed_time": "5:40:42", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 1680, "eval_loss": 2.630276679992676, "epoch": 5.997322623828648, "percentage": 100.0, "elapsed_time": "5:41:00", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 1680, "epoch": 5.997322623828648, "percentage": 100.0, "elapsed_time": "5:41:04", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}