llama-3-8b-instruct-laws / trainer_log.jsonl
Sayalik45's picture
Uploading model weights
4b301fd verified
raw
history blame
No virus
135 kB
{"current_steps": 10, "total_steps": 5463, "loss": 1.7028, "learning_rate": 9.140767824497258e-07, "epoch": 0.005489227391244683, "percentage": 0.18, "elapsed_time": "0:00:16", "remaining_time": "2:33:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 20, "total_steps": 5463, "loss": 1.6575, "learning_rate": 1.8281535648994516e-06, "epoch": 0.010978454782489365, "percentage": 0.37, "elapsed_time": "0:00:33", "remaining_time": "2:31:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 30, "total_steps": 5463, "loss": 1.3904, "learning_rate": 2.7422303473491773e-06, "epoch": 0.016467682173734045, "percentage": 0.55, "elapsed_time": "0:00:49", "remaining_time": "2:30:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 40, "total_steps": 5463, "loss": 1.2568, "learning_rate": 3.6563071297989032e-06, "epoch": 0.02195690956497873, "percentage": 0.73, "elapsed_time": "0:01:06", "remaining_time": "2:30:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 50, "total_steps": 5463, "loss": 1.2404, "learning_rate": 4.570383912248629e-06, "epoch": 0.027446136956223412, "percentage": 0.92, "elapsed_time": "0:01:22", "remaining_time": "2:29:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 60, "total_steps": 5463, "loss": 1.1597, "learning_rate": 5.484460694698355e-06, "epoch": 0.03293536434746809, "percentage": 1.1, "elapsed_time": "0:01:39", "remaining_time": "2:29:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 70, "total_steps": 5463, "loss": 1.1168, "learning_rate": 6.398537477148081e-06, "epoch": 0.03842459173871278, "percentage": 1.28, "elapsed_time": "0:01:56", "remaining_time": "2:29:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 80, "total_steps": 5463, "loss": 1.0531, "learning_rate": 7.3126142595978065e-06, "epoch": 0.04391381912995746, "percentage": 1.46, "elapsed_time": "0:02:12", "remaining_time": "2:28:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 90, "total_steps": 5463, "loss": 1.0974, "learning_rate": 8.226691042047533e-06, "epoch": 0.04940304652120214, "percentage": 1.65, "elapsed_time": "0:02:29", "remaining_time": "2:28:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 100, "total_steps": 5463, "loss": 1.0468, "learning_rate": 9.140767824497258e-06, "epoch": 0.054892273912446825, "percentage": 1.83, "elapsed_time": "0:02:45", "remaining_time": "2:28:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 110, "total_steps": 5463, "loss": 1.0481, "learning_rate": 1.0054844606946984e-05, "epoch": 0.06038150130369151, "percentage": 2.01, "elapsed_time": "0:03:02", "remaining_time": "2:27:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 120, "total_steps": 5463, "loss": 1.0444, "learning_rate": 1.096892138939671e-05, "epoch": 0.06587072869493618, "percentage": 2.2, "elapsed_time": "0:03:18", "remaining_time": "2:27:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 130, "total_steps": 5463, "loss": 1.005, "learning_rate": 1.1882998171846435e-05, "epoch": 0.07135995608618087, "percentage": 2.38, "elapsed_time": "0:03:35", "remaining_time": "2:27:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 140, "total_steps": 5463, "loss": 1.0538, "learning_rate": 1.2797074954296162e-05, "epoch": 0.07684918347742556, "percentage": 2.56, "elapsed_time": "0:03:51", "remaining_time": "2:26:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 150, "total_steps": 5463, "loss": 1.0122, "learning_rate": 1.3711151736745886e-05, "epoch": 0.08233841086867023, "percentage": 2.75, "elapsed_time": "0:04:08", "remaining_time": "2:26:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 160, "total_steps": 5463, "loss": 0.9613, "learning_rate": 1.4625228519195613e-05, "epoch": 0.08782763825991492, "percentage": 2.93, "elapsed_time": "0:04:24", "remaining_time": "2:26:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 170, "total_steps": 5463, "loss": 0.9637, "learning_rate": 1.553930530164534e-05, "epoch": 0.0933168656511596, "percentage": 3.11, "elapsed_time": "0:04:41", "remaining_time": "2:25:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 180, "total_steps": 5463, "loss": 0.9984, "learning_rate": 1.6453382084095066e-05, "epoch": 0.09880609304240429, "percentage": 3.29, "elapsed_time": "0:04:57", "remaining_time": "2:25:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 190, "total_steps": 5463, "loss": 0.9984, "learning_rate": 1.7367458866544793e-05, "epoch": 0.10429532043364896, "percentage": 3.48, "elapsed_time": "0:05:14", "remaining_time": "2:25:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 200, "total_steps": 5463, "loss": 0.949, "learning_rate": 1.8281535648994517e-05, "epoch": 0.10978454782489365, "percentage": 3.66, "elapsed_time": "0:05:30", "remaining_time": "2:25:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 210, "total_steps": 5463, "loss": 1.0031, "learning_rate": 1.9195612431444244e-05, "epoch": 0.11527377521613832, "percentage": 3.84, "elapsed_time": "0:05:47", "remaining_time": "2:24:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 220, "total_steps": 5463, "loss": 0.9751, "learning_rate": 2.0109689213893968e-05, "epoch": 0.12076300260738301, "percentage": 4.03, "elapsed_time": "0:06:04", "remaining_time": "2:24:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 230, "total_steps": 5463, "loss": 0.9564, "learning_rate": 2.1023765996343695e-05, "epoch": 0.1262522299986277, "percentage": 4.21, "elapsed_time": "0:06:21", "remaining_time": "2:24:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 240, "total_steps": 5463, "loss": 0.9182, "learning_rate": 2.193784277879342e-05, "epoch": 0.13174145738987236, "percentage": 4.39, "elapsed_time": "0:06:37", "remaining_time": "2:24:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 250, "total_steps": 5463, "loss": 0.9037, "learning_rate": 2.2851919561243146e-05, "epoch": 0.13723068478111705, "percentage": 4.58, "elapsed_time": "0:06:54", "remaining_time": "2:23:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 260, "total_steps": 5463, "loss": 0.9708, "learning_rate": 2.376599634369287e-05, "epoch": 0.14271991217236174, "percentage": 4.76, "elapsed_time": "0:07:10", "remaining_time": "2:23:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 270, "total_steps": 5463, "loss": 0.9611, "learning_rate": 2.4680073126142597e-05, "epoch": 0.14820913956360643, "percentage": 4.94, "elapsed_time": "0:07:27", "remaining_time": "2:23:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 280, "total_steps": 5463, "loss": 0.9872, "learning_rate": 2.5594149908592324e-05, "epoch": 0.15369836695485112, "percentage": 5.13, "elapsed_time": "0:07:43", "remaining_time": "2:23:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 290, "total_steps": 5463, "loss": 0.9, "learning_rate": 2.6508226691042048e-05, "epoch": 0.15918759434609578, "percentage": 5.31, "elapsed_time": "0:07:59", "remaining_time": "2:22:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 300, "total_steps": 5463, "loss": 0.8798, "learning_rate": 2.742230347349177e-05, "epoch": 0.16467682173734047, "percentage": 5.49, "elapsed_time": "0:08:16", "remaining_time": "2:22:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 310, "total_steps": 5463, "loss": 0.8962, "learning_rate": 2.8336380255941502e-05, "epoch": 0.17016604912858516, "percentage": 5.67, "elapsed_time": "0:08:33", "remaining_time": "2:22:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 320, "total_steps": 5463, "loss": 0.886, "learning_rate": 2.9250457038391226e-05, "epoch": 0.17565527651982984, "percentage": 5.86, "elapsed_time": "0:08:49", "remaining_time": "2:21:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 330, "total_steps": 5463, "loss": 0.8335, "learning_rate": 3.016453382084095e-05, "epoch": 0.1811445039110745, "percentage": 6.04, "elapsed_time": "0:09:06", "remaining_time": "2:21:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 340, "total_steps": 5463, "loss": 0.8946, "learning_rate": 3.107861060329068e-05, "epoch": 0.1866337313023192, "percentage": 6.22, "elapsed_time": "0:09:24", "remaining_time": "2:21:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 350, "total_steps": 5463, "loss": 0.9274, "learning_rate": 3.1992687385740404e-05, "epoch": 0.19212295869356388, "percentage": 6.41, "elapsed_time": "0:09:40", "remaining_time": "2:21:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 360, "total_steps": 5463, "loss": 0.8001, "learning_rate": 3.290676416819013e-05, "epoch": 0.19761218608480857, "percentage": 6.59, "elapsed_time": "0:09:57", "remaining_time": "2:21:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 370, "total_steps": 5463, "loss": 0.9036, "learning_rate": 3.382084095063985e-05, "epoch": 0.20310141347605323, "percentage": 6.77, "elapsed_time": "0:10:13", "remaining_time": "2:20:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 380, "total_steps": 5463, "loss": 0.8944, "learning_rate": 3.4734917733089586e-05, "epoch": 0.20859064086729792, "percentage": 6.96, "elapsed_time": "0:10:30", "remaining_time": "2:20:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 390, "total_steps": 5463, "loss": 0.8581, "learning_rate": 3.5648994515539306e-05, "epoch": 0.2140798682585426, "percentage": 7.14, "elapsed_time": "0:10:46", "remaining_time": "2:20:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 400, "total_steps": 5463, "loss": 0.8412, "learning_rate": 3.656307129798903e-05, "epoch": 0.2195690956497873, "percentage": 7.32, "elapsed_time": "0:11:03", "remaining_time": "2:19:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 410, "total_steps": 5463, "loss": 0.9105, "learning_rate": 3.7477148080438754e-05, "epoch": 0.225058323041032, "percentage": 7.51, "elapsed_time": "0:11:19", "remaining_time": "2:19:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 420, "total_steps": 5463, "loss": 0.9217, "learning_rate": 3.839122486288849e-05, "epoch": 0.23054755043227665, "percentage": 7.69, "elapsed_time": "0:11:36", "remaining_time": "2:19:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 430, "total_steps": 5463, "loss": 0.9259, "learning_rate": 3.930530164533821e-05, "epoch": 0.23603677782352134, "percentage": 7.87, "elapsed_time": "0:11:52", "remaining_time": "2:18:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 440, "total_steps": 5463, "loss": 0.8857, "learning_rate": 4.0219378427787935e-05, "epoch": 0.24152600521476603, "percentage": 8.05, "elapsed_time": "0:12:09", "remaining_time": "2:18:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 450, "total_steps": 5463, "loss": 0.8754, "learning_rate": 4.113345521023766e-05, "epoch": 0.24701523260601072, "percentage": 8.24, "elapsed_time": "0:12:25", "remaining_time": "2:18:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 460, "total_steps": 5463, "loss": 0.8769, "learning_rate": 4.204753199268739e-05, "epoch": 0.2525044599972554, "percentage": 8.42, "elapsed_time": "0:12:42", "remaining_time": "2:18:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 470, "total_steps": 5463, "loss": 0.8992, "learning_rate": 4.296160877513711e-05, "epoch": 0.2579936873885001, "percentage": 8.6, "elapsed_time": "0:12:58", "remaining_time": "2:17:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 480, "total_steps": 5463, "loss": 0.8918, "learning_rate": 4.387568555758684e-05, "epoch": 0.2634829147797447, "percentage": 8.79, "elapsed_time": "0:13:15", "remaining_time": "2:17:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 490, "total_steps": 5463, "loss": 0.8167, "learning_rate": 4.4789762340036564e-05, "epoch": 0.2689721421709894, "percentage": 8.97, "elapsed_time": "0:13:31", "remaining_time": "2:17:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 500, "total_steps": 5463, "loss": 0.8888, "learning_rate": 4.570383912248629e-05, "epoch": 0.2744613695622341, "percentage": 9.15, "elapsed_time": "0:13:48", "remaining_time": "2:16:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 510, "total_steps": 5463, "loss": 0.8296, "learning_rate": 4.661791590493602e-05, "epoch": 0.2799505969534788, "percentage": 9.34, "elapsed_time": "0:14:04", "remaining_time": "2:16:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 520, "total_steps": 5463, "loss": 0.8703, "learning_rate": 4.753199268738574e-05, "epoch": 0.2854398243447235, "percentage": 9.52, "elapsed_time": "0:14:21", "remaining_time": "2:16:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 530, "total_steps": 5463, "loss": 0.9081, "learning_rate": 4.844606946983547e-05, "epoch": 0.29092905173596817, "percentage": 9.7, "elapsed_time": "0:14:37", "remaining_time": "2:16:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 540, "total_steps": 5463, "loss": 0.9165, "learning_rate": 4.936014625228519e-05, "epoch": 0.29641827912721286, "percentage": 9.88, "elapsed_time": "0:14:54", "remaining_time": "2:15:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 550, "total_steps": 5463, "loss": 0.8977, "learning_rate": 4.999995405604411e-05, "epoch": 0.30190750651845755, "percentage": 10.07, "elapsed_time": "0:15:10", "remaining_time": "2:15:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 560, "total_steps": 5463, "loss": 0.8527, "learning_rate": 4.999913727930364e-05, "epoch": 0.30739673390970224, "percentage": 10.25, "elapsed_time": "0:15:27", "remaining_time": "2:15:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 570, "total_steps": 5463, "loss": 0.8716, "learning_rate": 4.999729956415998e-05, "epoch": 0.31288596130094687, "percentage": 10.43, "elapsed_time": "0:15:43", "remaining_time": "2:15:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 580, "total_steps": 5463, "loss": 0.8402, "learning_rate": 4.9994440985663475e-05, "epoch": 0.31837518869219156, "percentage": 10.62, "elapsed_time": "0:16:00", "remaining_time": "2:14:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 590, "total_steps": 5463, "loss": 0.8629, "learning_rate": 4.9990561660555454e-05, "epoch": 0.32386441608343625, "percentage": 10.8, "elapsed_time": "0:16:17", "remaining_time": "2:14:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 600, "total_steps": 5463, "loss": 0.7973, "learning_rate": 4.998566174726347e-05, "epoch": 0.32935364347468093, "percentage": 10.98, "elapsed_time": "0:16:34", "remaining_time": "2:14:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 610, "total_steps": 5463, "loss": 0.8956, "learning_rate": 4.997974144589481e-05, "epoch": 0.3348428708659256, "percentage": 11.17, "elapsed_time": "0:16:50", "remaining_time": "2:14:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 620, "total_steps": 5463, "loss": 0.794, "learning_rate": 4.997280099822833e-05, "epoch": 0.3403320982571703, "percentage": 11.35, "elapsed_time": "0:17:07", "remaining_time": "2:13:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 630, "total_steps": 5463, "loss": 0.7641, "learning_rate": 4.996484068770461e-05, "epoch": 0.345821325648415, "percentage": 11.53, "elapsed_time": "0:17:24", "remaining_time": "2:13:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 640, "total_steps": 5463, "loss": 0.8582, "learning_rate": 4.9955860839414324e-05, "epoch": 0.3513105530396597, "percentage": 11.72, "elapsed_time": "0:17:40", "remaining_time": "2:13:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 650, "total_steps": 5463, "loss": 0.8087, "learning_rate": 4.994586182008501e-05, "epoch": 0.3567997804309043, "percentage": 11.9, "elapsed_time": "0:17:57", "remaining_time": "2:12:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 660, "total_steps": 5463, "loss": 0.8814, "learning_rate": 4.993484403806609e-05, "epoch": 0.362289007822149, "percentage": 12.08, "elapsed_time": "0:18:13", "remaining_time": "2:12:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 670, "total_steps": 5463, "loss": 0.8039, "learning_rate": 4.9922807943312135e-05, "epoch": 0.3677782352133937, "percentage": 12.26, "elapsed_time": "0:18:30", "remaining_time": "2:12:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 680, "total_steps": 5463, "loss": 0.8411, "learning_rate": 4.990975402736457e-05, "epoch": 0.3732674626046384, "percentage": 12.45, "elapsed_time": "0:18:46", "remaining_time": "2:12:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 690, "total_steps": 5463, "loss": 0.7838, "learning_rate": 4.9895682823331564e-05, "epoch": 0.3787566899958831, "percentage": 12.63, "elapsed_time": "0:19:03", "remaining_time": "2:11:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 700, "total_steps": 5463, "loss": 0.7802, "learning_rate": 4.988059490586624e-05, "epoch": 0.38424591738712777, "percentage": 12.81, "elapsed_time": "0:19:19", "remaining_time": "2:11:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 710, "total_steps": 5463, "loss": 0.8049, "learning_rate": 4.986449089114325e-05, "epoch": 0.38973514477837246, "percentage": 13.0, "elapsed_time": "0:19:36", "remaining_time": "2:11:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 720, "total_steps": 5463, "loss": 0.864, "learning_rate": 4.984737143683356e-05, "epoch": 0.39522437216961714, "percentage": 13.18, "elapsed_time": "0:19:53", "remaining_time": "2:10:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 730, "total_steps": 5463, "loss": 0.8222, "learning_rate": 4.982923724207764e-05, "epoch": 0.40071359956086183, "percentage": 13.36, "elapsed_time": "0:20:09", "remaining_time": "2:10:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 740, "total_steps": 5463, "loss": 0.7757, "learning_rate": 4.9810089047456873e-05, "epoch": 0.40620282695210647, "percentage": 13.55, "elapsed_time": "0:20:26", "remaining_time": "2:10:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 750, "total_steps": 5463, "loss": 0.7693, "learning_rate": 4.978992763496334e-05, "epoch": 0.41169205434335115, "percentage": 13.73, "elapsed_time": "0:20:42", "remaining_time": "2:10:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 760, "total_steps": 5463, "loss": 0.7927, "learning_rate": 4.976875382796786e-05, "epoch": 0.41718128173459584, "percentage": 13.91, "elapsed_time": "0:20:59", "remaining_time": "2:09:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 770, "total_steps": 5463, "loss": 0.7997, "learning_rate": 4.974656849118638e-05, "epoch": 0.42267050912584053, "percentage": 14.09, "elapsed_time": "0:21:15", "remaining_time": "2:09:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 780, "total_steps": 5463, "loss": 0.7719, "learning_rate": 4.972337253064466e-05, "epoch": 0.4281597365170852, "percentage": 14.28, "elapsed_time": "0:21:32", "remaining_time": "2:09:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 790, "total_steps": 5463, "loss": 0.8203, "learning_rate": 4.969916689364128e-05, "epoch": 0.4336489639083299, "percentage": 14.46, "elapsed_time": "0:21:48", "remaining_time": "2:09:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 800, "total_steps": 5463, "loss": 0.8303, "learning_rate": 4.9673952568708906e-05, "epoch": 0.4391381912995746, "percentage": 14.64, "elapsed_time": "0:22:05", "remaining_time": "2:08:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 810, "total_steps": 5463, "loss": 0.8693, "learning_rate": 4.964773058557399e-05, "epoch": 0.4446274186908193, "percentage": 14.83, "elapsed_time": "0:22:21", "remaining_time": "2:08:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 820, "total_steps": 5463, "loss": 0.7929, "learning_rate": 4.9620502015114675e-05, "epoch": 0.450116646082064, "percentage": 15.01, "elapsed_time": "0:22:38", "remaining_time": "2:08:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 830, "total_steps": 5463, "loss": 0.8393, "learning_rate": 4.959226796931706e-05, "epoch": 0.4556058734733086, "percentage": 15.19, "elapsed_time": "0:22:54", "remaining_time": "2:07:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 840, "total_steps": 5463, "loss": 0.8195, "learning_rate": 4.95630296012298e-05, "epoch": 0.4610951008645533, "percentage": 15.38, "elapsed_time": "0:23:11", "remaining_time": "2:07:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 850, "total_steps": 5463, "loss": 0.8157, "learning_rate": 4.953278810491701e-05, "epoch": 0.466584328255798, "percentage": 15.56, "elapsed_time": "0:23:27", "remaining_time": "2:07:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 860, "total_steps": 5463, "loss": 0.7932, "learning_rate": 4.950154471540951e-05, "epoch": 0.4720735556470427, "percentage": 15.74, "elapsed_time": "0:23:44", "remaining_time": "2:07:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 870, "total_steps": 5463, "loss": 0.7741, "learning_rate": 4.9469300708654385e-05, "epoch": 0.47756278303828736, "percentage": 15.93, "elapsed_time": "0:24:00", "remaining_time": "2:06:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 880, "total_steps": 5463, "loss": 0.8406, "learning_rate": 4.943605740146286e-05, "epoch": 0.48305201042953205, "percentage": 16.11, "elapsed_time": "0:24:17", "remaining_time": "2:06:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 890, "total_steps": 5463, "loss": 0.7731, "learning_rate": 4.940181615145655e-05, "epoch": 0.48854123782077674, "percentage": 16.29, "elapsed_time": "0:24:33", "remaining_time": "2:06:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 900, "total_steps": 5463, "loss": 0.7903, "learning_rate": 4.936657835701198e-05, "epoch": 0.49403046521202143, "percentage": 16.47, "elapsed_time": "0:24:50", "remaining_time": "2:05:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 910, "total_steps": 5463, "loss": 0.7601, "learning_rate": 4.933034545720354e-05, "epoch": 0.49951969260326606, "percentage": 16.66, "elapsed_time": "0:25:06", "remaining_time": "2:05:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 920, "total_steps": 5463, "loss": 0.8246, "learning_rate": 4.9293118931744624e-05, "epoch": 0.5050089199945108, "percentage": 16.84, "elapsed_time": "0:25:23", "remaining_time": "2:05:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 930, "total_steps": 5463, "loss": 0.7729, "learning_rate": 4.925490030092729e-05, "epoch": 0.5104981473857555, "percentage": 17.02, "elapsed_time": "0:25:39", "remaining_time": "2:05:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 940, "total_steps": 5463, "loss": 0.7711, "learning_rate": 4.9215691125560104e-05, "epoch": 0.5159873747770002, "percentage": 17.21, "elapsed_time": "0:25:56", "remaining_time": "2:04:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 950, "total_steps": 5463, "loss": 0.7897, "learning_rate": 4.917549300690445e-05, "epoch": 0.5214766021682449, "percentage": 17.39, "elapsed_time": "0:26:14", "remaining_time": "2:04:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 960, "total_steps": 5463, "loss": 0.7356, "learning_rate": 4.9134307586609104e-05, "epoch": 0.5269658295594895, "percentage": 17.57, "elapsed_time": "0:26:30", "remaining_time": "2:04:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 970, "total_steps": 5463, "loss": 0.7599, "learning_rate": 4.9092136546643184e-05, "epoch": 0.5324550569507341, "percentage": 17.76, "elapsed_time": "0:26:47", "remaining_time": "2:04:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 980, "total_steps": 5463, "loss": 0.7572, "learning_rate": 4.9048981609227504e-05, "epoch": 0.5379442843419788, "percentage": 17.94, "elapsed_time": "0:27:03", "remaining_time": "2:03:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 990, "total_steps": 5463, "loss": 0.7726, "learning_rate": 4.9004844536764185e-05, "epoch": 0.5434335117332235, "percentage": 18.12, "elapsed_time": "0:27:20", "remaining_time": "2:03:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1000, "total_steps": 5463, "loss": 0.7772, "learning_rate": 4.8959727131764735e-05, "epoch": 0.5489227391244682, "percentage": 18.3, "elapsed_time": "0:27:36", "remaining_time": "2:03:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1010, "total_steps": 5463, "loss": 0.7954, "learning_rate": 4.891363123677638e-05, "epoch": 0.5544119665157129, "percentage": 18.49, "elapsed_time": "0:27:55", "remaining_time": "2:03:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1020, "total_steps": 5463, "loss": 0.759, "learning_rate": 4.886655873430687e-05, "epoch": 0.5599011939069576, "percentage": 18.67, "elapsed_time": "0:28:12", "remaining_time": "2:02:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1030, "total_steps": 5463, "loss": 0.675, "learning_rate": 4.881851154674757e-05, "epoch": 0.5653904212982023, "percentage": 18.85, "elapsed_time": "0:28:28", "remaining_time": "2:02:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1040, "total_steps": 5463, "loss": 0.8194, "learning_rate": 4.876949163629494e-05, "epoch": 0.570879648689447, "percentage": 19.04, "elapsed_time": "0:28:44", "remaining_time": "2:02:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1050, "total_steps": 5463, "loss": 0.7587, "learning_rate": 4.871950100487043e-05, "epoch": 0.5763688760806917, "percentage": 19.22, "elapsed_time": "0:29:01", "remaining_time": "2:01:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1060, "total_steps": 5463, "loss": 0.6909, "learning_rate": 4.866854169403871e-05, "epoch": 0.5818581034719363, "percentage": 19.4, "elapsed_time": "0:29:17", "remaining_time": "2:01:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1070, "total_steps": 5463, "loss": 0.7907, "learning_rate": 4.861661578492429e-05, "epoch": 0.587347330863181, "percentage": 19.59, "elapsed_time": "0:29:34", "remaining_time": "2:01:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1080, "total_steps": 5463, "loss": 0.7512, "learning_rate": 4.856372539812655e-05, "epoch": 0.5928365582544257, "percentage": 19.77, "elapsed_time": "0:29:50", "remaining_time": "2:01:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1090, "total_steps": 5463, "loss": 0.7171, "learning_rate": 4.850987269363311e-05, "epoch": 0.5983257856456704, "percentage": 19.95, "elapsed_time": "0:30:06", "remaining_time": "2:00:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1100, "total_steps": 5463, "loss": 0.763, "learning_rate": 4.845505987073161e-05, "epoch": 0.6038150130369151, "percentage": 20.14, "elapsed_time": "0:30:23", "remaining_time": "2:00:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1110, "total_steps": 5463, "loss": 0.7513, "learning_rate": 4.839928916791996e-05, "epoch": 0.6093042404281598, "percentage": 20.32, "elapsed_time": "0:30:39", "remaining_time": "2:00:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1120, "total_steps": 5463, "loss": 0.6982, "learning_rate": 4.834256286281482e-05, "epoch": 0.6147934678194045, "percentage": 20.5, "elapsed_time": "0:30:56", "remaining_time": "1:59:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1130, "total_steps": 5463, "loss": 0.8051, "learning_rate": 4.82848832720587e-05, "epoch": 0.620282695210649, "percentage": 20.68, "elapsed_time": "0:31:12", "remaining_time": "1:59:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1140, "total_steps": 5463, "loss": 0.7914, "learning_rate": 4.8226252751225245e-05, "epoch": 0.6257719226018937, "percentage": 20.87, "elapsed_time": "0:31:28", "remaining_time": "1:59:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1150, "total_steps": 5463, "loss": 0.7705, "learning_rate": 4.816667369472309e-05, "epoch": 0.6312611499931384, "percentage": 21.05, "elapsed_time": "0:31:44", "remaining_time": "1:59:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1160, "total_steps": 5463, "loss": 0.7916, "learning_rate": 4.810614853569807e-05, "epoch": 0.6367503773843831, "percentage": 21.23, "elapsed_time": "0:32:01", "remaining_time": "1:58:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1170, "total_steps": 5463, "loss": 0.7628, "learning_rate": 4.804467974593387e-05, "epoch": 0.6422396047756278, "percentage": 21.42, "elapsed_time": "0:32:17", "remaining_time": "1:58:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1180, "total_steps": 5463, "loss": 0.7393, "learning_rate": 4.798226983575103e-05, "epoch": 0.6477288321668725, "percentage": 21.6, "elapsed_time": "0:32:33", "remaining_time": "1:58:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1190, "total_steps": 5463, "loss": 0.7251, "learning_rate": 4.7918921353904464e-05, "epoch": 0.6532180595581172, "percentage": 21.78, "elapsed_time": "0:32:50", "remaining_time": "1:57:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1200, "total_steps": 5463, "loss": 0.7329, "learning_rate": 4.785463688747937e-05, "epoch": 0.6587072869493619, "percentage": 21.97, "elapsed_time": "0:33:06", "remaining_time": "1:57:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1210, "total_steps": 5463, "loss": 0.6967, "learning_rate": 4.778941906178556e-05, "epoch": 0.6641965143406066, "percentage": 22.15, "elapsed_time": "0:33:22", "remaining_time": "1:57:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1220, "total_steps": 5463, "loss": 0.7221, "learning_rate": 4.772327054025027e-05, "epoch": 0.6696857417318512, "percentage": 22.33, "elapsed_time": "0:33:38", "remaining_time": "1:57:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1230, "total_steps": 5463, "loss": 0.6925, "learning_rate": 4.765619402430934e-05, "epoch": 0.6751749691230959, "percentage": 22.52, "elapsed_time": "0:33:55", "remaining_time": "1:56:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1240, "total_steps": 5463, "loss": 0.7373, "learning_rate": 4.758819225329696e-05, "epoch": 0.6806641965143406, "percentage": 22.7, "elapsed_time": "0:34:11", "remaining_time": "1:56:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1250, "total_steps": 5463, "loss": 0.7348, "learning_rate": 4.751926800433374e-05, "epoch": 0.6861534239055853, "percentage": 22.88, "elapsed_time": "0:34:28", "remaining_time": "1:56:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1260, "total_steps": 5463, "loss": 0.7121, "learning_rate": 4.744942409221333e-05, "epoch": 0.69164265129683, "percentage": 23.06, "elapsed_time": "0:34:44", "remaining_time": "1:55:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1270, "total_steps": 5463, "loss": 0.6728, "learning_rate": 4.7378663369287445e-05, "epoch": 0.6971318786880747, "percentage": 23.25, "elapsed_time": "0:35:00", "remaining_time": "1:55:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1280, "total_steps": 5463, "loss": 0.7617, "learning_rate": 4.730698872534938e-05, "epoch": 0.7026211060793194, "percentage": 23.43, "elapsed_time": "0:35:17", "remaining_time": "1:55:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1290, "total_steps": 5463, "loss": 0.6887, "learning_rate": 4.723440308751601e-05, "epoch": 0.7081103334705641, "percentage": 23.61, "elapsed_time": "0:35:33", "remaining_time": "1:55:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1300, "total_steps": 5463, "loss": 0.752, "learning_rate": 4.716090942010823e-05, "epoch": 0.7135995608618086, "percentage": 23.8, "elapsed_time": "0:35:49", "remaining_time": "1:54:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1310, "total_steps": 5463, "loss": 0.7336, "learning_rate": 4.708651072452993e-05, "epoch": 0.7190887882530533, "percentage": 23.98, "elapsed_time": "0:36:07", "remaining_time": "1:54:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1320, "total_steps": 5463, "loss": 0.7333, "learning_rate": 4.701121003914537e-05, "epoch": 0.724578015644298, "percentage": 24.16, "elapsed_time": "0:36:24", "remaining_time": "1:54:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1330, "total_steps": 5463, "loss": 0.7648, "learning_rate": 4.693501043915514e-05, "epoch": 0.7300672430355427, "percentage": 24.35, "elapsed_time": "0:36:43", "remaining_time": "1:54:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1340, "total_steps": 5463, "loss": 0.787, "learning_rate": 4.685791503647052e-05, "epoch": 0.7355564704267874, "percentage": 24.53, "elapsed_time": "0:37:02", "remaining_time": "1:53:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1350, "total_steps": 5463, "loss": 0.7212, "learning_rate": 4.6779926979586475e-05, "epoch": 0.7410456978180321, "percentage": 24.71, "elapsed_time": "0:37:21", "remaining_time": "1:53:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1360, "total_steps": 5463, "loss": 0.7175, "learning_rate": 4.6701049453453e-05, "epoch": 0.7465349252092768, "percentage": 24.89, "elapsed_time": "0:37:41", "remaining_time": "1:53:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1370, "total_steps": 5463, "loss": 0.7133, "learning_rate": 4.662128567934509e-05, "epoch": 0.7520241526005215, "percentage": 25.08, "elapsed_time": "0:38:00", "remaining_time": "1:53:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1380, "total_steps": 5463, "loss": 0.6978, "learning_rate": 4.654063891473115e-05, "epoch": 0.7575133799917662, "percentage": 25.26, "elapsed_time": "0:38:19", "remaining_time": "1:53:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1390, "total_steps": 5463, "loss": 0.7019, "learning_rate": 4.645911245314e-05, "epoch": 0.7630026073830108, "percentage": 25.44, "elapsed_time": "0:38:38", "remaining_time": "1:53:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1400, "total_steps": 5463, "loss": 0.7483, "learning_rate": 4.637670962402636e-05, "epoch": 0.7684918347742555, "percentage": 25.63, "elapsed_time": "0:38:56", "remaining_time": "1:53:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1410, "total_steps": 5463, "loss": 0.7208, "learning_rate": 4.629343379263487e-05, "epoch": 0.7739810621655002, "percentage": 25.81, "elapsed_time": "0:39:14", "remaining_time": "1:52:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1420, "total_steps": 5463, "loss": 0.7733, "learning_rate": 4.620928835986267e-05, "epoch": 0.7794702895567449, "percentage": 25.99, "elapsed_time": "0:39:30", "remaining_time": "1:52:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1430, "total_steps": 5463, "loss": 0.7111, "learning_rate": 4.6124276762120485e-05, "epoch": 0.7849595169479896, "percentage": 26.18, "elapsed_time": "0:39:47", "remaining_time": "1:52:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1440, "total_steps": 5463, "loss": 0.6663, "learning_rate": 4.603840247119233e-05, "epoch": 0.7904487443392343, "percentage": 26.36, "elapsed_time": "0:40:04", "remaining_time": "1:51:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1450, "total_steps": 5463, "loss": 0.7692, "learning_rate": 4.595166899409368e-05, "epoch": 0.795937971730479, "percentage": 26.54, "elapsed_time": "0:40:20", "remaining_time": "1:51:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1460, "total_steps": 5463, "loss": 0.7305, "learning_rate": 4.5864079872928265e-05, "epoch": 0.8014271991217237, "percentage": 26.73, "elapsed_time": "0:40:37", "remaining_time": "1:51:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1470, "total_steps": 5463, "loss": 0.6875, "learning_rate": 4.577563868474344e-05, "epoch": 0.8069164265129684, "percentage": 26.91, "elapsed_time": "0:40:53", "remaining_time": "1:51:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1480, "total_steps": 5463, "loss": 0.6849, "learning_rate": 4.5686349041384055e-05, "epoch": 0.8124056539042129, "percentage": 27.09, "elapsed_time": "0:41:10", "remaining_time": "1:50:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1490, "total_steps": 5463, "loss": 0.6506, "learning_rate": 4.559621458934498e-05, "epoch": 0.8178948812954576, "percentage": 27.27, "elapsed_time": "0:41:26", "remaining_time": "1:50:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1500, "total_steps": 5463, "loss": 0.704, "learning_rate": 4.550523900962219e-05, "epoch": 0.8233841086867023, "percentage": 27.46, "elapsed_time": "0:41:43", "remaining_time": "1:50:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1510, "total_steps": 5463, "loss": 0.6988, "learning_rate": 4.541342601756242e-05, "epoch": 0.828873336077947, "percentage": 27.64, "elapsed_time": "0:41:59", "remaining_time": "1:49:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1520, "total_steps": 5463, "loss": 0.705, "learning_rate": 4.532077936271144e-05, "epoch": 0.8343625634691917, "percentage": 27.82, "elapsed_time": "0:42:16", "remaining_time": "1:49:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1530, "total_steps": 5463, "loss": 0.6801, "learning_rate": 4.522730282866093e-05, "epoch": 0.8398517908604364, "percentage": 28.01, "elapsed_time": "0:42:32", "remaining_time": "1:49:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1540, "total_steps": 5463, "loss": 0.6308, "learning_rate": 4.513300023289397e-05, "epoch": 0.8453410182516811, "percentage": 28.19, "elapsed_time": "0:42:49", "remaining_time": "1:49:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1550, "total_steps": 5463, "loss": 0.6731, "learning_rate": 4.503787542662912e-05, "epoch": 0.8508302456429258, "percentage": 28.37, "elapsed_time": "0:43:06", "remaining_time": "1:48:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1560, "total_steps": 5463, "loss": 0.7404, "learning_rate": 4.494193229466314e-05, "epoch": 0.8563194730341704, "percentage": 28.56, "elapsed_time": "0:43:22", "remaining_time": "1:48:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1570, "total_steps": 5463, "loss": 0.6884, "learning_rate": 4.4845174755212385e-05, "epoch": 0.8618087004254151, "percentage": 28.74, "elapsed_time": "0:43:39", "remaining_time": "1:48:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1580, "total_steps": 5463, "loss": 0.6947, "learning_rate": 4.47476067597527e-05, "epoch": 0.8672979278166598, "percentage": 28.92, "elapsed_time": "0:43:55", "remaining_time": "1:47:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1590, "total_steps": 5463, "loss": 0.6982, "learning_rate": 4.464923229285816e-05, "epoch": 0.8727871552079045, "percentage": 29.1, "elapsed_time": "0:44:12", "remaining_time": "1:47:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1600, "total_steps": 5463, "loss": 0.7124, "learning_rate": 4.4550055372038225e-05, "epoch": 0.8782763825991492, "percentage": 29.29, "elapsed_time": "0:44:28", "remaining_time": "1:47:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1610, "total_steps": 5463, "loss": 0.6771, "learning_rate": 4.445008004757376e-05, "epoch": 0.8837656099903939, "percentage": 29.47, "elapsed_time": "0:44:45", "remaining_time": "1:47:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1620, "total_steps": 5463, "loss": 0.6272, "learning_rate": 4.434931040235159e-05, "epoch": 0.8892548373816386, "percentage": 29.65, "elapsed_time": "0:45:01", "remaining_time": "1:46:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1630, "total_steps": 5463, "loss": 0.6477, "learning_rate": 4.4247750551697756e-05, "epoch": 0.8947440647728833, "percentage": 29.84, "elapsed_time": "0:45:18", "remaining_time": "1:46:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1640, "total_steps": 5463, "loss": 0.7128, "learning_rate": 4.414540464320945e-05, "epoch": 0.900233292164128, "percentage": 30.02, "elapsed_time": "0:45:34", "remaining_time": "1:46:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1650, "total_steps": 5463, "loss": 0.7098, "learning_rate": 4.404227685658565e-05, "epoch": 0.9057225195553725, "percentage": 30.2, "elapsed_time": "0:45:51", "remaining_time": "1:45:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1660, "total_steps": 5463, "loss": 0.6926, "learning_rate": 4.39383714034564e-05, "epoch": 0.9112117469466172, "percentage": 30.39, "elapsed_time": "0:46:08", "remaining_time": "1:45:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1670, "total_steps": 5463, "loss": 0.6398, "learning_rate": 4.383369252721084e-05, "epoch": 0.9167009743378619, "percentage": 30.57, "elapsed_time": "0:46:25", "remaining_time": "1:45:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1680, "total_steps": 5463, "loss": 0.7087, "learning_rate": 4.372824450282388e-05, "epoch": 0.9221902017291066, "percentage": 30.75, "elapsed_time": "0:46:42", "remaining_time": "1:45:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1690, "total_steps": 5463, "loss": 0.6764, "learning_rate": 4.362203163668164e-05, "epoch": 0.9276794291203513, "percentage": 30.94, "elapsed_time": "0:46:58", "remaining_time": "1:44:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1700, "total_steps": 5463, "loss": 0.6969, "learning_rate": 4.351505826640555e-05, "epoch": 0.933168656511596, "percentage": 31.12, "elapsed_time": "0:47:15", "remaining_time": "1:44:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1710, "total_steps": 5463, "loss": 0.672, "learning_rate": 4.3407328760675245e-05, "epoch": 0.9386578839028407, "percentage": 31.3, "elapsed_time": "0:47:32", "remaining_time": "1:44:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1720, "total_steps": 5463, "loss": 0.6586, "learning_rate": 4.329884751905014e-05, "epoch": 0.9441471112940854, "percentage": 31.48, "elapsed_time": "0:47:48", "remaining_time": "1:44:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1730, "total_steps": 5463, "loss": 0.6601, "learning_rate": 4.3189618971789747e-05, "epoch": 0.94963633868533, "percentage": 31.67, "elapsed_time": "0:48:05", "remaining_time": "1:43:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1740, "total_steps": 5463, "loss": 0.7042, "learning_rate": 4.307964757967273e-05, "epoch": 0.9551255660765747, "percentage": 31.85, "elapsed_time": "0:48:21", "remaining_time": "1:43:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1750, "total_steps": 5463, "loss": 0.6573, "learning_rate": 4.2968937833814784e-05, "epoch": 0.9606147934678194, "percentage": 32.03, "elapsed_time": "0:48:38", "remaining_time": "1:43:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1760, "total_steps": 5463, "loss": 0.619, "learning_rate": 4.285749425548518e-05, "epoch": 0.9661040208590641, "percentage": 32.22, "elapsed_time": "0:48:54", "remaining_time": "1:42:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1770, "total_steps": 5463, "loss": 0.6601, "learning_rate": 4.274532139592211e-05, "epoch": 0.9715932482503088, "percentage": 32.4, "elapsed_time": "0:49:11", "remaining_time": "1:42:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1780, "total_steps": 5463, "loss": 0.6449, "learning_rate": 4.2632423836146885e-05, "epoch": 0.9770824756415535, "percentage": 32.58, "elapsed_time": "0:49:28", "remaining_time": "1:42:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1790, "total_steps": 5463, "loss": 0.6404, "learning_rate": 4.251880618677678e-05, "epoch": 0.9825717030327982, "percentage": 32.77, "elapsed_time": "0:49:45", "remaining_time": "1:42:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1800, "total_steps": 5463, "loss": 0.7124, "learning_rate": 4.240447308783679e-05, "epoch": 0.9880609304240429, "percentage": 32.95, "elapsed_time": "0:50:01", "remaining_time": "1:41:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1810, "total_steps": 5463, "loss": 0.7138, "learning_rate": 4.2289429208570094e-05, "epoch": 0.9935501578152875, "percentage": 33.13, "elapsed_time": "0:50:18", "remaining_time": "1:41:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1820, "total_steps": 5463, "loss": 0.7439, "learning_rate": 4.217367924724741e-05, "epoch": 0.9990393852065321, "percentage": 33.32, "elapsed_time": "0:50:34", "remaining_time": "1:41:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1830, "total_steps": 5463, "loss": 0.4876, "learning_rate": 4.2057227930975066e-05, "epoch": 1.0045286125977768, "percentage": 33.5, "elapsed_time": "0:50:51", "remaining_time": "1:40:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1840, "total_steps": 5463, "loss": 0.4949, "learning_rate": 4.194008001550204e-05, "epoch": 1.0100178399890216, "percentage": 33.68, "elapsed_time": "0:51:07", "remaining_time": "1:40:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1850, "total_steps": 5463, "loss": 0.5329, "learning_rate": 4.1822240285025635e-05, "epoch": 1.0155070673802662, "percentage": 33.86, "elapsed_time": "0:51:24", "remaining_time": "1:40:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1860, "total_steps": 5463, "loss": 0.5068, "learning_rate": 4.170371355199621e-05, "epoch": 1.020996294771511, "percentage": 34.05, "elapsed_time": "0:51:40", "remaining_time": "1:40:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1870, "total_steps": 5463, "loss": 0.5112, "learning_rate": 4.158450465692051e-05, "epoch": 1.0264855221627556, "percentage": 34.23, "elapsed_time": "0:51:57", "remaining_time": "1:39:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1880, "total_steps": 5463, "loss": 0.4826, "learning_rate": 4.146461846816411e-05, "epoch": 1.0319747495540004, "percentage": 34.41, "elapsed_time": "0:52:14", "remaining_time": "1:39:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1890, "total_steps": 5463, "loss": 0.4522, "learning_rate": 4.1344059881752534e-05, "epoch": 1.037463976945245, "percentage": 34.6, "elapsed_time": "0:52:30", "remaining_time": "1:39:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1900, "total_steps": 5463, "loss": 0.4726, "learning_rate": 4.1222833821171315e-05, "epoch": 1.0429532043364897, "percentage": 34.78, "elapsed_time": "0:52:47", "remaining_time": "1:38:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1910, "total_steps": 5463, "loss": 0.469, "learning_rate": 4.110094523716492e-05, "epoch": 1.0484424317277343, "percentage": 34.96, "elapsed_time": "0:53:03", "remaining_time": "1:38:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1920, "total_steps": 5463, "loss": 0.4554, "learning_rate": 4.0978399107534584e-05, "epoch": 1.053931659118979, "percentage": 35.15, "elapsed_time": "0:53:20", "remaining_time": "1:38:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1930, "total_steps": 5463, "loss": 0.4914, "learning_rate": 4.0855200436935e-05, "epoch": 1.0594208865102237, "percentage": 35.33, "elapsed_time": "0:53:37", "remaining_time": "1:38:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1940, "total_steps": 5463, "loss": 0.4609, "learning_rate": 4.073135425666997e-05, "epoch": 1.0649101139014683, "percentage": 35.51, "elapsed_time": "0:53:53", "remaining_time": "1:37:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1950, "total_steps": 5463, "loss": 0.472, "learning_rate": 4.0606865624486875e-05, "epoch": 1.070399341292713, "percentage": 35.69, "elapsed_time": "0:54:10", "remaining_time": "1:37:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1960, "total_steps": 5463, "loss": 0.5072, "learning_rate": 4.048173962437019e-05, "epoch": 1.0758885686839577, "percentage": 35.88, "elapsed_time": "0:54:26", "remaining_time": "1:37:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1970, "total_steps": 5463, "loss": 0.455, "learning_rate": 4.035598136633378e-05, "epoch": 1.0813777960752025, "percentage": 36.06, "elapsed_time": "0:54:43", "remaining_time": "1:37:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1980, "total_steps": 5463, "loss": 0.5023, "learning_rate": 4.0229595986212304e-05, "epoch": 1.086867023466447, "percentage": 36.24, "elapsed_time": "0:55:00", "remaining_time": "1:36:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 1990, "total_steps": 5463, "loss": 0.4863, "learning_rate": 4.0102588645451396e-05, "epoch": 1.0923562508576918, "percentage": 36.43, "elapsed_time": "0:55:16", "remaining_time": "1:36:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2000, "total_steps": 5463, "loss": 0.4912, "learning_rate": 3.997496453089692e-05, "epoch": 1.0978454782489364, "percentage": 36.61, "elapsed_time": "0:55:33", "remaining_time": "1:36:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2010, "total_steps": 5463, "loss": 0.4691, "learning_rate": 3.984672885458312e-05, "epoch": 1.1033347056401812, "percentage": 36.79, "elapsed_time": "0:55:53", "remaining_time": "1:36:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2020, "total_steps": 5463, "loss": 0.4965, "learning_rate": 3.971788685351978e-05, "epoch": 1.1088239330314258, "percentage": 36.98, "elapsed_time": "0:56:10", "remaining_time": "1:35:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2030, "total_steps": 5463, "loss": 0.468, "learning_rate": 3.9588443789478366e-05, "epoch": 1.1143131604226706, "percentage": 37.16, "elapsed_time": "0:56:27", "remaining_time": "1:35:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2040, "total_steps": 5463, "loss": 0.4886, "learning_rate": 3.945840494877709e-05, "epoch": 1.1198023878139152, "percentage": 37.34, "elapsed_time": "0:56:44", "remaining_time": "1:35:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2050, "total_steps": 5463, "loss": 0.4932, "learning_rate": 3.934086499185402e-05, "epoch": 1.12529161520516, "percentage": 37.53, "elapsed_time": "0:57:00", "remaining_time": "1:34:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2060, "total_steps": 5463, "loss": 0.5121, "learning_rate": 3.9209708826272075e-05, "epoch": 1.1307808425964045, "percentage": 37.71, "elapsed_time": "0:57:17", "remaining_time": "1:34:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2070, "total_steps": 5463, "loss": 0.5094, "learning_rate": 3.907797235116677e-05, "epoch": 1.1362700699876491, "percentage": 37.89, "elapsed_time": "0:57:33", "remaining_time": "1:34:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2080, "total_steps": 5463, "loss": 0.488, "learning_rate": 3.894566094651682e-05, "epoch": 1.141759297378894, "percentage": 38.07, "elapsed_time": "0:57:50", "remaining_time": "1:34:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2090, "total_steps": 5463, "loss": 0.531, "learning_rate": 3.881278001578046e-05, "epoch": 1.1472485247701387, "percentage": 38.26, "elapsed_time": "0:58:06", "remaining_time": "1:33:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2100, "total_steps": 5463, "loss": 0.5397, "learning_rate": 3.8679334985674786e-05, "epoch": 1.1527377521613833, "percentage": 38.44, "elapsed_time": "0:58:23", "remaining_time": "1:33:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2110, "total_steps": 5463, "loss": 0.4964, "learning_rate": 3.854533130595408e-05, "epoch": 1.1582269795526279, "percentage": 38.62, "elapsed_time": "0:58:39", "remaining_time": "1:33:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2120, "total_steps": 5463, "loss": 0.5011, "learning_rate": 3.8410774449187315e-05, "epoch": 1.1637162069438727, "percentage": 38.81, "elapsed_time": "0:58:56", "remaining_time": "1:32:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2130, "total_steps": 5463, "loss": 0.4922, "learning_rate": 3.827566991053461e-05, "epoch": 1.1692054343351173, "percentage": 38.99, "elapsed_time": "0:59:13", "remaining_time": "1:32:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2140, "total_steps": 5463, "loss": 0.4309, "learning_rate": 3.814002320752287e-05, "epoch": 1.174694661726362, "percentage": 39.17, "elapsed_time": "0:59:29", "remaining_time": "1:32:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2150, "total_steps": 5463, "loss": 0.4761, "learning_rate": 3.8003839879820377e-05, "epoch": 1.1801838891176066, "percentage": 39.36, "elapsed_time": "0:59:46", "remaining_time": "1:32:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2160, "total_steps": 5463, "loss": 0.4895, "learning_rate": 3.786712548901064e-05, "epoch": 1.1856731165088514, "percentage": 39.54, "elapsed_time": "1:00:03", "remaining_time": "1:31:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2170, "total_steps": 5463, "loss": 0.4894, "learning_rate": 3.772988561836517e-05, "epoch": 1.191162343900096, "percentage": 39.72, "elapsed_time": "1:00:19", "remaining_time": "1:31:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2180, "total_steps": 5463, "loss": 0.4812, "learning_rate": 3.759212587261559e-05, "epoch": 1.1966515712913408, "percentage": 39.9, "elapsed_time": "1:00:36", "remaining_time": "1:31:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2190, "total_steps": 5463, "loss": 0.4928, "learning_rate": 3.745385187772463e-05, "epoch": 1.2021407986825854, "percentage": 40.09, "elapsed_time": "1:00:53", "remaining_time": "1:30:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2200, "total_steps": 5463, "loss": 0.512, "learning_rate": 3.731506928065641e-05, "epoch": 1.2076300260738302, "percentage": 40.27, "elapsed_time": "1:01:09", "remaining_time": "1:30:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2210, "total_steps": 5463, "loss": 0.4715, "learning_rate": 3.717578374914585e-05, "epoch": 1.2131192534650748, "percentage": 40.45, "elapsed_time": "1:01:26", "remaining_time": "1:30:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2220, "total_steps": 5463, "loss": 0.4754, "learning_rate": 3.703600097146718e-05, "epoch": 1.2186084808563196, "percentage": 40.64, "elapsed_time": "1:01:42", "remaining_time": "1:30:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2230, "total_steps": 5463, "loss": 0.475, "learning_rate": 3.68957266562016e-05, "epoch": 1.2240977082475641, "percentage": 40.82, "elapsed_time": "1:01:59", "remaining_time": "1:29:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2240, "total_steps": 5463, "loss": 0.4901, "learning_rate": 3.675496653200425e-05, "epoch": 1.229586935638809, "percentage": 41.0, "elapsed_time": "1:02:15", "remaining_time": "1:29:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2250, "total_steps": 5463, "loss": 0.4694, "learning_rate": 3.661372634737013e-05, "epoch": 1.2350761630300535, "percentage": 41.19, "elapsed_time": "1:02:32", "remaining_time": "1:29:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2260, "total_steps": 5463, "loss": 0.4809, "learning_rate": 3.647201187039946e-05, "epoch": 1.240565390421298, "percentage": 41.37, "elapsed_time": "1:02:48", "remaining_time": "1:29:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2270, "total_steps": 5463, "loss": 0.4539, "learning_rate": 3.632982888856202e-05, "epoch": 1.246054617812543, "percentage": 41.55, "elapsed_time": "1:03:05", "remaining_time": "1:28:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2280, "total_steps": 5463, "loss": 0.4945, "learning_rate": 3.6187183208460844e-05, "epoch": 1.2515438452037877, "percentage": 41.74, "elapsed_time": "1:03:22", "remaining_time": "1:28:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2290, "total_steps": 5463, "loss": 0.4853, "learning_rate": 3.604408065559508e-05, "epoch": 1.2570330725950323, "percentage": 41.92, "elapsed_time": "1:03:38", "remaining_time": "1:28:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2300, "total_steps": 5463, "loss": 0.498, "learning_rate": 3.590052707412208e-05, "epoch": 1.2625222999862769, "percentage": 42.1, "elapsed_time": "1:03:55", "remaining_time": "1:27:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2310, "total_steps": 5463, "loss": 0.5287, "learning_rate": 3.575652832661872e-05, "epoch": 1.2680115273775217, "percentage": 42.28, "elapsed_time": "1:04:11", "remaining_time": "1:27:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2320, "total_steps": 5463, "loss": 0.5035, "learning_rate": 3.5612090293841994e-05, "epoch": 1.2735007547687662, "percentage": 42.47, "elapsed_time": "1:04:28", "remaining_time": "1:27:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2330, "total_steps": 5463, "loss": 0.5078, "learning_rate": 3.5467218874488837e-05, "epoch": 1.278989982160011, "percentage": 42.65, "elapsed_time": "1:04:44", "remaining_time": "1:27:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2340, "total_steps": 5463, "loss": 0.5015, "learning_rate": 3.5321919984955244e-05, "epoch": 1.2844792095512556, "percentage": 42.83, "elapsed_time": "1:05:01", "remaining_time": "1:26:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2350, "total_steps": 5463, "loss": 0.4556, "learning_rate": 3.517619955909463e-05, "epoch": 1.2899684369425004, "percentage": 43.02, "elapsed_time": "1:05:18", "remaining_time": "1:26:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2360, "total_steps": 5463, "loss": 0.4417, "learning_rate": 3.5030063547975525e-05, "epoch": 1.295457664333745, "percentage": 43.2, "elapsed_time": "1:05:34", "remaining_time": "1:26:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2370, "total_steps": 5463, "loss": 0.435, "learning_rate": 3.488351791963849e-05, "epoch": 1.3009468917249898, "percentage": 43.38, "elapsed_time": "1:05:51", "remaining_time": "1:25:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2380, "total_steps": 5463, "loss": 0.4872, "learning_rate": 3.473656865885248e-05, "epoch": 1.3064361191162344, "percentage": 43.57, "elapsed_time": "1:06:08", "remaining_time": "1:25:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2390, "total_steps": 5463, "loss": 0.479, "learning_rate": 3.4589221766870306e-05, "epoch": 1.3119253465074792, "percentage": 43.75, "elapsed_time": "1:06:25", "remaining_time": "1:25:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2400, "total_steps": 5463, "loss": 0.577, "learning_rate": 3.444148326118366e-05, "epoch": 1.3174145738987237, "percentage": 43.93, "elapsed_time": "1:06:41", "remaining_time": "1:25:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2410, "total_steps": 5463, "loss": 0.4801, "learning_rate": 3.4293359175277314e-05, "epoch": 1.3229038012899683, "percentage": 44.11, "elapsed_time": "1:06:58", "remaining_time": "1:24:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2420, "total_steps": 5463, "loss": 0.4884, "learning_rate": 3.414485555838273e-05, "epoch": 1.3283930286812131, "percentage": 44.3, "elapsed_time": "1:07:14", "remaining_time": "1:24:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2430, "total_steps": 5463, "loss": 0.4527, "learning_rate": 3.3995978475231024e-05, "epoch": 1.333882256072458, "percentage": 44.48, "elapsed_time": "1:07:31", "remaining_time": "1:24:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2440, "total_steps": 5463, "loss": 0.4831, "learning_rate": 3.3846734005805254e-05, "epoch": 1.3393714834637025, "percentage": 44.66, "elapsed_time": "1:07:47", "remaining_time": "1:23:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2450, "total_steps": 5463, "loss": 0.4994, "learning_rate": 3.369712824509217e-05, "epoch": 1.344860710854947, "percentage": 44.85, "elapsed_time": "1:08:04", "remaining_time": "1:23:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2460, "total_steps": 5463, "loss": 0.4761, "learning_rate": 3.354716730283327e-05, "epoch": 1.3503499382461919, "percentage": 45.03, "elapsed_time": "1:08:21", "remaining_time": "1:23:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2470, "total_steps": 5463, "loss": 0.4891, "learning_rate": 3.3396857303275296e-05, "epoch": 1.3558391656374364, "percentage": 45.21, "elapsed_time": "1:08:37", "remaining_time": "1:23:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2480, "total_steps": 5463, "loss": 0.4415, "learning_rate": 3.324620438492011e-05, "epoch": 1.3613283930286812, "percentage": 45.4, "elapsed_time": "1:08:54", "remaining_time": "1:22:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2490, "total_steps": 5463, "loss": 0.4733, "learning_rate": 3.309521470027403e-05, "epoch": 1.3668176204199258, "percentage": 45.58, "elapsed_time": "1:09:11", "remaining_time": "1:22:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2500, "total_steps": 5463, "loss": 0.4626, "learning_rate": 3.294389441559655e-05, "epoch": 1.3723068478111706, "percentage": 45.76, "elapsed_time": "1:09:28", "remaining_time": "1:22:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2510, "total_steps": 5463, "loss": 0.5168, "learning_rate": 3.279224971064851e-05, "epoch": 1.3777960752024152, "percentage": 45.95, "elapsed_time": "1:09:44", "remaining_time": "1:22:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2520, "total_steps": 5463, "loss": 0.4687, "learning_rate": 3.2640286778439746e-05, "epoch": 1.38328530259366, "percentage": 46.13, "elapsed_time": "1:10:01", "remaining_time": "1:21:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2530, "total_steps": 5463, "loss": 0.454, "learning_rate": 3.248801182497615e-05, "epoch": 1.3887745299849046, "percentage": 46.31, "elapsed_time": "1:10:17", "remaining_time": "1:21:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2540, "total_steps": 5463, "loss": 0.4594, "learning_rate": 3.233543106900624e-05, "epoch": 1.3942637573761494, "percentage": 46.49, "elapsed_time": "1:10:34", "remaining_time": "1:21:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2550, "total_steps": 5463, "loss": 0.4408, "learning_rate": 3.21825507417672e-05, "epoch": 1.399752984767394, "percentage": 46.68, "elapsed_time": "1:10:50", "remaining_time": "1:20:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2560, "total_steps": 5463, "loss": 0.4802, "learning_rate": 3.202937708673033e-05, "epoch": 1.4052422121586385, "percentage": 46.86, "elapsed_time": "1:11:07", "remaining_time": "1:20:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2570, "total_steps": 5463, "loss": 0.4731, "learning_rate": 3.1875916359346214e-05, "epoch": 1.4107314395498833, "percentage": 47.04, "elapsed_time": "1:11:23", "remaining_time": "1:20:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2580, "total_steps": 5463, "loss": 0.454, "learning_rate": 3.17221748267891e-05, "epoch": 1.4162206669411281, "percentage": 47.23, "elapsed_time": "1:11:40", "remaining_time": "1:20:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2590, "total_steps": 5463, "loss": 0.4229, "learning_rate": 3.156815876770105e-05, "epoch": 1.4217098943323727, "percentage": 47.41, "elapsed_time": "1:11:57", "remaining_time": "1:19:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2600, "total_steps": 5463, "loss": 0.4896, "learning_rate": 3.1413874471935496e-05, "epoch": 1.4271991217236173, "percentage": 47.59, "elapsed_time": "1:12:13", "remaining_time": "1:19:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2610, "total_steps": 5463, "loss": 0.4808, "learning_rate": 3.125932824030037e-05, "epoch": 1.432688349114862, "percentage": 47.78, "elapsed_time": "1:12:29", "remaining_time": "1:19:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2620, "total_steps": 5463, "loss": 0.4271, "learning_rate": 3.110452638430081e-05, "epoch": 1.438177576506107, "percentage": 47.96, "elapsed_time": "1:12:46", "remaining_time": "1:18:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2630, "total_steps": 5463, "loss": 0.4618, "learning_rate": 3.094947522588135e-05, "epoch": 1.4436668038973515, "percentage": 48.14, "elapsed_time": "1:13:03", "remaining_time": "1:18:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2640, "total_steps": 5463, "loss": 0.4765, "learning_rate": 3.079418109716778e-05, "epoch": 1.449156031288596, "percentage": 48.33, "elapsed_time": "1:13:19", "remaining_time": "1:18:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2650, "total_steps": 5463, "loss": 0.4596, "learning_rate": 3.063865034020857e-05, "epoch": 1.4546452586798408, "percentage": 48.51, "elapsed_time": "1:13:36", "remaining_time": "1:18:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2660, "total_steps": 5463, "loss": 0.4384, "learning_rate": 3.0482889306715813e-05, "epoch": 1.4601344860710854, "percentage": 48.69, "elapsed_time": "1:13:52", "remaining_time": "1:17:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2670, "total_steps": 5463, "loss": 0.4872, "learning_rate": 3.032690435780584e-05, "epoch": 1.4656237134623302, "percentage": 48.87, "elapsed_time": "1:14:09", "remaining_time": "1:17:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2680, "total_steps": 5463, "loss": 0.4581, "learning_rate": 3.017070186373949e-05, "epoch": 1.4711129408535748, "percentage": 49.06, "elapsed_time": "1:14:25", "remaining_time": "1:17:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2690, "total_steps": 5463, "loss": 0.49, "learning_rate": 3.001428820366187e-05, "epoch": 1.4766021682448196, "percentage": 49.24, "elapsed_time": "1:14:42", "remaining_time": "1:17:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2700, "total_steps": 5463, "loss": 0.4262, "learning_rate": 2.9857669765341928e-05, "epoch": 1.4820913956360642, "percentage": 49.42, "elapsed_time": "1:14:58", "remaining_time": "1:16:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2710, "total_steps": 5463, "loss": 0.4774, "learning_rate": 2.9700852944911512e-05, "epoch": 1.487580623027309, "percentage": 49.61, "elapsed_time": "1:15:15", "remaining_time": "1:16:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2720, "total_steps": 5463, "loss": 0.4618, "learning_rate": 2.9543844146604195e-05, "epoch": 1.4930698504185536, "percentage": 49.79, "elapsed_time": "1:15:31", "remaining_time": "1:16:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2730, "total_steps": 5463, "loss": 0.4278, "learning_rate": 2.938664978249372e-05, "epoch": 1.4985590778097984, "percentage": 49.97, "elapsed_time": "1:15:48", "remaining_time": "1:15:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2740, "total_steps": 5463, "loss": 0.4706, "learning_rate": 2.9229276272232146e-05, "epoch": 1.504048305201043, "percentage": 50.16, "elapsed_time": "1:16:06", "remaining_time": "1:15:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2750, "total_steps": 5463, "loss": 0.4308, "learning_rate": 2.907173004278768e-05, "epoch": 1.5095375325922875, "percentage": 50.34, "elapsed_time": "1:16:22", "remaining_time": "1:15:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2760, "total_steps": 5463, "loss": 0.4487, "learning_rate": 2.8914017528182185e-05, "epoch": 1.5150267599835323, "percentage": 50.52, "elapsed_time": "1:16:39", "remaining_time": "1:15:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2770, "total_steps": 5463, "loss": 0.4232, "learning_rate": 2.8756145169228432e-05, "epoch": 1.5205159873747771, "percentage": 50.7, "elapsed_time": "1:16:55", "remaining_time": "1:14:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2780, "total_steps": 5463, "loss": 0.4603, "learning_rate": 2.859811941326709e-05, "epoch": 1.5260052147660217, "percentage": 50.89, "elapsed_time": "1:17:12", "remaining_time": "1:14:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2790, "total_steps": 5463, "loss": 0.4649, "learning_rate": 2.8439946713903354e-05, "epoch": 1.5314944421572663, "percentage": 51.07, "elapsed_time": "1:17:28", "remaining_time": "1:14:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2800, "total_steps": 5463, "loss": 0.4988, "learning_rate": 2.8281633530743497e-05, "epoch": 1.536983669548511, "percentage": 51.25, "elapsed_time": "1:17:45", "remaining_time": "1:13:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2810, "total_steps": 5463, "loss": 0.4795, "learning_rate": 2.8123186329130942e-05, "epoch": 1.5424728969397559, "percentage": 51.44, "elapsed_time": "1:18:04", "remaining_time": "1:13:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2820, "total_steps": 5463, "loss": 0.427, "learning_rate": 2.7964611579882317e-05, "epoch": 1.5479621243310004, "percentage": 51.62, "elapsed_time": "1:18:22", "remaining_time": "1:13:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2830, "total_steps": 5463, "loss": 0.4982, "learning_rate": 2.7805915759023153e-05, "epoch": 1.553451351722245, "percentage": 51.8, "elapsed_time": "1:18:41", "remaining_time": "1:13:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2840, "total_steps": 5463, "loss": 0.4489, "learning_rate": 2.764710534752342e-05, "epoch": 1.5589405791134898, "percentage": 51.99, "elapsed_time": "1:19:00", "remaining_time": "1:12:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2850, "total_steps": 5463, "loss": 0.4177, "learning_rate": 2.748818683103285e-05, "epoch": 1.5644298065047346, "percentage": 52.17, "elapsed_time": "1:19:18", "remaining_time": "1:12:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2860, "total_steps": 5463, "loss": 0.4816, "learning_rate": 2.7329166699616064e-05, "epoch": 1.569919033895979, "percentage": 52.35, "elapsed_time": "1:19:34", "remaining_time": "1:12:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2870, "total_steps": 5463, "loss": 0.4392, "learning_rate": 2.7170051447487532e-05, "epoch": 1.5754082612872238, "percentage": 52.54, "elapsed_time": "1:19:51", "remaining_time": "1:12:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2880, "total_steps": 5463, "loss": 0.5002, "learning_rate": 2.7010847572746356e-05, "epoch": 1.5808974886784686, "percentage": 52.72, "elapsed_time": "1:20:07", "remaining_time": "1:11:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2890, "total_steps": 5463, "loss": 0.437, "learning_rate": 2.6851561577110874e-05, "epoch": 1.5863867160697132, "percentage": 52.9, "elapsed_time": "1:20:23", "remaining_time": "1:11:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2900, "total_steps": 5463, "loss": 0.4565, "learning_rate": 2.6692199965653185e-05, "epoch": 1.5918759434609577, "percentage": 53.08, "elapsed_time": "1:20:40", "remaining_time": "1:11:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2910, "total_steps": 5463, "loss": 0.4755, "learning_rate": 2.6532769246533435e-05, "epoch": 1.5973651708522025, "percentage": 53.27, "elapsed_time": "1:20:56", "remaining_time": "1:11:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2920, "total_steps": 5463, "loss": 0.4603, "learning_rate": 2.6373275930734075e-05, "epoch": 1.6028543982434473, "percentage": 53.45, "elapsed_time": "1:21:13", "remaining_time": "1:10:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2930, "total_steps": 5463, "loss": 0.4551, "learning_rate": 2.621372653179391e-05, "epoch": 1.608343625634692, "percentage": 53.63, "elapsed_time": "1:21:29", "remaining_time": "1:10:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2940, "total_steps": 5463, "loss": 0.5062, "learning_rate": 2.6054127565542146e-05, "epoch": 1.6138328530259365, "percentage": 53.82, "elapsed_time": "1:21:45", "remaining_time": "1:10:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2950, "total_steps": 5463, "loss": 0.5046, "learning_rate": 2.5894485549832254e-05, "epoch": 1.6193220804171813, "percentage": 54.0, "elapsed_time": "1:22:02", "remaining_time": "1:09:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2960, "total_steps": 5463, "loss": 0.4685, "learning_rate": 2.57348070042758e-05, "epoch": 1.624811307808426, "percentage": 54.18, "elapsed_time": "1:22:18", "remaining_time": "1:09:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2970, "total_steps": 5463, "loss": 0.4836, "learning_rate": 2.5575098449976204e-05, "epoch": 1.6303005351996707, "percentage": 54.37, "elapsed_time": "1:22:35", "remaining_time": "1:09:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2980, "total_steps": 5463, "loss": 0.4146, "learning_rate": 2.541536640926238e-05, "epoch": 1.6357897625909152, "percentage": 54.55, "elapsed_time": "1:22:52", "remaining_time": "1:09:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 2990, "total_steps": 5463, "loss": 0.441, "learning_rate": 2.5255617405422443e-05, "epoch": 1.64127898998216, "percentage": 54.73, "elapsed_time": "1:23:08", "remaining_time": "1:08:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3000, "total_steps": 5463, "loss": 0.4932, "learning_rate": 2.5095857962437226e-05, "epoch": 1.6467682173734048, "percentage": 54.91, "elapsed_time": "1:23:24", "remaining_time": "1:08:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3010, "total_steps": 5463, "loss": 0.4324, "learning_rate": 2.4936094604713918e-05, "epoch": 1.6522574447646494, "percentage": 55.1, "elapsed_time": "1:23:44", "remaining_time": "1:08:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3020, "total_steps": 5463, "loss": 0.4655, "learning_rate": 2.4776333856819565e-05, "epoch": 1.657746672155894, "percentage": 55.28, "elapsed_time": "1:24:00", "remaining_time": "1:07:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3030, "total_steps": 5463, "loss": 0.4631, "learning_rate": 2.4616582243214623e-05, "epoch": 1.6632358995471388, "percentage": 55.46, "elapsed_time": "1:24:18", "remaining_time": "1:07:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3040, "total_steps": 5463, "loss": 0.4492, "learning_rate": 2.4456846287986525e-05, "epoch": 1.6687251269383834, "percentage": 55.65, "elapsed_time": "1:24:35", "remaining_time": "1:07:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3050, "total_steps": 5463, "loss": 0.4326, "learning_rate": 2.429713251458323e-05, "epoch": 1.674214354329628, "percentage": 55.83, "elapsed_time": "1:24:51", "remaining_time": "1:07:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3060, "total_steps": 5463, "loss": 0.4527, "learning_rate": 2.4137447445546837e-05, "epoch": 1.6797035817208728, "percentage": 56.01, "elapsed_time": "1:25:08", "remaining_time": "1:06:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3070, "total_steps": 5463, "loss": 0.4331, "learning_rate": 2.397779760224713e-05, "epoch": 1.6851928091121176, "percentage": 56.2, "elapsed_time": "1:25:24", "remaining_time": "1:06:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3080, "total_steps": 5463, "loss": 0.4159, "learning_rate": 2.3818189504615367e-05, "epoch": 1.6906820365033621, "percentage": 56.38, "elapsed_time": "1:25:41", "remaining_time": "1:06:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3090, "total_steps": 5463, "loss": 0.4996, "learning_rate": 2.3658629670877938e-05, "epoch": 1.6961712638946067, "percentage": 56.56, "elapsed_time": "1:25:57", "remaining_time": "1:06:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3100, "total_steps": 5463, "loss": 0.4827, "learning_rate": 2.3499124617290187e-05, "epoch": 1.7016604912858515, "percentage": 56.75, "elapsed_time": "1:26:15", "remaining_time": "1:05:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3110, "total_steps": 5463, "loss": 0.5358, "learning_rate": 2.3339680857870288e-05, "epoch": 1.7071497186770963, "percentage": 56.93, "elapsed_time": "1:26:31", "remaining_time": "1:05:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3120, "total_steps": 5463, "loss": 0.4584, "learning_rate": 2.318030490413323e-05, "epoch": 1.7126389460683409, "percentage": 57.11, "elapsed_time": "1:26:48", "remaining_time": "1:05:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3130, "total_steps": 5463, "loss": 0.4366, "learning_rate": 2.30210032648249e-05, "epoch": 1.7181281734595855, "percentage": 57.29, "elapsed_time": "1:27:04", "remaining_time": "1:04:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3140, "total_steps": 5463, "loss": 0.4633, "learning_rate": 2.286178244565625e-05, "epoch": 1.7236174008508303, "percentage": 57.48, "elapsed_time": "1:27:21", "remaining_time": "1:04:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3150, "total_steps": 5463, "loss": 0.4861, "learning_rate": 2.2702648949037618e-05, "epoch": 1.729106628242075, "percentage": 57.66, "elapsed_time": "1:27:37", "remaining_time": "1:04:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3160, "total_steps": 5463, "loss": 0.4881, "learning_rate": 2.2543609273813195e-05, "epoch": 1.7345958556333196, "percentage": 57.84, "elapsed_time": "1:27:54", "remaining_time": "1:04:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3170, "total_steps": 5463, "loss": 0.418, "learning_rate": 2.2384669914995592e-05, "epoch": 1.7400850830245642, "percentage": 58.03, "elapsed_time": "1:28:10", "remaining_time": "1:03:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3180, "total_steps": 5463, "loss": 0.472, "learning_rate": 2.2225837363500636e-05, "epoch": 1.745574310415809, "percentage": 58.21, "elapsed_time": "1:28:27", "remaining_time": "1:03:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3190, "total_steps": 5463, "loss": 0.4718, "learning_rate": 2.2067118105882195e-05, "epoch": 1.7510635378070538, "percentage": 58.39, "elapsed_time": "1:28:43", "remaining_time": "1:03:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3200, "total_steps": 5463, "loss": 0.4318, "learning_rate": 2.190851862406739e-05, "epoch": 1.7565527651982984, "percentage": 58.58, "elapsed_time": "1:29:00", "remaining_time": "1:02:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3210, "total_steps": 5463, "loss": 0.4728, "learning_rate": 2.17500453950918e-05, "epoch": 1.762041992589543, "percentage": 58.76, "elapsed_time": "1:29:16", "remaining_time": "1:02:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3220, "total_steps": 5463, "loss": 0.4229, "learning_rate": 2.159170489083498e-05, "epoch": 1.7675312199807878, "percentage": 58.94, "elapsed_time": "1:29:33", "remaining_time": "1:02:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3230, "total_steps": 5463, "loss": 0.3906, "learning_rate": 2.1433503577756137e-05, "epoch": 1.7730204473720323, "percentage": 59.13, "elapsed_time": "1:29:49", "remaining_time": "1:02:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3240, "total_steps": 5463, "loss": 0.379, "learning_rate": 2.1275447916630055e-05, "epoch": 1.778509674763277, "percentage": 59.31, "elapsed_time": "1:30:06", "remaining_time": "1:01:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3250, "total_steps": 5463, "loss": 0.4173, "learning_rate": 2.1117544362283286e-05, "epoch": 1.7839989021545217, "percentage": 59.49, "elapsed_time": "1:30:22", "remaining_time": "1:01:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3260, "total_steps": 5463, "loss": 0.426, "learning_rate": 2.0959799363330425e-05, "epoch": 1.7894881295457665, "percentage": 59.67, "elapsed_time": "1:30:39", "remaining_time": "1:01:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3270, "total_steps": 5463, "loss": 0.4165, "learning_rate": 2.0802219361910908e-05, "epoch": 1.794977356937011, "percentage": 59.86, "elapsed_time": "1:30:55", "remaining_time": "1:00:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3280, "total_steps": 5463, "loss": 0.4216, "learning_rate": 2.0644810793425807e-05, "epoch": 1.8004665843282557, "percentage": 60.04, "elapsed_time": "1:31:12", "remaining_time": "1:00:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3290, "total_steps": 5463, "loss": 0.4745, "learning_rate": 2.048758008627506e-05, "epoch": 1.8059558117195005, "percentage": 60.22, "elapsed_time": "1:31:29", "remaining_time": "1:00:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3300, "total_steps": 5463, "loss": 0.4314, "learning_rate": 2.033053366159493e-05, "epoch": 1.8114450391107453, "percentage": 60.41, "elapsed_time": "1:31:45", "remaining_time": "1:00:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3310, "total_steps": 5463, "loss": 0.4882, "learning_rate": 2.0173677932995787e-05, "epoch": 1.8169342665019899, "percentage": 60.59, "elapsed_time": "1:32:02", "remaining_time": "0:59:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3320, "total_steps": 5463, "loss": 0.4346, "learning_rate": 2.0017019306300182e-05, "epoch": 1.8224234938932344, "percentage": 60.77, "elapsed_time": "1:32:18", "remaining_time": "0:59:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3330, "total_steps": 5463, "loss": 0.515, "learning_rate": 1.9860564179281217e-05, "epoch": 1.8279127212844792, "percentage": 60.96, "elapsed_time": "1:32:35", "remaining_time": "0:59:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3340, "total_steps": 5463, "loss": 0.4268, "learning_rate": 1.970431894140128e-05, "epoch": 1.833401948675724, "percentage": 61.14, "elapsed_time": "1:32:51", "remaining_time": "0:59:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3350, "total_steps": 5463, "loss": 0.4324, "learning_rate": 1.954828997355112e-05, "epoch": 1.8388911760669686, "percentage": 61.32, "elapsed_time": "1:33:08", "remaining_time": "0:58:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3360, "total_steps": 5463, "loss": 0.4542, "learning_rate": 1.939248364778924e-05, "epoch": 1.8443804034582132, "percentage": 61.5, "elapsed_time": "1:33:24", "remaining_time": "0:58:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3370, "total_steps": 5463, "loss": 0.4695, "learning_rate": 1.923690632708169e-05, "epoch": 1.849869630849458, "percentage": 61.69, "elapsed_time": "1:33:41", "remaining_time": "0:58:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3380, "total_steps": 5463, "loss": 0.4433, "learning_rate": 1.908156436504215e-05, "epoch": 1.8553588582407026, "percentage": 61.87, "elapsed_time": "1:33:57", "remaining_time": "0:57:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3390, "total_steps": 5463, "loss": 0.4257, "learning_rate": 1.892646410567255e-05, "epoch": 1.8608480856319471, "percentage": 62.05, "elapsed_time": "1:34:14", "remaining_time": "0:57:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3400, "total_steps": 5463, "loss": 0.3585, "learning_rate": 1.877161188310392e-05, "epoch": 1.866337313023192, "percentage": 62.24, "elapsed_time": "1:34:31", "remaining_time": "0:57:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3410, "total_steps": 5463, "loss": 0.4234, "learning_rate": 1.8617014021337732e-05, "epoch": 1.8718265404144367, "percentage": 62.42, "elapsed_time": "1:34:50", "remaining_time": "0:57:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3420, "total_steps": 5463, "loss": 0.4546, "learning_rate": 1.846267683398761e-05, "epoch": 1.8773157678056813, "percentage": 62.6, "elapsed_time": "1:35:09", "remaining_time": "0:56:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3430, "total_steps": 5463, "loss": 0.4505, "learning_rate": 1.830860662402153e-05, "epoch": 1.882804995196926, "percentage": 62.79, "elapsed_time": "1:35:27", "remaining_time": "0:56:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3440, "total_steps": 5463, "loss": 0.4684, "learning_rate": 1.8154809683504403e-05, "epoch": 1.8882942225881707, "percentage": 62.97, "elapsed_time": "1:35:46", "remaining_time": "0:56:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3450, "total_steps": 5463, "loss": 0.4478, "learning_rate": 1.8001292293341087e-05, "epoch": 1.8937834499794155, "percentage": 63.15, "elapsed_time": "1:36:04", "remaining_time": "0:56:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3460, "total_steps": 5463, "loss": 0.4323, "learning_rate": 1.7848060723019894e-05, "epoch": 1.89927267737066, "percentage": 63.34, "elapsed_time": "1:36:20", "remaining_time": "0:55:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3470, "total_steps": 5463, "loss": 0.4429, "learning_rate": 1.7695121230356566e-05, "epoch": 1.9047619047619047, "percentage": 63.52, "elapsed_time": "1:36:37", "remaining_time": "0:55:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3480, "total_steps": 5463, "loss": 0.4399, "learning_rate": 1.7542480061238685e-05, "epoch": 1.9102511321531495, "percentage": 63.7, "elapsed_time": "1:36:53", "remaining_time": "0:55:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3490, "total_steps": 5463, "loss": 0.4029, "learning_rate": 1.7390143449370663e-05, "epoch": 1.9157403595443943, "percentage": 63.88, "elapsed_time": "1:37:09", "remaining_time": "0:54:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3500, "total_steps": 5463, "loss": 0.4072, "learning_rate": 1.723811761601904e-05, "epoch": 1.9212295869356388, "percentage": 64.07, "elapsed_time": "1:37:26", "remaining_time": "0:54:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3510, "total_steps": 5463, "loss": 0.4502, "learning_rate": 1.708640876975855e-05, "epoch": 1.9267188143268834, "percentage": 64.25, "elapsed_time": "1:37:42", "remaining_time": "0:54:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3520, "total_steps": 5463, "loss": 0.4397, "learning_rate": 1.693502310621848e-05, "epoch": 1.9322080417181282, "percentage": 64.43, "elapsed_time": "1:37:59", "remaining_time": "0:54:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3530, "total_steps": 5463, "loss": 0.4562, "learning_rate": 1.6783966807829692e-05, "epoch": 1.937697269109373, "percentage": 64.62, "elapsed_time": "1:38:15", "remaining_time": "0:53:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3540, "total_steps": 5463, "loss": 0.4332, "learning_rate": 1.66332460435721e-05, "epoch": 1.9431864965006176, "percentage": 64.8, "elapsed_time": "1:38:32", "remaining_time": "0:53:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3550, "total_steps": 5463, "loss": 0.4392, "learning_rate": 1.648286696872277e-05, "epoch": 1.9486757238918622, "percentage": 64.98, "elapsed_time": "1:38:48", "remaining_time": "0:53:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3560, "total_steps": 5463, "loss": 0.4079, "learning_rate": 1.6332835724604556e-05, "epoch": 1.954164951283107, "percentage": 65.17, "elapsed_time": "1:39:05", "remaining_time": "0:52:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3570, "total_steps": 5463, "loss": 0.4156, "learning_rate": 1.6183158438335223e-05, "epoch": 1.9596541786743515, "percentage": 65.35, "elapsed_time": "1:39:21", "remaining_time": "0:52:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3580, "total_steps": 5463, "loss": 0.4514, "learning_rate": 1.6033841222577312e-05, "epoch": 1.9651434060655961, "percentage": 65.53, "elapsed_time": "1:39:38", "remaining_time": "0:52:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3590, "total_steps": 5463, "loss": 0.4107, "learning_rate": 1.588489017528844e-05, "epoch": 1.970632633456841, "percentage": 65.71, "elapsed_time": "1:39:54", "remaining_time": "0:52:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3600, "total_steps": 5463, "loss": 0.4247, "learning_rate": 1.573631137947232e-05, "epoch": 1.9761218608480857, "percentage": 65.9, "elapsed_time": "1:40:11", "remaining_time": "0:51:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3610, "total_steps": 5463, "loss": 0.3993, "learning_rate": 1.5588110902930252e-05, "epoch": 1.9816110882393303, "percentage": 66.08, "elapsed_time": "1:40:27", "remaining_time": "0:51:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3620, "total_steps": 5463, "loss": 0.4032, "learning_rate": 1.5440294798013445e-05, "epoch": 1.9871003156305749, "percentage": 66.26, "elapsed_time": "1:40:44", "remaining_time": "0:51:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3630, "total_steps": 5463, "loss": 0.4191, "learning_rate": 1.5292869101375718e-05, "epoch": 1.9925895430218197, "percentage": 66.45, "elapsed_time": "1:41:00", "remaining_time": "0:51:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3640, "total_steps": 5463, "loss": 0.4065, "learning_rate": 1.514583983372707e-05, "epoch": 1.9980787704130645, "percentage": 66.63, "elapsed_time": "1:41:17", "remaining_time": "0:50:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3650, "total_steps": 5463, "loss": 0.3012, "learning_rate": 1.4999212999587723e-05, "epoch": 2.003567997804309, "percentage": 66.81, "elapsed_time": "1:41:33", "remaining_time": "0:50:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3660, "total_steps": 5463, "loss": 0.2699, "learning_rate": 1.4852994587042957e-05, "epoch": 2.0090572251955536, "percentage": 67.0, "elapsed_time": "1:41:50", "remaining_time": "0:50:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3670, "total_steps": 5463, "loss": 0.256, "learning_rate": 1.4707190567498552e-05, "epoch": 2.0145464525867984, "percentage": 67.18, "elapsed_time": "1:42:06", "remaining_time": "0:49:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3680, "total_steps": 5463, "loss": 0.2306, "learning_rate": 1.4561806895436907e-05, "epoch": 2.0200356799780432, "percentage": 67.36, "elapsed_time": "1:42:23", "remaining_time": "0:49:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3690, "total_steps": 5463, "loss": 0.2363, "learning_rate": 1.4416849508173864e-05, "epoch": 2.0255249073692876, "percentage": 67.55, "elapsed_time": "1:42:39", "remaining_time": "0:49:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3700, "total_steps": 5463, "loss": 0.2407, "learning_rate": 1.4272324325616251e-05, "epoch": 2.0310141347605324, "percentage": 67.73, "elapsed_time": "1:42:56", "remaining_time": "0:49:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3710, "total_steps": 5463, "loss": 0.2525, "learning_rate": 1.4128237250020115e-05, "epoch": 2.036503362151777, "percentage": 67.91, "elapsed_time": "1:43:12", "remaining_time": "0:48:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3720, "total_steps": 5463, "loss": 0.2371, "learning_rate": 1.3984594165749676e-05, "epoch": 2.041992589543022, "percentage": 68.09, "elapsed_time": "1:43:29", "remaining_time": "0:48:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3730, "total_steps": 5463, "loss": 0.241, "learning_rate": 1.3841400939037013e-05, "epoch": 2.0474818169342663, "percentage": 68.28, "elapsed_time": "1:43:45", "remaining_time": "0:48:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3740, "total_steps": 5463, "loss": 0.2509, "learning_rate": 1.3698663417742496e-05, "epoch": 2.052971044325511, "percentage": 68.46, "elapsed_time": "1:44:02", "remaining_time": "0:47:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3750, "total_steps": 5463, "loss": 0.265, "learning_rate": 1.3556387431115969e-05, "epoch": 2.058460271716756, "percentage": 68.64, "elapsed_time": "1:44:18", "remaining_time": "0:47:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3760, "total_steps": 5463, "loss": 0.2182, "learning_rate": 1.3414578789558696e-05, "epoch": 2.0639494991080007, "percentage": 68.83, "elapsed_time": "1:44:35", "remaining_time": "0:47:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3770, "total_steps": 5463, "loss": 0.2477, "learning_rate": 1.3273243284386023e-05, "epoch": 2.069438726499245, "percentage": 69.01, "elapsed_time": "1:44:52", "remaining_time": "0:47:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3780, "total_steps": 5463, "loss": 0.2379, "learning_rate": 1.3132386687590958e-05, "epoch": 2.07492795389049, "percentage": 69.19, "elapsed_time": "1:45:08", "remaining_time": "0:46:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3790, "total_steps": 5463, "loss": 0.2319, "learning_rate": 1.2992014751608372e-05, "epoch": 2.0804171812817347, "percentage": 69.38, "elapsed_time": "1:45:25", "remaining_time": "0:46:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3800, "total_steps": 5463, "loss": 0.2416, "learning_rate": 1.2852133209080097e-05, "epoch": 2.0859064086729795, "percentage": 69.56, "elapsed_time": "1:45:42", "remaining_time": "0:46:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3810, "total_steps": 5463, "loss": 0.2629, "learning_rate": 1.2712747772620801e-05, "epoch": 2.091395636064224, "percentage": 69.74, "elapsed_time": "1:45:58", "remaining_time": "0:45:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3820, "total_steps": 5463, "loss": 0.2069, "learning_rate": 1.2573864134584718e-05, "epoch": 2.0968848634554687, "percentage": 69.92, "elapsed_time": "1:46:15", "remaining_time": "0:45:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3830, "total_steps": 5463, "loss": 0.237, "learning_rate": 1.243548796683319e-05, "epoch": 2.1023740908467135, "percentage": 70.11, "elapsed_time": "1:46:32", "remaining_time": "0:45:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3840, "total_steps": 5463, "loss": 0.2531, "learning_rate": 1.2297624920502953e-05, "epoch": 2.107863318237958, "percentage": 70.29, "elapsed_time": "1:46:49", "remaining_time": "0:45:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3850, "total_steps": 5463, "loss": 0.2464, "learning_rate": 1.2160280625775447e-05, "epoch": 2.1133525456292026, "percentage": 70.47, "elapsed_time": "1:47:05", "remaining_time": "0:44:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3860, "total_steps": 5463, "loss": 0.2344, "learning_rate": 1.2023460691646821e-05, "epoch": 2.1188417730204474, "percentage": 70.66, "elapsed_time": "1:47:22", "remaining_time": "0:44:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3870, "total_steps": 5463, "loss": 0.2191, "learning_rate": 1.1887170705698905e-05, "epoch": 2.124331000411692, "percentage": 70.84, "elapsed_time": "1:47:38", "remaining_time": "0:44:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3880, "total_steps": 5463, "loss": 0.2303, "learning_rate": 1.1751416233870999e-05, "epoch": 2.1298202278029366, "percentage": 71.02, "elapsed_time": "1:47:55", "remaining_time": "0:44:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3890, "total_steps": 5463, "loss": 0.2493, "learning_rate": 1.1616202820232567e-05, "epoch": 2.1353094551941814, "percentage": 71.21, "elapsed_time": "1:48:12", "remaining_time": "0:43:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3900, "total_steps": 5463, "loss": 0.2527, "learning_rate": 1.1481535986756828e-05, "epoch": 2.140798682585426, "percentage": 71.39, "elapsed_time": "1:48:30", "remaining_time": "0:43:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3910, "total_steps": 5463, "loss": 0.2599, "learning_rate": 1.134742123309525e-05, "epoch": 2.146287909976671, "percentage": 71.57, "elapsed_time": "1:48:48", "remaining_time": "0:43:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3920, "total_steps": 5463, "loss": 0.2457, "learning_rate": 1.1213864036352939e-05, "epoch": 2.1517771373679153, "percentage": 71.76, "elapsed_time": "1:49:06", "remaining_time": "0:42:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3930, "total_steps": 5463, "loss": 0.2532, "learning_rate": 1.1080869850864964e-05, "epoch": 2.15726636475916, "percentage": 71.94, "elapsed_time": "1:49:23", "remaining_time": "0:42:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3940, "total_steps": 5463, "loss": 0.2651, "learning_rate": 1.094844410797361e-05, "epoch": 2.162755592150405, "percentage": 72.12, "elapsed_time": "1:49:39", "remaining_time": "0:42:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3950, "total_steps": 5463, "loss": 0.2171, "learning_rate": 1.0816592215806562e-05, "epoch": 2.1682448195416497, "percentage": 72.3, "elapsed_time": "1:49:56", "remaining_time": "0:42:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3960, "total_steps": 5463, "loss": 0.2579, "learning_rate": 1.0685319559056051e-05, "epoch": 2.173734046932894, "percentage": 72.49, "elapsed_time": "1:50:12", "remaining_time": "0:41:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3970, "total_steps": 5463, "loss": 0.2541, "learning_rate": 1.0554631498758943e-05, "epoch": 2.179223274324139, "percentage": 72.67, "elapsed_time": "1:50:29", "remaining_time": "0:41:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3980, "total_steps": 5463, "loss": 0.2053, "learning_rate": 1.0424533372077803e-05, "epoch": 2.1847125017153837, "percentage": 72.85, "elapsed_time": "1:50:45", "remaining_time": "0:41:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 3990, "total_steps": 5463, "loss": 0.214, "learning_rate": 1.029503049208293e-05, "epoch": 2.1902017291066285, "percentage": 73.04, "elapsed_time": "1:51:02", "remaining_time": "0:40:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4000, "total_steps": 5463, "loss": 0.2133, "learning_rate": 1.0166128147535352e-05, "epoch": 2.195690956497873, "percentage": 73.22, "elapsed_time": "1:51:19", "remaining_time": "0:40:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4010, "total_steps": 5463, "loss": 0.2233, "learning_rate": 1.003783160267091e-05, "epoch": 2.2011801838891176, "percentage": 73.4, "elapsed_time": "1:51:38", "remaining_time": "0:40:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4020, "total_steps": 5463, "loss": 0.2389, "learning_rate": 9.91014609698519e-06, "epoch": 2.2066694112803624, "percentage": 73.59, "elapsed_time": "1:51:55", "remaining_time": "0:40:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4030, "total_steps": 5463, "loss": 0.2297, "learning_rate": 9.783076845019598e-06, "epoch": 2.212158638671607, "percentage": 73.77, "elapsed_time": "1:52:12", "remaining_time": "0:39:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4040, "total_steps": 5463, "loss": 0.2519, "learning_rate": 9.656629036148365e-06, "epoch": 2.2176478660628516, "percentage": 73.95, "elapsed_time": "1:52:28", "remaining_time": "0:39:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4050, "total_steps": 5463, "loss": 0.2416, "learning_rate": 9.530807834366658e-06, "epoch": 2.2231370934540964, "percentage": 74.14, "elapsed_time": "1:52:45", "remaining_time": "0:39:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4060, "total_steps": 5463, "loss": 0.238, "learning_rate": 9.405618378079686e-06, "epoch": 2.228626320845341, "percentage": 74.32, "elapsed_time": "1:53:01", "remaining_time": "0:39:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4070, "total_steps": 5463, "loss": 0.2165, "learning_rate": 9.281065779892826e-06, "epoch": 2.2341155482365855, "percentage": 74.5, "elapsed_time": "1:53:18", "remaining_time": "0:38:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4080, "total_steps": 5463, "loss": 0.2539, "learning_rate": 9.15715512640282e-06, "epoch": 2.2396047756278303, "percentage": 74.68, "elapsed_time": "1:53:35", "remaining_time": "0:38:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4090, "total_steps": 5463, "loss": 0.2392, "learning_rate": 9.033891477990091e-06, "epoch": 2.245094003019075, "percentage": 74.87, "elapsed_time": "1:53:51", "remaining_time": "0:38:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4100, "total_steps": 5463, "loss": 0.2507, "learning_rate": 8.923511544874787e-06, "epoch": 2.25058323041032, "percentage": 75.05, "elapsed_time": "1:54:08", "remaining_time": "0:37:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4110, "total_steps": 5463, "loss": 0.2205, "learning_rate": 8.801491052657259e-06, "epoch": 2.2560724578015643, "percentage": 75.23, "elapsed_time": "1:54:24", "remaining_time": "0:37:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4120, "total_steps": 5463, "loss": 0.2189, "learning_rate": 8.680132090462712e-06, "epoch": 2.261561685192809, "percentage": 75.42, "elapsed_time": "1:54:41", "remaining_time": "0:37:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4130, "total_steps": 5463, "loss": 0.2573, "learning_rate": 8.559439614463177e-06, "epoch": 2.267050912584054, "percentage": 75.6, "elapsed_time": "1:54:57", "remaining_time": "0:37:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4140, "total_steps": 5463, "loss": 0.2464, "learning_rate": 8.439418553612105e-06, "epoch": 2.2725401399752982, "percentage": 75.78, "elapsed_time": "1:55:14", "remaining_time": "0:36:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4150, "total_steps": 5463, "loss": 0.236, "learning_rate": 8.320073809443024e-06, "epoch": 2.278029367366543, "percentage": 75.97, "elapsed_time": "1:55:30", "remaining_time": "0:36:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4160, "total_steps": 5463, "loss": 0.2596, "learning_rate": 8.201410255869458e-06, "epoch": 2.283518594757788, "percentage": 76.15, "elapsed_time": "1:55:47", "remaining_time": "0:36:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4170, "total_steps": 5463, "loss": 0.2233, "learning_rate": 8.083432738985782e-06, "epoch": 2.2890078221490326, "percentage": 76.33, "elapsed_time": "1:56:04", "remaining_time": "0:35:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4180, "total_steps": 5463, "loss": 0.223, "learning_rate": 7.966146076869386e-06, "epoch": 2.2944970495402774, "percentage": 76.51, "elapsed_time": "1:56:21", "remaining_time": "0:35:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4190, "total_steps": 5463, "loss": 0.2236, "learning_rate": 7.849555059383839e-06, "epoch": 2.299986276931522, "percentage": 76.7, "elapsed_time": "1:56:38", "remaining_time": "0:35:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4200, "total_steps": 5463, "loss": 0.2509, "learning_rate": 7.733664447983349e-06, "epoch": 2.3054755043227666, "percentage": 76.88, "elapsed_time": "1:56:54", "remaining_time": "0:35:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4210, "total_steps": 5463, "loss": 0.2373, "learning_rate": 7.618478975518292e-06, "epoch": 2.3109647317140114, "percentage": 77.06, "elapsed_time": "1:57:11", "remaining_time": "0:34:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4220, "total_steps": 5463, "loss": 0.2404, "learning_rate": 7.504003346041871e-06, "epoch": 2.3164539591052558, "percentage": 77.25, "elapsed_time": "1:57:28", "remaining_time": "0:34:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4230, "total_steps": 5463, "loss": 0.1858, "learning_rate": 7.390242234618075e-06, "epoch": 2.3219431864965006, "percentage": 77.43, "elapsed_time": "1:57:44", "remaining_time": "0:34:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4240, "total_steps": 5463, "loss": 0.2595, "learning_rate": 7.277200287130728e-06, "epoch": 2.3274324138877454, "percentage": 77.61, "elapsed_time": "1:58:01", "remaining_time": "0:34:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4250, "total_steps": 5463, "loss": 0.2419, "learning_rate": 7.164882120093757e-06, "epoch": 2.33292164127899, "percentage": 77.8, "elapsed_time": "1:58:18", "remaining_time": "0:33:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4260, "total_steps": 5463, "loss": 0.256, "learning_rate": 7.053292320462654e-06, "epoch": 2.3384108686702345, "percentage": 77.98, "elapsed_time": "1:58:34", "remaining_time": "0:33:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4270, "total_steps": 5463, "loss": 0.2319, "learning_rate": 6.942435445447159e-06, "epoch": 2.3439000960614793, "percentage": 78.16, "elapsed_time": "1:58:51", "remaining_time": "0:33:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4280, "total_steps": 5463, "loss": 0.212, "learning_rate": 6.832316022325138e-06, "epoch": 2.349389323452724, "percentage": 78.35, "elapsed_time": "1:59:07", "remaining_time": "0:32:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4290, "total_steps": 5463, "loss": 0.2434, "learning_rate": 6.7229385482577065e-06, "epoch": 2.354878550843969, "percentage": 78.53, "elapsed_time": "1:59:24", "remaining_time": "0:32:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4300, "total_steps": 5463, "loss": 0.2644, "learning_rate": 6.614307490105557e-06, "epoch": 2.3603677782352133, "percentage": 78.71, "elapsed_time": "1:59:41", "remaining_time": "0:32:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4310, "total_steps": 5463, "loss": 0.2327, "learning_rate": 6.506427284246547e-06, "epoch": 2.365857005626458, "percentage": 78.89, "elapsed_time": "1:59:57", "remaining_time": "0:32:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4320, "total_steps": 5463, "loss": 0.2206, "learning_rate": 6.3993023363945165e-06, "epoch": 2.371346233017703, "percentage": 79.08, "elapsed_time": "2:00:14", "remaining_time": "0:31:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4330, "total_steps": 5463, "loss": 0.2736, "learning_rate": 6.2929370214193735e-06, "epoch": 2.376835460408947, "percentage": 79.26, "elapsed_time": "2:00:30", "remaining_time": "0:31:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4340, "total_steps": 5463, "loss": 0.2344, "learning_rate": 6.1873356831683884e-06, "epoch": 2.382324687800192, "percentage": 79.44, "elapsed_time": "2:00:47", "remaining_time": "0:31:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4350, "total_steps": 5463, "loss": 0.2019, "learning_rate": 6.082502634288873e-06, "epoch": 2.387813915191437, "percentage": 79.63, "elapsed_time": "2:01:04", "remaining_time": "0:30:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4360, "total_steps": 5463, "loss": 0.2289, "learning_rate": 5.978442156051986e-06, "epoch": 2.3933031425826816, "percentage": 79.81, "elapsed_time": "2:01:20", "remaining_time": "0:30:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4370, "total_steps": 5463, "loss": 0.2396, "learning_rate": 5.875158498177921e-06, "epoch": 2.3987923699739264, "percentage": 79.99, "elapsed_time": "2:01:37", "remaining_time": "0:30:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4380, "total_steps": 5463, "loss": 0.2531, "learning_rate": 5.772655878662339e-06, "epoch": 2.4042815973651708, "percentage": 80.18, "elapsed_time": "2:01:53", "remaining_time": "0:30:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4390, "total_steps": 5463, "loss": 0.2405, "learning_rate": 5.6709384836041184e-06, "epoch": 2.4097708247564156, "percentage": 80.36, "elapsed_time": "2:02:10", "remaining_time": "0:29:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4400, "total_steps": 5463, "loss": 0.2279, "learning_rate": 5.570010467034425e-06, "epoch": 2.4152600521476604, "percentage": 80.54, "elapsed_time": "2:02:27", "remaining_time": "0:29:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4410, "total_steps": 5463, "loss": 0.2081, "learning_rate": 5.469875950747016e-06, "epoch": 2.4207492795389047, "percentage": 80.72, "elapsed_time": "2:02:43", "remaining_time": "0:29:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4420, "total_steps": 5463, "loss": 0.2455, "learning_rate": 5.370539024129928e-06, "epoch": 2.4262385069301495, "percentage": 80.91, "elapsed_time": "2:03:00", "remaining_time": "0:29:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4430, "total_steps": 5463, "loss": 0.256, "learning_rate": 5.272003743998489e-06, "epoch": 2.4317277343213943, "percentage": 81.09, "elapsed_time": "2:03:16", "remaining_time": "0:28:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4440, "total_steps": 5463, "loss": 0.2481, "learning_rate": 5.1742741344296246e-06, "epoch": 2.437216961712639, "percentage": 81.27, "elapsed_time": "2:03:33", "remaining_time": "0:28:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4450, "total_steps": 5463, "loss": 0.2213, "learning_rate": 5.077354186597541e-06, "epoch": 2.4427061891038835, "percentage": 81.46, "elapsed_time": "2:03:50", "remaining_time": "0:28:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4460, "total_steps": 5463, "loss": 0.2064, "learning_rate": 4.981247858610688e-06, "epoch": 2.4481954164951283, "percentage": 81.64, "elapsed_time": "2:04:06", "remaining_time": "0:27:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4470, "total_steps": 5463, "loss": 0.2344, "learning_rate": 4.885959075350149e-06, "epoch": 2.453684643886373, "percentage": 81.82, "elapsed_time": "2:04:23", "remaining_time": "0:27:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4480, "total_steps": 5463, "loss": 0.2727, "learning_rate": 4.791491728309347e-06, "epoch": 2.459173871277618, "percentage": 82.01, "elapsed_time": "2:04:40", "remaining_time": "0:27:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4490, "total_steps": 5463, "loss": 0.2449, "learning_rate": 4.697849675435112e-06, "epoch": 2.4646630986688622, "percentage": 82.19, "elapsed_time": "2:04:56", "remaining_time": "0:27:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4500, "total_steps": 5463, "loss": 0.2228, "learning_rate": 4.605036740970134e-06, "epoch": 2.470152326060107, "percentage": 82.37, "elapsed_time": "2:05:13", "remaining_time": "0:26:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4510, "total_steps": 5463, "loss": 0.2399, "learning_rate": 4.513056715296773e-06, "epoch": 2.475641553451352, "percentage": 82.56, "elapsed_time": "2:05:31", "remaining_time": "0:26:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4520, "total_steps": 5463, "loss": 0.2133, "learning_rate": 4.4219133547822865e-06, "epoch": 2.481130780842596, "percentage": 82.74, "elapsed_time": "2:05:49", "remaining_time": "0:26:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4530, "total_steps": 5463, "loss": 0.2318, "learning_rate": 4.331610381625395e-06, "epoch": 2.486620008233841, "percentage": 82.92, "elapsed_time": "2:06:07", "remaining_time": "0:25:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4540, "total_steps": 5463, "loss": 0.2393, "learning_rate": 4.242151483704293e-06, "epoch": 2.492109235625086, "percentage": 83.1, "elapsed_time": "2:06:25", "remaining_time": "0:25:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4550, "total_steps": 5463, "loss": 0.2343, "learning_rate": 4.153540314426033e-06, "epoch": 2.4975984630163306, "percentage": 83.29, "elapsed_time": "2:06:44", "remaining_time": "0:25:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4560, "total_steps": 5463, "loss": 0.2608, "learning_rate": 4.065780492577326e-06, "epoch": 2.5030876904075754, "percentage": 83.47, "elapsed_time": "2:07:04", "remaining_time": "0:25:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4570, "total_steps": 5463, "loss": 0.2401, "learning_rate": 3.978875602176726e-06, "epoch": 2.5085769177988197, "percentage": 83.65, "elapsed_time": "2:07:21", "remaining_time": "0:24:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4580, "total_steps": 5463, "loss": 0.2381, "learning_rate": 3.892829192328337e-06, "epoch": 2.5140661451900645, "percentage": 83.84, "elapsed_time": "2:07:38", "remaining_time": "0:24:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4590, "total_steps": 5463, "loss": 0.2712, "learning_rate": 3.8076447770767796e-06, "epoch": 2.5195553725813093, "percentage": 84.02, "elapsed_time": "2:07:54", "remaining_time": "0:24:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4600, "total_steps": 5463, "loss": 0.2162, "learning_rate": 3.7233258352637553e-06, "epoch": 2.5250445999725537, "percentage": 84.2, "elapsed_time": "2:08:12", "remaining_time": "0:24:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4610, "total_steps": 5463, "loss": 0.208, "learning_rate": 3.6398758103859067e-06, "epoch": 2.5305338273637985, "percentage": 84.39, "elapsed_time": "2:08:29", "remaining_time": "0:23:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4620, "total_steps": 5463, "loss": 0.2231, "learning_rate": 3.557298110454252e-06, "epoch": 2.5360230547550433, "percentage": 84.57, "elapsed_time": "2:08:45", "remaining_time": "0:23:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4630, "total_steps": 5463, "loss": 0.2359, "learning_rate": 3.475596107854981e-06, "epoch": 2.5415122821462877, "percentage": 84.75, "elapsed_time": "2:09:02", "remaining_time": "0:23:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4640, "total_steps": 5463, "loss": 0.2268, "learning_rate": 3.3947731392117237e-06, "epoch": 2.5470015095375325, "percentage": 84.94, "elapsed_time": "2:09:18", "remaining_time": "0:22:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4650, "total_steps": 5463, "loss": 0.2382, "learning_rate": 3.3148325052492713e-06, "epoch": 2.5524907369287773, "percentage": 85.12, "elapsed_time": "2:09:35", "remaining_time": "0:22:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4660, "total_steps": 5463, "loss": 0.2364, "learning_rate": 3.2357774706588157e-06, "epoch": 2.557979964320022, "percentage": 85.3, "elapsed_time": "2:09:52", "remaining_time": "0:22:22", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4670, "total_steps": 5463, "loss": 0.2379, "learning_rate": 3.1576112639646023e-06, "epoch": 2.563469191711267, "percentage": 85.48, "elapsed_time": "2:10:08", "remaining_time": "0:22:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4680, "total_steps": 5463, "loss": 0.2012, "learning_rate": 3.08033707739209e-06, "epoch": 2.568958419102511, "percentage": 85.67, "elapsed_time": "2:10:24", "remaining_time": "0:21:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4690, "total_steps": 5463, "loss": 0.2019, "learning_rate": 3.0039580667375557e-06, "epoch": 2.574447646493756, "percentage": 85.85, "elapsed_time": "2:10:41", "remaining_time": "0:21:32", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4700, "total_steps": 5463, "loss": 0.2565, "learning_rate": 2.9284773512392475e-06, "epoch": 2.579936873885001, "percentage": 86.03, "elapsed_time": "2:10:58", "remaining_time": "0:21:15", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4710, "total_steps": 5463, "loss": 0.2254, "learning_rate": 2.8538980134499958e-06, "epoch": 2.585426101276245, "percentage": 86.22, "elapsed_time": "2:11:14", "remaining_time": "0:20:58", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4720, "total_steps": 5463, "loss": 0.2505, "learning_rate": 2.780223099111298e-06, "epoch": 2.59091532866749, "percentage": 86.4, "elapsed_time": "2:11:31", "remaining_time": "0:20:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4730, "total_steps": 5463, "loss": 0.1887, "learning_rate": 2.7074556170289674e-06, "epoch": 2.5964045560587348, "percentage": 86.58, "elapsed_time": "2:11:47", "remaining_time": "0:20:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4740, "total_steps": 5463, "loss": 0.1995, "learning_rate": 2.6355985389502293e-06, "epoch": 2.6018937834499796, "percentage": 86.77, "elapsed_time": "2:12:04", "remaining_time": "0:20:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4750, "total_steps": 5463, "loss": 0.2527, "learning_rate": 2.5646547994423784e-06, "epoch": 2.6073830108412244, "percentage": 86.95, "elapsed_time": "2:12:20", "remaining_time": "0:19:51", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4760, "total_steps": 5463, "loss": 0.2007, "learning_rate": 2.4946272957729165e-06, "epoch": 2.6128722382324687, "percentage": 87.13, "elapsed_time": "2:12:37", "remaining_time": "0:19:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4770, "total_steps": 5463, "loss": 0.2044, "learning_rate": 2.4255188877912477e-06, "epoch": 2.6183614656237135, "percentage": 87.31, "elapsed_time": "2:12:54", "remaining_time": "0:19:18", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4780, "total_steps": 5463, "loss": 0.2825, "learning_rate": 2.3573323978118705e-06, "epoch": 2.6238506930149583, "percentage": 87.5, "elapsed_time": "2:13:10", "remaining_time": "0:19:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4790, "total_steps": 5463, "loss": 0.209, "learning_rate": 2.29007061049914e-06, "epoch": 2.6293399204062027, "percentage": 87.68, "elapsed_time": "2:13:27", "remaining_time": "0:18:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4800, "total_steps": 5463, "loss": 0.2069, "learning_rate": 2.2237362727535043e-06, "epoch": 2.6348291477974475, "percentage": 87.86, "elapsed_time": "2:13:43", "remaining_time": "0:18:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4810, "total_steps": 5463, "loss": 0.2606, "learning_rate": 2.1583320935993605e-06, "epoch": 2.6403183751886923, "percentage": 88.05, "elapsed_time": "2:14:00", "remaining_time": "0:18:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4820, "total_steps": 5463, "loss": 0.2235, "learning_rate": 2.0938607440744274e-06, "epoch": 2.6458076025799366, "percentage": 88.23, "elapsed_time": "2:14:16", "remaining_time": "0:17:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4830, "total_steps": 5463, "loss": 0.2454, "learning_rate": 2.0303248571206244e-06, "epoch": 2.6512968299711814, "percentage": 88.41, "elapsed_time": "2:14:33", "remaining_time": "0:17:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4840, "total_steps": 5463, "loss": 0.1998, "learning_rate": 1.967727027476568e-06, "epoch": 2.6567860573624262, "percentage": 88.6, "elapsed_time": "2:14:51", "remaining_time": "0:17:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4850, "total_steps": 5463, "loss": 0.2377, "learning_rate": 1.9060698115716063e-06, "epoch": 2.662275284753671, "percentage": 88.78, "elapsed_time": "2:15:07", "remaining_time": "0:17:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4860, "total_steps": 5463, "loss": 0.2288, "learning_rate": 1.8453557274214162e-06, "epoch": 2.667764512144916, "percentage": 88.96, "elapsed_time": "2:15:24", "remaining_time": "0:16:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4870, "total_steps": 5463, "loss": 0.2419, "learning_rate": 1.7855872545251757e-06, "epoch": 2.67325373953616, "percentage": 89.15, "elapsed_time": "2:15:40", "remaining_time": "0:16:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4880, "total_steps": 5463, "loss": 0.222, "learning_rate": 1.7267668337642761e-06, "epoch": 2.678742966927405, "percentage": 89.33, "elapsed_time": "2:15:57", "remaining_time": "0:16:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4890, "total_steps": 5463, "loss": 0.1913, "learning_rate": 1.6688968673026773e-06, "epoch": 2.68423219431865, "percentage": 89.51, "elapsed_time": "2:16:14", "remaining_time": "0:15:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4900, "total_steps": 5463, "loss": 0.1905, "learning_rate": 1.6119797184887792e-06, "epoch": 2.689721421709894, "percentage": 89.69, "elapsed_time": "2:16:31", "remaining_time": "0:15:41", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4910, "total_steps": 5463, "loss": 0.1978, "learning_rate": 1.5560177117589197e-06, "epoch": 2.695210649101139, "percentage": 89.88, "elapsed_time": "2:16:48", "remaining_time": "0:15:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4920, "total_steps": 5463, "loss": 0.2575, "learning_rate": 1.5010131325424337e-06, "epoch": 2.7006998764923837, "percentage": 90.06, "elapsed_time": "2:17:04", "remaining_time": "0:15:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4930, "total_steps": 5463, "loss": 0.215, "learning_rate": 1.4469682271683327e-06, "epoch": 2.7061891038836285, "percentage": 90.24, "elapsed_time": "2:17:21", "remaining_time": "0:14:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4940, "total_steps": 5463, "loss": 0.2259, "learning_rate": 1.3938852027735594e-06, "epoch": 2.711678331274873, "percentage": 90.43, "elapsed_time": "2:17:37", "remaining_time": "0:14:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4950, "total_steps": 5463, "loss": 0.2514, "learning_rate": 1.3417662272128484e-06, "epoch": 2.7171675586661177, "percentage": 90.61, "elapsed_time": "2:17:54", "remaining_time": "0:14:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4960, "total_steps": 5463, "loss": 0.2342, "learning_rate": 1.2906134289701998e-06, "epoch": 2.7226567860573625, "percentage": 90.79, "elapsed_time": "2:18:11", "remaining_time": "0:14:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4970, "total_steps": 5463, "loss": 0.2273, "learning_rate": 1.240428897071949e-06, "epoch": 2.7281460134486073, "percentage": 90.98, "elapsed_time": "2:18:28", "remaining_time": "0:13:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4980, "total_steps": 5463, "loss": 0.216, "learning_rate": 1.191214681001454e-06, "epoch": 2.7336352408398517, "percentage": 91.16, "elapsed_time": "2:18:44", "remaining_time": "0:13:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 4990, "total_steps": 5463, "loss": 0.2053, "learning_rate": 1.142972790615407e-06, "epoch": 2.7391244682310965, "percentage": 91.34, "elapsed_time": "2:19:01", "remaining_time": "0:13:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5000, "total_steps": 5463, "loss": 0.2265, "learning_rate": 1.095705196061722e-06, "epoch": 2.7446136956223413, "percentage": 91.52, "elapsed_time": "2:19:17", "remaining_time": "0:12:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5010, "total_steps": 5463, "loss": 0.1784, "learning_rate": 1.0494138276991278e-06, "epoch": 2.7501029230135856, "percentage": 91.71, "elapsed_time": "2:19:37", "remaining_time": "0:12:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5020, "total_steps": 5463, "loss": 0.1953, "learning_rate": 1.0041005760182853e-06, "epoch": 2.7555921504048304, "percentage": 91.89, "elapsed_time": "2:19:54", "remaining_time": "0:12:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5030, "total_steps": 5463, "loss": 0.2076, "learning_rate": 9.597672915646116e-07, "epoch": 2.761081377796075, "percentage": 92.07, "elapsed_time": "2:20:10", "remaining_time": "0:12:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5040, "total_steps": 5463, "loss": 0.2155, "learning_rate": 9.164157848626842e-07, "epoch": 2.76657060518732, "percentage": 92.26, "elapsed_time": "2:20:27", "remaining_time": "0:11:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5050, "total_steps": 5463, "loss": 0.2072, "learning_rate": 8.740478263423197e-07, "epoch": 2.772059832578565, "percentage": 92.44, "elapsed_time": "2:20:44", "remaining_time": "0:11:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5060, "total_steps": 5463, "loss": 0.2314, "learning_rate": 8.32665146266276e-07, "epoch": 2.777549059969809, "percentage": 92.62, "elapsed_time": "2:21:01", "remaining_time": "0:11:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5070, "total_steps": 5463, "loss": 0.2297, "learning_rate": 7.922694346595511e-07, "epoch": 2.783038287361054, "percentage": 92.81, "elapsed_time": "2:21:17", "remaining_time": "0:10:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5080, "total_steps": 5463, "loss": 0.214, "learning_rate": 7.528623412404179e-07, "epoch": 2.7885275147522988, "percentage": 92.99, "elapsed_time": "2:21:34", "remaining_time": "0:10:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5090, "total_steps": 5463, "loss": 0.2173, "learning_rate": 7.144454753530067e-07, "epoch": 2.794016742143543, "percentage": 93.17, "elapsed_time": "2:21:51", "remaining_time": "0:10:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5100, "total_steps": 5463, "loss": 0.2012, "learning_rate": 6.770204059016127e-07, "epoch": 2.799505969534788, "percentage": 93.36, "elapsed_time": "2:22:07", "remaining_time": "0:10:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5110, "total_steps": 5463, "loss": 0.224, "learning_rate": 6.405886612866036e-07, "epoch": 2.8049951969260327, "percentage": 93.54, "elapsed_time": "2:22:24", "remaining_time": "0:09:50", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5120, "total_steps": 5463, "loss": 0.1893, "learning_rate": 6.051517293420101e-07, "epoch": 2.810484424317277, "percentage": 93.72, "elapsed_time": "2:22:40", "remaining_time": "0:09:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5130, "total_steps": 5463, "loss": 0.2351, "learning_rate": 5.707110572747587e-07, "epoch": 2.815973651708522, "percentage": 93.9, "elapsed_time": "2:22:59", "remaining_time": "0:09:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5140, "total_steps": 5463, "loss": 0.2541, "learning_rate": 5.3726805160558e-07, "epoch": 2.8214628790997667, "percentage": 94.09, "elapsed_time": "2:23:19", "remaining_time": "0:09:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5150, "total_steps": 5463, "loss": 0.2351, "learning_rate": 5.048240781115571e-07, "epoch": 2.8269521064910115, "percentage": 94.27, "elapsed_time": "2:23:38", "remaining_time": "0:08:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5160, "total_steps": 5463, "loss": 0.245, "learning_rate": 4.7338046177035354e-07, "epoch": 2.8324413338822563, "percentage": 94.45, "elapsed_time": "2:23:57", "remaining_time": "0:08:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5170, "total_steps": 5463, "loss": 0.2444, "learning_rate": 4.429384867061015e-07, "epoch": 2.8379305612735006, "percentage": 94.64, "elapsed_time": "2:24:15", "remaining_time": "0:08:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5180, "total_steps": 5463, "loss": 0.2354, "learning_rate": 4.1349939613695434e-07, "epoch": 2.8434197886647454, "percentage": 94.82, "elapsed_time": "2:24:33", "remaining_time": "0:07:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5190, "total_steps": 5463, "loss": 0.2086, "learning_rate": 3.85064392324333e-07, "epoch": 2.8489090160559902, "percentage": 95.0, "elapsed_time": "2:24:51", "remaining_time": "0:07:37", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5200, "total_steps": 5463, "loss": 0.2329, "learning_rate": 3.5763463652380146e-07, "epoch": 2.8543982434472346, "percentage": 95.19, "elapsed_time": "2:25:09", "remaining_time": "0:07:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5210, "total_steps": 5463, "loss": 0.1665, "learning_rate": 3.3121124893766287e-07, "epoch": 2.8598874708384794, "percentage": 95.37, "elapsed_time": "2:25:26", "remaining_time": "0:07:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5220, "total_steps": 5463, "loss": 0.2444, "learning_rate": 3.057953086692017e-07, "epoch": 2.865376698229724, "percentage": 95.55, "elapsed_time": "2:25:44", "remaining_time": "0:06:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5230, "total_steps": 5463, "loss": 0.2303, "learning_rate": 2.8138785367860796e-07, "epoch": 2.870865925620969, "percentage": 95.73, "elapsed_time": "2:26:02", "remaining_time": "0:06:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5240, "total_steps": 5463, "loss": 0.2274, "learning_rate": 2.5798988074061394e-07, "epoch": 2.876355153012214, "percentage": 95.92, "elapsed_time": "2:26:21", "remaining_time": "0:06:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5250, "total_steps": 5463, "loss": 0.1995, "learning_rate": 2.3560234540375424e-07, "epoch": 2.881844380403458, "percentage": 96.1, "elapsed_time": "2:26:37", "remaining_time": "0:05:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5260, "total_steps": 5463, "loss": 0.2002, "learning_rate": 2.1422616195136692e-07, "epoch": 2.887333607794703, "percentage": 96.28, "elapsed_time": "2:26:54", "remaining_time": "0:05:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5270, "total_steps": 5463, "loss": 0.1811, "learning_rate": 1.9386220336423678e-07, "epoch": 2.8928228351859477, "percentage": 96.47, "elapsed_time": "2:27:11", "remaining_time": "0:05:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5280, "total_steps": 5463, "loss": 0.2376, "learning_rate": 1.7451130128495753e-07, "epoch": 2.898312062577192, "percentage": 96.65, "elapsed_time": "2:27:27", "remaining_time": "0:05:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5290, "total_steps": 5463, "loss": 0.236, "learning_rate": 1.5617424598396712e-07, "epoch": 2.903801289968437, "percentage": 96.83, "elapsed_time": "2:27:44", "remaining_time": "0:04:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5300, "total_steps": 5463, "loss": 0.208, "learning_rate": 1.3885178632726536e-07, "epoch": 2.9092905173596817, "percentage": 97.02, "elapsed_time": "2:28:01", "remaining_time": "0:04:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5310, "total_steps": 5463, "loss": 0.2124, "learning_rate": 1.225446297458327e-07, "epoch": 2.914779744750926, "percentage": 97.2, "elapsed_time": "2:28:17", "remaining_time": "0:04:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5320, "total_steps": 5463, "loss": 0.1983, "learning_rate": 1.0725344220675337e-07, "epoch": 2.920268972142171, "percentage": 97.38, "elapsed_time": "2:28:34", "remaining_time": "0:03:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5330, "total_steps": 5463, "loss": 0.2173, "learning_rate": 9.297884818599556e-08, "epoch": 2.9257581995334156, "percentage": 97.57, "elapsed_time": "2:28:50", "remaining_time": "0:03:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5340, "total_steps": 5463, "loss": 0.182, "learning_rate": 7.972143064292892e-08, "epoch": 2.9312474269246604, "percentage": 97.75, "elapsed_time": "2:29:07", "remaining_time": "0:03:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5350, "total_steps": 5463, "loss": 0.1871, "learning_rate": 6.748173099650202e-08, "epoch": 2.9367366543159052, "percentage": 97.93, "elapsed_time": "2:29:23", "remaining_time": "0:03:09", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5360, "total_steps": 5463, "loss": 0.1989, "learning_rate": 5.626024910314609e-08, "epoch": 2.9422258817071496, "percentage": 98.11, "elapsed_time": "2:29:40", "remaining_time": "0:02:52", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5370, "total_steps": 5463, "loss": 0.2186, "learning_rate": 4.605744323634142e-08, "epoch": 2.9477151090983944, "percentage": 98.3, "elapsed_time": "2:29:56", "remaining_time": "0:02:35", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5380, "total_steps": 5463, "loss": 0.2124, "learning_rate": 3.687373006792394e-08, "epoch": 2.953204336489639, "percentage": 98.48, "elapsed_time": "2:30:13", "remaining_time": "0:02:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5390, "total_steps": 5463, "loss": 0.2145, "learning_rate": 2.870948465105161e-08, "epoch": 2.9586935638808836, "percentage": 98.66, "elapsed_time": "2:30:29", "remaining_time": "0:02:02", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5400, "total_steps": 5463, "loss": 0.22, "learning_rate": 2.1565040404902813e-08, "epoch": 2.9641827912721284, "percentage": 98.85, "elapsed_time": "2:30:46", "remaining_time": "0:01:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5410, "total_steps": 5463, "loss": 0.218, "learning_rate": 1.544068910104002e-08, "epoch": 2.969672018663373, "percentage": 99.03, "elapsed_time": "2:31:02", "remaining_time": "0:01:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5420, "total_steps": 5463, "loss": 0.257, "learning_rate": 1.0336680851516512e-08, "epoch": 2.975161246054618, "percentage": 99.21, "elapsed_time": "2:31:18", "remaining_time": "0:01:12", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5430, "total_steps": 5463, "loss": 0.2193, "learning_rate": 6.2532240986457044e-09, "epoch": 2.9806504734458628, "percentage": 99.4, "elapsed_time": "2:31:35", "remaining_time": "0:00:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5440, "total_steps": 5463, "loss": 0.2392, "learning_rate": 3.1904856064940424e-09, "epoch": 2.986139700837107, "percentage": 99.58, "elapsed_time": "2:31:51", "remaining_time": "0:00:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5450, "total_steps": 5463, "loss": 0.2137, "learning_rate": 1.1485904540697867e-09, "epoch": 2.991628928228352, "percentage": 99.76, "elapsed_time": "2:32:07", "remaining_time": "0:00:21", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5460, "total_steps": 5463, "loss": 0.2132, "learning_rate": 1.276220302215414e-10, "epoch": 2.9971181556195967, "percentage": 99.95, "elapsed_time": "2:32:24", "remaining_time": "0:00:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 5463, "total_steps": 5463, "epoch": 2.99876492383697, "percentage": 100.0, "elapsed_time": "2:32:29", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}