{"current_steps": 5, "total_steps": 350, "loss": 0.9693, "learning_rate": 1.4285714285714285e-05, "epoch": 0.028429282160625444, "percentage": 1.43, "elapsed_time": "0:04:05", "remaining_time": "4:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 350, "loss": 0.7795, "learning_rate": 2.857142857142857e-05, "epoch": 0.05685856432125089, "percentage": 2.86, "elapsed_time": "0:08:13", "remaining_time": "4:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 350, "loss": 0.4535, "learning_rate": 4.2857142857142856e-05, "epoch": 0.08528784648187633, "percentage": 4.29, "elapsed_time": "0:12:20", "remaining_time": "4:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 350, "loss": 0.4519, "learning_rate": 5.714285714285714e-05, "epoch": 0.11371712864250177, "percentage": 5.71, "elapsed_time": "0:16:28", "remaining_time": "4:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 350, "loss": 0.4128, "learning_rate": 7.142857142857143e-05, "epoch": 0.14214641080312723, "percentage": 7.14, "elapsed_time": "0:20:36", "remaining_time": "4:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 350, "loss": 0.3446, "learning_rate": 8.571428571428571e-05, "epoch": 0.17057569296375266, "percentage": 8.57, "elapsed_time": "0:24:45", "remaining_time": "4:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 350, "loss": 0.3253, "learning_rate": 0.0001, "epoch": 0.19900497512437812, "percentage": 10.0, "elapsed_time": "0:28:52", "remaining_time": "4:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 350, "eval_loss": 0.28751906752586365, "epoch": 0.19900497512437812, "percentage": 10.0, "elapsed_time": "0:32:52", "remaining_time": "4:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 350, "loss": 0.3065, "learning_rate": 9.993784606094612e-05, "epoch": 0.22743425728500355, "percentage": 11.43, "elapsed_time": "0:37:02", "remaining_time": "4:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 350, "loss": 0.302, "learning_rate": 9.975153876827008e-05, "epoch": 0.255863539445629, "percentage": 12.86, "elapsed_time": "0:41:10", "remaining_time": "4:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 350, "loss": 0.307, "learning_rate": 9.944154131125642e-05, "epoch": 0.28429282160625446, "percentage": 14.29, "elapsed_time": "0:45:18", "remaining_time": "4:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 350, "loss": 0.2908, "learning_rate": 9.900862439242719e-05, "epoch": 0.31272210376687987, "percentage": 15.71, "elapsed_time": "0:49:27", "remaining_time": "4:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 350, "loss": 0.3112, "learning_rate": 9.84538643114539e-05, "epoch": 0.3411513859275053, "percentage": 17.14, "elapsed_time": "0:53:36", "remaining_time": "4:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 350, "loss": 0.2596, "learning_rate": 9.777864028930705e-05, "epoch": 0.3695806680881308, "percentage": 18.57, "elapsed_time": "0:57:43", "remaining_time": "4:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 350, "loss": 0.2868, "learning_rate": 9.698463103929542e-05, "epoch": 0.39800995024875624, "percentage": 20.0, "elapsed_time": "1:01:50", "remaining_time": "4:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 350, "eval_loss": 0.2600123882293701, "epoch": 0.39800995024875624, "percentage": 20.0, "elapsed_time": "1:05:51", "remaining_time": "4:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 350, "loss": 0.2763, "learning_rate": 9.607381059352038e-05, "epoch": 0.42643923240938164, "percentage": 21.43, "elapsed_time": "1:10:00", "remaining_time": "4:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 350, "loss": 0.254, "learning_rate": 9.504844339512095e-05, "epoch": 0.4548685145700071, "percentage": 22.86, "elapsed_time": "1:14:10", "remaining_time": "4:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 350, "loss": 0.2834, "learning_rate": 9.391107866851143e-05, "epoch": 0.48329779673063256, "percentage": 24.29, "elapsed_time": "1:18:18", "remaining_time": "4:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 350, "loss": 0.2509, "learning_rate": 9.266454408160779e-05, "epoch": 0.511727078891258, "percentage": 25.71, "elapsed_time": "1:22:26", "remaining_time": "3:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 350, "loss": 0.266, "learning_rate": 9.131193871579975e-05, "epoch": 0.5401563610518835, "percentage": 27.14, "elapsed_time": "1:26:34", "remaining_time": "3:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 350, "loss": 0.2562, "learning_rate": 8.985662536114613e-05, "epoch": 0.5685856432125089, "percentage": 28.57, "elapsed_time": "1:30:42", "remaining_time": "3:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 350, "loss": 0.2583, "learning_rate": 8.83022221559489e-05, "epoch": 0.5970149253731343, "percentage": 30.0, "elapsed_time": "1:34:49", "remaining_time": "3:41:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 350, "eval_loss": 0.25079870223999023, "epoch": 0.5970149253731343, "percentage": 30.0, "elapsed_time": "1:38:49", "remaining_time": "3:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 350, "loss": 0.2529, "learning_rate": 8.665259359149132e-05, "epoch": 0.6254442075337597, "percentage": 31.43, "elapsed_time": "1:42:59", "remaining_time": "3:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 350, "loss": 0.2482, "learning_rate": 8.491184090430364e-05, "epoch": 0.6538734896943852, "percentage": 32.86, "elapsed_time": "1:47:07", "remaining_time": "3:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 350, "loss": 0.244, "learning_rate": 8.308429187984297e-05, "epoch": 0.6823027718550106, "percentage": 34.29, "elapsed_time": "1:51:16", "remaining_time": "3:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 350, "loss": 0.2453, "learning_rate": 8.117449009293668e-05, "epoch": 0.7107320540156361, "percentage": 35.71, "elapsed_time": "1:55:23", "remaining_time": "3:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 350, "loss": 0.2451, "learning_rate": 7.91871836117395e-05, "epoch": 0.7391613361762616, "percentage": 37.14, "elapsed_time": "1:59:33", "remaining_time": "3:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 350, "loss": 0.2749, "learning_rate": 7.712731319328798e-05, "epoch": 0.767590618336887, "percentage": 38.57, "elapsed_time": "2:03:41", "remaining_time": "3:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 350, "loss": 0.2559, "learning_rate": 7.500000000000001e-05, "epoch": 0.7960199004975125, "percentage": 40.0, "elapsed_time": "2:07:51", "remaining_time": "3:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 350, "eval_loss": 0.2278721183538437, "epoch": 0.7960199004975125, "percentage": 40.0, "elapsed_time": "2:11:50", "remaining_time": "3:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 350, "loss": 0.2483, "learning_rate": 7.281053286765815e-05, "epoch": 0.8244491826581379, "percentage": 41.43, "elapsed_time": "2:15:59", "remaining_time": "3:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 350, "loss": 0.2666, "learning_rate": 7.056435515653059e-05, "epoch": 0.8528784648187633, "percentage": 42.86, "elapsed_time": "2:20:06", "remaining_time": "3:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 350, "loss": 0.2576, "learning_rate": 6.826705121831976e-05, "epoch": 0.8813077469793887, "percentage": 44.29, "elapsed_time": "2:24:15", "remaining_time": "3:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 350, "loss": 0.2552, "learning_rate": 6.592433251258423e-05, "epoch": 0.9097370291400142, "percentage": 45.71, "elapsed_time": "2:28:22", "remaining_time": "2:56:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 350, "loss": 0.2287, "learning_rate": 6.354202340715026e-05, "epoch": 0.9381663113006397, "percentage": 47.14, "elapsed_time": "2:32:29", "remaining_time": "2:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 350, "loss": 0.2469, "learning_rate": 6.112604669781572e-05, "epoch": 0.9665955934612651, "percentage": 48.57, "elapsed_time": "2:36:37", "remaining_time": "2:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 350, "loss": 0.2516, "learning_rate": 5.868240888334653e-05, "epoch": 0.9950248756218906, "percentage": 50.0, "elapsed_time": "2:40:47", "remaining_time": "2:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 350, "eval_loss": 0.22209325432777405, "epoch": 0.9950248756218906, "percentage": 50.0, "elapsed_time": "2:44:46", "remaining_time": "2:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 350, "loss": 0.2339, "learning_rate": 5.621718523237427e-05, "epoch": 1.023454157782516, "percentage": 51.43, "elapsed_time": "2:48:50", "remaining_time": "2:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 350, "loss": 0.2192, "learning_rate": 5.373650467932122e-05, "epoch": 1.0518834399431414, "percentage": 52.86, "elapsed_time": "2:52:59", "remaining_time": "2:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 350, "loss": 0.2306, "learning_rate": 5.124653458690365e-05, "epoch": 1.080312722103767, "percentage": 54.29, "elapsed_time": "2:57:08", "remaining_time": "2:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 350, "loss": 0.213, "learning_rate": 4.875346541309637e-05, "epoch": 1.1087420042643923, "percentage": 55.71, "elapsed_time": "3:01:16", "remaining_time": "2:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 350, "loss": 0.2306, "learning_rate": 4.626349532067879e-05, "epoch": 1.1371712864250179, "percentage": 57.14, "elapsed_time": "3:05:23", "remaining_time": "2:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 350, "loss": 0.2235, "learning_rate": 4.378281476762576e-05, "epoch": 1.1656005685856432, "percentage": 58.57, "elapsed_time": "3:09:31", "remaining_time": "2:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 350, "loss": 0.2086, "learning_rate": 4.131759111665349e-05, "epoch": 1.1940298507462686, "percentage": 60.0, "elapsed_time": "3:13:39", "remaining_time": "2:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 350, "eval_loss": 0.22708775103092194, "epoch": 1.1940298507462686, "percentage": 60.0, "elapsed_time": "3:17:38", "remaining_time": "2:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 350, "loss": 0.2027, "learning_rate": 3.887395330218429e-05, "epoch": 1.2224591329068941, "percentage": 61.43, "elapsed_time": "3:21:46", "remaining_time": "2:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 350, "loss": 0.1961, "learning_rate": 3.6457976592849754e-05, "epoch": 1.2508884150675195, "percentage": 62.86, "elapsed_time": "3:25:55", "remaining_time": "2:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 350, "loss": 0.2274, "learning_rate": 3.4075667487415785e-05, "epoch": 1.279317697228145, "percentage": 64.29, "elapsed_time": "3:30:02", "remaining_time": "1:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 350, "loss": 0.215, "learning_rate": 3.173294878168025e-05, "epoch": 1.3077469793887704, "percentage": 65.71, "elapsed_time": "3:34:09", "remaining_time": "1:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 350, "loss": 0.2164, "learning_rate": 2.9435644843469436e-05, "epoch": 1.336176261549396, "percentage": 67.14, "elapsed_time": "3:38:18", "remaining_time": "1:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 350, "loss": 0.2213, "learning_rate": 2.718946713234185e-05, "epoch": 1.3646055437100213, "percentage": 68.57, "elapsed_time": "3:42:26", "remaining_time": "1:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 350, "loss": 0.238, "learning_rate": 2.500000000000001e-05, "epoch": 1.3930348258706466, "percentage": 70.0, "elapsed_time": "3:46:33", "remaining_time": "1:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 350, "eval_loss": 0.2183476835489273, "epoch": 1.3930348258706466, "percentage": 70.0, "elapsed_time": "3:50:33", "remaining_time": "1:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 350, "loss": 0.2179, "learning_rate": 2.2872686806712035e-05, "epoch": 1.4214641080312722, "percentage": 71.43, "elapsed_time": "3:54:42", "remaining_time": "1:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 350, "loss": 0.2057, "learning_rate": 2.0812816388260518e-05, "epoch": 1.4498933901918978, "percentage": 72.86, "elapsed_time": "3:58:49", "remaining_time": "1:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 350, "loss": 0.1965, "learning_rate": 1.8825509907063327e-05, "epoch": 1.4783226723525231, "percentage": 74.29, "elapsed_time": "4:02:57", "remaining_time": "1:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 350, "loss": 0.2171, "learning_rate": 1.691570812015704e-05, "epoch": 1.5067519545131485, "percentage": 75.71, "elapsed_time": "4:07:07", "remaining_time": "1:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 350, "loss": 0.2217, "learning_rate": 1.5088159095696363e-05, "epoch": 1.535181236673774, "percentage": 77.14, "elapsed_time": "4:11:15", "remaining_time": "1:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 350, "loss": 0.2035, "learning_rate": 1.3347406408508695e-05, "epoch": 1.5636105188343994, "percentage": 78.57, "elapsed_time": "4:15:22", "remaining_time": "1:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 350, "loss": 0.2176, "learning_rate": 1.1697777844051105e-05, "epoch": 1.5920398009950247, "percentage": 80.0, "elapsed_time": "4:19:29", "remaining_time": "1:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 350, "eval_loss": 0.22061596810817719, "epoch": 1.5920398009950247, "percentage": 80.0, "elapsed_time": "4:23:32", "remaining_time": "1:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 350, "loss": 0.2203, "learning_rate": 1.0143374638853891e-05, "epoch": 1.6204690831556503, "percentage": 81.43, "elapsed_time": "4:27:42", "remaining_time": "1:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 350, "loss": 0.2171, "learning_rate": 8.688061284200266e-06, "epoch": 1.6488983653162759, "percentage": 82.86, "elapsed_time": "4:31:49", "remaining_time": "0:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 350, "loss": 0.2009, "learning_rate": 7.33545591839222e-06, "epoch": 1.6773276474769012, "percentage": 84.29, "elapsed_time": "4:35:57", "remaining_time": "0:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 350, "loss": 0.2224, "learning_rate": 6.088921331488568e-06, "epoch": 1.7057569296375266, "percentage": 85.71, "elapsed_time": "4:40:06", "remaining_time": "0:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 350, "loss": 0.224, "learning_rate": 4.951556604879048e-06, "epoch": 1.7341862117981521, "percentage": 87.14, "elapsed_time": "4:44:13", "remaining_time": "0:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 350, "loss": 0.1882, "learning_rate": 3.9261894064796135e-06, "epoch": 1.7626154939587777, "percentage": 88.57, "elapsed_time": "4:48:22", "remaining_time": "0:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 350, "loss": 0.2022, "learning_rate": 3.0153689607045845e-06, "epoch": 1.7910447761194028, "percentage": 90.0, "elapsed_time": "4:52:31", "remaining_time": "0:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 350, "eval_loss": 0.22089815139770508, "epoch": 1.7910447761194028, "percentage": 90.0, "elapsed_time": "4:56:32", "remaining_time": "0:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 350, "loss": 0.1922, "learning_rate": 2.221359710692961e-06, "epoch": 1.8194740582800284, "percentage": 91.43, "elapsed_time": "5:00:41", "remaining_time": "0:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 350, "loss": 0.2081, "learning_rate": 1.5461356885461075e-06, "epoch": 1.847903340440654, "percentage": 92.86, "elapsed_time": "5:04:48", "remaining_time": "0:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 350, "loss": 0.2067, "learning_rate": 9.913756075728087e-07, "epoch": 1.8763326226012793, "percentage": 94.29, "elapsed_time": "5:08:56", "remaining_time": "0:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 350, "loss": 0.2221, "learning_rate": 5.584586887435739e-07, "epoch": 1.9047619047619047, "percentage": 95.71, "elapsed_time": "5:13:05", "remaining_time": "0:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 350, "loss": 0.2142, "learning_rate": 2.4846123172992954e-07, "epoch": 1.9331911869225302, "percentage": 97.14, "elapsed_time": "5:17:14", "remaining_time": "0:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 350, "loss": 0.2089, "learning_rate": 6.215393905388278e-08, "epoch": 1.9616204690831558, "percentage": 98.57, "elapsed_time": "5:21:22", "remaining_time": "0:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 350, "loss": 0.209, "learning_rate": 0.0, "epoch": 1.9900497512437811, "percentage": 100.0, "elapsed_time": "5:25:31", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 350, "eval_loss": 0.21909472346305847, "epoch": 1.9900497512437811, "percentage": 100.0, "elapsed_time": "5:29:32", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 350, "epoch": 1.9900497512437811, "percentage": 100.0, "elapsed_time": "5:29:33", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}