Boffl's picture
Upload trainer_log.jsonl with huggingface_hub
4d7e961 verified
raw
history blame
10.9 kB
{"current_steps": 10, "total_steps": 42, "loss": 1.7972, "learning_rate": 4.77807122597034e-05, "epoch": 0.23391812865497075, "percentage": 23.81, "elapsed_time": "0:02:04", "remaining_time": "0:06:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 20, "total_steps": 42, "loss": 1.6893, "learning_rate": 3.232056928191376e-05, "epoch": 0.4678362573099415, "percentage": 47.62, "elapsed_time": "0:04:09", "remaining_time": "0:04:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 30, "total_steps": 42, "loss": 1.6413, "learning_rate": 1.1892317911069212e-05, "epoch": 0.7017543859649122, "percentage": 71.43, "elapsed_time": "0:06:13", "remaining_time": "0:02:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 40, "total_steps": 42, "loss": 1.6134, "learning_rate": 8.066763266625282e-07, "epoch": 0.935672514619883, "percentage": 95.24, "elapsed_time": "0:08:17", "remaining_time": "0:00:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 42, "total_steps": 42, "epoch": 0.9824561403508771, "percentage": 100.0, "elapsed_time": "0:08:43", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 50, "total_steps": 126, "loss": 1.4769, "learning_rate": 3.848943205739711e-05, "epoch": 1.1871345029239766, "percentage": 39.68, "elapsed_time": "0:01:39", "remaining_time": "0:02:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 60, "total_steps": 126, "loss": 1.4539, "learning_rate": 3.219473788427984e-05, "epoch": 1.4210526315789473, "percentage": 47.62, "elapsed_time": "0:03:42", "remaining_time": "0:04:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 70, "total_steps": 126, "loss": 1.5344, "learning_rate": 2.604226177226137e-05, "epoch": 1.654970760233918, "percentage": 55.56, "elapsed_time": "0:05:45", "remaining_time": "0:04:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 80, "total_steps": 126, "loss": 1.4816, "learning_rate": 1.9146971351147655e-05, "epoch": 1.8888888888888888, "percentage": 63.49, "elapsed_time": "0:07:48", "remaining_time": "0:04:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 90, "total_steps": 126, "loss": 1.4132, "learning_rate": 1.270117540713368e-05, "epoch": 2.1228070175438596, "percentage": 71.43, "elapsed_time": "0:09:50", "remaining_time": "0:03:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 100, "total_steps": 126, "loss": 1.3255, "learning_rate": 7.1998911101617575e-06, "epoch": 2.3567251461988303, "percentage": 79.37, "elapsed_time": "0:11:53", "remaining_time": "0:03:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 110, "total_steps": 126, "loss": 1.3132, "learning_rate": 3.0656000602372558e-06, "epoch": 2.590643274853801, "percentage": 87.3, "elapsed_time": "0:13:56", "remaining_time": "0:02:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 120, "total_steps": 126, "loss": 1.3476, "learning_rate": 6.158030087068001e-07, "epoch": 2.824561403508772, "percentage": 95.24, "elapsed_time": "0:15:59", "remaining_time": "0:00:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 126, "total_steps": 126, "epoch": 2.9649122807017543, "percentage": 100.0, "elapsed_time": "0:17:15", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 130, "total_steps": 420, "loss": 1.1837, "learning_rate": 4.388136440446337e-05, "epoch": 3.0935672514619883, "percentage": 30.95, "elapsed_time": "0:00:50", "remaining_time": "0:01:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 140, "total_steps": 420, "loss": 1.3114, "learning_rate": 4.245592045215182e-05, "epoch": 3.327485380116959, "percentage": 33.33, "elapsed_time": "0:02:54", "remaining_time": "0:05:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 150, "total_steps": 420, "loss": 1.2437, "learning_rate": 4.0909970437009096e-05, "epoch": 3.56140350877193, "percentage": 35.71, "elapsed_time": "0:04:57", "remaining_time": "0:08:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 160, "total_steps": 420, "loss": 1.2936, "learning_rate": 3.925418674667405e-05, "epoch": 3.7953216374269005, "percentage": 38.1, "elapsed_time": "0:07:00", "remaining_time": "0:11:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 170, "total_steps": 420, "loss": 1.3328, "learning_rate": 3.7500000000000003e-05, "epoch": 4.029239766081871, "percentage": 40.48, "elapsed_time": "0:09:03", "remaining_time": "0:13:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 180, "total_steps": 420, "loss": 1.1235, "learning_rate": 3.565952013635635e-05, "epoch": 4.2631578947368425, "percentage": 42.86, "elapsed_time": "0:11:06", "remaining_time": "0:14:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 190, "total_steps": 420, "loss": 1.0464, "learning_rate": 3.374545281527538e-05, "epoch": 4.497076023391813, "percentage": 45.24, "elapsed_time": "0:13:09", "remaining_time": "0:15:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 200, "total_steps": 420, "loss": 1.1242, "learning_rate": 3.177101170357513e-05, "epoch": 4.730994152046784, "percentage": 47.62, "elapsed_time": "0:15:13", "remaining_time": "0:16:44", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 210, "total_steps": 420, "loss": 1.0463, "learning_rate": 2.9749827255479755e-05, "epoch": 4.964912280701754, "percentage": 50.0, "elapsed_time": "0:17:16", "remaining_time": "0:17:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 220, "total_steps": 420, "loss": 0.9407, "learning_rate": 2.769585261546897e-05, "epoch": 5.1988304093567255, "percentage": 52.38, "elapsed_time": "0:19:19", "remaining_time": "0:17:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 230, "total_steps": 420, "loss": 0.8377, "learning_rate": 2.5623267293451826e-05, "epoch": 5.432748538011696, "percentage": 54.76, "elapsed_time": "0:21:22", "remaining_time": "0:17:39", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 240, "total_steps": 420, "loss": 0.9125, "learning_rate": 2.3546379277238107e-05, "epoch": 5.666666666666667, "percentage": 57.14, "elapsed_time": "0:23:25", "remaining_time": "0:17:34", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 250, "total_steps": 420, "loss": 0.9502, "learning_rate": 2.1479526258069087e-05, "epoch": 5.900584795321637, "percentage": 59.52, "elapsed_time": "0:25:28", "remaining_time": "0:17:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 260, "total_steps": 420, "loss": 0.8194, "learning_rate": 1.9436976651092144e-05, "epoch": 6.1345029239766085, "percentage": 61.9, "elapsed_time": "0:27:31", "remaining_time": "0:16:56", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 270, "total_steps": 420, "loss": 0.7167, "learning_rate": 1.7432831094079355e-05, "epoch": 6.368421052631579, "percentage": 64.29, "elapsed_time": "0:29:34", "remaining_time": "0:16:26", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 280, "total_steps": 420, "loss": 0.7622, "learning_rate": 1.5480925104388762e-05, "epoch": 6.60233918128655, "percentage": 66.67, "elapsed_time": "0:31:38", "remaining_time": "0:15:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 290, "total_steps": 420, "loss": 0.767, "learning_rate": 1.3594733566170926e-05, "epoch": 6.83625730994152, "percentage": 69.05, "elapsed_time": "0:33:41", "remaining_time": "0:15:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 300, "total_steps": 420, "loss": 0.7493, "learning_rate": 1.1787277707188616e-05, "epoch": 7.0701754385964914, "percentage": 71.43, "elapsed_time": "0:35:44", "remaining_time": "0:14:17", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 310, "total_steps": 420, "loss": 0.6112, "learning_rate": 1.0071035207430352e-05, "epoch": 7.304093567251462, "percentage": 73.81, "elapsed_time": "0:37:47", "remaining_time": "0:13:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 320, "total_steps": 420, "loss": 0.6109, "learning_rate": 8.45785406007852e-06, "epoch": 7.538011695906433, "percentage": 76.19, "elapsed_time": "0:39:50", "remaining_time": "0:12:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 330, "total_steps": 420, "loss": 0.6453, "learning_rate": 6.958870779488447e-06, "epoch": 7.771929824561403, "percentage": 78.57, "elapsed_time": "0:41:53", "remaining_time": "0:11:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 340, "total_steps": 420, "loss": 0.6664, "learning_rate": 5.584433520825541e-06, "epoch": 8.005847953216374, "percentage": 80.95, "elapsed_time": "0:43:56", "remaining_time": "0:10:20", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 350, "total_steps": 420, "loss": 0.5755, "learning_rate": 4.344030642100133e-06, "epoch": 8.239766081871345, "percentage": 83.33, "elapsed_time": "0:45:59", "remaining_time": "0:09:11", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 360, "total_steps": 420, "loss": 0.5977, "learning_rate": 3.2462252017684797e-06, "epoch": 8.473684210526315, "percentage": 85.71, "elapsed_time": "0:48:03", "remaining_time": "0:08:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 370, "total_steps": 420, "loss": 0.5428, "learning_rate": 2.298595844092377e-06, "epoch": 8.707602339181287, "percentage": 88.1, "elapsed_time": "0:50:06", "remaining_time": "0:06:46", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 380, "total_steps": 420, "loss": 0.5528, "learning_rate": 1.5076844803522922e-06, "epoch": 8.941520467836257, "percentage": 90.48, "elapsed_time": "0:52:09", "remaining_time": "0:05:29", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 390, "total_steps": 420, "loss": 0.5825, "learning_rate": 8.78951127094127e-07, "epoch": 9.175438596491228, "percentage": 92.86, "elapsed_time": "0:54:12", "remaining_time": "0:04:10", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 400, "total_steps": 420, "loss": 0.5498, "learning_rate": 4.16736213181515e-07, "epoch": 9.409356725146198, "percentage": 95.24, "elapsed_time": "0:56:15", "remaining_time": "0:02:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 410, "total_steps": 420, "loss": 0.5318, "learning_rate": 1.2423061586496477e-07, "epoch": 9.64327485380117, "percentage": 97.62, "elapsed_time": "0:58:19", "remaining_time": "0:01:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 420, "total_steps": 420, "loss": 0.5299, "learning_rate": 3.453632722358324e-09, "epoch": 9.87719298245614, "percentage": 100.0, "elapsed_time": "1:00:22", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 420, "total_steps": 420, "epoch": 9.87719298245614, "percentage": 100.0, "elapsed_time": "1:00:24", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}