Training in progress, step 2950
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +11 -0
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 29034840
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b7a40fbb5d3ef8c199f94ef197e14510d714bce74ec2a360d2feaf74aeb1aee
|
3 |
size 29034840
|
trainer_log.jsonl
CHANGED
@@ -648,3 +648,14 @@
|
|
648 |
{"current_steps": 2895, "total_steps": 6770, "loss": 0.2312, "lr": 6.5831320462607e-05, "epoch": 0.8552437223042836, "percentage": 42.76, "elapsed_time": "6:12:49", "remaining_time": "8:19:01", "throughput": 1344.06, "total_tokens": 30066016}
|
649 |
{"current_steps": 2900, "total_steps": 6770, "loss": 0.2029, "lr": 6.571542983224223e-05, "epoch": 0.8567208271787297, "percentage": 42.84, "elapsed_time": "6:14:15", "remaining_time": "8:19:26", "throughput": 1341.23, "total_tokens": 30118072}
|
650 |
{"current_steps": 2900, "total_steps": 6770, "eval_loss": 0.39434579014778137, "epoch": 0.8567208271787297, "percentage": 42.84, "elapsed_time": "6:14:34", "remaining_time": "8:19:52", "throughput": 1340.09, "total_tokens": 30118072}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
648 |
{"current_steps": 2895, "total_steps": 6770, "loss": 0.2312, "lr": 6.5831320462607e-05, "epoch": 0.8552437223042836, "percentage": 42.76, "elapsed_time": "6:12:49", "remaining_time": "8:19:01", "throughput": 1344.06, "total_tokens": 30066016}
|
649 |
{"current_steps": 2900, "total_steps": 6770, "loss": 0.2029, "lr": 6.571542983224223e-05, "epoch": 0.8567208271787297, "percentage": 42.84, "elapsed_time": "6:14:15", "remaining_time": "8:19:26", "throughput": 1341.23, "total_tokens": 30118072}
|
650 |
{"current_steps": 2900, "total_steps": 6770, "eval_loss": 0.39434579014778137, "epoch": 0.8567208271787297, "percentage": 42.84, "elapsed_time": "6:14:34", "remaining_time": "8:19:52", "throughput": 1340.09, "total_tokens": 30118072}
|
651 |
+
{"current_steps": 2905, "total_steps": 6770, "loss": 0.2241, "lr": 6.559944544378072e-05, "epoch": 0.8581979320531757, "percentage": 42.91, "elapsed_time": "6:16:07", "remaining_time": "8:20:24", "throughput": 1336.91, "total_tokens": 30170248}
|
652 |
+
{"current_steps": 2910, "total_steps": 6770, "loss": 0.2298, "lr": 6.548336798918411e-05, "epoch": 0.8596750369276218, "percentage": 42.98, "elapsed_time": "6:17:33", "remaining_time": "8:20:49", "throughput": 1334.08, "total_tokens": 30222016}
|
653 |
+
{"current_steps": 2915, "total_steps": 6770, "loss": 0.2396, "lr": 6.536719816096935e-05, "epoch": 0.8611521418020679, "percentage": 43.06, "elapsed_time": "6:19:01", "remaining_time": "8:21:15", "throughput": 1331.18, "total_tokens": 30273312}
|
654 |
+
{"current_steps": 2920, "total_steps": 6770, "loss": 0.2324, "lr": 6.52509366522045e-05, "epoch": 0.8626292466765141, "percentage": 43.13, "elapsed_time": "6:20:29", "remaining_time": "8:21:39", "throughput": 1328.32, "total_tokens": 30324328}
|
655 |
+
{"current_steps": 2925, "total_steps": 6770, "loss": 0.2263, "lr": 6.513458415650452e-05, "epoch": 0.8641063515509602, "percentage": 43.21, "elapsed_time": "6:21:57", "remaining_time": "8:22:05", "throughput": 1325.47, "total_tokens": 30376488}
|
656 |
+
{"current_steps": 2930, "total_steps": 6770, "loss": 0.1734, "lr": 6.501814136802725e-05, "epoch": 0.8655834564254062, "percentage": 43.28, "elapsed_time": "6:23:24", "remaining_time": "8:22:28", "throughput": 1322.77, "total_tokens": 30429504}
|
657 |
+
{"current_steps": 2935, "total_steps": 6770, "loss": 0.2235, "lr": 6.490160898146918e-05, "epoch": 0.8670605612998523, "percentage": 43.35, "elapsed_time": "6:24:52", "remaining_time": "8:22:53", "throughput": 1319.93, "total_tokens": 30480400}
|
658 |
+
{"current_steps": 2940, "total_steps": 6770, "loss": 0.2297, "lr": 6.47849876920614e-05, "epoch": 0.8685376661742984, "percentage": 43.43, "elapsed_time": "6:26:19", "remaining_time": "8:23:15", "throughput": 1317.22, "total_tokens": 30531912}
|
659 |
+
{"current_steps": 2945, "total_steps": 6770, "loss": 0.1764, "lr": 6.46682781955653e-05, "epoch": 0.8700147710487445, "percentage": 43.5, "elapsed_time": "6:27:46", "remaining_time": "8:23:39", "throughput": 1314.52, "total_tokens": 30584688}
|
660 |
+
{"current_steps": 2950, "total_steps": 6770, "loss": 0.1692, "lr": 6.455148118826859e-05, "epoch": 0.8714918759231906, "percentage": 43.57, "elapsed_time": "6:29:12", "remaining_time": "8:23:59", "throughput": 1311.97, "total_tokens": 30637448}
|
661 |
+
{"current_steps": 2950, "total_steps": 6770, "eval_loss": 0.20344533026218414, "epoch": 0.8714918759231906, "percentage": 43.57, "elapsed_time": "6:29:31", "remaining_time": "8:24:23", "throughput": 1310.91, "total_tokens": 30637448}
|