Training in progress, step 1950
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +11 -0
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 29034840
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad3594bcb3ff35f3f2e878e13876be354135b355ddc08a0bafcc51fa9e238692
|
3 |
size 29034840
|
trainer_log.jsonl
CHANGED
@@ -420,3 +420,14 @@
|
|
420 |
{"current_steps": 1895, "total_steps": 3400, "loss": 0.4356, "lr": 4.466073859319781e-05, "epoch": 0.4880247231522019, "percentage": 55.74, "elapsed_time": "6:42:18", "remaining_time": "5:19:30", "throughput": 824.3, "total_tokens": 19897464}
|
421 |
{"current_steps": 1900, "total_steps": 3400, "loss": 0.2877, "lr": 4.441903570394739e-05, "epoch": 0.4893123873293845, "percentage": 55.88, "elapsed_time": "6:43:44", "remaining_time": "5:18:44", "throughput": 823.55, "total_tokens": 19950480}
|
422 |
{"current_steps": 1900, "total_steps": 3400, "eval_loss": 0.4511750042438507, "epoch": 0.4893123873293845, "percentage": 55.88, "elapsed_time": "6:44:22", "remaining_time": "5:19:14", "throughput": 822.26, "total_tokens": 19950480}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
420 |
{"current_steps": 1895, "total_steps": 3400, "loss": 0.4356, "lr": 4.466073859319781e-05, "epoch": 0.4880247231522019, "percentage": 55.74, "elapsed_time": "6:42:18", "remaining_time": "5:19:30", "throughput": 824.3, "total_tokens": 19897464}
|
421 |
{"current_steps": 1900, "total_steps": 3400, "loss": 0.2877, "lr": 4.441903570394739e-05, "epoch": 0.4893123873293845, "percentage": 55.88, "elapsed_time": "6:43:44", "remaining_time": "5:18:44", "throughput": 823.55, "total_tokens": 19950480}
|
422 |
{"current_steps": 1900, "total_steps": 3400, "eval_loss": 0.4511750042438507, "epoch": 0.4893123873293845, "percentage": 55.88, "elapsed_time": "6:44:22", "remaining_time": "5:19:14", "throughput": 822.26, "total_tokens": 19950480}
|
423 |
+
{"current_steps": 1905, "total_steps": 3400, "loss": 0.3542, "lr": 4.41774648053257e-05, "epoch": 0.4906000515065671, "percentage": 56.03, "elapsed_time": "6:45:56", "remaining_time": "5:18:34", "throughput": 821.27, "total_tokens": 20002968}
|
424 |
+
{"current_steps": 1910, "total_steps": 3400, "loss": 0.4095, "lr": 4.3936031610520124e-05, "epoch": 0.49188771568374967, "percentage": 56.18, "elapsed_time": "6:47:22", "remaining_time": "5:17:47", "throughput": 820.53, "total_tokens": 20055560}
|
425 |
+
{"current_steps": 1915, "total_steps": 3400, "loss": 0.3887, "lr": 4.3694741829461336e-05, "epoch": 0.4931753798609323, "percentage": 56.32, "elapsed_time": "6:48:49", "remaining_time": "5:17:01", "throughput": 819.74, "total_tokens": 20108016}
|
426 |
+
{"current_steps": 1920, "total_steps": 3400, "loss": 0.3485, "lr": 4.345360116868823e-05, "epoch": 0.49446304403811486, "percentage": 56.47, "elapsed_time": "6:50:16", "remaining_time": "5:16:15", "throughput": 818.97, "total_tokens": 20160480}
|
427 |
+
{"current_steps": 1925, "total_steps": 3400, "loss": 0.4348, "lr": 4.321261533121303e-05, "epoch": 0.49575070821529743, "percentage": 56.62, "elapsed_time": "6:51:43", "remaining_time": "5:15:28", "throughput": 818.22, "total_tokens": 20213312}
|
428 |
+
{"current_steps": 1930, "total_steps": 3400, "loss": 0.4073, "lr": 4.2971790016386286e-05, "epoch": 0.49703837239248005, "percentage": 56.76, "elapsed_time": "6:53:11", "remaining_time": "5:14:42", "throughput": 817.48, "total_tokens": 20266288}
|
429 |
+
{"current_steps": 1935, "total_steps": 3400, "loss": 0.3297, "lr": 4.273113091976225e-05, "epoch": 0.4983260365696626, "percentage": 56.91, "elapsed_time": "6:54:38", "remaining_time": "5:13:55", "throughput": 816.72, "total_tokens": 20318576}
|
430 |
+
{"current_steps": 1940, "total_steps": 3400, "loss": 0.3352, "lr": 4.249064373296403e-05, "epoch": 0.49961370074684525, "percentage": 57.06, "elapsed_time": "6:56:05", "remaining_time": "5:13:08", "throughput": 815.96, "total_tokens": 20370696}
|
431 |
+
{"current_steps": 1945, "total_steps": 3400, "loss": 0.3195, "lr": 4.225033414354908e-05, "epoch": 0.5009013649240278, "percentage": 57.21, "elapsed_time": "6:57:32", "remaining_time": "5:12:20", "throughput": 815.23, "total_tokens": 20423480}
|
432 |
+
{"current_steps": 1950, "total_steps": 3400, "loss": 0.365, "lr": 4.201020783487464e-05, "epoch": 0.5021890291012104, "percentage": 57.35, "elapsed_time": "6:58:59", "remaining_time": "5:11:33", "throughput": 814.49, "total_tokens": 20476176}
|
433 |
+
{"current_steps": 1950, "total_steps": 3400, "eval_loss": 0.4763557016849518, "epoch": 0.5021890291012104, "percentage": 57.35, "elapsed_time": "6:59:37", "remaining_time": "5:12:02", "throughput": 813.26, "total_tokens": 20476176}
|