sedrickkeh
commited on
Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f4b044db17fdc9a47a0d0ba1b55cb4d182f7209d4933ebdc23e55d8fa61d2fb
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:119a266c32438499af232fecfbc34def0900bc7a146e2f69840840fae81ffc1d
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72afab046ea06f1b22112f347975f3041ecca7b251ccf398d33b887128b07b74
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e9b2f558defed5bd8618ebc57e720b5938a1501b133855e3846cbef8107bc50
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -33,3 +33,20 @@
|
|
33 |
{"current_steps": 320, "total_steps": 504, "loss": 0.5533, "lr": 5e-06, "epoch": 1.899184581171238, "percentage": 63.49, "elapsed_time": "5:10:34", "remaining_time": "2:58:34"}
|
34 |
{"current_steps": 330, "total_steps": 504, "loss": 0.5487, "lr": 5e-06, "epoch": 1.9584877687175686, "percentage": 65.48, "elapsed_time": "5:20:08", "remaining_time": "2:48:48"}
|
35 |
{"current_steps": 336, "total_steps": 504, "eval_loss": 0.6003267765045166, "epoch": 1.9940696812453669, "percentage": 66.67, "elapsed_time": "5:29:31", "remaining_time": "2:44:45"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
{"current_steps": 320, "total_steps": 504, "loss": 0.5533, "lr": 5e-06, "epoch": 1.899184581171238, "percentage": 63.49, "elapsed_time": "5:10:34", "remaining_time": "2:58:34"}
|
34 |
{"current_steps": 330, "total_steps": 504, "loss": 0.5487, "lr": 5e-06, "epoch": 1.9584877687175686, "percentage": 65.48, "elapsed_time": "5:20:08", "remaining_time": "2:48:48"}
|
35 |
{"current_steps": 336, "total_steps": 504, "eval_loss": 0.6003267765045166, "epoch": 1.9940696812453669, "percentage": 66.67, "elapsed_time": "5:29:31", "remaining_time": "2:44:45"}
|
36 |
+
{"current_steps": 340, "total_steps": 504, "loss": 0.564, "lr": 5e-06, "epoch": 2.0192735359525575, "percentage": 67.46, "elapsed_time": "5:33:53", "remaining_time": "2:41:03"}
|
37 |
+
{"current_steps": 350, "total_steps": 504, "loss": 0.4911, "lr": 5e-06, "epoch": 2.078576723498888, "percentage": 69.44, "elapsed_time": "5:43:27", "remaining_time": "2:31:07"}
|
38 |
+
{"current_steps": 360, "total_steps": 504, "loss": 0.4883, "lr": 5e-06, "epoch": 2.1378799110452187, "percentage": 71.43, "elapsed_time": "5:53:01", "remaining_time": "2:21:12"}
|
39 |
+
{"current_steps": 370, "total_steps": 504, "loss": 0.488, "lr": 5e-06, "epoch": 2.1971830985915495, "percentage": 73.41, "elapsed_time": "6:02:36", "remaining_time": "2:11:19"}
|
40 |
+
{"current_steps": 380, "total_steps": 504, "loss": 0.493, "lr": 5e-06, "epoch": 2.25648628613788, "percentage": 75.4, "elapsed_time": "6:12:11", "remaining_time": "2:01:27"}
|
41 |
+
{"current_steps": 390, "total_steps": 504, "loss": 0.4814, "lr": 5e-06, "epoch": 2.3157894736842106, "percentage": 77.38, "elapsed_time": "6:21:46", "remaining_time": "1:51:35"}
|
42 |
+
{"current_steps": 400, "total_steps": 504, "loss": 0.4947, "lr": 5e-06, "epoch": 2.375092661230541, "percentage": 79.37, "elapsed_time": "6:31:20", "remaining_time": "1:41:44"}
|
43 |
+
{"current_steps": 410, "total_steps": 504, "loss": 0.4916, "lr": 5e-06, "epoch": 2.4343958487768718, "percentage": 81.35, "elapsed_time": "6:40:55", "remaining_time": "1:31:55"}
|
44 |
+
{"current_steps": 420, "total_steps": 504, "loss": 0.4956, "lr": 5e-06, "epoch": 2.4936990363232026, "percentage": 83.33, "elapsed_time": "6:50:31", "remaining_time": "1:22:06"}
|
45 |
+
{"current_steps": 430, "total_steps": 504, "loss": 0.494, "lr": 5e-06, "epoch": 2.553002223869533, "percentage": 85.32, "elapsed_time": "7:00:06", "remaining_time": "1:12:17"}
|
46 |
+
{"current_steps": 440, "total_steps": 504, "loss": 0.4973, "lr": 5e-06, "epoch": 2.6123054114158637, "percentage": 87.3, "elapsed_time": "7:09:41", "remaining_time": "1:02:30"}
|
47 |
+
{"current_steps": 450, "total_steps": 504, "loss": 0.4998, "lr": 5e-06, "epoch": 2.6716085989621945, "percentage": 89.29, "elapsed_time": "7:19:16", "remaining_time": "0:52:42"}
|
48 |
+
{"current_steps": 460, "total_steps": 504, "loss": 0.4891, "lr": 5e-06, "epoch": 2.730911786508525, "percentage": 91.27, "elapsed_time": "7:28:52", "remaining_time": "0:42:56"}
|
49 |
+
{"current_steps": 470, "total_steps": 504, "loss": 0.5005, "lr": 5e-06, "epoch": 2.790214974054855, "percentage": 93.25, "elapsed_time": "7:38:27", "remaining_time": "0:33:09"}
|
50 |
+
{"current_steps": 480, "total_steps": 504, "loss": 0.4894, "lr": 5e-06, "epoch": 2.849518161601186, "percentage": 95.24, "elapsed_time": "7:48:03", "remaining_time": "0:23:24"}
|
51 |
+
{"current_steps": 490, "total_steps": 504, "loss": 0.4939, "lr": 5e-06, "epoch": 2.9088213491475168, "percentage": 97.22, "elapsed_time": "7:57:38", "remaining_time": "0:13:38"}
|
52 |
+
{"current_steps": 500, "total_steps": 504, "loss": 0.497, "lr": 5e-06, "epoch": 2.968124536693847, "percentage": 99.21, "elapsed_time": "8:07:15", "remaining_time": "0:03:53"}
|