End of training
Browse files- all_results.json +12 -0
- eval_results.json +8 -0
- runs/Dec17_00-49-12_129-213-88-66/events.out.tfevents.1671302027.129-213-88-66.1326738.2 +3 -0
- train_20221217-004912.log +4 -0
- train_results.json +7 -0
- train_run_1.log +26 -1
- trainer_state.json +805 -0
all_results.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 1.1,
|
3 |
+
"eval_loss": 0.10796044021844864,
|
4 |
+
"eval_runtime": 2073.5744,
|
5 |
+
"eval_samples_per_second": 7.654,
|
6 |
+
"eval_steps_per_second": 0.239,
|
7 |
+
"eval_wer": 12.206885082321635,
|
8 |
+
"train_loss": 0.17721048017342886,
|
9 |
+
"train_runtime": 61737.3829,
|
10 |
+
"train_samples_per_second": 6.22,
|
11 |
+
"train_steps_per_second": 0.097
|
12 |
+
}
|
eval_results.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 1.1,
|
3 |
+
"eval_loss": 0.10796044021844864,
|
4 |
+
"eval_runtime": 2073.5744,
|
5 |
+
"eval_samples_per_second": 7.654,
|
6 |
+
"eval_steps_per_second": 0.239,
|
7 |
+
"eval_wer": 12.206885082321635
|
8 |
+
}
|
runs/Dec17_00-49-12_129-213-88-66/events.out.tfevents.1671302027.129-213-88-66.1326738.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54f58508fb05ada573f3a57972a24b5a612a0fe93a9a8935c2036990e6dc02ed
|
3 |
+
size 358
|
train_20221217-004912.log
CHANGED
@@ -138,3 +138,7 @@ remote: LFS file scan complete.
|
|
138 |
To https://huggingface.co/ales/whisper-base-belarusian
|
139 |
4074dad..52d55ef main -> main
|
140 |
|
|
|
|
|
|
|
|
|
|
138 |
To https://huggingface.co/ales/whisper-base-belarusian
|
139 |
4074dad..52d55ef main -> main
|
140 |
|
141 |
+
12/17/2022 17:59:11 - WARNING - huggingface_hub.repository - To https://huggingface.co/ales/whisper-base-belarusian
|
142 |
+
52d55ef..4aae45b main -> main
|
143 |
+
|
144 |
+
12/17/2022 17:59:14 - INFO - __main__ - *** Evaluate ***
|
train_results.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 1.1,
|
3 |
+
"train_loss": 0.17721048017342886,
|
4 |
+
"train_runtime": 61737.3829,
|
5 |
+
"train_samples_per_second": 6.22,
|
6 |
+
"train_steps_per_second": 0.097
|
7 |
+
}
|
train_run_1.log
CHANGED
@@ -36388,4 +36388,29 @@ remote: LFS file scan complete.
|
|
36388 |
To https://huggingface.co/ales/whisper-base-belarusian
|
36389 |
4074dad..52d55ef main -> main
|
36390 |
|
36391 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
36392 |
0%| | 0/496 [00:00<?, ?it/s]
|
36393 |
0%| | 2/496 [00:02<12:12, 1.48s/it]
|
36394 |
1%| | 3/496 [00:06<18:24, 2.24s/it]
|
36395 |
1%| | 4/496 [00:09<21:51, 2.67s/it]
|
36396 |
1%| | 5/496 [00:12<23:42, 2.90s/it]
|
36397 |
1%| | 6/496 [00:16<24:19, 2.98s/it]
|
36398 |
1%|▏ | 7/496 [00:20<27:04, 3.32s/it]
|
36399 |
2%|▏ | 8/496 [00:23<27:39, 3.40s/it]
|
36400 |
2%|▏ | 9/496 [00:26<25:56, 3.20s/it]
|
36401 |
2%|▏ | 10/496 [00:29<25:11, 3.11s/it]
|
36402 |
2%|▏ | 11/496 [00:32<24:23, 3.02s/it]
|
36403 |
2%|▏ | 12/496 [00:35<25:18, 3.14s/it]
|
36404 |
3%|▎ | 13/496 [00:38<25:26, 3.16s/it]
|
36405 |
3%|▎ | 14/496 [00:41<24:15, 3.02s/it]
|
36406 |
3%|▎ | 15/496 [00:45<25:47, 3.22s/it]
|
36407 |
3%|▎ | 16/496 [00:48<25:38, 3.21s/it]
|
36408 |
3%|▎ | 17/496 [00:51<25:22, 3.18s/it]
|
36409 |
4%|▎ | 18/496 [00:54<24:15, 3.05s/it]
|
36410 |
4%|▍ | 19/496 [00:57<24:07, 3.03s/it]
|
36411 |
4%|▍ | 20/496 [01:00<24:16, 3.06s/it]
|
36412 |
4%|▍ | 21/496 [01:03<24:03, 3.04s/it]
|
36413 |
4%|▍ | 22/496 [01:06<23:17, 2.95s/it]
|
36414 |
5%|▍ | 23/496 [01:09<24:46, 3.14s/it]
|
36415 |
5%|▍ | 24/496 [01:12<23:55, 3.04s/it]
|
36416 |
5%|▌ | 25/496 [01:16<25:09, 3.20s/it]
|
36417 |
5%|▌ | 26/496 [01:19<25:19, 3.23s/it]
|
36418 |
5%|▌ | 27/496 [01:22<24:26, 3.13s/it]
|
36419 |
6%|▌ | 28/496 [01:25<23:56, 3.07s/it]
|
36420 |
6%|▌ | 29/496 [01:28<24:39, 3.17s/it]
|
36421 |
6%|▌ | 30/496 [01:31<25:05, 3.23s/it]
|
36422 |
6%|▋ | 31/496 [01:34<23:58, 3.09s/it]
|
36423 |
6%|▋ | 32/496 [01:38<25:00, 3.23s/it]
|
36424 |
7%|▋ | 33/496 [01:42<27:41, 3.59s/it]
|
36425 |
7%|▋ | 34/496 [01:45<25:28, 3.31s/it]
|
36426 |
7%|▋ | 35/496 [01:48<25:38, 3.34s/it]
|
36427 |
7%|▋ | 36/496 [01:52<25:34, 3.34s/it]
|
36428 |
7%|▋ | 37/496 [01:54<24:04, 3.15s/it]
|
36429 |
8%|▊ | 38/496 [01:57<24:04, 3.16s/it]
|
36430 |
8%|▊ | 39/496 [02:01<23:59, 3.15s/it]
|
36431 |
8%|▊ | 40/496 [02:03<22:32, 2.97s/it]
|
36432 |
8%|▊ | 41/496 [02:06<22:10, 2.92s/it]
|
36433 |
8%|▊ | 42/496 [02:09<23:02, 3.05s/it]
|
36434 |
9%|▊ | 43/496 [02:13<23:49, 3.16s/it]
|
36435 |
9%|▉ | 44/496 [02:16<24:04, 3.20s/it]
|
36436 |
9%|▉ | 45/496 [02:19<22:39, 3.01s/it]
|
36437 |
9%|▉ | 46/496 [02:21<21:54, 2.92s/it]
|
36438 |
9%|▉ | 47/496 [02:24<20:50, 2.78s/it]
|
36439 |
10%|▉ | 48/496 [02:27<21:49, 2.92s/it]
|
36440 |
10%|▉ | 49/496 [02:30<21:10, 2.84s/it]
|
36441 |
10%|█ | 50/496 [02:32<20:34, 2.77s/it]
|
36442 |
10%|█ | 51/496 [02:35<21:04, 2.84s/it]
|
36443 |
10%|█ | 52/496 [02:38<21:39, 2.93s/it]
|
36444 |
11%|█ | 53/496 [02:41<20:54, 2.83s/it]
|
36445 |
11%|█ | 54/496 [02:44<20:25, 2.77s/it]
|
36446 |
11%|█ | 55/496 [02:46<20:03, 2.73s/it]
|
36447 |
11%|█▏ | 56/496 [02:49<21:03, 2.87s/it]
|
36448 |
11%|█▏ | 57/496 [02:52<21:03, 2.88s/it]
|
36449 |
12%|█▏ | 58/496 [02:55<20:26, 2.80s/it]
|
36450 |
12%|█▏ | 59/496 [02:58<20:13, 2.78s/it]
|
36451 |
12%|█▏ | 60/496 [03:01<20:47, 2.86s/it]
|
36452 |
12%|█▏ | 61/496 [03:03<20:19, 2.80s/it]
|
36453 |
12%|█▎ | 62/496 [03:06<20:46, 2.87s/it]
|
36454 |
13%|█▎ | 63/496 [03:09<20:45, 2.88s/it]
|
36455 |
13%|█▎ | 64/496 [03:12<20:54, 2.91s/it]
|
36456 |
13%|█▎ | 65/496 [03:16<21:28, 2.99s/it]
|
36457 |
13%|█▎ | 66/496 [03:19<21:31, 3.00s/it]
|
36458 |
14%|█▎ | 67/496 [03:21<20:14, 2.83s/it]
|
36459 |
14%|█▎ | 68/496 [03:23<19:18, 2.71s/it]
|
36460 |
14%|█▍ | 69/496 [03:26<19:26, 2.73s/it]
|
36461 |
14%|█▍ | 70/496 [03:29<19:42, 2.78s/it]
|
36462 |
14%|█▍ | 71/496 [03:32<20:16, 2.86s/it]
|
36463 |
15%|█▍ | 72/496 [03:35<20:12, 2.86s/it]
|
36464 |
15%|█▍ | 73/496 [03:38<20:02, 2.84s/it]
|
36465 |
15%|█▍ | 74/496 [03:40<19:41, 2.80s/it]
|
36466 |
15%|█▌ | 75/496 [03:43<19:55, 2.84s/it]
|
36467 |
15%|█▌ | 76/496 [03:47<20:28, 2.93s/it]
|
36468 |
16%|█▌ | 77/496 [03:50<21:00, 3.01s/it]
|
36469 |
16%|█▌ | 78/496 [03:53<20:37, 2.96s/it]
|
36470 |
16%|█▌ | 79/496 [03:56<21:21, 3.07s/it]
|
36471 |
16%|█▌ | 80/496 [03:59<21:38, 3.12s/it]
|
36472 |
16%|█▋ | 81/496 [04:03<22:28, 3.25s/it]
|
36473 |
17%|█▋ | 82/496 [04:06<22:22, 3.24s/it]
|
36474 |
17%|█▋ | 83/496 [04:09<21:24, 3.11s/it]
|
36475 |
17%|█▋ | 84/496 [04:12<22:08, 3.23s/it]
|
36476 |
17%|█▋ | 85/496 [04:15<22:00, 3.21s/it]
|
36477 |
17%|█▋ | 86/496 [04:19<22:39, 3.32s/it]
|
36478 |
18%|█▊ | 87/496 [04:22<22:18, 3.27s/it]
|
36479 |
18%|█▊ | 88/496 [04:25<21:10, 3.11s/it]
|
36480 |
18%|█▊ | 89/496 [04:28<20:45, 3.06s/it]
|
36481 |
18%|█▊ | 90/496 [04:31<20:32, 3.04s/it]
|
36482 |
18%|█▊ | 91/496 [04:34<21:21, 3.16s/it]
|
36483 |
19%|█▊ | 92/496 [04:37<21:17, 3.16s/it]
|
36484 |
19%|█▉ | 93/496 [04:41<21:41, 3.23s/it]
|
36485 |
19%|█▉ | 94/496 [04:44<21:48, 3.26s/it]
|
36486 |
19%|█▉ | 95/496 [04:48<21:58, 3.29s/it]
|
36487 |
19%|█▉ | 96/496 [04:50<20:33, 3.08s/it]
|
36488 |
20%|█▉ | 97/496 [04:53<20:22, 3.06s/it]
|
36489 |
20%|█▉ | 98/496 [04:56<20:15, 3.06s/it]
|
36490 |
20%|█▉ | 99/496 [04:59<20:11, 3.05s/it]
|
36491 |
20%|██ | 100/496 [05:02<19:38, 2.98s/it]
|
36492 |
20%|██ | 101/496 [05:05<19:09, 2.91s/it]
|
36493 |
21%|██ | 102/496 [05:08<18:50, 2.87s/it]
|
36494 |
21%|██ | 103/496 [05:10<18:56, 2.89s/it]
|
36495 |
21%|██ | 104/496 [05:13<18:31, 2.84s/it]
|
36496 |
21%|██ | 105/496 [05:16<19:08, 2.94s/it]
|
36497 |
21%|██▏ | 106/496 [05:19<19:21, 2.98s/it]
|
36498 |
22%|██▏ | 107/496 [05:23<19:42, 3.04s/it]
|
36499 |
22%|██▏ | 108/496 [05:25<19:19, 2.99s/it]
|
36500 |
22%|██▏ | 109/496 [05:28<19:15, 2.98s/it]
|
36501 |
22%|██▏ | 110/496 [05:31<18:53, 2.94s/it]
|
36502 |
22%|██▏ | 111/496 [05:34<18:13, 2.84s/it]
|
36503 |
23%|██▎ | 112/496 [05:37<18:49, 2.94s/it]
|
36504 |
23%|██▎ | 113/496 [05:39<17:44, 2.78s/it]
|
36505 |
23%|██▎ | 114/496 [05:42<17:41, 2.78s/it]
|
36506 |
23%|██▎ | 115/496 [05:45<17:20, 2.73s/it]
|
36507 |
23%|██▎ | 116/496 [05:48<18:26, 2.91s/it]
|
36508 |
24%|██▎ | 117/496 [05:51<18:20, 2.90s/it]
|
36509 |
24%|██▍ | 118/496 [05:54<17:44, 2.82s/it]
|
36510 |
24%|██▍ | 119/496 [05:56<17:24, 2.77s/it]
|
36511 |
24%|██▍ | 120/496 [05:59<17:57, 2.87s/it]
|
36512 |
24%|██▍ | 121/496 [06:02<17:45, 2.84s/it]
|
36513 |
25%|██▍ | 122/496 [06:05<18:00, 2.89s/it]
|
36514 |
25%|██▍ | 123/496 [06:08<18:31, 2.98s/it]
|
36515 |
25%|██▌ | 124/496 [06:11<17:33, 2.83s/it]
|
36516 |
25%|██▌ | 125/496 [06:14<17:35, 2.84s/it]
|
36517 |
25%|██▌ | 126/496 [06:17<17:50, 2.89s/it]
|
36518 |
26%|██▌ | 127/496 [06:20<18:29, 3.01s/it]
|
36519 |
26%|██▌ | 128/496 [06:23<18:19, 2.99s/it]
|
36520 |
26%|██▌ | 129/496 [06:26<17:38, 2.88s/it]
|
36521 |
26%|██▌ | 130/496 [06:29<17:56, 2.94s/it]
|
36522 |
26%|██▋ | 131/496 [06:32<17:49, 2.93s/it]
|
36523 |
27%|██▋ | 132/496 [06:34<17:03, 2.81s/it]
|
36524 |
27%|██▋ | 133/496 [06:37<16:22, 2.71s/it]
|
36525 |
27%|██▋ | 134/496 [06:40<16:39, 2.76s/it]
|
36526 |
27%|██▋ | 135/496 [06:43<17:11, 2.86s/it]
|
36527 |
27%|██▋ | 136/496 [06:46<17:18, 2.89s/it]
|
36528 |
28%|██▊ | 137/496 [06:48<16:54, 2.82s/it]
|
36529 |
28%|██▊ | 138/496 [06:51<17:06, 2.87s/it]
|
36530 |
28%|██▊ | 139/496 [06:54<17:28, 2.94s/it]
|
36531 |
28%|██▊ | 140/496 [06:58<18:10, 3.06s/it]
|
36532 |
28%|██▊ | 141/496 [07:01<17:53, 3.02s/it]
|
36533 |
29%|██▊ | 142/496 [07:04<18:21, 3.11s/it]
|
36534 |
29%|██▉ | 143/496 [07:07<17:51, 3.03s/it]
|
36535 |
29%|██▉ | 144/496 [07:09<17:06, 2.92s/it]
|
36536 |
29%|██▉ | 145/496 [07:12<17:13, 2.94s/it]
|
36537 |
29%|██▉ | 146/496 [07:16<17:28, 3.00s/it]
|
36538 |
30%|██▉ | 147/496 [07:19<18:15, 3.14s/it]
|
36539 |
30%|██▉ | 148/496 [07:22<17:54, 3.09s/it]
|
36540 |
30%|███ | 149/496 [07:25<17:31, 3.03s/it]
|
36541 |
30%|███ | 150/496 [07:28<17:50, 3.09s/it]
|
36542 |
30%|███ | 151/496 [07:31<16:52, 2.94s/it]
|
36543 |
31%|███ | 152/496 [07:35<18:21, 3.20s/it]
|
36544 |
31%|███ | 153/496 [07:38<18:37, 3.26s/it]
|
36545 |
31%|███ | 154/496 [07:40<17:17, 3.03s/it]
|
36546 |
31%|███▏ | 155/496 [07:43<16:31, 2.91s/it]
|
36547 |
31%|███▏ | 156/496 [07:46<16:33, 2.92s/it]
|
36548 |
32%|███▏ | 157/496 [07:49<16:31, 2.92s/it]
|
36549 |
32%|███▏ | 158/496 [07:51<15:11, 2.70s/it]
|
36550 |
32%|███▏ | 159/496 [07:54<14:47, 2.63s/it]
|
36551 |
32%|███▏ | 160/496 [07:56<14:20, 2.56s/it]
|
36552 |
32%|███▏ | 161/496 [07:59<14:47, 2.65s/it]
|
36553 |
33%|███▎ | 162/496 [08:02<15:13, 2.73s/it]
|
36554 |
33%|███▎ | 163/496 [08:05<15:25, 2.78s/it]
|
36555 |
33%|███▎ | 164/496 [08:08<16:01, 2.90s/it]
|
36556 |
33%|███▎ | 165/496 [08:11<16:58, 3.08s/it]
|
36557 |
33%|███▎ | 166/496 [08:15<17:12, 3.13s/it]
|
36558 |
34%|███▎ | 167/496 [08:17<16:00, 2.92s/it]
|
36559 |
34%|███▍ | 168/496 [08:20<15:34, 2.85s/it]
|
36560 |
34%|███▍ | 169/496 [08:23<15:40, 2.88s/it]
|
36561 |
34%|███▍ | 170/496 [08:25<15:37, 2.88s/it]
|
36562 |
34%|███▍ | 171/496 [08:28<15:08, 2.79s/it]
|
36563 |
35%|███▍ | 172/496 [08:31<15:44, 2.92s/it]
|
36564 |
35%|███▍ | 173/496 [08:34<15:27, 2.87s/it]
|
36565 |
35%|███▌ | 174/496 [08:37<15:02, 2.80s/it]
|
36566 |
35%|███▌ | 175/496 [08:40<15:04, 2.82s/it]
|
36567 |
35%|███▌ | 176/496 [08:43<15:36, 2.93s/it]
|
36568 |
36%|███▌ | 177/496 [08:45<15:06, 2.84s/it]
|
36569 |
36%|███▌ | 178/496 [08:49<16:49, 3.17s/it]
|
36570 |
36%|███▌ | 179/496 [08:52<16:22, 3.10s/it]
|
36571 |
36%|███▋ | 180/496 [08:55<16:15, 3.09s/it]
|
36572 |
36%|███▋ | 181/496 [08:58<16:05, 3.07s/it]
|
36573 |
37%|███▋ | 182/496 [09:01<15:18, 2.92s/it]
|
36574 |
37%|███▋ | 183/496 [09:04<15:09, 2.91s/it]
|
36575 |
37%|███▋ | 184/496 [09:07<14:51, 2.86s/it]
|
36576 |
37%|███▋ | 185/496 [09:10<15:17, 2.95s/it]
|
36577 |
38%|███▊ | 186/496 [09:13<15:29, 3.00s/it]
|
36578 |
38%|███▊ | 187/496 [09:15<14:47, 2.87s/it]
|
36579 |
38%|███▊ | 188/496 [09:19<15:58, 3.11s/it]
|
36580 |
38%|███▊ | 189/496 [09:22<15:54, 3.11s/it]
|
36581 |
38%|███▊ | 190/496 [09:25<15:57, 3.13s/it]
|
36582 |
39%|███▊ | 191/496 [09:29<16:17, 3.21s/it]
|
36583 |
39%|███▊ | 192/496 [09:32<15:37, 3.09s/it]
|
36584 |
39%|███▉ | 193/496 [09:34<15:19, 3.03s/it]
|
36585 |
39%|███▉ | 194/496 [09:37<14:05, 2.80s/it]
|
36586 |
39%|███▉ | 195/496 [09:39<13:51, 2.76s/it]
|
36587 |
40%|███▉ | 196/496 [09:42<14:08, 2.83s/it]
|
36588 |
40%|███▉ | 197/496 [09:45<14:07, 2.83s/it]
|
36589 |
40%|███▉ | 198/496 [09:48<14:31, 2.93s/it]
|
36590 |
40%|████ | 199/496 [09:51<14:41, 2.97s/it]
|
36591 |
40%|████ | 200/496 [09:54<14:37, 2.97s/it]
|
36592 |
41%|████ | 201/496 [09:57<14:49, 3.02s/it]
|
36593 |
41%|████ | 202/496 [10:01<15:28, 3.16s/it]
|
36594 |
41%|████ | 203/496 [10:03<14:24, 2.95s/it]
|
36595 |
41%|████ | 204/496 [10:06<14:04, 2.89s/it]
|
36596 |
41%|████▏ | 205/496 [10:09<13:46, 2.84s/it]
|
36597 |
42%|████▏ | 206/496 [10:12<13:34, 2.81s/it]
|
36598 |
42%|████▏ | 207/496 [10:14<13:27, 2.79s/it]
|
36599 |
42%|████▏ | 208/496 [10:17<13:22, 2.79s/it]
|
36600 |
42%|████▏ | 209/496 [10:20<14:04, 2.94s/it]
|
36601 |
42%|████▏ | 210/496 [10:23<14:05, 2.96s/it]
|
36602 |
43%|████▎ | 211/496 [10:26<14:08, 2.98s/it]
|
36603 |
43%|████▎ | 212/496 [10:30<14:26, 3.05s/it]
|
36604 |
43%|████▎ | 213/496 [10:33<14:15, 3.02s/it]
|
36605 |
43%|████▎ | 214/496 [10:36<14:18, 3.05s/it]
|
36606 |
43%|████▎ | 215/496 [10:39<14:00, 2.99s/it]
|
36607 |
44%|████▎ | 216/496 [10:42<14:33, 3.12s/it]
|
36608 |
44%|████▍ | 217/496 [10:46<15:38, 3.36s/it]
|
36609 |
44%|████▍ | 218/496 [10:49<14:29, 3.13s/it]
|
36610 |
44%|████▍ | 219/496 [10:51<13:49, 2.99s/it]
|
36611 |
44%|████▍ | 220/496 [10:54<13:28, 2.93s/it]
|
36612 |
45%|████▍ | 221/496 [10:57<13:45, 3.00s/it]
|
36613 |
45%|████▍ | 222/496 [11:00<13:46, 3.02s/it]
|
36614 |
45%|████▍ | 223/496 [11:03<13:38, 3.00s/it]
|
36615 |
45%|████▌ | 224/496 [11:07<14:38, 3.23s/it]
|
36616 |
45%|████▌ | 225/496 [11:11<15:20, 3.40s/it]
|
36617 |
46%|████▌ | 226/496 [11:14<14:45, 3.28s/it]
|
36618 |
46%|████▌ | 227/496 [11:17<14:04, 3.14s/it]
|
36619 |
46%|████▌ | 228/496 [11:20<14:05, 3.16s/it]
|
36620 |
46%|████▌ | 229/496 [11:23<13:34, 3.05s/it]
|
36621 |
46%|████▋ | 230/496 [11:26<13:29, 3.04s/it]
|
36622 |
47%|████▋ | 231/496 [11:29<13:37, 3.08s/it]
|
36623 |
47%|████▋ | 232/496 [11:32<13:34, 3.08s/it]
|
36624 |
47%|████▋ | 233/496 [11:35<13:48, 3.15s/it]
|
36625 |
47%|████▋ | 234/496 [11:38<13:23, 3.07s/it]
|
36626 |
47%|████▋ | 235/496 [11:41<13:19, 3.06s/it]
|
36627 |
48%|████▊ | 236/496 [11:44<13:16, 3.06s/it]
|
36628 |
48%|████▊ | 237/496 [11:47<12:48, 2.97s/it]
|
36629 |
48%|████▊ | 238/496 [11:50<12:54, 3.00s/it]
|
36630 |
48%|████▊ | 239/496 [11:53<13:25, 3.14s/it]
|
36631 |
48%|████▊ | 240/496 [11:56<12:47, 3.00s/it]
|
36632 |
49%|████▊ | 241/496 [11:59<12:53, 3.03s/it]
|
36633 |
49%|████▉ | 242/496 [12:02<12:46, 3.02s/it]
|
36634 |
49%|████▉ | 243/496 [12:05<12:26, 2.95s/it]
|
36635 |
49%|████▉ | 244/496 [12:08<12:30, 2.98s/it]
|
36636 |
49%|████▉ | 245/496 [12:12<13:17, 3.18s/it]
|
36637 |
50%|████▉ | 246/496 [12:15<12:56, 3.11s/it]
|
36638 |
50%|████▉ | 247/496 [12:18<12:59, 3.13s/it]
|
36639 |
50%|█████ | 248/496 [12:21<12:23, 3.00s/it]
|
36640 |
50%|█████ | 249/496 [12:23<12:17, 2.98s/it]
|
36641 |
50%|█████ | 250/496 [12:26<12:03, 2.94s/it]
|
36642 |
51%|█████ | 251/496 [12:29<11:18, 2.77s/it]
|
36643 |
51%|█████ | 252/496 [12:32<12:00, 2.95s/it]
|
36644 |
51%|█████ | 253/496 [12:35<12:21, 3.05s/it]
|
36645 |
51%|█████ | 254/496 [12:39<12:57, 3.21s/it]
|
36646 |
51%|█████▏ | 255/496 [12:41<11:52, 2.96s/it]
|
36647 |
52%|█████▏ | 256/496 [12:45<13:06, 3.28s/it]
|
36648 |
52%|█████▏ | 257/496 [12:48<12:45, 3.20s/it]
|
36649 |
52%|█████▏ | 258/496 [12:51<11:50, 2.98s/it]
|
36650 |
52%|█████▏ | 259/496 [12:54<11:58, 3.03s/it]
|
36651 |
52%|█████▏ | 260/496 [12:57<12:10, 3.09s/it]
|
36652 |
53%|█████▎ | 261/496 [13:00<11:42, 2.99s/it]
|
36653 |
53%|█████▎ | 262/496 [13:03<11:26, 2.93s/it]
|
36654 |
53%|█████▎ | 263/496 [13:06<11:14, 2.90s/it]
|
36655 |
53%|█████▎ | 264/496 [13:08<10:56, 2.83s/it]
|
36656 |
53%|█████▎ | 265/496 [13:12<11:29, 2.98s/it]
|
36657 |
54%|█████▎ | 266/496 [13:15<11:55, 3.11s/it]
|
36658 |
54%|█████▍ | 267/496 [13:19<12:29, 3.27s/it]
|
36659 |
54%|█████▍ | 268/496 [13:22<12:20, 3.25s/it]
|
36660 |
54%|█████▍ | 269/496 [13:25<12:22, 3.27s/it]
|
36661 |
54%|█████▍ | 270/496 [13:28<12:15, 3.25s/it]
|
36662 |
55%|█████▍ | 271/496 [13:31<12:00, 3.20s/it]
|
36663 |
55%|█████▍ | 272/496 [13:34<11:27, 3.07s/it]
|
36664 |
55%|█████▌ | 273/496 [13:37<11:03, 2.98s/it]
|
36665 |
55%|█████▌ | 274/496 [13:40<11:16, 3.05s/it]
|
36666 |
55%|█████▌ | 275/496 [13:44<11:45, 3.19s/it]
|
36667 |
56%|█████▌ | 276/496 [13:47<11:27, 3.12s/it]
|
36668 |
56%|█████▌ | 277/496 [13:49<11:01, 3.02s/it]
|
36669 |
56%|█████▌ | 278/496 [13:53<11:31, 3.17s/it]
|
36670 |
56%|█████▋ | 279/496 [13:56<11:23, 3.15s/it]
|
36671 |
56%|█████▋ | 280/496 [14:00<11:40, 3.24s/it]
|
36672 |
57%|█████▋ | 281/496 [14:03<11:21, 3.17s/it]
|
36673 |
57%|█████▋ | 282/496 [14:05<11:03, 3.10s/it]
|
36674 |
57%|█████▋ | 283/496 [14:11<13:06, 3.69s/it]
|
36675 |
57%|█████▋ | 284/496 [14:13<11:46, 3.33s/it]
|
36676 |
57%|█████▋ | 285/496 [14:16<10:51, 3.09s/it]
|
36677 |
58%|█████▊ | 286/496 [14:19<11:13, 3.21s/it]
|
36678 |
58%|█████▊ | 287/496 [14:22<10:49, 3.11s/it]
|
36679 |
58%|█████▊ | 288/496 [14:26<11:41, 3.37s/it]
|
36680 |
58%|█████▊ | 289/496 [14:29<11:08, 3.23s/it]
|
36681 |
58%|█████▊ | 290/496 [14:32<10:46, 3.14s/it]
|
36682 |
59%|█████▊ | 291/496 [14:35<10:25, 3.05s/it]
|
36683 |
59%|█████▉ | 292/496 [14:37<10:12, 3.00s/it]
|
36684 |
59%|█████▉ | 293/496 [14:40<09:17, 2.75s/it]
|
36685 |
59%|█████▉ | 294/496 [14:42<09:16, 2.76s/it]
|
36686 |
59%|█████▉ | 295/496 [14:46<10:04, 3.01s/it]
|
36687 |
60%|█████▉ | 296/496 [14:49<09:48, 2.94s/it]
|
36688 |
60%|█████▉ | 297/496 [14:51<09:13, 2.78s/it]
|
36689 |
60%|██████ | 298/496 [14:54<08:45, 2.65s/it]
|
36690 |
60%|██████ | 299/496 [14:56<08:37, 2.63s/it]
|
36691 |
60%|██████ | 300/496 [14:59<09:02, 2.77s/it]
|
36692 |
61%|██████ | 301/496 [15:02<08:58, 2.76s/it]
|
36693 |
61%|██████ | 302/496 [15:06<10:03, 3.11s/it]
|
36694 |
61%|██████ | 303/496 [15:09<10:05, 3.14s/it]
|
36695 |
61%|██████▏ | 304/496 [15:12<10:06, 3.16s/it]
|
36696 |
61%|██████▏ | 305/496 [15:15<09:26, 2.97s/it]
|
36697 |
62%|██████▏ | 306/496 [15:17<09:09, 2.89s/it]
|
36698 |
62%|██████▏ | 307/496 [15:20<08:48, 2.80s/it]
|
36699 |
62%|██████▏ | 308/496 [15:23<08:41, 2.77s/it]
|
36700 |
62%|██████▏ | 309/496 [15:26<08:40, 2.78s/it]
|
36701 |
62%|██████▎ | 310/496 [15:29<09:10, 2.96s/it]
|
36702 |
63%|██████▎ | 311/496 [15:32<09:38, 3.13s/it]
|
36703 |
63%|██████▎ | 312/496 [15:36<09:44, 3.18s/it]
|
36704 |
63%|██████▎ | 313/496 [15:38<08:43, 2.86s/it]
|
36705 |
63%|██████▎ | 314/496 [15:41<08:28, 2.79s/it]
|
36706 |
64%|██████▎ | 315/496 [15:44<08:42, 2.89s/it]
|
36707 |
64%|██████▎ | 316/496 [15:47<08:39, 2.88s/it]
|
36708 |
64%|██████▍ | 317/496 [15:49<08:37, 2.89s/it]
|
36709 |
64%|██████▍ | 318/496 [15:52<08:38, 2.91s/it]
|
36710 |
64%|██████�� | 319/496 [15:56<09:25, 3.19s/it]
|
36711 |
65%|██████▍ | 320/496 [15:59<08:56, 3.05s/it]
|
36712 |
65%|██████▍ | 321/496 [16:02<08:32, 2.93s/it]
|
36713 |
65%|██████▍ | 322/496 [16:04<08:17, 2.86s/it]
|
36714 |
65%|██████▌ | 323/496 [16:08<08:36, 2.98s/it]
|
36715 |
65%|██████▌ | 324/496 [16:11<08:33, 2.99s/it]
|
36716 |
66%|██████▌ | 325/496 [16:13<08:05, 2.84s/it]
|
36717 |
66%|██████▌ | 326/496 [16:16<08:22, 2.96s/it]
|
36718 |
66%|██████▌ | 327/496 [16:19<07:59, 2.83s/it]
|
36719 |
66%|██████▌ | 328/496 [16:21<07:46, 2.77s/it]
|
36720 |
66%|██████▋ | 329/496 [16:25<08:04, 2.90s/it]
|
36721 |
67%|██████▋ | 330/496 [16:27<07:52, 2.85s/it]
|
36722 |
67%|██████▋ | 331/496 [16:31<08:08, 2.96s/it]
|
36723 |
67%|██████▋ | 332/496 [16:34<08:15, 3.02s/it]
|
36724 |
67%|██████▋ | 333/496 [16:37<08:10, 3.01s/it]
|
36725 |
67%|██████▋ | 334/496 [16:40<07:54, 2.93s/it]
|
36726 |
68%|██████▊ | 335/496 [16:43<08:04, 3.01s/it]
|
36727 |
68%|██████▊ | 336/496 [16:46<08:23, 3.15s/it]
|
36728 |
68%|██████▊ | 337/496 [16:49<08:15, 3.11s/it]
|
36729 |
68%|██████▊ | 338/496 [16:52<07:48, 2.96s/it]
|
36730 |
68%|██████▊ | 339/496 [16:54<07:26, 2.84s/it]
|
36731 |
69%|██████▊ | 340/496 [16:58<07:36, 2.93s/it]
|
36732 |
69%|██████▉ | 341/496 [17:01<07:49, 3.03s/it]
|
36733 |
69%|██████▉ | 342/496 [17:04<08:04, 3.14s/it]
|
36734 |
69%|██████▉ | 343/496 [17:07<08:00, 3.14s/it]
|
36735 |
69%|██████▉ | 344/496 [17:10<07:49, 3.09s/it]
|
36736 |
70%|██████▉ | 345/496 [17:13<07:27, 2.97s/it]
|
36737 |
70%|██████▉ | 346/496 [17:15<07:05, 2.84s/it]
|
36738 |
70%|██████▉ | 347/496 [17:19<07:14, 2.92s/it]
|
36739 |
70%|███████ | 348/496 [17:22<07:13, 2.93s/it]
|
36740 |
70%|███████ | 349/496 [17:26<08:25, 3.44s/it]
|
36741 |
71%|███████ | 350/496 [17:29<08:12, 3.38s/it]
|
36742 |
71%|███████ | 351/496 [17:32<07:51, 3.25s/it]
|
36743 |
71%|███████ | 352/496 [17:35<07:31, 3.13s/it]
|
36744 |
71%|███████ | 353/496 [17:38<07:24, 3.11s/it]
|
36745 |
71%|███████▏ | 354/496 [17:41<07:23, 3.12s/it]
|
36746 |
72%|███████▏ | 355/496 [17:45<07:33, 3.21s/it]
|
36747 |
72%|███████▏ | 356/496 [17:48<07:27, 3.20s/it]
|
36748 |
72%|███████▏ | 357/496 [17:51<07:14, 3.13s/it]
|
36749 |
72%|███████▏ | 358/496 [17:53<06:41, 2.91s/it]
|
36750 |
72%|███████▏ | 359/496 [17:57<06:47, 2.97s/it]
|
36751 |
73%|███████▎ | 360/496 [18:00<06:47, 3.00s/it]
|
36752 |
73%|███████▎ | 361/496 [18:02<06:37, 2.94s/it]
|
36753 |
73%|███████▎ | 362/496 [18:06<06:55, 3.10s/it]
|
36754 |
73%|███████▎ | 363/496 [18:09<06:44, 3.04s/it]
|
36755 |
73%|███████▎ | 364/496 [18:11<06:21, 2.89s/it]
|
36756 |
74%|███████▎ | 365/496 [18:14<06:14, 2.86s/it]
|
36757 |
74%|███████▍ | 366/496 [18:17<06:06, 2.82s/it]
|
36758 |
74%|███████▍ | 367/496 [18:19<05:56, 2.76s/it]
|
36759 |
74%|███████▍ | 368/496 [18:23<06:24, 3.00s/it]
|
36760 |
74%|███████▍ | 369/496 [18:26<06:17, 2.97s/it]
|
36761 |
75%|███████▍ | 370/496 [18:29<06:24, 3.05s/it]
|
36762 |
75%|███████▍ | 371/496 [18:32<06:29, 3.12s/it]
|
36763 |
75%|███████▌ | 372/496 [18:35<06:12, 3.01s/it]
|
36764 |
75%|███████▌ | 373/496 [18:38<06:07, 2.99s/it]
|
36765 |
75%|███████▌ | 374/496 [18:41<06:02, 2.97s/it]
|
36766 |
76%|███████▌ | 375/496 [18:44<06:11, 3.07s/it]
|
36767 |
76%|███████▌ | 376/496 [18:47<05:57, 2.98s/it]
|
36768 |
76%|███████▌ | 377/496 [18:50<05:56, 3.00s/it]
|
36769 |
76%|███████▌ | 378/496 [18:53<05:44, 2.92s/it]
|
36770 |
76%|███████▋ | 379/496 [18:55<05:22, 2.75s/it]
|
36771 |
77%|███████▋ | 380/496 [18:58<05:30, 2.85s/it]
|
36772 |
77%|███████▋ | 381/496 [19:01<05:15, 2.74s/it]
|
36773 |
77%|███████▋ | 382/496 [19:04<05:25, 2.86s/it]
|
36774 |
77%|███████▋ | 383/496 [19:07<05:37, 2.99s/it]
|
36775 |
77%|███████▋ | 384/496 [19:10<05:12, 2.79s/it]
|
36776 |
78%|███████▊ | 385/496 [19:13<05:26, 2.94s/it]
|
36777 |
78%|███████▊ | 386/496 [19:16<05:28, 2.98s/it]
|
36778 |
78%|███████▊ | 387/496 [19:19<05:29, 3.03s/it]
|
36779 |
78%|███████▊ | 388/496 [19:22<05:28, 3.04s/it]
|
36780 |
78%|███████▊ | 389/496 [19:25<05:30, 3.09s/it]
|
36781 |
79%|███████▊ | 390/496 [19:28<05:22, 3.05s/it]
|
36782 |
79%|███████▉ | 391/496 [19:31<05:18, 3.04s/it]
|
36783 |
79%|███████▉ | 392/496 [19:34<05:09, 2.98s/it]
|
36784 |
79%|███████▉ | 393/496 [19:37<04:59, 2.91s/it]
|
36785 |
79%|███████▉ | 394/496 [19:40<05:02, 2.96s/it]
|
36786 |
80%|███████▉ | 395/496 [19:42<04:42, 2.80s/it]
|
36787 |
80%|███████▉ | 396/496 [19:46<04:57, 2.98s/it]
|
36788 |
80%|████████ | 397/496 [19:49<05:02, 3.06s/it]
|
36789 |
80%|████████ | 398/496 [19:52<05:09, 3.16s/it]
|
36790 |
80%|████████ | 399/496 [19:55<04:43, 2.92s/it]
|
36791 |
81%|████████ | 400/496 [19:57<04:30, 2.81s/it]
|
36792 |
81%|████████ | 401/496 [20:01<04:50, 3.06s/it]
|
36793 |
81%|████████ | 402/496 [20:04<04:43, 3.02s/it]
|
36794 |
81%|████████▏ | 403/496 [20:08<05:19, 3.43s/it]
|
36795 |
81%|████████▏ | 404/496 [20:11<04:55, 3.21s/it]
|
36796 |
82%|████████▏ | 405/496 [20:14<04:48, 3.17s/it]
|
36797 |
82%|████████▏ | 406/496 [20:16<04:22, 2.92s/it]
|
36798 |
82%|████████▏ | 407/496 [20:19<04:15, 2.87s/it]
|
36799 |
82%|████████▏ | 408/496 [20:22<04:14, 2.89s/it]
|
36800 |
82%|████████▏ | 409/496 [20:25<04:05, 2.82s/it]
|
36801 |
83%|████████▎ | 410/496 [20:27<03:58, 2.78s/it]
|
36802 |
83%|████████▎ | 411/496 [20:31<04:08, 2.92s/it]
|
36803 |
83%|████████▎ | 412/496 [20:34<04:13, 3.01s/it]
|
36804 |
83%|████████▎ | 413/496 [20:37<04:20, 3.14s/it]
|
36805 |
83%|████████▎ | 414/496 [20:40<04:17, 3.14s/it]
|
36806 |
84%|████████▎ | 415/496 [20:44<04:27, 3.30s/it]
|
36807 |
84%|████████▍ | 416/496 [20:47<04:13, 3.17s/it]
|
36808 |
84%|████████▍ | 417/496 [20:50<04:05, 3.11s/it]
|
36809 |
84%|████████▍ | 418/496 [20:53<03:54, 3.01s/it]
|
36810 |
84%|████████▍ | 419/496 [20:55<03:40, 2.86s/it]
|
36811 |
85%|████████▍ | 420/496 [20:58<03:25, 2.70s/it]
|
36812 |
85%|████████▍ | 421/496 [21:00<03:18, 2.65s/it]
|
36813 |
85%|████████▌ | 422/496 [21:03<03:18, 2.69s/it]
|
36814 |
85%|████████▌ | 423/496 [21:05<03:08, 2.58s/it]
|
36815 |
85%|████████▌ | 424/496 [21:08<03:17, 2.74s/it]
|
36816 |
86%|████████▌ | 425/496 [21:11<03:16, 2.77s/it]
|
36817 |
86%|████████▌ | 426/496 [21:15<03:25, 2.94s/it]
|
36818 |
86%|████████▌ | 427/496 [21:17<03:22, 2.93s/it]
|
36819 |
86%|████████▋ | 428/496 [21:21<03:24, 3.01s/it]
|
36820 |
86%|████████▋ | 429/496 [21:23<03:14, 2.90s/it]
|
36821 |
87%|████████▋ | 430/496 [21:26<03:06, 2.83s/it]
|
36822 |
87%|████████▋ | 431/496 [21:29<03:09, 2.92s/it]
|
36823 |
87%|████████▋ | 432/496 [21:32<03:10, 2.98s/it]
|
36824 |
87%|████████▋ | 433/496 [21:35<02:57, 2.82s/it]
|
36825 |
88%|████████▊ | 434/496 [21:38<02:58, 2.88s/it]
|
36826 |
88%|████████▊ | 435/496 [21:41<02:55, 2.87s/it]
|
36827 |
88%|████████▊ | 436/496 [21:44<02:57, 2.95s/it]
|
36828 |
88%|████████▊ | 437/496 [21:47<03:09, 3.20s/it]
|
36829 |
88%|████████▊ | 438/496 [21:50<02:58, 3.07s/it]
|
36830 |
89%|████████▊ | 439/496 [21:53<02:57, 3.11s/it]
|
36831 |
89%|████████▊ | 440/496 [21:56<02:50, 3.04s/it]
|
36832 |
89%|████████▉ | 441/496 [22:00<02:50, 3.10s/it]
|
36833 |
89%|████████▉ | 442/496 [22:02<02:45, 3.06s/it]
|
36834 |
89%|████████▉ | 443/496 [22:06<02:51, 3.24s/it]
|
36835 |
90%|████████▉ | 444/496 [22:09<02:41, 3.11s/it]
|
36836 |
90%|████████▉ | 445/496 [22:12<02:34, 3.02s/it]
|
36837 |
90%|████████▉ | 446/496 [22:15<02:27, 2.95s/it]
|
36838 |
90%|█████████ | 447/496 [22:18<02:25, 2.97s/it]
|
36839 |
90%|█████████ | 448/496 [22:21<02:24, 3.00s/it]
|
36840 |
91%|█████████ | 449/496 [22:24<02:27, 3.14s/it]
|
36841 |
91%|█████████ | 450/496 [22:27<02:17, 2.99s/it]
|
36842 |
91%|█████████ | 451/496 [22:29<02:04, 2.76s/it]
|
36843 |
91%|█████████ | 452/496 [22:32<01:59, 2.71s/it]
|
36844 |
91%|█████████▏| 453/496 [22:35<02:06, 2.95s/it]
|
36845 |
92%|█████████▏| 454/496 [22:39<02:15, 3.22s/it]
|
36846 |
92%|█████████▏| 455/496 [22:41<02:02, 2.99s/it]
|
36847 |
92%|█████████▏| 456/496 [22:44<01:59, 2.99s/it]
|
36848 |
92%|█████████▏| 457/496 [22:48<02:03, 3.18s/it]
|
36849 |
92%|█████████▏| 458/496 [22:50<01:51, 2.94s/it]
|
36850 |
93%|█████████▎| 459/496 [22:54<01:59, 3.23s/it]
|
36851 |
93%|█████████▎| 460/496 [22:57<01:53, 3.16s/it]
|
36852 |
93%|█████████▎| 461/496 [23:00<01:47, 3.07s/it]
|
36853 |
93%|█████████▎| 462/496 [23:03<01:41, 2.98s/it]
|
36854 |
93%|█████████▎| 463/496 [23:06<01:37, 2.96s/it]
|
36855 |
94%|█████████▎| 464/496 [23:09<01:39, 3.10s/it]
|
36856 |
94%|█████████▍| 465/496 [23:12<01:32, 2.97s/it]
|
36857 |
94%|█████████▍| 466/496 [23:15<01:26, 2.87s/it]
|
36858 |
94%|█████████▍| 467/496 [23:17<01:19, 2.76s/it]
|
36859 |
94%|█████████▍| 468/496 [23:20<01:17, 2.78s/it]
|
36860 |
95%|█████████▍| 469/496 [23:23<01:17, 2.87s/it]
|
36861 |
95%|█████████▍| 470/496 [23:26<01:15, 2.89s/it]
|
36862 |
95%|█████████▍| 471/496 [23:29<01:11, 2.86s/it]
|
36863 |
95%|█████████▌| 472/496 [23:32<01:09, 2.91s/it]
|
36864 |
95%|█████████▌| 473/496 [23:34<01:04, 2.79s/it]
|
36865 |
96%|█████████▌| 474/496 [23:37<01:02, 2.85s/it]
|
36866 |
96%|█████████▌| 475/496 [23:40<00:59, 2.84s/it]
|
36867 |
96%|█████████▌| 476/496 [23:43<00:55, 2.80s/it]
|
36868 |
96%|█████████▌| 477/496 [23:46<00:53, 2.82s/it]
|
36869 |
96%|█████████▋| 478/496 [23:49<00:51, 2.86s/it]
|
36870 |
97%|█████████▋| 479/496 [23:51<00:47, 2.79s/it]
|
36871 |
97%|█████████▋| 480/496 [23:54<00:46, 2.88s/it]
|
36872 |
97%|█████████▋| 481/496 [23:57<00:44, 2.95s/it]
|
36873 |
97%|█████████▋| 482/496 [24:00<00:41, 2.95s/it]
|
36874 |
97%|█████████▋| 483/496 [24:03<00:38, 2.93s/it]
|
36875 |
98%|█████████▊| 484/496 [24:07<00:36, 3.07s/it]
|
36876 |
98%|█████████▊| 485/496 [24:09<00:33, 3.00s/it]
|
36877 |
98%|█████████▊| 486/496 [24:12<00:29, 2.94s/it]
|
36878 |
98%|█████████▊| 487/496 [24:15<00:27, 3.02s/it]
|
36879 |
98%|█████████▊| 488/496 [24:18<00:23, 3.00s/it]
|
36880 |
99%|█████████▊| 489/496 [24:21<00:20, 2.96s/it]
|
36881 |
99%|█████████▉| 490/496 [24:24<00:17, 2.91s/it]
|
36882 |
99%|█████████▉| 491/496 [24:27<00:14, 3.00s/it]
|
36883 |
99%|█████████▉| 492/496 [24:30<00:11, 2.98s/it]
|
36884 |
99%|█████████▉| 493/496 [24:33<00:09, 3.06s/it]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
36388 |
To https://huggingface.co/ales/whisper-base-belarusian
|
36389 |
4074dad..52d55ef main -> main
|
36390 |
|
36391 |
+
|
36392 |
+
To https://huggingface.co/ales/whisper-base-belarusian
|
36393 |
+
52d55ef..4aae45b main -> main
|
36394 |
+
|
36395 |
+
12/17/2022 17:59:11 - WARNING - huggingface_hub.repository - To https://huggingface.co/ales/whisper-base-belarusian
|
36396 |
+
52d55ef..4aae45b main -> main
|
36397 |
+
|
36398 |
+
***** train metrics *****
|
36399 |
+
epoch = 1.1
|
36400 |
+
train_loss = 0.1772
|
36401 |
+
train_runtime = 17:08:57.38
|
36402 |
+
train_samples_per_second = 6.22
|
36403 |
+
train_steps_per_second = 0.097
|
36404 |
+
12/17/2022 17:59:14 - INFO - __main__ - *** Evaluate ***
|
36405 |
+
[INFO|trainer.py:710] 2022-12-17 17:59:14,350 >> The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: sentence, labels_truncated, input_length, labels_length, audio. If sentence, labels_truncated, input_length, labels_length, audio are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.
|
36406 |
+
[INFO|trainer.py:2955] 2022-12-17 17:59:14,353 >> ***** Running Evaluation *****
|
36407 |
+
[INFO|trainer.py:2957] 2022-12-17 17:59:14,353 >> Num examples = 15872
|
36408 |
+
[INFO|trainer.py:2960] 2022-12-17 17:59:14,353 >> Batch size = 32
|
36409 |
+
|
36410 |
0%| | 0/496 [00:00<?, ?it/s]
|
36411 |
0%| | 2/496 [00:02<12:12, 1.48s/it]
|
36412 |
1%| | 3/496 [00:06<18:24, 2.24s/it]
|
36413 |
1%| | 4/496 [00:09<21:51, 2.67s/it]
|
36414 |
1%| | 5/496 [00:12<23:42, 2.90s/it]
|
36415 |
1%| | 6/496 [00:16<24:19, 2.98s/it]
|
36416 |
1%|▏ | 7/496 [00:20<27:04, 3.32s/it]
|
36417 |
2%|▏ | 8/496 [00:23<27:39, 3.40s/it]
|
36418 |
2%|▏ | 9/496 [00:26<25:56, 3.20s/it]
|
36419 |
2%|▏ | 10/496 [00:29<25:11, 3.11s/it]
|
36420 |
2%|▏ | 11/496 [00:32<24:23, 3.02s/it]
|
36421 |
2%|▏ | 12/496 [00:35<25:18, 3.14s/it]
|
36422 |
3%|▎ | 13/496 [00:38<25:26, 3.16s/it]
|
36423 |
3%|▎ | 14/496 [00:41<24:15, 3.02s/it]
|
36424 |
3%|▎ | 15/496 [00:45<25:47, 3.22s/it]
|
36425 |
3%|▎ | 16/496 [00:48<25:38, 3.21s/it]
|
36426 |
3%|▎ | 17/496 [00:51<25:22, 3.18s/it]
|
36427 |
4%|▎ | 18/496 [00:54<24:15, 3.05s/it]
|
36428 |
4%|▍ | 19/496 [00:57<24:07, 3.03s/it]
|
36429 |
4%|▍ | 20/496 [01:00<24:16, 3.06s/it]
|
36430 |
4%|▍ | 21/496 [01:03<24:03, 3.04s/it]
|
36431 |
4%|▍ | 22/496 [01:06<23:17, 2.95s/it]
|
36432 |
5%|▍ | 23/496 [01:09<24:46, 3.14s/it]
|
36433 |
5%|▍ | 24/496 [01:12<23:55, 3.04s/it]
|
36434 |
5%|▌ | 25/496 [01:16<25:09, 3.20s/it]
|
36435 |
5%|▌ | 26/496 [01:19<25:19, 3.23s/it]
|
36436 |
5%|▌ | 27/496 [01:22<24:26, 3.13s/it]
|
36437 |
6%|▌ | 28/496 [01:25<23:56, 3.07s/it]
|
36438 |
6%|▌ | 29/496 [01:28<24:39, 3.17s/it]
|
36439 |
6%|▌ | 30/496 [01:31<25:05, 3.23s/it]
|
36440 |
6%|▋ | 31/496 [01:34<23:58, 3.09s/it]
|
36441 |
6%|▋ | 32/496 [01:38<25:00, 3.23s/it]
|
36442 |
7%|▋ | 33/496 [01:42<27:41, 3.59s/it]
|
36443 |
7%|▋ | 34/496 [01:45<25:28, 3.31s/it]
|
36444 |
7%|▋ | 35/496 [01:48<25:38, 3.34s/it]
|
36445 |
7%|▋ | 36/496 [01:52<25:34, 3.34s/it]
|
36446 |
7%|▋ | 37/496 [01:54<24:04, 3.15s/it]
|
36447 |
8%|▊ | 38/496 [01:57<24:04, 3.16s/it]
|
36448 |
8%|▊ | 39/496 [02:01<23:59, 3.15s/it]
|
36449 |
8%|▊ | 40/496 [02:03<22:32, 2.97s/it]
|
36450 |
8%|▊ | 41/496 [02:06<22:10, 2.92s/it]
|
36451 |
8%|▊ | 42/496 [02:09<23:02, 3.05s/it]
|
36452 |
9%|▊ | 43/496 [02:13<23:49, 3.16s/it]
|
36453 |
9%|▉ | 44/496 [02:16<24:04, 3.20s/it]
|
36454 |
9%|▉ | 45/496 [02:19<22:39, 3.01s/it]
|
36455 |
9%|▉ | 46/496 [02:21<21:54, 2.92s/it]
|
36456 |
9%|▉ | 47/496 [02:24<20:50, 2.78s/it]
|
36457 |
10%|▉ | 48/496 [02:27<21:49, 2.92s/it]
|
36458 |
10%|▉ | 49/496 [02:30<21:10, 2.84s/it]
|
36459 |
10%|█ | 50/496 [02:32<20:34, 2.77s/it]
|
36460 |
10%|█ | 51/496 [02:35<21:04, 2.84s/it]
|
36461 |
10%|█ | 52/496 [02:38<21:39, 2.93s/it]
|
36462 |
11%|█ | 53/496 [02:41<20:54, 2.83s/it]
|
36463 |
11%|█ | 54/496 [02:44<20:25, 2.77s/it]
|
36464 |
11%|█ | 55/496 [02:46<20:03, 2.73s/it]
|
36465 |
11%|█▏ | 56/496 [02:49<21:03, 2.87s/it]
|
36466 |
11%|█▏ | 57/496 [02:52<21:03, 2.88s/it]
|
36467 |
12%|█▏ | 58/496 [02:55<20:26, 2.80s/it]
|
36468 |
12%|█▏ | 59/496 [02:58<20:13, 2.78s/it]
|
36469 |
12%|█▏ | 60/496 [03:01<20:47, 2.86s/it]
|
36470 |
12%|█▏ | 61/496 [03:03<20:19, 2.80s/it]
|
36471 |
12%|█▎ | 62/496 [03:06<20:46, 2.87s/it]
|
36472 |
13%|█▎ | 63/496 [03:09<20:45, 2.88s/it]
|
36473 |
13%|█▎ | 64/496 [03:12<20:54, 2.91s/it]
|
36474 |
13%|█▎ | 65/496 [03:16<21:28, 2.99s/it]
|
36475 |
13%|█▎ | 66/496 [03:19<21:31, 3.00s/it]
|
36476 |
14%|█▎ | 67/496 [03:21<20:14, 2.83s/it]
|
36477 |
14%|█▎ | 68/496 [03:23<19:18, 2.71s/it]
|
36478 |
14%|█▍ | 69/496 [03:26<19:26, 2.73s/it]
|
36479 |
14%|█▍ | 70/496 [03:29<19:42, 2.78s/it]
|
36480 |
14%|█▍ | 71/496 [03:32<20:16, 2.86s/it]
|
36481 |
15%|█▍ | 72/496 [03:35<20:12, 2.86s/it]
|
36482 |
15%|█▍ | 73/496 [03:38<20:02, 2.84s/it]
|
36483 |
15%|█▍ | 74/496 [03:40<19:41, 2.80s/it]
|
36484 |
15%|█▌ | 75/496 [03:43<19:55, 2.84s/it]
|
36485 |
15%|█▌ | 76/496 [03:47<20:28, 2.93s/it]
|
36486 |
16%|█▌ | 77/496 [03:50<21:00, 3.01s/it]
|
36487 |
16%|█▌ | 78/496 [03:53<20:37, 2.96s/it]
|
36488 |
16%|█▌ | 79/496 [03:56<21:21, 3.07s/it]
|
36489 |
16%|█▌ | 80/496 [03:59<21:38, 3.12s/it]
|
36490 |
16%|█▋ | 81/496 [04:03<22:28, 3.25s/it]
|
36491 |
17%|█▋ | 82/496 [04:06<22:22, 3.24s/it]
|
36492 |
17%|█▋ | 83/496 [04:09<21:24, 3.11s/it]
|
36493 |
17%|█▋ | 84/496 [04:12<22:08, 3.23s/it]
|
36494 |
17%|█▋ | 85/496 [04:15<22:00, 3.21s/it]
|
36495 |
17%|█▋ | 86/496 [04:19<22:39, 3.32s/it]
|
36496 |
18%|█▊ | 87/496 [04:22<22:18, 3.27s/it]
|
36497 |
18%|█▊ | 88/496 [04:25<21:10, 3.11s/it]
|
36498 |
18%|█▊ | 89/496 [04:28<20:45, 3.06s/it]
|
36499 |
18%|█▊ | 90/496 [04:31<20:32, 3.04s/it]
|
36500 |
18%|█▊ | 91/496 [04:34<21:21, 3.16s/it]
|
36501 |
19%|█▊ | 92/496 [04:37<21:17, 3.16s/it]
|
36502 |
19%|█▉ | 93/496 [04:41<21:41, 3.23s/it]
|
36503 |
19%|█▉ | 94/496 [04:44<21:48, 3.26s/it]
|
36504 |
19%|█▉ | 95/496 [04:48<21:58, 3.29s/it]
|
36505 |
19%|█▉ | 96/496 [04:50<20:33, 3.08s/it]
|
36506 |
20%|█▉ | 97/496 [04:53<20:22, 3.06s/it]
|
36507 |
20%|█▉ | 98/496 [04:56<20:15, 3.06s/it]
|
36508 |
20%|█▉ | 99/496 [04:59<20:11, 3.05s/it]
|
36509 |
20%|██ | 100/496 [05:02<19:38, 2.98s/it]
|
36510 |
20%|██ | 101/496 [05:05<19:09, 2.91s/it]
|
36511 |
21%|██ | 102/496 [05:08<18:50, 2.87s/it]
|
36512 |
21%|██ | 103/496 [05:10<18:56, 2.89s/it]
|
36513 |
21%|██ | 104/496 [05:13<18:31, 2.84s/it]
|
36514 |
21%|██ | 105/496 [05:16<19:08, 2.94s/it]
|
36515 |
21%|██▏ | 106/496 [05:19<19:21, 2.98s/it]
|
36516 |
22%|██▏ | 107/496 [05:23<19:42, 3.04s/it]
|
36517 |
22%|██▏ | 108/496 [05:25<19:19, 2.99s/it]
|
36518 |
22%|██▏ | 109/496 [05:28<19:15, 2.98s/it]
|
36519 |
22%|██▏ | 110/496 [05:31<18:53, 2.94s/it]
|
36520 |
22%|██▏ | 111/496 [05:34<18:13, 2.84s/it]
|
36521 |
23%|██▎ | 112/496 [05:37<18:49, 2.94s/it]
|
36522 |
23%|██▎ | 113/496 [05:39<17:44, 2.78s/it]
|
36523 |
23%|██▎ | 114/496 [05:42<17:41, 2.78s/it]
|
36524 |
23%|██▎ | 115/496 [05:45<17:20, 2.73s/it]
|
36525 |
23%|██▎ | 116/496 [05:48<18:26, 2.91s/it]
|
36526 |
24%|██▎ | 117/496 [05:51<18:20, 2.90s/it]
|
36527 |
24%|██▍ | 118/496 [05:54<17:44, 2.82s/it]
|
36528 |
24%|██▍ | 119/496 [05:56<17:24, 2.77s/it]
|
36529 |
24%|██▍ | 120/496 [05:59<17:57, 2.87s/it]
|
36530 |
24%|██▍ | 121/496 [06:02<17:45, 2.84s/it]
|
36531 |
25%|██▍ | 122/496 [06:05<18:00, 2.89s/it]
|
36532 |
25%|██▍ | 123/496 [06:08<18:31, 2.98s/it]
|
36533 |
25%|██▌ | 124/496 [06:11<17:33, 2.83s/it]
|
36534 |
25%|██▌ | 125/496 [06:14<17:35, 2.84s/it]
|
36535 |
25%|██▌ | 126/496 [06:17<17:50, 2.89s/it]
|
36536 |
26%|██▌ | 127/496 [06:20<18:29, 3.01s/it]
|
36537 |
26%|██▌ | 128/496 [06:23<18:19, 2.99s/it]
|
36538 |
26%|██▌ | 129/496 [06:26<17:38, 2.88s/it]
|
36539 |
26%|██▌ | 130/496 [06:29<17:56, 2.94s/it]
|
36540 |
26%|██▋ | 131/496 [06:32<17:49, 2.93s/it]
|
36541 |
27%|██▋ | 132/496 [06:34<17:03, 2.81s/it]
|
36542 |
27%|██▋ | 133/496 [06:37<16:22, 2.71s/it]
|
36543 |
27%|██▋ | 134/496 [06:40<16:39, 2.76s/it]
|
36544 |
27%|██▋ | 135/496 [06:43<17:11, 2.86s/it]
|
36545 |
27%|██▋ | 136/496 [06:46<17:18, 2.89s/it]
|
36546 |
28%|██▊ | 137/496 [06:48<16:54, 2.82s/it]
|
36547 |
28%|██▊ | 138/496 [06:51<17:06, 2.87s/it]
|
36548 |
28%|██▊ | 139/496 [06:54<17:28, 2.94s/it]
|
36549 |
28%|██▊ | 140/496 [06:58<18:10, 3.06s/it]
|
36550 |
28%|██▊ | 141/496 [07:01<17:53, 3.02s/it]
|
36551 |
29%|██▊ | 142/496 [07:04<18:21, 3.11s/it]
|
36552 |
29%|██▉ | 143/496 [07:07<17:51, 3.03s/it]
|
36553 |
29%|██▉ | 144/496 [07:09<17:06, 2.92s/it]
|
36554 |
29%|██▉ | 145/496 [07:12<17:13, 2.94s/it]
|
36555 |
29%|██▉ | 146/496 [07:16<17:28, 3.00s/it]
|
36556 |
30%|██▉ | 147/496 [07:19<18:15, 3.14s/it]
|
36557 |
30%|██▉ | 148/496 [07:22<17:54, 3.09s/it]
|
36558 |
30%|███ | 149/496 [07:25<17:31, 3.03s/it]
|
36559 |
30%|███ | 150/496 [07:28<17:50, 3.09s/it]
|
36560 |
30%|███ | 151/496 [07:31<16:52, 2.94s/it]
|
36561 |
31%|███ | 152/496 [07:35<18:21, 3.20s/it]
|
36562 |
31%|███ | 153/496 [07:38<18:37, 3.26s/it]
|
36563 |
31%|███ | 154/496 [07:40<17:17, 3.03s/it]
|
36564 |
31%|███▏ | 155/496 [07:43<16:31, 2.91s/it]
|
36565 |
31%|███▏ | 156/496 [07:46<16:33, 2.92s/it]
|
36566 |
32%|███▏ | 157/496 [07:49<16:31, 2.92s/it]
|
36567 |
32%|███▏ | 158/496 [07:51<15:11, 2.70s/it]
|
36568 |
32%|███▏ | 159/496 [07:54<14:47, 2.63s/it]
|
36569 |
32%|███▏ | 160/496 [07:56<14:20, 2.56s/it]
|
36570 |
32%|███▏ | 161/496 [07:59<14:47, 2.65s/it]
|
36571 |
33%|███▎ | 162/496 [08:02<15:13, 2.73s/it]
|
36572 |
33%|███▎ | 163/496 [08:05<15:25, 2.78s/it]
|
36573 |
33%|███▎ | 164/496 [08:08<16:01, 2.90s/it]
|
36574 |
33%|███▎ | 165/496 [08:11<16:58, 3.08s/it]
|
36575 |
33%|███▎ | 166/496 [08:15<17:12, 3.13s/it]
|
36576 |
34%|███▎ | 167/496 [08:17<16:00, 2.92s/it]
|
36577 |
34%|███▍ | 168/496 [08:20<15:34, 2.85s/it]
|
36578 |
34%|███▍ | 169/496 [08:23<15:40, 2.88s/it]
|
36579 |
34%|███▍ | 170/496 [08:25<15:37, 2.88s/it]
|
36580 |
34%|███▍ | 171/496 [08:28<15:08, 2.79s/it]
|
36581 |
35%|███▍ | 172/496 [08:31<15:44, 2.92s/it]
|
36582 |
35%|███▍ | 173/496 [08:34<15:27, 2.87s/it]
|
36583 |
35%|███▌ | 174/496 [08:37<15:02, 2.80s/it]
|
36584 |
35%|███▌ | 175/496 [08:40<15:04, 2.82s/it]
|
36585 |
35%|███▌ | 176/496 [08:43<15:36, 2.93s/it]
|
36586 |
36%|███▌ | 177/496 [08:45<15:06, 2.84s/it]
|
36587 |
36%|███▌ | 178/496 [08:49<16:49, 3.17s/it]
|
36588 |
36%|███▌ | 179/496 [08:52<16:22, 3.10s/it]
|
36589 |
36%|███▋ | 180/496 [08:55<16:15, 3.09s/it]
|
36590 |
36%|███▋ | 181/496 [08:58<16:05, 3.07s/it]
|
36591 |
37%|███▋ | 182/496 [09:01<15:18, 2.92s/it]
|
36592 |
37%|███▋ | 183/496 [09:04<15:09, 2.91s/it]
|
36593 |
37%|███▋ | 184/496 [09:07<14:51, 2.86s/it]
|
36594 |
37%|███▋ | 185/496 [09:10<15:17, 2.95s/it]
|
36595 |
38%|███▊ | 186/496 [09:13<15:29, 3.00s/it]
|
36596 |
38%|███▊ | 187/496 [09:15<14:47, 2.87s/it]
|
36597 |
38%|███▊ | 188/496 [09:19<15:58, 3.11s/it]
|
36598 |
38%|███▊ | 189/496 [09:22<15:54, 3.11s/it]
|
36599 |
38%|███▊ | 190/496 [09:25<15:57, 3.13s/it]
|
36600 |
39%|███▊ | 191/496 [09:29<16:17, 3.21s/it]
|
36601 |
39%|███▊ | 192/496 [09:32<15:37, 3.09s/it]
|
36602 |
39%|███▉ | 193/496 [09:34<15:19, 3.03s/it]
|
36603 |
39%|███▉ | 194/496 [09:37<14:05, 2.80s/it]
|
36604 |
39%|███▉ | 195/496 [09:39<13:51, 2.76s/it]
|
36605 |
40%|███▉ | 196/496 [09:42<14:08, 2.83s/it]
|
36606 |
40%|███▉ | 197/496 [09:45<14:07, 2.83s/it]
|
36607 |
40%|███▉ | 198/496 [09:48<14:31, 2.93s/it]
|
36608 |
40%|████ | 199/496 [09:51<14:41, 2.97s/it]
|
36609 |
40%|████ | 200/496 [09:54<14:37, 2.97s/it]
|
36610 |
41%|████ | 201/496 [09:57<14:49, 3.02s/it]
|
36611 |
41%|████ | 202/496 [10:01<15:28, 3.16s/it]
|
36612 |
41%|████ | 203/496 [10:03<14:24, 2.95s/it]
|
36613 |
41%|████ | 204/496 [10:06<14:04, 2.89s/it]
|
36614 |
41%|████▏ | 205/496 [10:09<13:46, 2.84s/it]
|
36615 |
42%|████▏ | 206/496 [10:12<13:34, 2.81s/it]
|
36616 |
42%|████▏ | 207/496 [10:14<13:27, 2.79s/it]
|
36617 |
42%|████▏ | 208/496 [10:17<13:22, 2.79s/it]
|
36618 |
42%|████▏ | 209/496 [10:20<14:04, 2.94s/it]
|
36619 |
42%|████▏ | 210/496 [10:23<14:05, 2.96s/it]
|
36620 |
43%|████▎ | 211/496 [10:26<14:08, 2.98s/it]
|
36621 |
43%|████▎ | 212/496 [10:30<14:26, 3.05s/it]
|
36622 |
43%|████▎ | 213/496 [10:33<14:15, 3.02s/it]
|
36623 |
43%|████▎ | 214/496 [10:36<14:18, 3.05s/it]
|
36624 |
43%|████▎ | 215/496 [10:39<14:00, 2.99s/it]
|
36625 |
44%|████▎ | 216/496 [10:42<14:33, 3.12s/it]
|
36626 |
44%|████▍ | 217/496 [10:46<15:38, 3.36s/it]
|
36627 |
44%|████▍ | 218/496 [10:49<14:29, 3.13s/it]
|
36628 |
44%|████▍ | 219/496 [10:51<13:49, 2.99s/it]
|
36629 |
44%|████▍ | 220/496 [10:54<13:28, 2.93s/it]
|
36630 |
45%|████▍ | 221/496 [10:57<13:45, 3.00s/it]
|
36631 |
45%|████▍ | 222/496 [11:00<13:46, 3.02s/it]
|
36632 |
45%|████▍ | 223/496 [11:03<13:38, 3.00s/it]
|
36633 |
45%|████▌ | 224/496 [11:07<14:38, 3.23s/it]
|
36634 |
45%|████▌ | 225/496 [11:11<15:20, 3.40s/it]
|
36635 |
46%|████▌ | 226/496 [11:14<14:45, 3.28s/it]
|
36636 |
46%|████▌ | 227/496 [11:17<14:04, 3.14s/it]
|
36637 |
46%|████▌ | 228/496 [11:20<14:05, 3.16s/it]
|
36638 |
46%|████▌ | 229/496 [11:23<13:34, 3.05s/it]
|
36639 |
46%|████▋ | 230/496 [11:26<13:29, 3.04s/it]
|
36640 |
47%|████▋ | 231/496 [11:29<13:37, 3.08s/it]
|
36641 |
47%|████▋ | 232/496 [11:32<13:34, 3.08s/it]
|
36642 |
47%|████▋ | 233/496 [11:35<13:48, 3.15s/it]
|
36643 |
47%|████▋ | 234/496 [11:38<13:23, 3.07s/it]
|
36644 |
47%|████▋ | 235/496 [11:41<13:19, 3.06s/it]
|
36645 |
48%|████▊ | 236/496 [11:44<13:16, 3.06s/it]
|
36646 |
48%|████▊ | 237/496 [11:47<12:48, 2.97s/it]
|
36647 |
48%|████▊ | 238/496 [11:50<12:54, 3.00s/it]
|
36648 |
48%|████▊ | 239/496 [11:53<13:25, 3.14s/it]
|
36649 |
48%|████▊ | 240/496 [11:56<12:47, 3.00s/it]
|
36650 |
49%|████▊ | 241/496 [11:59<12:53, 3.03s/it]
|
36651 |
49%|████▉ | 242/496 [12:02<12:46, 3.02s/it]
|
36652 |
49%|████▉ | 243/496 [12:05<12:26, 2.95s/it]
|
36653 |
49%|████▉ | 244/496 [12:08<12:30, 2.98s/it]
|
36654 |
49%|████▉ | 245/496 [12:12<13:17, 3.18s/it]
|
36655 |
50%|████▉ | 246/496 [12:15<12:56, 3.11s/it]
|
36656 |
50%|████▉ | 247/496 [12:18<12:59, 3.13s/it]
|
36657 |
50%|█████ | 248/496 [12:21<12:23, 3.00s/it]
|
36658 |
50%|█████ | 249/496 [12:23<12:17, 2.98s/it]
|
36659 |
50%|█████ | 250/496 [12:26<12:03, 2.94s/it]
|
36660 |
51%|█████ | 251/496 [12:29<11:18, 2.77s/it]
|
36661 |
51%|█████ | 252/496 [12:32<12:00, 2.95s/it]
|
36662 |
51%|█████ | 253/496 [12:35<12:21, 3.05s/it]
|
36663 |
51%|█████ | 254/496 [12:39<12:57, 3.21s/it]
|
36664 |
51%|█████▏ | 255/496 [12:41<11:52, 2.96s/it]
|
36665 |
52%|█████▏ | 256/496 [12:45<13:06, 3.28s/it]
|
36666 |
52%|█████▏ | 257/496 [12:48<12:45, 3.20s/it]
|
36667 |
52%|█████▏ | 258/496 [12:51<11:50, 2.98s/it]
|
36668 |
52%|█████▏ | 259/496 [12:54<11:58, 3.03s/it]
|
36669 |
52%|█████▏ | 260/496 [12:57<12:10, 3.09s/it]
|
36670 |
53%|█████▎ | 261/496 [13:00<11:42, 2.99s/it]
|
36671 |
53%|█████▎ | 262/496 [13:03<11:26, 2.93s/it]
|
36672 |
53%|█████▎ | 263/496 [13:06<11:14, 2.90s/it]
|
36673 |
53%|█████▎ | 264/496 [13:08<10:56, 2.83s/it]
|
36674 |
53%|█████▎ | 265/496 [13:12<11:29, 2.98s/it]
|
36675 |
54%|█████▎ | 266/496 [13:15<11:55, 3.11s/it]
|
36676 |
54%|█████▍ | 267/496 [13:19<12:29, 3.27s/it]
|
36677 |
54%|█████▍ | 268/496 [13:22<12:20, 3.25s/it]
|
36678 |
54%|█████▍ | 269/496 [13:25<12:22, 3.27s/it]
|
36679 |
54%|█████▍ | 270/496 [13:28<12:15, 3.25s/it]
|
36680 |
55%|█████▍ | 271/496 [13:31<12:00, 3.20s/it]
|
36681 |
55%|█████▍ | 272/496 [13:34<11:27, 3.07s/it]
|
36682 |
55%|█████▌ | 273/496 [13:37<11:03, 2.98s/it]
|
36683 |
55%|█████▌ | 274/496 [13:40<11:16, 3.05s/it]
|
36684 |
55%|█████▌ | 275/496 [13:44<11:45, 3.19s/it]
|
36685 |
56%|█████▌ | 276/496 [13:47<11:27, 3.12s/it]
|
36686 |
56%|█████▌ | 277/496 [13:49<11:01, 3.02s/it]
|
36687 |
56%|█████▌ | 278/496 [13:53<11:31, 3.17s/it]
|
36688 |
56%|█████▋ | 279/496 [13:56<11:23, 3.15s/it]
|
36689 |
56%|█████▋ | 280/496 [14:00<11:40, 3.24s/it]
|
36690 |
57%|█████▋ | 281/496 [14:03<11:21, 3.17s/it]
|
36691 |
57%|█████▋ | 282/496 [14:05<11:03, 3.10s/it]
|
36692 |
57%|█████▋ | 283/496 [14:11<13:06, 3.69s/it]
|
36693 |
57%|█████▋ | 284/496 [14:13<11:46, 3.33s/it]
|
36694 |
57%|█████▋ | 285/496 [14:16<10:51, 3.09s/it]
|
36695 |
58%|█████▊ | 286/496 [14:19<11:13, 3.21s/it]
|
36696 |
58%|█████▊ | 287/496 [14:22<10:49, 3.11s/it]
|
36697 |
58%|█████▊ | 288/496 [14:26<11:41, 3.37s/it]
|
36698 |
58%|█████▊ | 289/496 [14:29<11:08, 3.23s/it]
|
36699 |
58%|█████▊ | 290/496 [14:32<10:46, 3.14s/it]
|
36700 |
59%|█████▊ | 291/496 [14:35<10:25, 3.05s/it]
|
36701 |
59%|█████▉ | 292/496 [14:37<10:12, 3.00s/it]
|
36702 |
59%|█████▉ | 293/496 [14:40<09:17, 2.75s/it]
|
36703 |
59%|█████▉ | 294/496 [14:42<09:16, 2.76s/it]
|
36704 |
59%|█████▉ | 295/496 [14:46<10:04, 3.01s/it]
|
36705 |
60%|█████▉ | 296/496 [14:49<09:48, 2.94s/it]
|
36706 |
60%|█████▉ | 297/496 [14:51<09:13, 2.78s/it]
|
36707 |
60%|██████ | 298/496 [14:54<08:45, 2.65s/it]
|
36708 |
60%|██████ | 299/496 [14:56<08:37, 2.63s/it]
|
36709 |
60%|██████ | 300/496 [14:59<09:02, 2.77s/it]
|
36710 |
61%|██████ | 301/496 [15:02<08:58, 2.76s/it]
|
36711 |
61%|██████ | 302/496 [15:06<10:03, 3.11s/it]
|
36712 |
61%|██████ | 303/496 [15:09<10:05, 3.14s/it]
|
36713 |
61%|██████▏ | 304/496 [15:12<10:06, 3.16s/it]
|
36714 |
61%|██████▏ | 305/496 [15:15<09:26, 2.97s/it]
|
36715 |
62%|██████▏ | 306/496 [15:17<09:09, 2.89s/it]
|
36716 |
62%|██████▏ | 307/496 [15:20<08:48, 2.80s/it]
|
36717 |
62%|██████▏ | 308/496 [15:23<08:41, 2.77s/it]
|
36718 |
62%|██████▏ | 309/496 [15:26<08:40, 2.78s/it]
|
36719 |
62%|██████▎ | 310/496 [15:29<09:10, 2.96s/it]
|
36720 |
63%|██████▎ | 311/496 [15:32<09:38, 3.13s/it]
|
36721 |
63%|██████▎ | 312/496 [15:36<09:44, 3.18s/it]
|
36722 |
63%|██████▎ | 313/496 [15:38<08:43, 2.86s/it]
|
36723 |
63%|██████▎ | 314/496 [15:41<08:28, 2.79s/it]
|
36724 |
64%|██████▎ | 315/496 [15:44<08:42, 2.89s/it]
|
36725 |
64%|██████▎ | 316/496 [15:47<08:39, 2.88s/it]
|
36726 |
64%|██████▍ | 317/496 [15:49<08:37, 2.89s/it]
|
36727 |
64%|██████▍ | 318/496 [15:52<08:38, 2.91s/it]
|
36728 |
64%|██████�� | 319/496 [15:56<09:25, 3.19s/it]
|
36729 |
65%|██████▍ | 320/496 [15:59<08:56, 3.05s/it]
|
36730 |
65%|██████▍ | 321/496 [16:02<08:32, 2.93s/it]
|
36731 |
65%|██████▍ | 322/496 [16:04<08:17, 2.86s/it]
|
36732 |
65%|██████▌ | 323/496 [16:08<08:36, 2.98s/it]
|
36733 |
65%|██████▌ | 324/496 [16:11<08:33, 2.99s/it]
|
36734 |
66%|██████▌ | 325/496 [16:13<08:05, 2.84s/it]
|
36735 |
66%|██████▌ | 326/496 [16:16<08:22, 2.96s/it]
|
36736 |
66%|██████▌ | 327/496 [16:19<07:59, 2.83s/it]
|
36737 |
66%|██████▌ | 328/496 [16:21<07:46, 2.77s/it]
|
36738 |
66%|██████▋ | 329/496 [16:25<08:04, 2.90s/it]
|
36739 |
67%|██████▋ | 330/496 [16:27<07:52, 2.85s/it]
|
36740 |
67%|██████▋ | 331/496 [16:31<08:08, 2.96s/it]
|
36741 |
67%|██████▋ | 332/496 [16:34<08:15, 3.02s/it]
|
36742 |
67%|██████▋ | 333/496 [16:37<08:10, 3.01s/it]
|
36743 |
67%|██████▋ | 334/496 [16:40<07:54, 2.93s/it]
|
36744 |
68%|██████▊ | 335/496 [16:43<08:04, 3.01s/it]
|
36745 |
68%|██████▊ | 336/496 [16:46<08:23, 3.15s/it]
|
36746 |
68%|██████▊ | 337/496 [16:49<08:15, 3.11s/it]
|
36747 |
68%|██████▊ | 338/496 [16:52<07:48, 2.96s/it]
|
36748 |
68%|██████▊ | 339/496 [16:54<07:26, 2.84s/it]
|
36749 |
69%|██████▊ | 340/496 [16:58<07:36, 2.93s/it]
|
36750 |
69%|██████▉ | 341/496 [17:01<07:49, 3.03s/it]
|
36751 |
69%|██████▉ | 342/496 [17:04<08:04, 3.14s/it]
|
36752 |
69%|██████▉ | 343/496 [17:07<08:00, 3.14s/it]
|
36753 |
69%|██████▉ | 344/496 [17:10<07:49, 3.09s/it]
|
36754 |
70%|██████▉ | 345/496 [17:13<07:27, 2.97s/it]
|
36755 |
70%|██████▉ | 346/496 [17:15<07:05, 2.84s/it]
|
36756 |
70%|██████▉ | 347/496 [17:19<07:14, 2.92s/it]
|
36757 |
70%|███████ | 348/496 [17:22<07:13, 2.93s/it]
|
36758 |
70%|███████ | 349/496 [17:26<08:25, 3.44s/it]
|
36759 |
71%|███████ | 350/496 [17:29<08:12, 3.38s/it]
|
36760 |
71%|███████ | 351/496 [17:32<07:51, 3.25s/it]
|
36761 |
71%|███████ | 352/496 [17:35<07:31, 3.13s/it]
|
36762 |
71%|███████ | 353/496 [17:38<07:24, 3.11s/it]
|
36763 |
71%|███████▏ | 354/496 [17:41<07:23, 3.12s/it]
|
36764 |
72%|███████▏ | 355/496 [17:45<07:33, 3.21s/it]
|
36765 |
72%|███████▏ | 356/496 [17:48<07:27, 3.20s/it]
|
36766 |
72%|███████▏ | 357/496 [17:51<07:14, 3.13s/it]
|
36767 |
72%|███████▏ | 358/496 [17:53<06:41, 2.91s/it]
|
36768 |
72%|███████▏ | 359/496 [17:57<06:47, 2.97s/it]
|
36769 |
73%|███████▎ | 360/496 [18:00<06:47, 3.00s/it]
|
36770 |
73%|███████▎ | 361/496 [18:02<06:37, 2.94s/it]
|
36771 |
73%|███████▎ | 362/496 [18:06<06:55, 3.10s/it]
|
36772 |
73%|███████▎ | 363/496 [18:09<06:44, 3.04s/it]
|
36773 |
73%|███████▎ | 364/496 [18:11<06:21, 2.89s/it]
|
36774 |
74%|███████▎ | 365/496 [18:14<06:14, 2.86s/it]
|
36775 |
74%|███████▍ | 366/496 [18:17<06:06, 2.82s/it]
|
36776 |
74%|███████▍ | 367/496 [18:19<05:56, 2.76s/it]
|
36777 |
74%|███████▍ | 368/496 [18:23<06:24, 3.00s/it]
|
36778 |
74%|███████▍ | 369/496 [18:26<06:17, 2.97s/it]
|
36779 |
75%|███████▍ | 370/496 [18:29<06:24, 3.05s/it]
|
36780 |
75%|███████▍ | 371/496 [18:32<06:29, 3.12s/it]
|
36781 |
75%|███████▌ | 372/496 [18:35<06:12, 3.01s/it]
|
36782 |
75%|███████▌ | 373/496 [18:38<06:07, 2.99s/it]
|
36783 |
75%|███████▌ | 374/496 [18:41<06:02, 2.97s/it]
|
36784 |
76%|███████▌ | 375/496 [18:44<06:11, 3.07s/it]
|
36785 |
76%|███████▌ | 376/496 [18:47<05:57, 2.98s/it]
|
36786 |
76%|███████▌ | 377/496 [18:50<05:56, 3.00s/it]
|
36787 |
76%|███████▌ | 378/496 [18:53<05:44, 2.92s/it]
|
36788 |
76%|███████▋ | 379/496 [18:55<05:22, 2.75s/it]
|
36789 |
77%|███████▋ | 380/496 [18:58<05:30, 2.85s/it]
|
36790 |
77%|███████▋ | 381/496 [19:01<05:15, 2.74s/it]
|
36791 |
77%|███████▋ | 382/496 [19:04<05:25, 2.86s/it]
|
36792 |
77%|███████▋ | 383/496 [19:07<05:37, 2.99s/it]
|
36793 |
77%|███████▋ | 384/496 [19:10<05:12, 2.79s/it]
|
36794 |
78%|███████▊ | 385/496 [19:13<05:26, 2.94s/it]
|
36795 |
78%|███████▊ | 386/496 [19:16<05:28, 2.98s/it]
|
36796 |
78%|███████▊ | 387/496 [19:19<05:29, 3.03s/it]
|
36797 |
78%|███████▊ | 388/496 [19:22<05:28, 3.04s/it]
|
36798 |
78%|███████▊ | 389/496 [19:25<05:30, 3.09s/it]
|
36799 |
79%|███████▊ | 390/496 [19:28<05:22, 3.05s/it]
|
36800 |
79%|███████▉ | 391/496 [19:31<05:18, 3.04s/it]
|
36801 |
79%|███████▉ | 392/496 [19:34<05:09, 2.98s/it]
|
36802 |
79%|███████▉ | 393/496 [19:37<04:59, 2.91s/it]
|
36803 |
79%|███████▉ | 394/496 [19:40<05:02, 2.96s/it]
|
36804 |
80%|███████▉ | 395/496 [19:42<04:42, 2.80s/it]
|
36805 |
80%|███████▉ | 396/496 [19:46<04:57, 2.98s/it]
|
36806 |
80%|████████ | 397/496 [19:49<05:02, 3.06s/it]
|
36807 |
80%|████████ | 398/496 [19:52<05:09, 3.16s/it]
|
36808 |
80%|████████ | 399/496 [19:55<04:43, 2.92s/it]
|
36809 |
81%|████████ | 400/496 [19:57<04:30, 2.81s/it]
|
36810 |
81%|████████ | 401/496 [20:01<04:50, 3.06s/it]
|
36811 |
81%|████████ | 402/496 [20:04<04:43, 3.02s/it]
|
36812 |
81%|████████▏ | 403/496 [20:08<05:19, 3.43s/it]
|
36813 |
81%|████████▏ | 404/496 [20:11<04:55, 3.21s/it]
|
36814 |
82%|████████▏ | 405/496 [20:14<04:48, 3.17s/it]
|
36815 |
82%|████████▏ | 406/496 [20:16<04:22, 2.92s/it]
|
36816 |
82%|████████▏ | 407/496 [20:19<04:15, 2.87s/it]
|
36817 |
82%|████████▏ | 408/496 [20:22<04:14, 2.89s/it]
|
36818 |
82%|████████▏ | 409/496 [20:25<04:05, 2.82s/it]
|
36819 |
83%|████████▎ | 410/496 [20:27<03:58, 2.78s/it]
|
36820 |
83%|████████▎ | 411/496 [20:31<04:08, 2.92s/it]
|
36821 |
83%|████████▎ | 412/496 [20:34<04:13, 3.01s/it]
|
36822 |
83%|████████▎ | 413/496 [20:37<04:20, 3.14s/it]
|
36823 |
83%|████████▎ | 414/496 [20:40<04:17, 3.14s/it]
|
36824 |
84%|████████▎ | 415/496 [20:44<04:27, 3.30s/it]
|
36825 |
84%|████████▍ | 416/496 [20:47<04:13, 3.17s/it]
|
36826 |
84%|████████▍ | 417/496 [20:50<04:05, 3.11s/it]
|
36827 |
84%|████████▍ | 418/496 [20:53<03:54, 3.01s/it]
|
36828 |
84%|████████▍ | 419/496 [20:55<03:40, 2.86s/it]
|
36829 |
85%|████████▍ | 420/496 [20:58<03:25, 2.70s/it]
|
36830 |
85%|████████▍ | 421/496 [21:00<03:18, 2.65s/it]
|
36831 |
85%|████████▌ | 422/496 [21:03<03:18, 2.69s/it]
|
36832 |
85%|████████▌ | 423/496 [21:05<03:08, 2.58s/it]
|
36833 |
85%|████████▌ | 424/496 [21:08<03:17, 2.74s/it]
|
36834 |
86%|████████▌ | 425/496 [21:11<03:16, 2.77s/it]
|
36835 |
86%|████████▌ | 426/496 [21:15<03:25, 2.94s/it]
|
36836 |
86%|████████▌ | 427/496 [21:17<03:22, 2.93s/it]
|
36837 |
86%|████████▋ | 428/496 [21:21<03:24, 3.01s/it]
|
36838 |
86%|████████▋ | 429/496 [21:23<03:14, 2.90s/it]
|
36839 |
87%|████████▋ | 430/496 [21:26<03:06, 2.83s/it]
|
36840 |
87%|████████▋ | 431/496 [21:29<03:09, 2.92s/it]
|
36841 |
87%|████████▋ | 432/496 [21:32<03:10, 2.98s/it]
|
36842 |
87%|████████▋ | 433/496 [21:35<02:57, 2.82s/it]
|
36843 |
88%|████████▊ | 434/496 [21:38<02:58, 2.88s/it]
|
36844 |
88%|████████▊ | 435/496 [21:41<02:55, 2.87s/it]
|
36845 |
88%|████████▊ | 436/496 [21:44<02:57, 2.95s/it]
|
36846 |
88%|████████▊ | 437/496 [21:47<03:09, 3.20s/it]
|
36847 |
88%|████████▊ | 438/496 [21:50<02:58, 3.07s/it]
|
36848 |
89%|████████▊ | 439/496 [21:53<02:57, 3.11s/it]
|
36849 |
89%|████████▊ | 440/496 [21:56<02:50, 3.04s/it]
|
36850 |
89%|████████▉ | 441/496 [22:00<02:50, 3.10s/it]
|
36851 |
89%|████████▉ | 442/496 [22:02<02:45, 3.06s/it]
|
36852 |
89%|████████▉ | 443/496 [22:06<02:51, 3.24s/it]
|
36853 |
90%|████████▉ | 444/496 [22:09<02:41, 3.11s/it]
|
36854 |
90%|████████▉ | 445/496 [22:12<02:34, 3.02s/it]
|
36855 |
90%|████████▉ | 446/496 [22:15<02:27, 2.95s/it]
|
36856 |
90%|█████████ | 447/496 [22:18<02:25, 2.97s/it]
|
36857 |
90%|█████████ | 448/496 [22:21<02:24, 3.00s/it]
|
36858 |
91%|█████████ | 449/496 [22:24<02:27, 3.14s/it]
|
36859 |
91%|█████████ | 450/496 [22:27<02:17, 2.99s/it]
|
36860 |
91%|█████████ | 451/496 [22:29<02:04, 2.76s/it]
|
36861 |
91%|█████████ | 452/496 [22:32<01:59, 2.71s/it]
|
36862 |
91%|█████████▏| 453/496 [22:35<02:06, 2.95s/it]
|
36863 |
92%|█████████▏| 454/496 [22:39<02:15, 3.22s/it]
|
36864 |
92%|█████████▏| 455/496 [22:41<02:02, 2.99s/it]
|
36865 |
92%|█████████▏| 456/496 [22:44<01:59, 2.99s/it]
|
36866 |
92%|█████████▏| 457/496 [22:48<02:03, 3.18s/it]
|
36867 |
92%|█████████▏| 458/496 [22:50<01:51, 2.94s/it]
|
36868 |
93%|█████████▎| 459/496 [22:54<01:59, 3.23s/it]
|
36869 |
93%|█████████▎| 460/496 [22:57<01:53, 3.16s/it]
|
36870 |
93%|█████████▎| 461/496 [23:00<01:47, 3.07s/it]
|
36871 |
93%|█████████▎| 462/496 [23:03<01:41, 2.98s/it]
|
36872 |
93%|█████████▎| 463/496 [23:06<01:37, 2.96s/it]
|
36873 |
94%|█████████▎| 464/496 [23:09<01:39, 3.10s/it]
|
36874 |
94%|█████████▍| 465/496 [23:12<01:32, 2.97s/it]
|
36875 |
94%|█████████▍| 466/496 [23:15<01:26, 2.87s/it]
|
36876 |
94%|█████████▍| 467/496 [23:17<01:19, 2.76s/it]
|
36877 |
94%|█████████▍| 468/496 [23:20<01:17, 2.78s/it]
|
36878 |
95%|█████████▍| 469/496 [23:23<01:17, 2.87s/it]
|
36879 |
95%|█████████▍| 470/496 [23:26<01:15, 2.89s/it]
|
36880 |
95%|█████████▍| 471/496 [23:29<01:11, 2.86s/it]
|
36881 |
95%|█████████▌| 472/496 [23:32<01:09, 2.91s/it]
|
36882 |
95%|█████████▌| 473/496 [23:34<01:04, 2.79s/it]
|
36883 |
96%|█████████▌| 474/496 [23:37<01:02, 2.85s/it]
|
36884 |
96%|█████████▌| 475/496 [23:40<00:59, 2.84s/it]
|
36885 |
96%|█████████▌| 476/496 [23:43<00:55, 2.80s/it]
|
36886 |
96%|█████████▌| 477/496 [23:46<00:53, 2.82s/it]
|
36887 |
96%|█████████▋| 478/496 [23:49<00:51, 2.86s/it]
|
36888 |
97%|█████████▋| 479/496 [23:51<00:47, 2.79s/it]
|
36889 |
97%|█████████▋| 480/496 [23:54<00:46, 2.88s/it]
|
36890 |
97%|█████████▋| 481/496 [23:57<00:44, 2.95s/it]
|
36891 |
97%|█████████▋| 482/496 [24:00<00:41, 2.95s/it]
|
36892 |
97%|█████████▋| 483/496 [24:03<00:38, 2.93s/it]
|
36893 |
98%|█████████▊| 484/496 [24:07<00:36, 3.07s/it]
|
36894 |
98%|█████████▊| 485/496 [24:09<00:33, 3.00s/it]
|
36895 |
98%|█████████▊| 486/496 [24:12<00:29, 2.94s/it]
|
36896 |
98%|█████████▊| 487/496 [24:15<00:27, 3.02s/it]
|
36897 |
98%|█████████▊| 488/496 [24:18<00:23, 3.00s/it]
|
36898 |
99%|█████████▊| 489/496 [24:21<00:20, 2.96s/it]
|
36899 |
99%|█████████▉| 490/496 [24:24<00:17, 2.91s/it]
|
36900 |
99%|█████████▉| 491/496 [24:27<00:14, 3.00s/it]
|
36901 |
99%|█████████▉| 492/496 [24:30<00:11, 2.98s/it]
|
36902 |
99%|█████████▉| 493/496 [24:33<00:09, 3.06s/it]
|
36903 |
+
[INFO|trainer.py:2700] 2022-12-17 18:33:47,930 >> Saving model checkpoint to ./
|
36904 |
+
[INFO|configuration_utils.py:447] 2022-12-17 18:33:47,931 >> Configuration saved in ./config.json
|
36905 |
+
[INFO|modeling_utils.py:1680] 2022-12-17 18:33:48,292 >> Model weights saved in ./pytorch_model.bin
|
36906 |
+
[INFO|feature_extraction_utils.py:368] 2022-12-17 18:33:48,308 >> Feature extractor saved in ./preprocessor_config.json
|
36907 |
+
[INFO|tokenization_utils_base.py:2157] 2022-12-17 18:33:48,308 >> tokenizer config file saved in ./tokenizer_config.json
|
36908 |
+
[INFO|tokenization_utils_base.py:2164] 2022-12-17 18:33:48,309 >> Special tokens file saved in ./special_tokens_map.json
|
36909 |
+
[INFO|tokenization_utils_base.py:2210] 2022-12-17 18:33:48,309 >> added tokens file saved in ./added_tokens.json
|
trainer_state.json
ADDED
@@ -0,0 +1,805 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": 12.206885082321635,
|
3 |
+
"best_model_checkpoint": "./checkpoint-6000",
|
4 |
+
"epoch": 1.0958333333333334,
|
5 |
+
"global_step": 6000,
|
6 |
+
"is_hyper_param_search": false,
|
7 |
+
"is_local_process_zero": true,
|
8 |
+
"is_world_process_zero": true,
|
9 |
+
"log_history": [
|
10 |
+
{
|
11 |
+
"epoch": 0.0,
|
12 |
+
"learning_rate": 0.0,
|
13 |
+
"loss": 2.996,
|
14 |
+
"step": 1
|
15 |
+
},
|
16 |
+
{
|
17 |
+
"epoch": 0.01,
|
18 |
+
"learning_rate": 9.4e-06,
|
19 |
+
"loss": 1.9547,
|
20 |
+
"step": 50
|
21 |
+
},
|
22 |
+
{
|
23 |
+
"epoch": 0.02,
|
24 |
+
"learning_rate": 1.94e-05,
|
25 |
+
"loss": 0.7554,
|
26 |
+
"step": 100
|
27 |
+
},
|
28 |
+
{
|
29 |
+
"epoch": 0.03,
|
30 |
+
"learning_rate": 2.94e-05,
|
31 |
+
"loss": 0.5206,
|
32 |
+
"step": 150
|
33 |
+
},
|
34 |
+
{
|
35 |
+
"epoch": 0.03,
|
36 |
+
"learning_rate": 3.94e-05,
|
37 |
+
"loss": 0.4737,
|
38 |
+
"step": 200
|
39 |
+
},
|
40 |
+
{
|
41 |
+
"epoch": 0.04,
|
42 |
+
"learning_rate": 4.94e-05,
|
43 |
+
"loss": 0.3952,
|
44 |
+
"step": 250
|
45 |
+
},
|
46 |
+
{
|
47 |
+
"epoch": 0.05,
|
48 |
+
"learning_rate": 5.94e-05,
|
49 |
+
"loss": 0.3662,
|
50 |
+
"step": 300
|
51 |
+
},
|
52 |
+
{
|
53 |
+
"epoch": 0.06,
|
54 |
+
"learning_rate": 6.939999999999999e-05,
|
55 |
+
"loss": 0.3557,
|
56 |
+
"step": 350
|
57 |
+
},
|
58 |
+
{
|
59 |
+
"epoch": 0.07,
|
60 |
+
"learning_rate": 7.94e-05,
|
61 |
+
"loss": 0.3687,
|
62 |
+
"step": 400
|
63 |
+
},
|
64 |
+
{
|
65 |
+
"epoch": 0.07,
|
66 |
+
"learning_rate": 8.94e-05,
|
67 |
+
"loss": 0.3288,
|
68 |
+
"step": 450
|
69 |
+
},
|
70 |
+
{
|
71 |
+
"epoch": 0.08,
|
72 |
+
"learning_rate": 9.94e-05,
|
73 |
+
"loss": 0.2986,
|
74 |
+
"step": 500
|
75 |
+
},
|
76 |
+
{
|
77 |
+
"epoch": 0.09,
|
78 |
+
"learning_rate": 9.914545454545455e-05,
|
79 |
+
"loss": 0.3076,
|
80 |
+
"step": 550
|
81 |
+
},
|
82 |
+
{
|
83 |
+
"epoch": 0.1,
|
84 |
+
"learning_rate": 9.823636363636364e-05,
|
85 |
+
"loss": 0.2977,
|
86 |
+
"step": 600
|
87 |
+
},
|
88 |
+
{
|
89 |
+
"epoch": 0.11,
|
90 |
+
"learning_rate": 9.732727272727273e-05,
|
91 |
+
"loss": 0.3167,
|
92 |
+
"step": 650
|
93 |
+
},
|
94 |
+
{
|
95 |
+
"epoch": 0.12,
|
96 |
+
"learning_rate": 9.641818181818182e-05,
|
97 |
+
"loss": 0.2799,
|
98 |
+
"step": 700
|
99 |
+
},
|
100 |
+
{
|
101 |
+
"epoch": 0.12,
|
102 |
+
"learning_rate": 9.550909090909092e-05,
|
103 |
+
"loss": 0.2079,
|
104 |
+
"step": 750
|
105 |
+
},
|
106 |
+
{
|
107 |
+
"epoch": 0.13,
|
108 |
+
"learning_rate": 9.46e-05,
|
109 |
+
"loss": 0.2246,
|
110 |
+
"step": 800
|
111 |
+
},
|
112 |
+
{
|
113 |
+
"epoch": 0.14,
|
114 |
+
"learning_rate": 9.36909090909091e-05,
|
115 |
+
"loss": 0.2568,
|
116 |
+
"step": 850
|
117 |
+
},
|
118 |
+
{
|
119 |
+
"epoch": 0.15,
|
120 |
+
"learning_rate": 9.278181818181819e-05,
|
121 |
+
"loss": 0.2734,
|
122 |
+
"step": 900
|
123 |
+
},
|
124 |
+
{
|
125 |
+
"epoch": 0.16,
|
126 |
+
"learning_rate": 9.187272727272727e-05,
|
127 |
+
"loss": 0.183,
|
128 |
+
"step": 950
|
129 |
+
},
|
130 |
+
{
|
131 |
+
"epoch": 0.17,
|
132 |
+
"learning_rate": 9.096363636363638e-05,
|
133 |
+
"loss": 0.2445,
|
134 |
+
"step": 1000
|
135 |
+
},
|
136 |
+
{
|
137 |
+
"epoch": 0.17,
|
138 |
+
"eval_loss": 0.3058685064315796,
|
139 |
+
"eval_runtime": 2133.1044,
|
140 |
+
"eval_samples_per_second": 7.441,
|
141 |
+
"eval_steps_per_second": 0.233,
|
142 |
+
"eval_wer": 32.41627267903669,
|
143 |
+
"step": 1000
|
144 |
+
},
|
145 |
+
{
|
146 |
+
"epoch": 0.17,
|
147 |
+
"learning_rate": 9.005454545454545e-05,
|
148 |
+
"loss": 0.1608,
|
149 |
+
"step": 1050
|
150 |
+
},
|
151 |
+
{
|
152 |
+
"epoch": 0.18,
|
153 |
+
"learning_rate": 8.914545454545455e-05,
|
154 |
+
"loss": 0.1718,
|
155 |
+
"step": 1100
|
156 |
+
},
|
157 |
+
{
|
158 |
+
"epoch": 0.19,
|
159 |
+
"learning_rate": 8.823636363636364e-05,
|
160 |
+
"loss": 0.1721,
|
161 |
+
"step": 1150
|
162 |
+
},
|
163 |
+
{
|
164 |
+
"epoch": 0.2,
|
165 |
+
"learning_rate": 8.732727272727273e-05,
|
166 |
+
"loss": 0.1762,
|
167 |
+
"step": 1200
|
168 |
+
},
|
169 |
+
{
|
170 |
+
"epoch": 0.21,
|
171 |
+
"learning_rate": 8.641818181818182e-05,
|
172 |
+
"loss": 0.1587,
|
173 |
+
"step": 1250
|
174 |
+
},
|
175 |
+
{
|
176 |
+
"epoch": 0.22,
|
177 |
+
"learning_rate": 8.550909090909092e-05,
|
178 |
+
"loss": 0.2133,
|
179 |
+
"step": 1300
|
180 |
+
},
|
181 |
+
{
|
182 |
+
"epoch": 0.23,
|
183 |
+
"learning_rate": 8.46e-05,
|
184 |
+
"loss": 0.2291,
|
185 |
+
"step": 1350
|
186 |
+
},
|
187 |
+
{
|
188 |
+
"epoch": 0.23,
|
189 |
+
"learning_rate": 8.36909090909091e-05,
|
190 |
+
"loss": 0.1172,
|
191 |
+
"step": 1400
|
192 |
+
},
|
193 |
+
{
|
194 |
+
"epoch": 0.24,
|
195 |
+
"learning_rate": 8.278181818181819e-05,
|
196 |
+
"loss": 0.1034,
|
197 |
+
"step": 1450
|
198 |
+
},
|
199 |
+
{
|
200 |
+
"epoch": 0.25,
|
201 |
+
"learning_rate": 8.187272727272728e-05,
|
202 |
+
"loss": 0.1746,
|
203 |
+
"step": 1500
|
204 |
+
},
|
205 |
+
{
|
206 |
+
"epoch": 0.26,
|
207 |
+
"learning_rate": 8.096363636363636e-05,
|
208 |
+
"loss": 0.1649,
|
209 |
+
"step": 1550
|
210 |
+
},
|
211 |
+
{
|
212 |
+
"epoch": 0.27,
|
213 |
+
"learning_rate": 8.005454545454547e-05,
|
214 |
+
"loss": 0.1153,
|
215 |
+
"step": 1600
|
216 |
+
},
|
217 |
+
{
|
218 |
+
"epoch": 0.28,
|
219 |
+
"learning_rate": 7.914545454545454e-05,
|
220 |
+
"loss": 0.1521,
|
221 |
+
"step": 1650
|
222 |
+
},
|
223 |
+
{
|
224 |
+
"epoch": 0.28,
|
225 |
+
"learning_rate": 7.823636363636364e-05,
|
226 |
+
"loss": 0.1684,
|
227 |
+
"step": 1700
|
228 |
+
},
|
229 |
+
{
|
230 |
+
"epoch": 0.29,
|
231 |
+
"learning_rate": 7.732727272727273e-05,
|
232 |
+
"loss": 0.2243,
|
233 |
+
"step": 1750
|
234 |
+
},
|
235 |
+
{
|
236 |
+
"epoch": 0.3,
|
237 |
+
"learning_rate": 7.641818181818182e-05,
|
238 |
+
"loss": 0.2149,
|
239 |
+
"step": 1800
|
240 |
+
},
|
241 |
+
{
|
242 |
+
"epoch": 0.31,
|
243 |
+
"learning_rate": 7.550909090909092e-05,
|
244 |
+
"loss": 0.1927,
|
245 |
+
"step": 1850
|
246 |
+
},
|
247 |
+
{
|
248 |
+
"epoch": 0.32,
|
249 |
+
"learning_rate": 7.46e-05,
|
250 |
+
"loss": 0.2019,
|
251 |
+
"step": 1900
|
252 |
+
},
|
253 |
+
{
|
254 |
+
"epoch": 0.33,
|
255 |
+
"learning_rate": 7.36909090909091e-05,
|
256 |
+
"loss": 0.2003,
|
257 |
+
"step": 1950
|
258 |
+
},
|
259 |
+
{
|
260 |
+
"epoch": 0.33,
|
261 |
+
"learning_rate": 7.278181818181819e-05,
|
262 |
+
"loss": 0.1823,
|
263 |
+
"step": 2000
|
264 |
+
},
|
265 |
+
{
|
266 |
+
"epoch": 0.33,
|
267 |
+
"eval_loss": 0.20035691559314728,
|
268 |
+
"eval_runtime": 2105.4622,
|
269 |
+
"eval_samples_per_second": 7.538,
|
270 |
+
"eval_steps_per_second": 0.236,
|
271 |
+
"eval_wer": 22.12587013850942,
|
272 |
+
"step": 2000
|
273 |
+
},
|
274 |
+
{
|
275 |
+
"epoch": 0.34,
|
276 |
+
"learning_rate": 7.187272727272728e-05,
|
277 |
+
"loss": 0.1707,
|
278 |
+
"step": 2050
|
279 |
+
},
|
280 |
+
{
|
281 |
+
"epoch": 0.35,
|
282 |
+
"learning_rate": 7.096363636363636e-05,
|
283 |
+
"loss": 0.1659,
|
284 |
+
"step": 2100
|
285 |
+
},
|
286 |
+
{
|
287 |
+
"epoch": 0.36,
|
288 |
+
"learning_rate": 7.005454545454547e-05,
|
289 |
+
"loss": 0.193,
|
290 |
+
"step": 2150
|
291 |
+
},
|
292 |
+
{
|
293 |
+
"epoch": 0.37,
|
294 |
+
"learning_rate": 6.914545454545454e-05,
|
295 |
+
"loss": 0.1882,
|
296 |
+
"step": 2200
|
297 |
+
},
|
298 |
+
{
|
299 |
+
"epoch": 0.38,
|
300 |
+
"learning_rate": 6.823636363636364e-05,
|
301 |
+
"loss": 0.163,
|
302 |
+
"step": 2250
|
303 |
+
},
|
304 |
+
{
|
305 |
+
"epoch": 0.38,
|
306 |
+
"learning_rate": 6.732727272727273e-05,
|
307 |
+
"loss": 0.1689,
|
308 |
+
"step": 2300
|
309 |
+
},
|
310 |
+
{
|
311 |
+
"epoch": 0.39,
|
312 |
+
"learning_rate": 6.641818181818182e-05,
|
313 |
+
"loss": 0.1585,
|
314 |
+
"step": 2350
|
315 |
+
},
|
316 |
+
{
|
317 |
+
"epoch": 0.4,
|
318 |
+
"learning_rate": 6.550909090909091e-05,
|
319 |
+
"loss": 0.1643,
|
320 |
+
"step": 2400
|
321 |
+
},
|
322 |
+
{
|
323 |
+
"epoch": 0.41,
|
324 |
+
"learning_rate": 6.460000000000001e-05,
|
325 |
+
"loss": 0.1634,
|
326 |
+
"step": 2450
|
327 |
+
},
|
328 |
+
{
|
329 |
+
"epoch": 0.42,
|
330 |
+
"learning_rate": 6.369090909090909e-05,
|
331 |
+
"loss": 0.1362,
|
332 |
+
"step": 2500
|
333 |
+
},
|
334 |
+
{
|
335 |
+
"epoch": 0.42,
|
336 |
+
"learning_rate": 6.278181818181819e-05,
|
337 |
+
"loss": 0.1446,
|
338 |
+
"step": 2550
|
339 |
+
},
|
340 |
+
{
|
341 |
+
"epoch": 0.43,
|
342 |
+
"learning_rate": 6.187272727272728e-05,
|
343 |
+
"loss": 0.1439,
|
344 |
+
"step": 2600
|
345 |
+
},
|
346 |
+
{
|
347 |
+
"epoch": 0.44,
|
348 |
+
"learning_rate": 6.0963636363636366e-05,
|
349 |
+
"loss": 0.1534,
|
350 |
+
"step": 2650
|
351 |
+
},
|
352 |
+
{
|
353 |
+
"epoch": 0.45,
|
354 |
+
"learning_rate": 6.0054545454545454e-05,
|
355 |
+
"loss": 0.1264,
|
356 |
+
"step": 2700
|
357 |
+
},
|
358 |
+
{
|
359 |
+
"epoch": 0.46,
|
360 |
+
"learning_rate": 5.914545454545455e-05,
|
361 |
+
"loss": 0.1373,
|
362 |
+
"step": 2750
|
363 |
+
},
|
364 |
+
{
|
365 |
+
"epoch": 0.47,
|
366 |
+
"learning_rate": 5.8236363636363645e-05,
|
367 |
+
"loss": 0.1406,
|
368 |
+
"step": 2800
|
369 |
+
},
|
370 |
+
{
|
371 |
+
"epoch": 0.47,
|
372 |
+
"learning_rate": 5.732727272727273e-05,
|
373 |
+
"loss": 0.1393,
|
374 |
+
"step": 2850
|
375 |
+
},
|
376 |
+
{
|
377 |
+
"epoch": 0.48,
|
378 |
+
"learning_rate": 5.641818181818183e-05,
|
379 |
+
"loss": 0.1377,
|
380 |
+
"step": 2900
|
381 |
+
},
|
382 |
+
{
|
383 |
+
"epoch": 0.49,
|
384 |
+
"learning_rate": 5.550909090909091e-05,
|
385 |
+
"loss": 0.1467,
|
386 |
+
"step": 2950
|
387 |
+
},
|
388 |
+
{
|
389 |
+
"epoch": 0.5,
|
390 |
+
"learning_rate": 5.4600000000000006e-05,
|
391 |
+
"loss": 0.1412,
|
392 |
+
"step": 3000
|
393 |
+
},
|
394 |
+
{
|
395 |
+
"epoch": 0.5,
|
396 |
+
"eval_loss": 0.17524316906929016,
|
397 |
+
"eval_runtime": 2121.3824,
|
398 |
+
"eval_samples_per_second": 7.482,
|
399 |
+
"eval_steps_per_second": 0.234,
|
400 |
+
"eval_wer": 20.070007048220916,
|
401 |
+
"step": 3000
|
402 |
+
},
|
403 |
+
{
|
404 |
+
"epoch": 0.51,
|
405 |
+
"learning_rate": 5.3690909090909094e-05,
|
406 |
+
"loss": 0.1186,
|
407 |
+
"step": 3050
|
408 |
+
},
|
409 |
+
{
|
410 |
+
"epoch": 0.52,
|
411 |
+
"learning_rate": 5.278181818181819e-05,
|
412 |
+
"loss": 0.1437,
|
413 |
+
"step": 3100
|
414 |
+
},
|
415 |
+
{
|
416 |
+
"epoch": 0.53,
|
417 |
+
"learning_rate": 5.187272727272727e-05,
|
418 |
+
"loss": 0.1287,
|
419 |
+
"step": 3150
|
420 |
+
},
|
421 |
+
{
|
422 |
+
"epoch": 0.53,
|
423 |
+
"learning_rate": 5.096363636363637e-05,
|
424 |
+
"loss": 0.1242,
|
425 |
+
"step": 3200
|
426 |
+
},
|
427 |
+
{
|
428 |
+
"epoch": 0.54,
|
429 |
+
"learning_rate": 5.0054545454545455e-05,
|
430 |
+
"loss": 0.1431,
|
431 |
+
"step": 3250
|
432 |
+
},
|
433 |
+
{
|
434 |
+
"epoch": 0.55,
|
435 |
+
"learning_rate": 4.914545454545455e-05,
|
436 |
+
"loss": 0.1316,
|
437 |
+
"step": 3300
|
438 |
+
},
|
439 |
+
{
|
440 |
+
"epoch": 0.56,
|
441 |
+
"learning_rate": 4.823636363636364e-05,
|
442 |
+
"loss": 0.1119,
|
443 |
+
"step": 3350
|
444 |
+
},
|
445 |
+
{
|
446 |
+
"epoch": 0.57,
|
447 |
+
"learning_rate": 4.7327272727272734e-05,
|
448 |
+
"loss": 0.1286,
|
449 |
+
"step": 3400
|
450 |
+
},
|
451 |
+
{
|
452 |
+
"epoch": 0.57,
|
453 |
+
"learning_rate": 4.641818181818182e-05,
|
454 |
+
"loss": 0.1479,
|
455 |
+
"step": 3450
|
456 |
+
},
|
457 |
+
{
|
458 |
+
"epoch": 0.58,
|
459 |
+
"learning_rate": 4.550909090909091e-05,
|
460 |
+
"loss": 0.1144,
|
461 |
+
"step": 3500
|
462 |
+
},
|
463 |
+
{
|
464 |
+
"epoch": 0.59,
|
465 |
+
"learning_rate": 4.46e-05,
|
466 |
+
"loss": 0.1071,
|
467 |
+
"step": 3550
|
468 |
+
},
|
469 |
+
{
|
470 |
+
"epoch": 0.6,
|
471 |
+
"learning_rate": 4.3690909090909095e-05,
|
472 |
+
"loss": 0.1525,
|
473 |
+
"step": 3600
|
474 |
+
},
|
475 |
+
{
|
476 |
+
"epoch": 0.61,
|
477 |
+
"learning_rate": 4.2781818181818184e-05,
|
478 |
+
"loss": 0.1158,
|
479 |
+
"step": 3650
|
480 |
+
},
|
481 |
+
{
|
482 |
+
"epoch": 0.62,
|
483 |
+
"learning_rate": 4.187272727272727e-05,
|
484 |
+
"loss": 0.1111,
|
485 |
+
"step": 3700
|
486 |
+
},
|
487 |
+
{
|
488 |
+
"epoch": 0.62,
|
489 |
+
"learning_rate": 4.096363636363637e-05,
|
490 |
+
"loss": 0.1237,
|
491 |
+
"step": 3750
|
492 |
+
},
|
493 |
+
{
|
494 |
+
"epoch": 0.63,
|
495 |
+
"learning_rate": 4.0054545454545456e-05,
|
496 |
+
"loss": 0.154,
|
497 |
+
"step": 3800
|
498 |
+
},
|
499 |
+
{
|
500 |
+
"epoch": 0.64,
|
501 |
+
"learning_rate": 3.9145454545454545e-05,
|
502 |
+
"loss": 0.1298,
|
503 |
+
"step": 3850
|
504 |
+
},
|
505 |
+
{
|
506 |
+
"epoch": 0.65,
|
507 |
+
"learning_rate": 3.823636363636364e-05,
|
508 |
+
"loss": 0.1273,
|
509 |
+
"step": 3900
|
510 |
+
},
|
511 |
+
{
|
512 |
+
"epoch": 0.66,
|
513 |
+
"learning_rate": 3.732727272727273e-05,
|
514 |
+
"loss": 0.121,
|
515 |
+
"step": 3950
|
516 |
+
},
|
517 |
+
{
|
518 |
+
"epoch": 0.67,
|
519 |
+
"learning_rate": 3.641818181818182e-05,
|
520 |
+
"loss": 0.1093,
|
521 |
+
"step": 4000
|
522 |
+
},
|
523 |
+
{
|
524 |
+
"epoch": 0.67,
|
525 |
+
"eval_loss": 0.14134088158607483,
|
526 |
+
"eval_runtime": 2102.7704,
|
527 |
+
"eval_samples_per_second": 7.548,
|
528 |
+
"eval_steps_per_second": 0.236,
|
529 |
+
"eval_wer": 16.053313059799006,
|
530 |
+
"step": 4000
|
531 |
+
},
|
532 |
+
{
|
533 |
+
"epoch": 0.68,
|
534 |
+
"learning_rate": 3.5509090909090905e-05,
|
535 |
+
"loss": 0.1054,
|
536 |
+
"step": 4050
|
537 |
+
},
|
538 |
+
{
|
539 |
+
"epoch": 0.68,
|
540 |
+
"learning_rate": 3.46e-05,
|
541 |
+
"loss": 0.1305,
|
542 |
+
"step": 4100
|
543 |
+
},
|
544 |
+
{
|
545 |
+
"epoch": 0.69,
|
546 |
+
"learning_rate": 3.3690909090909096e-05,
|
547 |
+
"loss": 0.1138,
|
548 |
+
"step": 4150
|
549 |
+
},
|
550 |
+
{
|
551 |
+
"epoch": 0.7,
|
552 |
+
"learning_rate": 3.2781818181818185e-05,
|
553 |
+
"loss": 0.1275,
|
554 |
+
"step": 4200
|
555 |
+
},
|
556 |
+
{
|
557 |
+
"epoch": 0.71,
|
558 |
+
"learning_rate": 3.187272727272727e-05,
|
559 |
+
"loss": 0.0885,
|
560 |
+
"step": 4250
|
561 |
+
},
|
562 |
+
{
|
563 |
+
"epoch": 0.72,
|
564 |
+
"learning_rate": 3.096363636363637e-05,
|
565 |
+
"loss": 0.1089,
|
566 |
+
"step": 4300
|
567 |
+
},
|
568 |
+
{
|
569 |
+
"epoch": 0.72,
|
570 |
+
"learning_rate": 3.0054545454545457e-05,
|
571 |
+
"loss": 0.0838,
|
572 |
+
"step": 4350
|
573 |
+
},
|
574 |
+
{
|
575 |
+
"epoch": 0.73,
|
576 |
+
"learning_rate": 2.914545454545455e-05,
|
577 |
+
"loss": 0.0833,
|
578 |
+
"step": 4400
|
579 |
+
},
|
580 |
+
{
|
581 |
+
"epoch": 0.74,
|
582 |
+
"learning_rate": 2.8236363636363637e-05,
|
583 |
+
"loss": 0.0968,
|
584 |
+
"step": 4450
|
585 |
+
},
|
586 |
+
{
|
587 |
+
"epoch": 0.75,
|
588 |
+
"learning_rate": 2.732727272727273e-05,
|
589 |
+
"loss": 0.0962,
|
590 |
+
"step": 4500
|
591 |
+
},
|
592 |
+
{
|
593 |
+
"epoch": 0.76,
|
594 |
+
"learning_rate": 2.641818181818182e-05,
|
595 |
+
"loss": 0.0779,
|
596 |
+
"step": 4550
|
597 |
+
},
|
598 |
+
{
|
599 |
+
"epoch": 0.77,
|
600 |
+
"learning_rate": 2.550909090909091e-05,
|
601 |
+
"loss": 0.1033,
|
602 |
+
"step": 4600
|
603 |
+
},
|
604 |
+
{
|
605 |
+
"epoch": 0.78,
|
606 |
+
"learning_rate": 2.46e-05,
|
607 |
+
"loss": 0.0762,
|
608 |
+
"step": 4650
|
609 |
+
},
|
610 |
+
{
|
611 |
+
"epoch": 0.78,
|
612 |
+
"learning_rate": 2.369090909090909e-05,
|
613 |
+
"loss": 0.1111,
|
614 |
+
"step": 4700
|
615 |
+
},
|
616 |
+
{
|
617 |
+
"epoch": 0.79,
|
618 |
+
"learning_rate": 2.2781818181818182e-05,
|
619 |
+
"loss": 0.0875,
|
620 |
+
"step": 4750
|
621 |
+
},
|
622 |
+
{
|
623 |
+
"epoch": 0.8,
|
624 |
+
"learning_rate": 2.1872727272727274e-05,
|
625 |
+
"loss": 0.1337,
|
626 |
+
"step": 4800
|
627 |
+
},
|
628 |
+
{
|
629 |
+
"epoch": 0.81,
|
630 |
+
"learning_rate": 2.0963636363636366e-05,
|
631 |
+
"loss": 0.1232,
|
632 |
+
"step": 4850
|
633 |
+
},
|
634 |
+
{
|
635 |
+
"epoch": 0.82,
|
636 |
+
"learning_rate": 2.0054545454545458e-05,
|
637 |
+
"loss": 0.1153,
|
638 |
+
"step": 4900
|
639 |
+
},
|
640 |
+
{
|
641 |
+
"epoch": 0.82,
|
642 |
+
"learning_rate": 1.9145454545454546e-05,
|
643 |
+
"loss": 0.1189,
|
644 |
+
"step": 4950
|
645 |
+
},
|
646 |
+
{
|
647 |
+
"epoch": 0.83,
|
648 |
+
"learning_rate": 1.8236363636363638e-05,
|
649 |
+
"loss": 0.1137,
|
650 |
+
"step": 5000
|
651 |
+
},
|
652 |
+
{
|
653 |
+
"epoch": 0.83,
|
654 |
+
"eval_loss": 0.11552777886390686,
|
655 |
+
"eval_runtime": 2104.6449,
|
656 |
+
"eval_samples_per_second": 7.541,
|
657 |
+
"eval_steps_per_second": 0.236,
|
658 |
+
"eval_wer": 13.31084238118996,
|
659 |
+
"step": 5000
|
660 |
+
},
|
661 |
+
{
|
662 |
+
"epoch": 0.84,
|
663 |
+
"learning_rate": 1.7327272727272727e-05,
|
664 |
+
"loss": 0.1159,
|
665 |
+
"step": 5050
|
666 |
+
},
|
667 |
+
{
|
668 |
+
"epoch": 0.85,
|
669 |
+
"learning_rate": 1.641818181818182e-05,
|
670 |
+
"loss": 0.1152,
|
671 |
+
"step": 5100
|
672 |
+
},
|
673 |
+
{
|
674 |
+
"epoch": 0.86,
|
675 |
+
"learning_rate": 1.550909090909091e-05,
|
676 |
+
"loss": 0.1051,
|
677 |
+
"step": 5150
|
678 |
+
},
|
679 |
+
{
|
680 |
+
"epoch": 0.87,
|
681 |
+
"learning_rate": 1.4599999999999999e-05,
|
682 |
+
"loss": 0.1196,
|
683 |
+
"step": 5200
|
684 |
+
},
|
685 |
+
{
|
686 |
+
"epoch": 0.88,
|
687 |
+
"learning_rate": 1.3690909090909091e-05,
|
688 |
+
"loss": 0.117,
|
689 |
+
"step": 5250
|
690 |
+
},
|
691 |
+
{
|
692 |
+
"epoch": 0.88,
|
693 |
+
"learning_rate": 1.2781818181818183e-05,
|
694 |
+
"loss": 0.0972,
|
695 |
+
"step": 5300
|
696 |
+
},
|
697 |
+
{
|
698 |
+
"epoch": 0.89,
|
699 |
+
"learning_rate": 1.1872727272727273e-05,
|
700 |
+
"loss": 0.0965,
|
701 |
+
"step": 5350
|
702 |
+
},
|
703 |
+
{
|
704 |
+
"epoch": 0.9,
|
705 |
+
"learning_rate": 1.0963636363636365e-05,
|
706 |
+
"loss": 0.1008,
|
707 |
+
"step": 5400
|
708 |
+
},
|
709 |
+
{
|
710 |
+
"epoch": 1.0,
|
711 |
+
"learning_rate": 1.0054545454545455e-05,
|
712 |
+
"loss": 0.0843,
|
713 |
+
"step": 5450
|
714 |
+
},
|
715 |
+
{
|
716 |
+
"epoch": 1.01,
|
717 |
+
"learning_rate": 9.145454545454546e-06,
|
718 |
+
"loss": 0.0583,
|
719 |
+
"step": 5500
|
720 |
+
},
|
721 |
+
{
|
722 |
+
"epoch": 1.02,
|
723 |
+
"learning_rate": 8.236363636363636e-06,
|
724 |
+
"loss": 0.06,
|
725 |
+
"step": 5550
|
726 |
+
},
|
727 |
+
{
|
728 |
+
"epoch": 1.03,
|
729 |
+
"learning_rate": 7.327272727272727e-06,
|
730 |
+
"loss": 0.0601,
|
731 |
+
"step": 5600
|
732 |
+
},
|
733 |
+
{
|
734 |
+
"epoch": 1.04,
|
735 |
+
"learning_rate": 6.418181818181819e-06,
|
736 |
+
"loss": 0.0591,
|
737 |
+
"step": 5650
|
738 |
+
},
|
739 |
+
{
|
740 |
+
"epoch": 1.05,
|
741 |
+
"learning_rate": 5.50909090909091e-06,
|
742 |
+
"loss": 0.0608,
|
743 |
+
"step": 5700
|
744 |
+
},
|
745 |
+
{
|
746 |
+
"epoch": 1.05,
|
747 |
+
"learning_rate": 4.6e-06,
|
748 |
+
"loss": 0.0628,
|
749 |
+
"step": 5750
|
750 |
+
},
|
751 |
+
{
|
752 |
+
"epoch": 1.06,
|
753 |
+
"learning_rate": 3.6909090909090915e-06,
|
754 |
+
"loss": 0.0636,
|
755 |
+
"step": 5800
|
756 |
+
},
|
757 |
+
{
|
758 |
+
"epoch": 1.07,
|
759 |
+
"learning_rate": 2.781818181818182e-06,
|
760 |
+
"loss": 0.0654,
|
761 |
+
"step": 5850
|
762 |
+
},
|
763 |
+
{
|
764 |
+
"epoch": 1.08,
|
765 |
+
"learning_rate": 1.8727272727272728e-06,
|
766 |
+
"loss": 0.061,
|
767 |
+
"step": 5900
|
768 |
+
},
|
769 |
+
{
|
770 |
+
"epoch": 1.09,
|
771 |
+
"learning_rate": 9.636363636363636e-07,
|
772 |
+
"loss": 0.0559,
|
773 |
+
"step": 5950
|
774 |
+
},
|
775 |
+
{
|
776 |
+
"epoch": 1.1,
|
777 |
+
"learning_rate": 5.454545454545455e-08,
|
778 |
+
"loss": 0.0585,
|
779 |
+
"step": 6000
|
780 |
+
},
|
781 |
+
{
|
782 |
+
"epoch": 1.1,
|
783 |
+
"eval_loss": 0.10796044021844864,
|
784 |
+
"eval_runtime": 2137.698,
|
785 |
+
"eval_samples_per_second": 7.425,
|
786 |
+
"eval_steps_per_second": 0.232,
|
787 |
+
"eval_wer": 12.206885082321635,
|
788 |
+
"step": 6000
|
789 |
+
},
|
790 |
+
{
|
791 |
+
"epoch": 1.1,
|
792 |
+
"step": 6000,
|
793 |
+
"total_flos": 2.490351440560128e+19,
|
794 |
+
"train_loss": 0.17721048017342886,
|
795 |
+
"train_runtime": 61737.3829,
|
796 |
+
"train_samples_per_second": 6.22,
|
797 |
+
"train_steps_per_second": 0.097
|
798 |
+
}
|
799 |
+
],
|
800 |
+
"max_steps": 6000,
|
801 |
+
"num_train_epochs": 9223372036854775807,
|
802 |
+
"total_flos": 2.490351440560128e+19,
|
803 |
+
"trial_name": null,
|
804 |
+
"trial_params": null
|
805 |
+
}
|