Dmitry Chaplinsky
commited on
Commit
·
0d6fc75
1
Parent(s):
3cfa162
Updated model: 655 splits, 23.39 epochs, min_loss: 1.0425, min_ppl: 2.8364
Browse files- best-lm.pt +1 -1
- loss.txt +11 -0
best-lm.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 22791455
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7df0bbeffbb8943d939a0dde1486d555a05c93359999bda14dc4370ab23c0424
|
3 |
size 22791455
|
loss.txt
CHANGED
@@ -642,3 +642,14 @@ TEST: valid loss 1.0437 | valid ppl 2.8396
|
|
642 |
| end of split 137 / 28 | epoch 19 | time: 3774.11s | valid loss 1.0428 | valid ppl 2.8371 | learning rate 5.0000
|
643 |
| end of split 138 / 28 | epoch 19 | time: 3776.83s | valid loss 1.0427 | valid ppl 2.8369 | learning rate 5.0000
|
644 |
| end of split 139 / 28 | epoch 19 | time: 3775.57s | valid loss 1.0426 | valid ppl 2.8367 | learning rate 5.0000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
642 |
| end of split 137 / 28 | epoch 19 | time: 3774.11s | valid loss 1.0428 | valid ppl 2.8371 | learning rate 5.0000
|
643 |
| end of split 138 / 28 | epoch 19 | time: 3776.83s | valid loss 1.0427 | valid ppl 2.8369 | learning rate 5.0000
|
644 |
| end of split 139 / 28 | epoch 19 | time: 3775.57s | valid loss 1.0426 | valid ppl 2.8367 | learning rate 5.0000
|
645 |
+
| end of split 140 / 28 | epoch 19 | time: 3774.84s | valid loss 1.0426 | valid ppl 2.8367 | learning rate 5.0000
|
646 |
+
| end of split 141 / 28 | epoch 19 | time: 1089.42s | valid loss 1.0429 | valid ppl 2.8373 | learning rate 5.0000
|
647 |
+
| end of split 142 / 28 | epoch 19 | time: 3781.20s | valid loss 1.0427 | valid ppl 2.8369 | learning rate 5.0000
|
648 |
+
| end of split 143 / 28 | epoch 19 | time: 3774.42s | valid loss 1.0426 | valid ppl 2.8367 | learning rate 5.0000
|
649 |
+
| end of split 144 / 28 | epoch 19 | time: 3771.17s | valid loss 1.0426 | valid ppl 2.8366 | learning rate 5.0000
|
650 |
+
| end of split 145 / 28 | epoch 19 | time: 3774.23s | valid loss 1.0425 | valid ppl 2.8364 | learning rate 5.0000
|
651 |
+
| end of split 118 / 28 | epoch 20 | time: 3768.43s | valid loss 1.0426 | valid ppl 2.8366 | learning rate 5.0000
|
652 |
+
| end of split 119 / 28 | epoch 20 | time: 3769.09s | valid loss 1.0425 | valid ppl 2.8362 | learning rate 5.0000
|
653 |
+
| end of split 120 / 28 | epoch 20 | time: 3773.51s | valid loss 1.0425 | valid ppl 2.8363 | learning rate 5.0000
|
654 |
+
| end of split 121 / 28 | epoch 20 | time: 3773.63s | valid loss 1.0426 | valid ppl 2.8365 | learning rate 5.0000
|
655 |
+
| end of split 122 / 28 | epoch 20 | time: 3772.94s | valid loss 1.0427 | valid ppl 2.8369 | learning rate 5.0000
|