bayartsogt
commited on
Commit
•
2587880
1
Parent(s):
f8da4c9
init
Browse files- README.md +17 -0
- config.yaml +24 -0
- gcmvn_stats.npz +0 -0
- pytorch_model.pt +3 -0
- speakers.txt +1 -0
- spm_char.model +3 -0
- spm_char.txt +40 -0
- spm_char.vocab +44 -0
README.md
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: fairseq
|
3 |
+
task: text-to-speech
|
4 |
+
tags:
|
5 |
+
- fairseq
|
6 |
+
- audio
|
7 |
+
- text-to-speech
|
8 |
+
language: mn
|
9 |
+
datasets:
|
10 |
+
- mbspeech
|
11 |
+
---
|
12 |
+
# tts_transformer-mn-mbspeech
|
13 |
+
[Transformer](https://arxiv.org/abs/1809.08895) text-to-speech model from fairseq S^2 ([paper](https://arxiv.org/abs/2109.06912)/[code](https://github.com/pytorch/fairseq/tree/main/examples/speech_synthesis)):
|
14 |
+
- Vietnamese
|
15 |
+
- Single-speaker male voice
|
16 |
+
- Trained on [MBSpeech](https://github.com/tugstugi/mongolian-nlp/blob/master/datasets/MBSpeech-1.0-csv.zip)
|
17 |
+
|
config.yaml
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
bpe_tokenizer:
|
2 |
+
bpe: sentencepiece
|
3 |
+
sentencepiece_model: spm_char.model
|
4 |
+
features:
|
5 |
+
eps: 1.0e-05
|
6 |
+
f_max: 8000
|
7 |
+
f_min: 20
|
8 |
+
hop_len_t: 0.011609977324263039
|
9 |
+
hop_length: 256
|
10 |
+
n_fft: 1024
|
11 |
+
n_mels: 80
|
12 |
+
n_stft: 513
|
13 |
+
sample_rate: 22050
|
14 |
+
type: spectrogram+melscale+log
|
15 |
+
win_len_t: 0.046439909297052155
|
16 |
+
win_length: 1024
|
17 |
+
window_fn: hann
|
18 |
+
global_cmvn:
|
19 |
+
stats_npz_path: gcmvn_stats.npz
|
20 |
+
sample_rate: 22050
|
21 |
+
transforms:
|
22 |
+
'*':
|
23 |
+
- global_cmvn
|
24 |
+
vocab_filename: spm_char.txt
|
gcmvn_stats.npz
ADDED
Binary file (1.14 kB). View file
|
|
pytorch_model.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb65454af66ec96eef3825fab2a9fd66ed604282eba7c0c4b34e7306ce0b8730
|
3 |
+
size 652966179
|
speakers.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
mbspeech
|
spm_char.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c3ac7e7fcce150657c687f1bb3d5980bd7ce97d632540b4c1334064426d4e47
|
3 |
+
size 238217
|
spm_char.txt
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
▁ 1
|
2 |
+
а 1
|
3 |
+
н 1
|
4 |
+
э 1
|
5 |
+
г 1
|
6 |
+
р 1
|
7 |
+
и 1
|
8 |
+
д 1
|
9 |
+
х 1
|
10 |
+
л 1
|
11 |
+
ү 1
|
12 |
+
т 1
|
13 |
+
о 1
|
14 |
+
й 1
|
15 |
+
у 1
|
16 |
+
ө 1
|
17 |
+
с 1
|
18 |
+
б 1
|
19 |
+
м 1
|
20 |
+
в 1
|
21 |
+
. 1
|
22 |
+
ч 1
|
23 |
+
з 1
|
24 |
+
ж 1
|
25 |
+
ы 1
|
26 |
+
е 1
|
27 |
+
, 1
|
28 |
+
ь 1
|
29 |
+
ш 1
|
30 |
+
ц 1
|
31 |
+
я 1
|
32 |
+
ю 1
|
33 |
+
ё 1
|
34 |
+
к 1
|
35 |
+
ф 1
|
36 |
+
п 1
|
37 |
+
! 1
|
38 |
+
? 1
|
39 |
+
ъ 1
|
40 |
+
щ 1
|
spm_char.vocab
ADDED
@@ -0,0 +1,44 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<s> 0
|
2 |
+
<pad> 0
|
3 |
+
</s> 0
|
4 |
+
<unk> 0
|
5 |
+
▁ -1.87835
|
6 |
+
а -2.3376
|
7 |
+
н -2.66474
|
8 |
+
э -2.67631
|
9 |
+
г -3.00228
|
10 |
+
р -3.081
|
11 |
+
и -3.1159
|
12 |
+
д -3.1658
|
13 |
+
х -3.2745
|
14 |
+
л -3.31839
|
15 |
+
ү -3.36249
|
16 |
+
т -3.43907
|
17 |
+
о -3.4786
|
18 |
+
й -3.4863
|
19 |
+
у -3.49546
|
20 |
+
ө -3.78138
|
21 |
+
с -3.79323
|
22 |
+
б -3.79863
|
23 |
+
м -4.01439
|
24 |
+
в -4.19775
|
25 |
+
. -4.37665
|
26 |
+
ч -4.46334
|
27 |
+
з -4.52161
|
28 |
+
ж -4.64295
|
29 |
+
ы -4.76725
|
30 |
+
е -4.81287
|
31 |
+
, -4.81325
|
32 |
+
ь -4.84147
|
33 |
+
ш -5.19829
|
34 |
+
ц -5.46254
|
35 |
+
я -5.75058
|
36 |
+
ю -6.61326
|
37 |
+
ё -6.61552
|
38 |
+
к -6.68832
|
39 |
+
ф -6.75376
|
40 |
+
п -7.32121
|
41 |
+
! -8.05174
|
42 |
+
? -8.05174
|
43 |
+
ъ -9.32131
|
44 |
+
щ -13.3988
|