Initial Upload
Browse files- config.yaml +25 -0
- gcmvn_stats.npz +3 -0
- hifigan.bin +3 -0
- hifigan.json +37 -0
- transcript_a.pt +3 -0
- vocab.txt +77 -0
config.yaml
ADDED
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
features:
|
2 |
+
eps: 1.0e-05
|
3 |
+
f_max: 8000
|
4 |
+
f_min: 20
|
5 |
+
hop_len_t: 0.011609977324263039
|
6 |
+
hop_length: 256
|
7 |
+
n_fft: 1024
|
8 |
+
n_mels: 80
|
9 |
+
n_stft: 513
|
10 |
+
sample_rate: 22050
|
11 |
+
type: spectrogram+melscale+log
|
12 |
+
win_len_t: 0.046439909297052155
|
13 |
+
win_length: 1024
|
14 |
+
window_fn: hann
|
15 |
+
global_cmvn:
|
16 |
+
stats_npz_path: gcmvn_stats.npz
|
17 |
+
sample_rate: 22050
|
18 |
+
transforms:
|
19 |
+
'*':
|
20 |
+
- global_cmvn
|
21 |
+
vocab_filename: vocab.txt
|
22 |
+
vocoder:
|
23 |
+
type: hifigan
|
24 |
+
config: hifigan.json
|
25 |
+
checkpoint: hifigan.bin
|
gcmvn_stats.npz
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae721fd82149867ffd979be2f24eac27e0e6449de91ea85046e866487afca6b2
|
3 |
+
size 1140
|
hifigan.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2ee4ed2333b84fa3b5c93d31e9f5981c60d9e747a7ea393c62e83687d054940
|
3 |
+
size 55818654
|
hifigan.json
ADDED
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"resblock": "1",
|
3 |
+
"num_gpus": 0,
|
4 |
+
"batch_size": 16,
|
5 |
+
"learning_rate": 0.0002,
|
6 |
+
"adam_b1": 0.8,
|
7 |
+
"adam_b2": 0.99,
|
8 |
+
"lr_decay": 0.999,
|
9 |
+
"seed": 1234,
|
10 |
+
|
11 |
+
"upsample_rates": [8,8,2,2],
|
12 |
+
"upsample_kernel_sizes": [16,16,4,4],
|
13 |
+
"upsample_initial_channel": 512,
|
14 |
+
"resblock_kernel_sizes": [3,7,11],
|
15 |
+
"resblock_dilation_sizes": [[1,3,5], [1,3,5], [1,3,5]],
|
16 |
+
|
17 |
+
"segment_size": 8192,
|
18 |
+
"num_mels": 80,
|
19 |
+
"num_freq": 1025,
|
20 |
+
"n_fft": 1024,
|
21 |
+
"hop_size": 256,
|
22 |
+
"win_size": 1024,
|
23 |
+
|
24 |
+
"sampling_rate": 22050,
|
25 |
+
|
26 |
+
"fmin": 0,
|
27 |
+
"fmax": 8000,
|
28 |
+
"fmax_for_loss": null,
|
29 |
+
|
30 |
+
"num_workers": 4,
|
31 |
+
|
32 |
+
"dist_config": {
|
33 |
+
"dist_backend": "nccl",
|
34 |
+
"dist_url": "tcp://localhost:54321",
|
35 |
+
"world_size": 1
|
36 |
+
}
|
37 |
+
}
|
transcript_a.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df6e70b7ef51e2667cfb4c56a3652751482700d344b503891595665ec75117c0
|
3 |
+
size 653182043
|
vocab.txt
ADDED
@@ -0,0 +1,77 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
| 121629
|
2 |
+
T 26543
|
3 |
+
N 21566
|
4 |
+
AH0 19303
|
5 |
+
, 16607
|
6 |
+
S 14270
|
7 |
+
D 13421
|
8 |
+
R 12691
|
9 |
+
AH1 11712
|
10 |
+
L 11443
|
11 |
+
IH1 11117
|
12 |
+
DH 10829
|
13 |
+
AY1 9874
|
14 |
+
K 9382
|
15 |
+
AE1 9136
|
16 |
+
EH1 8980
|
17 |
+
W 8744
|
18 |
+
M 8619
|
19 |
+
UW1 8343
|
20 |
+
Z 7827
|
21 |
+
IH0 6512
|
22 |
+
. 6354
|
23 |
+
OW1 6247
|
24 |
+
IY1 6221
|
25 |
+
V 6107
|
26 |
+
B 5939
|
27 |
+
AA1 5670
|
28 |
+
Y 5232
|
29 |
+
P 4952
|
30 |
+
IY0 4683
|
31 |
+
AO1 4650
|
32 |
+
F 4477
|
33 |
+
EY1 4445
|
34 |
+
HH 4356
|
35 |
+
ER0 4115
|
36 |
+
NG 4029
|
37 |
+
G 3538
|
38 |
+
TH 2209
|
39 |
+
AW1 2172
|
40 |
+
JH 1740
|
41 |
+
UH1 1659
|
42 |
+
SH 1346
|
43 |
+
CH 1242
|
44 |
+
ER1 1204
|
45 |
+
- 504
|
46 |
+
? 470
|
47 |
+
EY2 423
|
48 |
+
IH2 348
|
49 |
+
EH2 309
|
50 |
+
OW0 286
|
51 |
+
OW2 255
|
52 |
+
AA2 244
|
53 |
+
OY1 234
|
54 |
+
AY2 217
|
55 |
+
AH2 188
|
56 |
+
EH0 182
|
57 |
+
AE2 165
|
58 |
+
ZH 146
|
59 |
+
AO2 137
|
60 |
+
UW0 116
|
61 |
+
IY2 95
|
62 |
+
UW2 81
|
63 |
+
AE0 78
|
64 |
+
AY0 63
|
65 |
+
AO0 47
|
66 |
+
AA0 43
|
67 |
+
AW2 40
|
68 |
+
EY0 36
|
69 |
+
UH2 33
|
70 |
+
ER2 22
|
71 |
+
OY2 22
|
72 |
+
AW0 11
|
73 |
+
' 9
|
74 |
+
UH0 9
|
75 |
+
.. 4
|
76 |
+
OY0 1
|
77 |
+
! 1
|