|
{ |
|
"data": { |
|
"text_cleaners": [ |
|
"cjke_cleaners2" |
|
], |
|
"sampling_rate": 22050, |
|
"filter_length": 1024, |
|
"hop_length": 256, |
|
"win_length": 1024, |
|
"n_mel_channels": 80, |
|
"add_blank": true, |
|
"cleaned_text": true, |
|
"n_speakers": 10 |
|
}, |
|
"model": { |
|
"inter_channels": 192, |
|
"hidden_channels": 192, |
|
"filter_channels": 768, |
|
"n_heads": 2, |
|
"n_layers": 6, |
|
"n_layers_trans_flow": 3, |
|
"kernel_size": 3, |
|
"p_dropout": 0.1, |
|
"resblock": "1", |
|
"resblock_kernel_sizes": [ |
|
3, |
|
7, |
|
11 |
|
], |
|
"resblock_dilation_sizes": [ |
|
[ |
|
1, |
|
3, |
|
5 |
|
], |
|
[ |
|
1, |
|
3, |
|
5 |
|
], |
|
[ |
|
1, |
|
3, |
|
5 |
|
] |
|
], |
|
"upsample_rates": [ |
|
8, |
|
8, |
|
2, |
|
2 |
|
], |
|
"upsample_initial_channel": 512, |
|
"upsample_kernel_sizes": [ |
|
16, |
|
16, |
|
4, |
|
4 |
|
], |
|
"n_layers_q": 3, |
|
"use_spectral_norm": false, |
|
"gin_channels": 256 |
|
}, |
|
"symbols": [ |
|
"_", |
|
",", |
|
".", |
|
"!", |
|
"?", |
|
"-", |
|
"~", |
|
"\u2026", |
|
"N", |
|
"Q", |
|
"a", |
|
"b", |
|
"d", |
|
"e", |
|
"f", |
|
"g", |
|
"h", |
|
"i", |
|
"j", |
|
"k", |
|
"l", |
|
"m", |
|
"n", |
|
"o", |
|
"p", |
|
"s", |
|
"t", |
|
"u", |
|
"v", |
|
"w", |
|
"x", |
|
"y", |
|
"z", |
|
"\u0251", |
|
"\u00e6", |
|
"\u0283", |
|
"\u0291", |
|
"\u00e7", |
|
"\u026f", |
|
"\u026a", |
|
"\u0254", |
|
"\u025b", |
|
"\u0279", |
|
"\u00f0", |
|
"\u0259", |
|
"\u026b", |
|
"\u0265", |
|
"\u0278", |
|
"\u028a", |
|
"\u027e", |
|
"\u0292", |
|
"\u03b8", |
|
"\u03b2", |
|
"\u014b", |
|
"\u0266", |
|
"\u207c", |
|
"\u02b0", |
|
"`", |
|
"^", |
|
"#", |
|
"*", |
|
"=", |
|
"\u02c8", |
|
"\u02cc", |
|
"\u2192", |
|
"\u2193", |
|
"\u2191", |
|
" " |
|
], |
|
"speakers": { |
|
"default": 0 |
|
} |
|
} |