hans00 commited on
Commit
2a5c81c
1 Parent(s): 9709628

Upload folder using huggingface_hub

Browse files
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<unk>": 177
3
+ }
config.json ADDED
@@ -0,0 +1,82 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "kakao-enterprise/vits-ljs",
3
+ "activation_dropout": 0.1,
4
+ "architectures": [
5
+ "VitsModel"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "depth_separable_channels": 2,
9
+ "depth_separable_num_layers": 3,
10
+ "duration_predictor_dropout": 0.5,
11
+ "duration_predictor_filter_channels": 256,
12
+ "duration_predictor_flow_bins": 10,
13
+ "duration_predictor_kernel_size": 3,
14
+ "duration_predictor_num_flows": 4,
15
+ "duration_predictor_tail_bound": 5.0,
16
+ "ffn_dim": 768,
17
+ "ffn_kernel_size": 3,
18
+ "flow_size": 192,
19
+ "hidden_act": "relu",
20
+ "hidden_dropout": 0.1,
21
+ "hidden_size": 192,
22
+ "initializer_range": 0.02,
23
+ "layer_norm_eps": 1e-05,
24
+ "layerdrop": 0.1,
25
+ "leaky_relu_slope": 0.1,
26
+ "model_type": "vits",
27
+ "noise_scale": 0.667,
28
+ "noise_scale_duration": 0.8,
29
+ "num_attention_heads": 2,
30
+ "num_hidden_layers": 6,
31
+ "num_speakers": 1,
32
+ "posterior_encoder_num_wavenet_layers": 16,
33
+ "prior_encoder_num_flows": 4,
34
+ "prior_encoder_num_wavenet_layers": 4,
35
+ "resblock_dilation_sizes": [
36
+ [
37
+ 1,
38
+ 3,
39
+ 5
40
+ ],
41
+ [
42
+ 1,
43
+ 3,
44
+ 5
45
+ ],
46
+ [
47
+ 1,
48
+ 3,
49
+ 5
50
+ ]
51
+ ],
52
+ "resblock_kernel_sizes": [
53
+ 3,
54
+ 7,
55
+ 11
56
+ ],
57
+ "sampling_rate": 22050,
58
+ "speaker_embedding_size": 0,
59
+ "speaking_rate": 1.0,
60
+ "spectrogram_bins": 513,
61
+ "transformers_version": "4.36.2",
62
+ "upsample_initial_channel": 512,
63
+ "upsample_kernel_sizes": [
64
+ 16,
65
+ 16,
66
+ 4,
67
+ 4
68
+ ],
69
+ "upsample_rates": [
70
+ 8,
71
+ 8,
72
+ 2,
73
+ 2
74
+ ],
75
+ "use_bias": true,
76
+ "use_stochastic_duration_prediction": true,
77
+ "vocab_size": 178,
78
+ "wavenet_dilation_rate": 1,
79
+ "wavenet_dropout": 0.0,
80
+ "wavenet_kernel_size": 5,
81
+ "window_size": 4
82
+ }
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c619e834e92c03fe281ed6c738e5b2acc6251f25a014c23e6a69780de0266aba
3
+ size 114392346
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01ee43468408cc825b926548e3a713b0bdcbbe86aa55964ef50329c138ccbded
3
+ size 38471858
quantize_config.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Sqrt",
8
+ "Split",
9
+ "LessOrEqual",
10
+ "ReduceMean",
11
+ "LeakyRelu",
12
+ "Equal",
13
+ "Not",
14
+ "Add",
15
+ "CumSum",
16
+ "GatherElements",
17
+ "Sigmoid",
18
+ "Less",
19
+ "Where",
20
+ "Ceil",
21
+ "Concat",
22
+ "Transpose",
23
+ "Expand",
24
+ "Mul",
25
+ "Gather",
26
+ "Pow",
27
+ "RandomNormalLike",
28
+ "Softmax",
29
+ "Shape",
30
+ "NonZero",
31
+ "Tanh",
32
+ "Sub",
33
+ "Slice",
34
+ "Exp",
35
+ "Div",
36
+ "MatMul",
37
+ "GreaterOrEqual",
38
+ "ReduceSum",
39
+ "Cast",
40
+ "Unsqueeze",
41
+ "Softplus",
42
+ "ScatterND",
43
+ "GatherND",
44
+ "Pad",
45
+ "Clip",
46
+ "ReduceMax",
47
+ "ConvTranspose",
48
+ "Neg",
49
+ "Squeeze",
50
+ "Erf",
51
+ "Range",
52
+ "Conv",
53
+ "ConstantOfShape",
54
+ "Relu",
55
+ "Reshape",
56
+ "Constant",
57
+ "And"
58
+ ],
59
+ "weight_type": "QUInt8"
60
+ }
61
+ }
62
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "pad_token": "_",
3
+ "unk_token": "<unk>"
4
+ }
tokenizer.json ADDED
@@ -0,0 +1,235 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 177,
8
+ "content": "<unk>",
9
+ "single_word": false,
10
+ "lstrip": false,
11
+ "rstrip": false,
12
+ "normalized": false,
13
+ "special": true
14
+ }
15
+ ],
16
+ "normalizer": {
17
+ "type": "Sequence",
18
+ "normalizers": [
19
+ {
20
+ "type": "Lowercase"
21
+ },
22
+ {
23
+ "type": "Replace",
24
+ "pattern": {
25
+ "Regex": "[^_;:,.!?\u00a1\u00bf\u2014\u2026\"\u00ab\u00bb\u201c\u201d ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz\u0251\u0250\u0252\u00e6\u0253\u0299\u03b2\u0254\u0255\u00e7\u0257\u0256\u00f0\u02a4\u0259\u0258\u025a\u025b\u025c\u025d\u025e\u025f\u0284\u0261\u0260\u0262\u029b\u0266\u0267\u0127\u0265\u029c\u0268\u026a\u029d\u026d\u026c\u026b\u026e\u029f\u0271\u026f\u0270\u014b\u0273\u0272\u0274\u00f8\u0275\u0278\u03b8\u0153\u0276\u0298\u0279\u027a\u027e\u027b\u0280\u0281\u027d\u0282\u0283\u0288\u02a7\u0289\u028a\u028b\u2c71\u028c\u0263\u0264\u028d\u03c7\u028e\u028f\u0291\u0290\u0292\u0294\u02a1\u0295\u02a2\u01c0\u01c1\u01c2\u01c3\u02c8\u02cc\u02d0\u02d1\u02bc\u02b4\u02b0\u02b1\u02b2\u02b7\u02e0\u02e4\u02de\u2193\u2191\u2192\u2197\u2198\u0329']"
26
+ },
27
+ "content": ""
28
+ },
29
+ {
30
+ "type": "Strip",
31
+ "strip_left": true,
32
+ "strip_right": true
33
+ },
34
+ {
35
+ "type": "Replace",
36
+ "pattern": {
37
+ "Regex": "(?=.)|(?<!^)$"
38
+ },
39
+ "content": "_"
40
+ }
41
+ ]
42
+ },
43
+ "pre_tokenizer": {
44
+ "type": "Split",
45
+ "pattern": {
46
+ "Regex": ""
47
+ },
48
+ "behavior": "Isolated",
49
+ "invert": false
50
+ },
51
+ "post_processor": null,
52
+ "decoder": null,
53
+ "model": {
54
+ "vocab": {
55
+ "_": 0,
56
+ ";": 1,
57
+ ":": 2,
58
+ ",": 3,
59
+ ".": 4,
60
+ "!": 5,
61
+ "?": 6,
62
+ "\u00a1": 7,
63
+ "\u00bf": 8,
64
+ "\u2014": 9,
65
+ "\u2026": 10,
66
+ "\"": 11,
67
+ "\u00ab": 12,
68
+ "\u00bb": 13,
69
+ "\u201c": 14,
70
+ "\u201d": 15,
71
+ " ": 16,
72
+ "A": 17,
73
+ "B": 18,
74
+ "C": 19,
75
+ "D": 20,
76
+ "E": 21,
77
+ "F": 22,
78
+ "G": 23,
79
+ "H": 24,
80
+ "I": 25,
81
+ "J": 26,
82
+ "K": 27,
83
+ "L": 28,
84
+ "M": 29,
85
+ "N": 30,
86
+ "O": 31,
87
+ "P": 32,
88
+ "Q": 33,
89
+ "R": 34,
90
+ "S": 35,
91
+ "T": 36,
92
+ "U": 37,
93
+ "V": 38,
94
+ "W": 39,
95
+ "X": 40,
96
+ "Y": 41,
97
+ "Z": 42,
98
+ "a": 43,
99
+ "b": 44,
100
+ "c": 45,
101
+ "d": 46,
102
+ "e": 47,
103
+ "f": 48,
104
+ "g": 49,
105
+ "h": 50,
106
+ "i": 51,
107
+ "j": 52,
108
+ "k": 53,
109
+ "l": 54,
110
+ "m": 55,
111
+ "n": 56,
112
+ "o": 57,
113
+ "p": 58,
114
+ "q": 59,
115
+ "r": 60,
116
+ "s": 61,
117
+ "t": 62,
118
+ "u": 63,
119
+ "v": 64,
120
+ "w": 65,
121
+ "x": 66,
122
+ "y": 67,
123
+ "z": 68,
124
+ "\u0251": 69,
125
+ "\u0250": 70,
126
+ "\u0252": 71,
127
+ "\u00e6": 72,
128
+ "\u0253": 73,
129
+ "\u0299": 74,
130
+ "\u03b2": 75,
131
+ "\u0254": 76,
132
+ "\u0255": 77,
133
+ "\u00e7": 78,
134
+ "\u0257": 79,
135
+ "\u0256": 80,
136
+ "\u00f0": 81,
137
+ "\u02a4": 82,
138
+ "\u0259": 83,
139
+ "\u0258": 84,
140
+ "\u025a": 85,
141
+ "\u025b": 86,
142
+ "\u025c": 87,
143
+ "\u025d": 88,
144
+ "\u025e": 89,
145
+ "\u025f": 90,
146
+ "\u0284": 91,
147
+ "\u0261": 92,
148
+ "\u0260": 93,
149
+ "\u0262": 94,
150
+ "\u029b": 95,
151
+ "\u0266": 96,
152
+ "\u0267": 97,
153
+ "\u0127": 98,
154
+ "\u0265": 99,
155
+ "\u029c": 100,
156
+ "\u0268": 101,
157
+ "\u026a": 102,
158
+ "\u029d": 103,
159
+ "\u026d": 104,
160
+ "\u026c": 105,
161
+ "\u026b": 106,
162
+ "\u026e": 107,
163
+ "\u029f": 108,
164
+ "\u0271": 109,
165
+ "\u026f": 110,
166
+ "\u0270": 111,
167
+ "\u014b": 112,
168
+ "\u0273": 113,
169
+ "\u0272": 114,
170
+ "\u0274": 115,
171
+ "\u00f8": 116,
172
+ "\u0275": 117,
173
+ "\u0278": 118,
174
+ "\u03b8": 119,
175
+ "\u0153": 120,
176
+ "\u0276": 121,
177
+ "\u0298": 122,
178
+ "\u0279": 123,
179
+ "\u027a": 124,
180
+ "\u027e": 125,
181
+ "\u027b": 126,
182
+ "\u0280": 127,
183
+ "\u0281": 128,
184
+ "\u027d": 129,
185
+ "\u0282": 130,
186
+ "\u0283": 131,
187
+ "\u0288": 132,
188
+ "\u02a7": 133,
189
+ "\u0289": 134,
190
+ "\u028a": 135,
191
+ "\u028b": 136,
192
+ "\u2c71": 137,
193
+ "\u028c": 138,
194
+ "\u0263": 139,
195
+ "\u0264": 140,
196
+ "\u028d": 141,
197
+ "\u03c7": 142,
198
+ "\u028e": 143,
199
+ "\u028f": 144,
200
+ "\u0291": 145,
201
+ "\u0290": 146,
202
+ "\u0292": 147,
203
+ "\u0294": 148,
204
+ "\u02a1": 149,
205
+ "\u0295": 150,
206
+ "\u02a2": 151,
207
+ "\u01c0": 152,
208
+ "\u01c1": 153,
209
+ "\u01c2": 154,
210
+ "\u01c3": 155,
211
+ "\u02c8": 156,
212
+ "\u02cc": 157,
213
+ "\u02d0": 158,
214
+ "\u02d1": 159,
215
+ "\u02bc": 160,
216
+ "\u02b4": 161,
217
+ "\u02b0": 162,
218
+ "\u02b1": 163,
219
+ "\u02b2": 164,
220
+ "\u02b7": 165,
221
+ "\u02e0": 166,
222
+ "\u02e4": 167,
223
+ "\u02de": 168,
224
+ "\u2193": 169,
225
+ "\u2191": 170,
226
+ "\u2192": 171,
227
+ "\u2197": 172,
228
+ "\u2198": 173,
229
+ "null": 174,
230
+ "\u0329": 175,
231
+ "'": 176,
232
+ "<unk>": 177
233
+ }
234
+ }
235
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_blank": true,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "_",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "177": {
13
+ "content": "<unk>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ }
20
+ },
21
+ "clean_up_tokenization_spaces": true,
22
+ "is_uroman": false,
23
+ "language": null,
24
+ "model_max_length": 1000000000000000019884624838656,
25
+ "normalize": true,
26
+ "pad_token": "_",
27
+ "phonemize": true,
28
+ "tokenizer_class": "VitsTokenizer",
29
+ "unk_token": "<unk>"
30
+ }
vocab.json ADDED
@@ -0,0 +1,179 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ " ": 16,
3
+ "!": 5,
4
+ "\"": 11,
5
+ "'": 176,
6
+ ",": 3,
7
+ ".": 4,
8
+ ":": 2,
9
+ ";": 1,
10
+ "?": 6,
11
+ "A": 17,
12
+ "B": 18,
13
+ "C": 19,
14
+ "D": 20,
15
+ "E": 21,
16
+ "F": 22,
17
+ "G": 23,
18
+ "H": 24,
19
+ "I": 25,
20
+ "J": 26,
21
+ "K": 27,
22
+ "L": 28,
23
+ "M": 29,
24
+ "N": 30,
25
+ "O": 31,
26
+ "P": 32,
27
+ "Q": 33,
28
+ "R": 34,
29
+ "S": 35,
30
+ "T": 36,
31
+ "U": 37,
32
+ "V": 38,
33
+ "W": 39,
34
+ "X": 40,
35
+ "Y": 41,
36
+ "Z": 42,
37
+ "_": 0,
38
+ "a": 43,
39
+ "b": 44,
40
+ "c": 45,
41
+ "d": 46,
42
+ "e": 47,
43
+ "f": 48,
44
+ "g": 49,
45
+ "h": 50,
46
+ "i": 51,
47
+ "j": 52,
48
+ "k": 53,
49
+ "l": 54,
50
+ "m": 55,
51
+ "n": 56,
52
+ "o": 57,
53
+ "p": 58,
54
+ "q": 59,
55
+ "r": 60,
56
+ "s": 61,
57
+ "t": 62,
58
+ "u": 63,
59
+ "v": 64,
60
+ "w": 65,
61
+ "x": 66,
62
+ "y": 67,
63
+ "z": 68,
64
+ "¡": 7,
65
+ "«": 12,
66
+ "»": 13,
67
+ "¿": 8,
68
+ "æ": 72,
69
+ "ç": 78,
70
+ "ð": 81,
71
+ "ø": 116,
72
+ "ħ": 98,
73
+ "ŋ": 112,
74
+ "œ": 120,
75
+ "ǀ": 152,
76
+ "ǁ": 153,
77
+ "ǂ": 154,
78
+ "ǃ": 155,
79
+ "ɐ": 70,
80
+ "ɑ": 69,
81
+ "ɒ": 71,
82
+ "ɓ": 73,
83
+ "ɔ": 76,
84
+ "ɕ": 77,
85
+ "ɖ": 80,
86
+ "ɗ": 79,
87
+ "ɘ": 84,
88
+ "ə": 83,
89
+ "ɚ": 85,
90
+ "ɛ": 86,
91
+ "ɜ": 87,
92
+ "ɝ": 88,
93
+ "ɞ": 89,
94
+ "ɟ": 90,
95
+ "ɠ": 93,
96
+ "ɡ": 92,
97
+ "ɢ": 94,
98
+ "ɣ": 139,
99
+ "ɤ": 140,
100
+ "ɥ": 99,
101
+ "ɦ": 96,
102
+ "ɧ": 97,
103
+ "ɨ": 101,
104
+ "ɪ": 102,
105
+ "ɫ": 106,
106
+ "ɬ": 105,
107
+ "ɭ": 104,
108
+ "ɮ": 107,
109
+ "ɯ": 110,
110
+ "ɰ": 111,
111
+ "ɱ": 109,
112
+ "ɲ": 114,
113
+ "ɳ": 113,
114
+ "ɴ": 115,
115
+ "ɵ": 117,
116
+ "ɶ": 121,
117
+ "ɸ": 118,
118
+ "ɹ": 123,
119
+ "ɺ": 124,
120
+ "ɻ": 126,
121
+ "ɽ": 129,
122
+ "ɾ": 125,
123
+ "ʀ": 127,
124
+ "ʁ": 128,
125
+ "ʂ": 130,
126
+ "ʃ": 131,
127
+ "ʄ": 91,
128
+ "ʈ": 132,
129
+ "ʉ": 134,
130
+ "ʊ": 135,
131
+ "ʋ": 136,
132
+ "ʌ": 138,
133
+ "ʍ": 141,
134
+ "ʎ": 143,
135
+ "ʏ": 144,
136
+ "ʐ": 146,
137
+ "ʑ": 145,
138
+ "ʒ": 147,
139
+ "ʔ": 148,
140
+ "ʕ": 150,
141
+ "ʘ": 122,
142
+ "ʙ": 74,
143
+ "ʛ": 95,
144
+ "ʜ": 100,
145
+ "ʝ": 103,
146
+ "ʟ": 108,
147
+ "ʡ": 149,
148
+ "ʢ": 151,
149
+ "ʤ": 82,
150
+ "ʧ": 133,
151
+ "ʰ": 162,
152
+ "ʱ": 163,
153
+ "ʲ": 164,
154
+ "ʴ": 161,
155
+ "ʷ": 165,
156
+ "ʼ": 160,
157
+ "ˈ": 156,
158
+ "ˌ": 157,
159
+ "ː": 158,
160
+ "ˑ": 159,
161
+ "˞": 168,
162
+ "ˠ": 166,
163
+ "ˤ": 167,
164
+ "̩": 175,
165
+ "β": 75,
166
+ "θ": 119,
167
+ "χ": 142,
168
+ "ᵻ": 177,
169
+ "—": 9,
170
+ "“": 14,
171
+ "”": 15,
172
+ "…": 10,
173
+ "↑": 170,
174
+ "→": 171,
175
+ "↓": 169,
176
+ "↗": 172,
177
+ "↘": 173,
178
+ "ⱱ": 137
179
+ }