mychen76 commited on
Commit
510e0f5
1 Parent(s): ce9abc9
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. ar/ar_JO/kareem/low/MODEL_CARD +15 -0
  2. ar/ar_JO/kareem/low/ar_JO-kareem-low.onnx +3 -0
  3. ar/ar_JO/kareem/low/ar_JO-kareem-low.onnx.json +508 -0
  4. ar/ar_JO/kareem/low/samples/speaker_0.mp3 +0 -0
  5. ar/ar_JO/kareem/medium/MODEL_CARD +15 -0
  6. ar/ar_JO/kareem/medium/ar_JO-kareem-medium.onnx +3 -0
  7. ar/ar_JO/kareem/medium/ar_JO-kareem-medium.onnx.json +508 -0
  8. ar/ar_JO/kareem/medium/samples/speaker_0.mp3 +0 -0
  9. ca/ca_ES/upc_ona/medium/MODEL_CARD +15 -0
  10. ca/ca_ES/upc_ona/medium/ca_ES-upc_ona-medium.onnx +3 -0
  11. ca/ca_ES/upc_ona/medium/ca_ES-upc_ona-medium.onnx.json +493 -0
  12. ca/ca_ES/upc_ona/medium/samples/speaker_0.mp3 +0 -0
  13. ca/ca_ES/upc_ona/x_low/ALIASES +1 -0
  14. ca/ca_ES/upc_ona/x_low/MODEL_CARD +15 -0
  15. ca/ca_ES/upc_ona/x_low/ca_ES-upc_ona-x_low.onnx +3 -0
  16. ca/ca_ES/upc_ona/x_low/ca_ES-upc_ona-x_low.onnx.json +420 -0
  17. ca/ca_ES/upc_ona/x_low/samples/speaker_0.mp3 +0 -0
  18. ca/ca_ES/upc_pau/x_low/ALIASES +1 -0
  19. ca/ca_ES/upc_pau/x_low/MODEL_CARD +15 -0
  20. ca/ca_ES/upc_pau/x_low/ca_ES-upc_pau-x_low.onnx +3 -0
  21. ca/ca_ES/upc_pau/x_low/ca_ES-upc_pau-x_low.onnx.json +420 -0
  22. ca/ca_ES/upc_pau/x_low/samples/speaker_0.mp3 +0 -0
  23. cs/cs_CZ/jirka/low/MODEL_CARD +15 -0
  24. cs/cs_CZ/jirka/low/cs_CZ-jirka-low.onnx +3 -0
  25. cs/cs_CZ/jirka/low/cs_CZ-jirka-low.onnx.json +508 -0
  26. cs/cs_CZ/jirka/low/samples/speaker_0.mp3 +0 -0
  27. cs/cs_CZ/jirka/medium/MODEL_CARD +15 -0
  28. cs/cs_CZ/jirka/medium/cs_CZ-jirka-medium.onnx +3 -0
  29. cs/cs_CZ/jirka/medium/cs_CZ-jirka-medium.onnx.json +508 -0
  30. cs/cs_CZ/jirka/medium/samples/speaker_0.mp3 +0 -0
  31. da/da_DK/talesyntese/medium/ALIASES +1 -0
  32. da/da_DK/talesyntese/medium/MODEL_CARD +15 -0
  33. da/da_DK/talesyntese/medium/da_DK-talesyntese-medium.onnx +3 -0
  34. da/da_DK/talesyntese/medium/da_DK-talesyntese-medium.onnx.json +493 -0
  35. da/da_DK/talesyntese/medium/samples/speaker_0.mp3 +0 -0
  36. de/de_DE/eva_k/x_low/ALIASES +1 -0
  37. de/de_DE/eva_k/x_low/MODEL_CARD +15 -0
  38. de/de_DE/eva_k/x_low/de_DE-eva_k-x_low.onnx +3 -0
  39. de/de_DE/eva_k/x_low/de_DE-eva_k-x_low.onnx.json +420 -0
  40. de/de_DE/eva_k/x_low/samples/speaker_0.mp3 +0 -0
  41. de/de_DE/karlsson/low/ALIASES +1 -0
  42. de/de_DE/karlsson/low/MODEL_CARD +15 -0
  43. de/de_DE/karlsson/low/de_DE-karlsson-low.onnx +3 -0
  44. de/de_DE/karlsson/low/de_DE-karlsson-low.onnx.json +420 -0
  45. de/de_DE/karlsson/low/samples/speaker_0.mp3 +0 -0
  46. de/de_DE/kerstin/low/ALIASES +1 -0
  47. de/de_DE/kerstin/low/MODEL_CARD +15 -0
  48. de/de_DE/kerstin/low/de_DE-kerstin-low.onnx +3 -0
  49. de/de_DE/kerstin/low/de_DE-kerstin-low.onnx.json +420 -0
  50. de/de_DE/kerstin/low/samples/speaker_0.mp3 +0 -0
ar/ar_JO/kareem/low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for kareem (low)
2
+
3
+ * Language: ar_JO (Arabic, Jordan)
4
+ * Speakers: 1
5
+ * Quality: low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/AliMokhammad/arabicttstrain/
11
+ * License: See URL
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S English lessac voice (low quality).
ar/ar_JO/kareem/low/ar_JO-kareem-low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2887e9d68b125965c747e1371fa21e1cef19555ea98d0795a0d5d71188b13890
3
+ size 63201294
ar/ar_JO/kareem/low/ar_JO-kareem-low.onnx.json ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": "kareem",
3
+ "audio": {
4
+ "sample_rate": 16000,
5
+ "quality": "low"
6
+ },
7
+ "espeak": {
8
+ "voice": "ar"
9
+ },
10
+ "language": {
11
+ "code": "ar_JO",
12
+ "family": "ar",
13
+ "region": "JO",
14
+ "name_native": "العربية",
15
+ "name_english": "Arabic",
16
+ "country_english": "Jordan"
17
+ },
18
+ "inference": {
19
+ "noise_scale": 0.667,
20
+ "length_scale": 1,
21
+ "noise_w": 0.8
22
+ },
23
+ "phoneme_type": "espeak",
24
+ "phoneme_map": {},
25
+ "phoneme_id_map": {
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "\"": [
33
+ 150
34
+ ],
35
+ "#": [
36
+ 149
37
+ ],
38
+ "$": [
39
+ 2
40
+ ],
41
+ "'": [
42
+ 5
43
+ ],
44
+ "(": [
45
+ 6
46
+ ],
47
+ ")": [
48
+ 7
49
+ ],
50
+ ",": [
51
+ 8
52
+ ],
53
+ "-": [
54
+ 9
55
+ ],
56
+ ".": [
57
+ 10
58
+ ],
59
+ "0": [
60
+ 130
61
+ ],
62
+ "1": [
63
+ 131
64
+ ],
65
+ "2": [
66
+ 132
67
+ ],
68
+ "3": [
69
+ 133
70
+ ],
71
+ "4": [
72
+ 134
73
+ ],
74
+ "5": [
75
+ 135
76
+ ],
77
+ "6": [
78
+ 136
79
+ ],
80
+ "7": [
81
+ 137
82
+ ],
83
+ "8": [
84
+ 138
85
+ ],
86
+ "9": [
87
+ 139
88
+ ],
89
+ ":": [
90
+ 11
91
+ ],
92
+ ";": [
93
+ 12
94
+ ],
95
+ "?": [
96
+ 13
97
+ ],
98
+ "X": [
99
+ 156
100
+ ],
101
+ "^": [
102
+ 1
103
+ ],
104
+ "_": [
105
+ 0
106
+ ],
107
+ "a": [
108
+ 14
109
+ ],
110
+ "b": [
111
+ 15
112
+ ],
113
+ "c": [
114
+ 16
115
+ ],
116
+ "d": [
117
+ 17
118
+ ],
119
+ "e": [
120
+ 18
121
+ ],
122
+ "f": [
123
+ 19
124
+ ],
125
+ "g": [
126
+ 154
127
+ ],
128
+ "h": [
129
+ 20
130
+ ],
131
+ "i": [
132
+ 21
133
+ ],
134
+ "j": [
135
+ 22
136
+ ],
137
+ "k": [
138
+ 23
139
+ ],
140
+ "l": [
141
+ 24
142
+ ],
143
+ "m": [
144
+ 25
145
+ ],
146
+ "n": [
147
+ 26
148
+ ],
149
+ "o": [
150
+ 27
151
+ ],
152
+ "p": [
153
+ 28
154
+ ],
155
+ "q": [
156
+ 29
157
+ ],
158
+ "r": [
159
+ 30
160
+ ],
161
+ "s": [
162
+ 31
163
+ ],
164
+ "t": [
165
+ 32
166
+ ],
167
+ "u": [
168
+ 33
169
+ ],
170
+ "v": [
171
+ 34
172
+ ],
173
+ "w": [
174
+ 35
175
+ ],
176
+ "x": [
177
+ 36
178
+ ],
179
+ "y": [
180
+ 37
181
+ ],
182
+ "z": [
183
+ 38
184
+ ],
185
+ "æ": [
186
+ 39
187
+ ],
188
+ "ç": [
189
+ 40
190
+ ],
191
+ "ð": [
192
+ 41
193
+ ],
194
+ "ø": [
195
+ 42
196
+ ],
197
+ "ħ": [
198
+ 43
199
+ ],
200
+ "ŋ": [
201
+ 44
202
+ ],
203
+ "œ": [
204
+ 45
205
+ ],
206
+ "ǀ": [
207
+ 46
208
+ ],
209
+ "ǁ": [
210
+ 47
211
+ ],
212
+ "ǂ": [
213
+ 48
214
+ ],
215
+ "ǃ": [
216
+ 49
217
+ ],
218
+ "ɐ": [
219
+ 50
220
+ ],
221
+ "ɑ": [
222
+ 51
223
+ ],
224
+ "ɒ": [
225
+ 52
226
+ ],
227
+ "ɓ": [
228
+ 53
229
+ ],
230
+ "ɔ": [
231
+ 54
232
+ ],
233
+ "ɕ": [
234
+ 55
235
+ ],
236
+ "ɖ": [
237
+ 56
238
+ ],
239
+ "ɗ": [
240
+ 57
241
+ ],
242
+ "ɘ": [
243
+ 58
244
+ ],
245
+ "ə": [
246
+ 59
247
+ ],
248
+ "ɚ": [
249
+ 60
250
+ ],
251
+ "ɛ": [
252
+ 61
253
+ ],
254
+ "ɜ": [
255
+ 62
256
+ ],
257
+ "ɞ": [
258
+ 63
259
+ ],
260
+ "ɟ": [
261
+ 64
262
+ ],
263
+ "ɠ": [
264
+ 65
265
+ ],
266
+ "ɡ": [
267
+ 66
268
+ ],
269
+ "ɢ": [
270
+ 67
271
+ ],
272
+ "ɣ": [
273
+ 68
274
+ ],
275
+ "ɤ": [
276
+ 69
277
+ ],
278
+ "ɥ": [
279
+ 70
280
+ ],
281
+ "ɦ": [
282
+ 71
283
+ ],
284
+ "ɧ": [
285
+ 72
286
+ ],
287
+ "ɨ": [
288
+ 73
289
+ ],
290
+ "ɪ": [
291
+ 74
292
+ ],
293
+ "ɫ": [
294
+ 75
295
+ ],
296
+ "ɬ": [
297
+ 76
298
+ ],
299
+ "ɭ": [
300
+ 77
301
+ ],
302
+ "ɮ": [
303
+ 78
304
+ ],
305
+ "ɯ": [
306
+ 79
307
+ ],
308
+ "ɰ": [
309
+ 80
310
+ ],
311
+ "ɱ": [
312
+ 81
313
+ ],
314
+ "ɲ": [
315
+ 82
316
+ ],
317
+ "ɳ": [
318
+ 83
319
+ ],
320
+ "ɴ": [
321
+ 84
322
+ ],
323
+ "ɵ": [
324
+ 85
325
+ ],
326
+ "ɶ": [
327
+ 86
328
+ ],
329
+ "ɸ": [
330
+ 87
331
+ ],
332
+ "ɹ": [
333
+ 88
334
+ ],
335
+ "ɺ": [
336
+ 89
337
+ ],
338
+ "ɻ": [
339
+ 90
340
+ ],
341
+ "ɽ": [
342
+ 91
343
+ ],
344
+ "ɾ": [
345
+ 92
346
+ ],
347
+ "ʀ": [
348
+ 93
349
+ ],
350
+ "ʁ": [
351
+ 94
352
+ ],
353
+ "ʂ": [
354
+ 95
355
+ ],
356
+ "ʃ": [
357
+ 96
358
+ ],
359
+ "ʄ": [
360
+ 97
361
+ ],
362
+ "ʈ": [
363
+ 98
364
+ ],
365
+ "ʉ": [
366
+ 99
367
+ ],
368
+ "ʊ": [
369
+ 100
370
+ ],
371
+ "ʋ": [
372
+ 101
373
+ ],
374
+ "ʌ": [
375
+ 102
376
+ ],
377
+ "ʍ": [
378
+ 103
379
+ ],
380
+ "ʎ": [
381
+ 104
382
+ ],
383
+ "ʏ": [
384
+ 105
385
+ ],
386
+ "ʐ": [
387
+ 106
388
+ ],
389
+ "ʑ": [
390
+ 107
391
+ ],
392
+ "ʒ": [
393
+ 108
394
+ ],
395
+ "ʔ": [
396
+ 109
397
+ ],
398
+ "ʕ": [
399
+ 110
400
+ ],
401
+ "ʘ": [
402
+ 111
403
+ ],
404
+ "ʙ": [
405
+ 112
406
+ ],
407
+ "ʛ": [
408
+ 113
409
+ ],
410
+ "ʜ": [
411
+ 114
412
+ ],
413
+ "ʝ": [
414
+ 115
415
+ ],
416
+ "ʟ": [
417
+ 116
418
+ ],
419
+ "ʡ": [
420
+ 117
421
+ ],
422
+ "ʢ": [
423
+ 118
424
+ ],
425
+ "ʦ": [
426
+ 155
427
+ ],
428
+ "ʰ": [
429
+ 145
430
+ ],
431
+ "ʲ": [
432
+ 119
433
+ ],
434
+ "ˈ": [
435
+ 120
436
+ ],
437
+ "ˌ": [
438
+ 121
439
+ ],
440
+ "ː": [
441
+ 122
442
+ ],
443
+ "ˑ": [
444
+ 123
445
+ ],
446
+ "˞": [
447
+ 124
448
+ ],
449
+ "ˤ": [
450
+ 146
451
+ ],
452
+ "̃": [
453
+ 141
454
+ ],
455
+ "̊": [
456
+ 158
457
+ ],
458
+ "̝": [
459
+ 157
460
+ ],
461
+ "̧": [
462
+ 140
463
+ ],
464
+ "̩": [
465
+ 144
466
+ ],
467
+ "̪": [
468
+ 142
469
+ ],
470
+ "̯": [
471
+ 143
472
+ ],
473
+ "̺": [
474
+ 152
475
+ ],
476
+ "̻": [
477
+ 153
478
+ ],
479
+ "β": [
480
+ 125
481
+ ],
482
+ "ε": [
483
+ 147
484
+ ],
485
+ "θ": [
486
+ 126
487
+ ],
488
+ "χ": [
489
+ 127
490
+ ],
491
+ "ᵻ": [
492
+ 128
493
+ ],
494
+ "↑": [
495
+ 151
496
+ ],
497
+ "↓": [
498
+ 148
499
+ ],
500
+ "ⱱ": [
501
+ 129
502
+ ]
503
+ },
504
+ "num_symbols": 256,
505
+ "num_speakers": 1,
506
+ "speaker_id_map": {},
507
+ "piper_version": "1.0.0"
508
+ }
ar/ar_JO/kareem/low/samples/speaker_0.mp3 ADDED
Binary file (107 kB). View file
 
ar/ar_JO/kareem/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for kareem (medium)
2
+
3
+ * Language: ar_JO (Arabic, Jordan)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/AliMokhammad/arabicttstrain/
11
+ * License: See URL
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S English lessac voice (medium quality).
ar/ar_JO/kareem/medium/ar_JO-kareem-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e95cab07b679da603bba17c4dec7ab3111320571964ee95c0379603c086491e
3
+ size 63201294
ar/ar_JO/kareem/medium/ar_JO-kareem-medium.onnx.json ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": "kareem",
3
+ "audio": {
4
+ "sample_rate": 22050,
5
+ "quality": "medium"
6
+ },
7
+ "espeak": {
8
+ "voice": "ar"
9
+ },
10
+ "language": {
11
+ "code": "ar_JO",
12
+ "family": "ar",
13
+ "region": "JO",
14
+ "name_native": "العربية",
15
+ "name_english": "Arabic",
16
+ "country_english": "Jordan"
17
+ },
18
+ "inference": {
19
+ "noise_scale": 0.667,
20
+ "length_scale": 1,
21
+ "noise_w": 0.8
22
+ },
23
+ "phoneme_type": "espeak",
24
+ "phoneme_map": {},
25
+ "phoneme_id_map": {
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "\"": [
33
+ 150
34
+ ],
35
+ "#": [
36
+ 149
37
+ ],
38
+ "$": [
39
+ 2
40
+ ],
41
+ "'": [
42
+ 5
43
+ ],
44
+ "(": [
45
+ 6
46
+ ],
47
+ ")": [
48
+ 7
49
+ ],
50
+ ",": [
51
+ 8
52
+ ],
53
+ "-": [
54
+ 9
55
+ ],
56
+ ".": [
57
+ 10
58
+ ],
59
+ "0": [
60
+ 130
61
+ ],
62
+ "1": [
63
+ 131
64
+ ],
65
+ "2": [
66
+ 132
67
+ ],
68
+ "3": [
69
+ 133
70
+ ],
71
+ "4": [
72
+ 134
73
+ ],
74
+ "5": [
75
+ 135
76
+ ],
77
+ "6": [
78
+ 136
79
+ ],
80
+ "7": [
81
+ 137
82
+ ],
83
+ "8": [
84
+ 138
85
+ ],
86
+ "9": [
87
+ 139
88
+ ],
89
+ ":": [
90
+ 11
91
+ ],
92
+ ";": [
93
+ 12
94
+ ],
95
+ "?": [
96
+ 13
97
+ ],
98
+ "X": [
99
+ 156
100
+ ],
101
+ "^": [
102
+ 1
103
+ ],
104
+ "_": [
105
+ 0
106
+ ],
107
+ "a": [
108
+ 14
109
+ ],
110
+ "b": [
111
+ 15
112
+ ],
113
+ "c": [
114
+ 16
115
+ ],
116
+ "d": [
117
+ 17
118
+ ],
119
+ "e": [
120
+ 18
121
+ ],
122
+ "f": [
123
+ 19
124
+ ],
125
+ "g": [
126
+ 154
127
+ ],
128
+ "h": [
129
+ 20
130
+ ],
131
+ "i": [
132
+ 21
133
+ ],
134
+ "j": [
135
+ 22
136
+ ],
137
+ "k": [
138
+ 23
139
+ ],
140
+ "l": [
141
+ 24
142
+ ],
143
+ "m": [
144
+ 25
145
+ ],
146
+ "n": [
147
+ 26
148
+ ],
149
+ "o": [
150
+ 27
151
+ ],
152
+ "p": [
153
+ 28
154
+ ],
155
+ "q": [
156
+ 29
157
+ ],
158
+ "r": [
159
+ 30
160
+ ],
161
+ "s": [
162
+ 31
163
+ ],
164
+ "t": [
165
+ 32
166
+ ],
167
+ "u": [
168
+ 33
169
+ ],
170
+ "v": [
171
+ 34
172
+ ],
173
+ "w": [
174
+ 35
175
+ ],
176
+ "x": [
177
+ 36
178
+ ],
179
+ "y": [
180
+ 37
181
+ ],
182
+ "z": [
183
+ 38
184
+ ],
185
+ "æ": [
186
+ 39
187
+ ],
188
+ "ç": [
189
+ 40
190
+ ],
191
+ "ð": [
192
+ 41
193
+ ],
194
+ "ø": [
195
+ 42
196
+ ],
197
+ "ħ": [
198
+ 43
199
+ ],
200
+ "ŋ": [
201
+ 44
202
+ ],
203
+ "œ": [
204
+ 45
205
+ ],
206
+ "ǀ": [
207
+ 46
208
+ ],
209
+ "ǁ": [
210
+ 47
211
+ ],
212
+ "ǂ": [
213
+ 48
214
+ ],
215
+ "ǃ": [
216
+ 49
217
+ ],
218
+ "ɐ": [
219
+ 50
220
+ ],
221
+ "ɑ": [
222
+ 51
223
+ ],
224
+ "ɒ": [
225
+ 52
226
+ ],
227
+ "ɓ": [
228
+ 53
229
+ ],
230
+ "ɔ": [
231
+ 54
232
+ ],
233
+ "ɕ": [
234
+ 55
235
+ ],
236
+ "ɖ": [
237
+ 56
238
+ ],
239
+ "ɗ": [
240
+ 57
241
+ ],
242
+ "ɘ": [
243
+ 58
244
+ ],
245
+ "ə": [
246
+ 59
247
+ ],
248
+ "ɚ": [
249
+ 60
250
+ ],
251
+ "ɛ": [
252
+ 61
253
+ ],
254
+ "ɜ": [
255
+ 62
256
+ ],
257
+ "ɞ": [
258
+ 63
259
+ ],
260
+ "ɟ": [
261
+ 64
262
+ ],
263
+ "ɠ": [
264
+ 65
265
+ ],
266
+ "ɡ": [
267
+ 66
268
+ ],
269
+ "ɢ": [
270
+ 67
271
+ ],
272
+ "ɣ": [
273
+ 68
274
+ ],
275
+ "ɤ": [
276
+ 69
277
+ ],
278
+ "ɥ": [
279
+ 70
280
+ ],
281
+ "ɦ": [
282
+ 71
283
+ ],
284
+ "ɧ": [
285
+ 72
286
+ ],
287
+ "ɨ": [
288
+ 73
289
+ ],
290
+ "ɪ": [
291
+ 74
292
+ ],
293
+ "ɫ": [
294
+ 75
295
+ ],
296
+ "ɬ": [
297
+ 76
298
+ ],
299
+ "ɭ": [
300
+ 77
301
+ ],
302
+ "ɮ": [
303
+ 78
304
+ ],
305
+ "ɯ": [
306
+ 79
307
+ ],
308
+ "ɰ": [
309
+ 80
310
+ ],
311
+ "ɱ": [
312
+ 81
313
+ ],
314
+ "ɲ": [
315
+ 82
316
+ ],
317
+ "ɳ": [
318
+ 83
319
+ ],
320
+ "ɴ": [
321
+ 84
322
+ ],
323
+ "ɵ": [
324
+ 85
325
+ ],
326
+ "ɶ": [
327
+ 86
328
+ ],
329
+ "ɸ": [
330
+ 87
331
+ ],
332
+ "ɹ": [
333
+ 88
334
+ ],
335
+ "ɺ": [
336
+ 89
337
+ ],
338
+ "ɻ": [
339
+ 90
340
+ ],
341
+ "ɽ": [
342
+ 91
343
+ ],
344
+ "ɾ": [
345
+ 92
346
+ ],
347
+ "ʀ": [
348
+ 93
349
+ ],
350
+ "ʁ": [
351
+ 94
352
+ ],
353
+ "ʂ": [
354
+ 95
355
+ ],
356
+ "ʃ": [
357
+ 96
358
+ ],
359
+ "ʄ": [
360
+ 97
361
+ ],
362
+ "ʈ": [
363
+ 98
364
+ ],
365
+ "ʉ": [
366
+ 99
367
+ ],
368
+ "ʊ": [
369
+ 100
370
+ ],
371
+ "ʋ": [
372
+ 101
373
+ ],
374
+ "ʌ": [
375
+ 102
376
+ ],
377
+ "ʍ": [
378
+ 103
379
+ ],
380
+ "ʎ": [
381
+ 104
382
+ ],
383
+ "ʏ": [
384
+ 105
385
+ ],
386
+ "ʐ": [
387
+ 106
388
+ ],
389
+ "ʑ": [
390
+ 107
391
+ ],
392
+ "ʒ": [
393
+ 108
394
+ ],
395
+ "ʔ": [
396
+ 109
397
+ ],
398
+ "ʕ": [
399
+ 110
400
+ ],
401
+ "ʘ": [
402
+ 111
403
+ ],
404
+ "ʙ": [
405
+ 112
406
+ ],
407
+ "ʛ": [
408
+ 113
409
+ ],
410
+ "ʜ": [
411
+ 114
412
+ ],
413
+ "ʝ": [
414
+ 115
415
+ ],
416
+ "ʟ": [
417
+ 116
418
+ ],
419
+ "ʡ": [
420
+ 117
421
+ ],
422
+ "ʢ": [
423
+ 118
424
+ ],
425
+ "ʦ": [
426
+ 155
427
+ ],
428
+ "ʰ": [
429
+ 145
430
+ ],
431
+ "ʲ": [
432
+ 119
433
+ ],
434
+ "ˈ": [
435
+ 120
436
+ ],
437
+ "ˌ": [
438
+ 121
439
+ ],
440
+ "ː": [
441
+ 122
442
+ ],
443
+ "ˑ": [
444
+ 123
445
+ ],
446
+ "˞": [
447
+ 124
448
+ ],
449
+ "ˤ": [
450
+ 146
451
+ ],
452
+ "̃": [
453
+ 141
454
+ ],
455
+ "̊": [
456
+ 158
457
+ ],
458
+ "̝": [
459
+ 157
460
+ ],
461
+ "̧": [
462
+ 140
463
+ ],
464
+ "̩": [
465
+ 144
466
+ ],
467
+ "̪": [
468
+ 142
469
+ ],
470
+ "̯": [
471
+ 143
472
+ ],
473
+ "̺": [
474
+ 152
475
+ ],
476
+ "̻": [
477
+ 153
478
+ ],
479
+ "β": [
480
+ 125
481
+ ],
482
+ "ε": [
483
+ 147
484
+ ],
485
+ "θ": [
486
+ 126
487
+ ],
488
+ "χ": [
489
+ 127
490
+ ],
491
+ "ᵻ": [
492
+ 128
493
+ ],
494
+ "↑": [
495
+ 151
496
+ ],
497
+ "↓": [
498
+ 148
499
+ ],
500
+ "ⱱ": [
501
+ 129
502
+ ]
503
+ },
504
+ "num_symbols": 256,
505
+ "num_speakers": 1,
506
+ "speaker_id_map": {},
507
+ "piper_version": "1.0.0"
508
+ }
ar/ar_JO/kareem/medium/samples/speaker_0.mp3 ADDED
Binary file (147 kB). View file
 
ca/ca_ES/upc_ona/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for upc_ona (medium)
2
+
3
+ * Language: ca_ES (Catalan, Spain)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://collectivat.cat/asr#upc-festcat-tts-corpora
11
+ * License: CC BY-SA 3.0 ES
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S English lessac voice (medium quality).
ca/ca_ES/upc_ona/medium/ca_ES-upc_ona-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdb652db8c11a4475527346cf3241cb064d1ba393cf370f3f2ec09a872d118fd
3
+ size 63201294
ca/ca_ES/upc_ona/medium/ca_ES-upc_ona-medium.onnx.json ADDED
@@ -0,0 +1,493 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "ca"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ "_": [
18
+ 0
19
+ ],
20
+ "^": [
21
+ 1
22
+ ],
23
+ "$": [
24
+ 2
25
+ ],
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ ":": [
51
+ 11
52
+ ],
53
+ ";": [
54
+ 12
55
+ ],
56
+ "?": [
57
+ 13
58
+ ],
59
+ "a": [
60
+ 14
61
+ ],
62
+ "b": [
63
+ 15
64
+ ],
65
+ "c": [
66
+ 16
67
+ ],
68
+ "d": [
69
+ 17
70
+ ],
71
+ "e": [
72
+ 18
73
+ ],
74
+ "f": [
75
+ 19
76
+ ],
77
+ "h": [
78
+ 20
79
+ ],
80
+ "i": [
81
+ 21
82
+ ],
83
+ "j": [
84
+ 22
85
+ ],
86
+ "k": [
87
+ 23
88
+ ],
89
+ "l": [
90
+ 24
91
+ ],
92
+ "m": [
93
+ 25
94
+ ],
95
+ "n": [
96
+ 26
97
+ ],
98
+ "o": [
99
+ 27
100
+ ],
101
+ "p": [
102
+ 28
103
+ ],
104
+ "q": [
105
+ 29
106
+ ],
107
+ "r": [
108
+ 30
109
+ ],
110
+ "s": [
111
+ 31
112
+ ],
113
+ "t": [
114
+ 32
115
+ ],
116
+ "u": [
117
+ 33
118
+ ],
119
+ "v": [
120
+ 34
121
+ ],
122
+ "w": [
123
+ 35
124
+ ],
125
+ "x": [
126
+ 36
127
+ ],
128
+ "y": [
129
+ 37
130
+ ],
131
+ "z": [
132
+ 38
133
+ ],
134
+ "æ": [
135
+ 39
136
+ ],
137
+ "ç": [
138
+ 40
139
+ ],
140
+ "ð": [
141
+ 41
142
+ ],
143
+ "ø": [
144
+ 42
145
+ ],
146
+ "ħ": [
147
+ 43
148
+ ],
149
+ "ŋ": [
150
+ 44
151
+ ],
152
+ "œ": [
153
+ 45
154
+ ],
155
+ "ǀ": [
156
+ 46
157
+ ],
158
+ "ǁ": [
159
+ 47
160
+ ],
161
+ "ǂ": [
162
+ 48
163
+ ],
164
+ "ǃ": [
165
+ 49
166
+ ],
167
+ "ɐ": [
168
+ 50
169
+ ],
170
+ "ɑ": [
171
+ 51
172
+ ],
173
+ "ɒ": [
174
+ 52
175
+ ],
176
+ "ɓ": [
177
+ 53
178
+ ],
179
+ "ɔ": [
180
+ 54
181
+ ],
182
+ "ɕ": [
183
+ 55
184
+ ],
185
+ "ɖ": [
186
+ 56
187
+ ],
188
+ "ɗ": [
189
+ 57
190
+ ],
191
+ "ɘ": [
192
+ 58
193
+ ],
194
+ "ə": [
195
+ 59
196
+ ],
197
+ "ɚ": [
198
+ 60
199
+ ],
200
+ "ɛ": [
201
+ 61
202
+ ],
203
+ "ɜ": [
204
+ 62
205
+ ],
206
+ "ɞ": [
207
+ 63
208
+ ],
209
+ "ɟ": [
210
+ 64
211
+ ],
212
+ "ɠ": [
213
+ 65
214
+ ],
215
+ "ɡ": [
216
+ 66
217
+ ],
218
+ "ɢ": [
219
+ 67
220
+ ],
221
+ "ɣ": [
222
+ 68
223
+ ],
224
+ "ɤ": [
225
+ 69
226
+ ],
227
+ "ɥ": [
228
+ 70
229
+ ],
230
+ "ɦ": [
231
+ 71
232
+ ],
233
+ "ɧ": [
234
+ 72
235
+ ],
236
+ "ɨ": [
237
+ 73
238
+ ],
239
+ "ɪ": [
240
+ 74
241
+ ],
242
+ "ɫ": [
243
+ 75
244
+ ],
245
+ "ɬ": [
246
+ 76
247
+ ],
248
+ "ɭ": [
249
+ 77
250
+ ],
251
+ "ɮ": [
252
+ 78
253
+ ],
254
+ "ɯ": [
255
+ 79
256
+ ],
257
+ "ɰ": [
258
+ 80
259
+ ],
260
+ "ɱ": [
261
+ 81
262
+ ],
263
+ "ɲ": [
264
+ 82
265
+ ],
266
+ "ɳ": [
267
+ 83
268
+ ],
269
+ "ɴ": [
270
+ 84
271
+ ],
272
+ "ɵ": [
273
+ 85
274
+ ],
275
+ "ɶ": [
276
+ 86
277
+ ],
278
+ "ɸ": [
279
+ 87
280
+ ],
281
+ "ɹ": [
282
+ 88
283
+ ],
284
+ "ɺ": [
285
+ 89
286
+ ],
287
+ "ɻ": [
288
+ 90
289
+ ],
290
+ "ɽ": [
291
+ 91
292
+ ],
293
+ "ɾ": [
294
+ 92
295
+ ],
296
+ "ʀ": [
297
+ 93
298
+ ],
299
+ "ʁ": [
300
+ 94
301
+ ],
302
+ "ʂ": [
303
+ 95
304
+ ],
305
+ "ʃ": [
306
+ 96
307
+ ],
308
+ "ʄ": [
309
+ 97
310
+ ],
311
+ "ʈ": [
312
+ 98
313
+ ],
314
+ "ʉ": [
315
+ 99
316
+ ],
317
+ "ʊ": [
318
+ 100
319
+ ],
320
+ "ʋ": [
321
+ 101
322
+ ],
323
+ "ʌ": [
324
+ 102
325
+ ],
326
+ "ʍ": [
327
+ 103
328
+ ],
329
+ "ʎ": [
330
+ 104
331
+ ],
332
+ "ʏ": [
333
+ 105
334
+ ],
335
+ "ʐ": [
336
+ 106
337
+ ],
338
+ "ʑ": [
339
+ 107
340
+ ],
341
+ "ʒ": [
342
+ 108
343
+ ],
344
+ "ʔ": [
345
+ 109
346
+ ],
347
+ "ʕ": [
348
+ 110
349
+ ],
350
+ "ʘ": [
351
+ 111
352
+ ],
353
+ "ʙ": [
354
+ 112
355
+ ],
356
+ "ʛ": [
357
+ 113
358
+ ],
359
+ "ʜ": [
360
+ 114
361
+ ],
362
+ "ʝ": [
363
+ 115
364
+ ],
365
+ "ʟ": [
366
+ 116
367
+ ],
368
+ "ʡ": [
369
+ 117
370
+ ],
371
+ "ʢ": [
372
+ 118
373
+ ],
374
+ "ʲ": [
375
+ 119
376
+ ],
377
+ "ˈ": [
378
+ 120
379
+ ],
380
+ "ˌ": [
381
+ 121
382
+ ],
383
+ "ː": [
384
+ 122
385
+ ],
386
+ "ˑ": [
387
+ 123
388
+ ],
389
+ "˞": [
390
+ 124
391
+ ],
392
+ "β": [
393
+ 125
394
+ ],
395
+ "θ": [
396
+ 126
397
+ ],
398
+ "χ": [
399
+ 127
400
+ ],
401
+ "ᵻ": [
402
+ 128
403
+ ],
404
+ "ⱱ": [
405
+ 129
406
+ ],
407
+ "0": [
408
+ 130
409
+ ],
410
+ "1": [
411
+ 131
412
+ ],
413
+ "2": [
414
+ 132
415
+ ],
416
+ "3": [
417
+ 133
418
+ ],
419
+ "4": [
420
+ 134
421
+ ],
422
+ "5": [
423
+ 135
424
+ ],
425
+ "6": [
426
+ 136
427
+ ],
428
+ "7": [
429
+ 137
430
+ ],
431
+ "8": [
432
+ 138
433
+ ],
434
+ "9": [
435
+ 139
436
+ ],
437
+ "̧": [
438
+ 140
439
+ ],
440
+ "̃": [
441
+ 141
442
+ ],
443
+ "̪": [
444
+ 142
445
+ ],
446
+ "̯": [
447
+ 143
448
+ ],
449
+ "̩": [
450
+ 144
451
+ ],
452
+ "ʰ": [
453
+ 145
454
+ ],
455
+ "ˤ": [
456
+ 146
457
+ ],
458
+ "ε": [
459
+ 147
460
+ ],
461
+ "↓": [
462
+ 148
463
+ ],
464
+ "#": [
465
+ 149
466
+ ],
467
+ "\"": [
468
+ 150
469
+ ],
470
+ "↑": [
471
+ 151
472
+ ],
473
+ "̺": [
474
+ 152
475
+ ],
476
+ "̻": [
477
+ 153
478
+ ]
479
+ },
480
+ "num_symbols": 256,
481
+ "num_speakers": 1,
482
+ "speaker_id_map": {},
483
+ "piper_version": "1.0.0",
484
+ "language": {
485
+ "code": "ca_ES",
486
+ "family": "ca",
487
+ "region": "ES",
488
+ "name_native": "Català",
489
+ "name_english": "Catalan",
490
+ "country_english": "Spain"
491
+ },
492
+ "dataset": "upc_ona"
493
+ }
ca/ca_ES/upc_ona/medium/samples/speaker_0.mp3 ADDED
Binary file (173 kB). View file
 
ca/ca_ES/upc_ona/x_low/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ ca-upc_ona-x-low
ca/ca_ES/upc_ona/x_low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for upc_ona (x_low)
2
+
3
+ * Language: ca_ES (Catalan, Spain)
4
+ * Speakers: 1
5
+ * Quality: x_low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://collectivat.cat/asr#upc-festcat-tts-corpora
11
+ * License: CC BY-SA 3.0 ES
12
+
13
+ ## Training
14
+
15
+ Trained from scratch.
ca/ca_ES/upc_ona/x_low/ca_ES-upc_ona-x_low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13661d26423e0c791823823a5971f4e1aaf644a62e65e0e94d299c0e70560e14
3
+ size 20628813
ca/ca_ES/upc_ona/x_low/ca_ES-upc_ona-x_low.onnx.json ADDED
@@ -0,0 +1,420 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 16000,
4
+ "quality": "x_low"
5
+ },
6
+ "espeak": {
7
+ "voice": "ca"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_map": {},
15
+ "phoneme_id_map": {
16
+ "_": [
17
+ 0
18
+ ],
19
+ "^": [
20
+ 1
21
+ ],
22
+ "$": [
23
+ 2
24
+ ],
25
+ " ": [
26
+ 3
27
+ ],
28
+ "!": [
29
+ 4
30
+ ],
31
+ "'": [
32
+ 5
33
+ ],
34
+ "(": [
35
+ 6
36
+ ],
37
+ ")": [
38
+ 7
39
+ ],
40
+ ",": [
41
+ 8
42
+ ],
43
+ "-": [
44
+ 9
45
+ ],
46
+ ".": [
47
+ 10
48
+ ],
49
+ ":": [
50
+ 11
51
+ ],
52
+ ";": [
53
+ 12
54
+ ],
55
+ "?": [
56
+ 13
57
+ ],
58
+ "a": [
59
+ 14
60
+ ],
61
+ "b": [
62
+ 15
63
+ ],
64
+ "c": [
65
+ 16
66
+ ],
67
+ "d": [
68
+ 17
69
+ ],
70
+ "e": [
71
+ 18
72
+ ],
73
+ "f": [
74
+ 19
75
+ ],
76
+ "h": [
77
+ 20
78
+ ],
79
+ "i": [
80
+ 21
81
+ ],
82
+ "j": [
83
+ 22
84
+ ],
85
+ "k": [
86
+ 23
87
+ ],
88
+ "l": [
89
+ 24
90
+ ],
91
+ "m": [
92
+ 25
93
+ ],
94
+ "n": [
95
+ 26
96
+ ],
97
+ "o": [
98
+ 27
99
+ ],
100
+ "p": [
101
+ 28
102
+ ],
103
+ "q": [
104
+ 29
105
+ ],
106
+ "r": [
107
+ 30
108
+ ],
109
+ "s": [
110
+ 31
111
+ ],
112
+ "t": [
113
+ 32
114
+ ],
115
+ "u": [
116
+ 33
117
+ ],
118
+ "v": [
119
+ 34
120
+ ],
121
+ "w": [
122
+ 35
123
+ ],
124
+ "x": [
125
+ 36
126
+ ],
127
+ "y": [
128
+ 37
129
+ ],
130
+ "z": [
131
+ 38
132
+ ],
133
+ "æ": [
134
+ 39
135
+ ],
136
+ "ç": [
137
+ 40
138
+ ],
139
+ "ð": [
140
+ 41
141
+ ],
142
+ "ø": [
143
+ 42
144
+ ],
145
+ "ħ": [
146
+ 43
147
+ ],
148
+ "ŋ": [
149
+ 44
150
+ ],
151
+ "œ": [
152
+ 45
153
+ ],
154
+ "ǀ": [
155
+ 46
156
+ ],
157
+ "ǁ": [
158
+ 47
159
+ ],
160
+ "ǂ": [
161
+ 48
162
+ ],
163
+ "ǃ": [
164
+ 49
165
+ ],
166
+ "ɐ": [
167
+ 50
168
+ ],
169
+ "ɑ": [
170
+ 51
171
+ ],
172
+ "ɒ": [
173
+ 52
174
+ ],
175
+ "ɓ": [
176
+ 53
177
+ ],
178
+ "ɔ": [
179
+ 54
180
+ ],
181
+ "ɕ": [
182
+ 55
183
+ ],
184
+ "ɖ": [
185
+ 56
186
+ ],
187
+ "ɗ": [
188
+ 57
189
+ ],
190
+ "ɘ": [
191
+ 58
192
+ ],
193
+ "ə": [
194
+ 59
195
+ ],
196
+ "ɚ": [
197
+ 60
198
+ ],
199
+ "ɛ": [
200
+ 61
201
+ ],
202
+ "ɜ": [
203
+ 62
204
+ ],
205
+ "ɞ": [
206
+ 63
207
+ ],
208
+ "ɟ": [
209
+ 64
210
+ ],
211
+ "ɠ": [
212
+ 65
213
+ ],
214
+ "ɡ": [
215
+ 66
216
+ ],
217
+ "ɢ": [
218
+ 67
219
+ ],
220
+ "ɣ": [
221
+ 68
222
+ ],
223
+ "ɤ": [
224
+ 69
225
+ ],
226
+ "ɥ": [
227
+ 70
228
+ ],
229
+ "ɦ": [
230
+ 71
231
+ ],
232
+ "ɧ": [
233
+ 72
234
+ ],
235
+ "ɨ": [
236
+ 73
237
+ ],
238
+ "ɪ": [
239
+ 74
240
+ ],
241
+ "ɫ": [
242
+ 75
243
+ ],
244
+ "ɬ": [
245
+ 76
246
+ ],
247
+ "ɭ": [
248
+ 77
249
+ ],
250
+ "ɮ": [
251
+ 78
252
+ ],
253
+ "ɯ": [
254
+ 79
255
+ ],
256
+ "ɰ": [
257
+ 80
258
+ ],
259
+ "ɱ": [
260
+ 81
261
+ ],
262
+ "ɲ": [
263
+ 82
264
+ ],
265
+ "ɳ": [
266
+ 83
267
+ ],
268
+ "ɴ": [
269
+ 84
270
+ ],
271
+ "ɵ": [
272
+ 85
273
+ ],
274
+ "ɶ": [
275
+ 86
276
+ ],
277
+ "ɸ": [
278
+ 87
279
+ ],
280
+ "ɹ": [
281
+ 88
282
+ ],
283
+ "ɺ": [
284
+ 89
285
+ ],
286
+ "ɻ": [
287
+ 90
288
+ ],
289
+ "ɽ": [
290
+ 91
291
+ ],
292
+ "ɾ": [
293
+ 92
294
+ ],
295
+ "ʀ": [
296
+ 93
297
+ ],
298
+ "ʁ": [
299
+ 94
300
+ ],
301
+ "ʂ": [
302
+ 95
303
+ ],
304
+ "ʃ": [
305
+ 96
306
+ ],
307
+ "ʄ": [
308
+ 97
309
+ ],
310
+ "ʈ": [
311
+ 98
312
+ ],
313
+ "ʉ": [
314
+ 99
315
+ ],
316
+ "ʊ": [
317
+ 100
318
+ ],
319
+ "ʋ": [
320
+ 101
321
+ ],
322
+ "ʌ": [
323
+ 102
324
+ ],
325
+ "ʍ": [
326
+ 103
327
+ ],
328
+ "ʎ": [
329
+ 104
330
+ ],
331
+ "ʏ": [
332
+ 105
333
+ ],
334
+ "ʐ": [
335
+ 106
336
+ ],
337
+ "ʑ": [
338
+ 107
339
+ ],
340
+ "ʒ": [
341
+ 108
342
+ ],
343
+ "ʔ": [
344
+ 109
345
+ ],
346
+ "ʕ": [
347
+ 110
348
+ ],
349
+ "ʘ": [
350
+ 111
351
+ ],
352
+ "ʙ": [
353
+ 112
354
+ ],
355
+ "ʛ": [
356
+ 113
357
+ ],
358
+ "ʜ": [
359
+ 114
360
+ ],
361
+ "ʝ": [
362
+ 115
363
+ ],
364
+ "ʟ": [
365
+ 116
366
+ ],
367
+ "ʡ": [
368
+ 117
369
+ ],
370
+ "ʢ": [
371
+ 118
372
+ ],
373
+ "ʲ": [
374
+ 119
375
+ ],
376
+ "ˈ": [
377
+ 120
378
+ ],
379
+ "ˌ": [
380
+ 121
381
+ ],
382
+ "ː": [
383
+ 122
384
+ ],
385
+ "ˑ": [
386
+ 123
387
+ ],
388
+ "˞": [
389
+ 124
390
+ ],
391
+ "β": [
392
+ 125
393
+ ],
394
+ "θ": [
395
+ 126
396
+ ],
397
+ "χ": [
398
+ 127
399
+ ],
400
+ "ᵻ": [
401
+ 128
402
+ ],
403
+ "ⱱ": [
404
+ 129
405
+ ]
406
+ },
407
+ "num_symbols": 130,
408
+ "num_speakers": 1,
409
+ "speaker_id_map": {},
410
+ "piper_version": "0.2.0",
411
+ "language": {
412
+ "code": "ca_ES",
413
+ "family": "ca",
414
+ "region": "ES",
415
+ "name_native": "Català",
416
+ "name_english": "Catalan",
417
+ "country_english": "Spain"
418
+ },
419
+ "dataset": "upc_ona"
420
+ }
ca/ca_ES/upc_ona/x_low/samples/speaker_0.mp3 ADDED
Binary file (139 kB). View file
 
ca/ca_ES/upc_pau/x_low/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ ca-upc_pau-x-low
ca/ca_ES/upc_pau/x_low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for upc_pau (x_low)
2
+
3
+ * Language: ca_ES (Catalan, Spain)
4
+ * Speakers: 1
5
+ * Quality: x_low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://collectivat.cat/asr#upc-festcat-tts-corpora
11
+ * License: CC BY-SA 3.0 ES
12
+
13
+ ## Training
14
+
15
+ Trained from scratch.
ca/ca_ES/upc_pau/x_low/ca_ES-upc_pau-x_low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c936a1a78b0a795af3c2422a0f2edb26303c389ff961616902ba12e26b489071
3
+ size 28130791
ca/ca_ES/upc_pau/x_low/ca_ES-upc_pau-x_low.onnx.json ADDED
@@ -0,0 +1,420 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 16000,
4
+ "quality": "x_low"
5
+ },
6
+ "espeak": {
7
+ "voice": "ca"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_map": {},
15
+ "phoneme_id_map": {
16
+ "_": [
17
+ 0
18
+ ],
19
+ "^": [
20
+ 1
21
+ ],
22
+ "$": [
23
+ 2
24
+ ],
25
+ " ": [
26
+ 3
27
+ ],
28
+ "!": [
29
+ 4
30
+ ],
31
+ "'": [
32
+ 5
33
+ ],
34
+ "(": [
35
+ 6
36
+ ],
37
+ ")": [
38
+ 7
39
+ ],
40
+ ",": [
41
+ 8
42
+ ],
43
+ "-": [
44
+ 9
45
+ ],
46
+ ".": [
47
+ 10
48
+ ],
49
+ ":": [
50
+ 11
51
+ ],
52
+ ";": [
53
+ 12
54
+ ],
55
+ "?": [
56
+ 13
57
+ ],
58
+ "a": [
59
+ 14
60
+ ],
61
+ "b": [
62
+ 15
63
+ ],
64
+ "c": [
65
+ 16
66
+ ],
67
+ "d": [
68
+ 17
69
+ ],
70
+ "e": [
71
+ 18
72
+ ],
73
+ "f": [
74
+ 19
75
+ ],
76
+ "h": [
77
+ 20
78
+ ],
79
+ "i": [
80
+ 21
81
+ ],
82
+ "j": [
83
+ 22
84
+ ],
85
+ "k": [
86
+ 23
87
+ ],
88
+ "l": [
89
+ 24
90
+ ],
91
+ "m": [
92
+ 25
93
+ ],
94
+ "n": [
95
+ 26
96
+ ],
97
+ "o": [
98
+ 27
99
+ ],
100
+ "p": [
101
+ 28
102
+ ],
103
+ "q": [
104
+ 29
105
+ ],
106
+ "r": [
107
+ 30
108
+ ],
109
+ "s": [
110
+ 31
111
+ ],
112
+ "t": [
113
+ 32
114
+ ],
115
+ "u": [
116
+ 33
117
+ ],
118
+ "v": [
119
+ 34
120
+ ],
121
+ "w": [
122
+ 35
123
+ ],
124
+ "x": [
125
+ 36
126
+ ],
127
+ "y": [
128
+ 37
129
+ ],
130
+ "z": [
131
+ 38
132
+ ],
133
+ "æ": [
134
+ 39
135
+ ],
136
+ "ç": [
137
+ 40
138
+ ],
139
+ "ð": [
140
+ 41
141
+ ],
142
+ "ø": [
143
+ 42
144
+ ],
145
+ "ħ": [
146
+ 43
147
+ ],
148
+ "ŋ": [
149
+ 44
150
+ ],
151
+ "œ": [
152
+ 45
153
+ ],
154
+ "ǀ": [
155
+ 46
156
+ ],
157
+ "ǁ": [
158
+ 47
159
+ ],
160
+ "ǂ": [
161
+ 48
162
+ ],
163
+ "ǃ": [
164
+ 49
165
+ ],
166
+ "ɐ": [
167
+ 50
168
+ ],
169
+ "ɑ": [
170
+ 51
171
+ ],
172
+ "ɒ": [
173
+ 52
174
+ ],
175
+ "ɓ": [
176
+ 53
177
+ ],
178
+ "ɔ": [
179
+ 54
180
+ ],
181
+ "ɕ": [
182
+ 55
183
+ ],
184
+ "ɖ": [
185
+ 56
186
+ ],
187
+ "ɗ": [
188
+ 57
189
+ ],
190
+ "ɘ": [
191
+ 58
192
+ ],
193
+ "ə": [
194
+ 59
195
+ ],
196
+ "ɚ": [
197
+ 60
198
+ ],
199
+ "ɛ": [
200
+ 61
201
+ ],
202
+ "ɜ": [
203
+ 62
204
+ ],
205
+ "ɞ": [
206
+ 63
207
+ ],
208
+ "ɟ": [
209
+ 64
210
+ ],
211
+ "ɠ": [
212
+ 65
213
+ ],
214
+ "ɡ": [
215
+ 66
216
+ ],
217
+ "ɢ": [
218
+ 67
219
+ ],
220
+ "ɣ": [
221
+ 68
222
+ ],
223
+ "ɤ": [
224
+ 69
225
+ ],
226
+ "ɥ": [
227
+ 70
228
+ ],
229
+ "ɦ": [
230
+ 71
231
+ ],
232
+ "ɧ": [
233
+ 72
234
+ ],
235
+ "ɨ": [
236
+ 73
237
+ ],
238
+ "ɪ": [
239
+ 74
240
+ ],
241
+ "ɫ": [
242
+ 75
243
+ ],
244
+ "ɬ": [
245
+ 76
246
+ ],
247
+ "ɭ": [
248
+ 77
249
+ ],
250
+ "ɮ": [
251
+ 78
252
+ ],
253
+ "ɯ": [
254
+ 79
255
+ ],
256
+ "ɰ": [
257
+ 80
258
+ ],
259
+ "ɱ": [
260
+ 81
261
+ ],
262
+ "ɲ": [
263
+ 82
264
+ ],
265
+ "ɳ": [
266
+ 83
267
+ ],
268
+ "ɴ": [
269
+ 84
270
+ ],
271
+ "ɵ": [
272
+ 85
273
+ ],
274
+ "ɶ": [
275
+ 86
276
+ ],
277
+ "ɸ": [
278
+ 87
279
+ ],
280
+ "ɹ": [
281
+ 88
282
+ ],
283
+ "ɺ": [
284
+ 89
285
+ ],
286
+ "ɻ": [
287
+ 90
288
+ ],
289
+ "ɽ": [
290
+ 91
291
+ ],
292
+ "ɾ": [
293
+ 92
294
+ ],
295
+ "ʀ": [
296
+ 93
297
+ ],
298
+ "ʁ": [
299
+ 94
300
+ ],
301
+ "ʂ": [
302
+ 95
303
+ ],
304
+ "ʃ": [
305
+ 96
306
+ ],
307
+ "ʄ": [
308
+ 97
309
+ ],
310
+ "ʈ": [
311
+ 98
312
+ ],
313
+ "ʉ": [
314
+ 99
315
+ ],
316
+ "ʊ": [
317
+ 100
318
+ ],
319
+ "ʋ": [
320
+ 101
321
+ ],
322
+ "ʌ": [
323
+ 102
324
+ ],
325
+ "ʍ": [
326
+ 103
327
+ ],
328
+ "ʎ": [
329
+ 104
330
+ ],
331
+ "ʏ": [
332
+ 105
333
+ ],
334
+ "ʐ": [
335
+ 106
336
+ ],
337
+ "ʑ": [
338
+ 107
339
+ ],
340
+ "ʒ": [
341
+ 108
342
+ ],
343
+ "ʔ": [
344
+ 109
345
+ ],
346
+ "ʕ": [
347
+ 110
348
+ ],
349
+ "ʘ": [
350
+ 111
351
+ ],
352
+ "ʙ": [
353
+ 112
354
+ ],
355
+ "ʛ": [
356
+ 113
357
+ ],
358
+ "ʜ": [
359
+ 114
360
+ ],
361
+ "ʝ": [
362
+ 115
363
+ ],
364
+ "ʟ": [
365
+ 116
366
+ ],
367
+ "ʡ": [
368
+ 117
369
+ ],
370
+ "ʢ": [
371
+ 118
372
+ ],
373
+ "ʲ": [
374
+ 119
375
+ ],
376
+ "ˈ": [
377
+ 120
378
+ ],
379
+ "ˌ": [
380
+ 121
381
+ ],
382
+ "ː": [
383
+ 122
384
+ ],
385
+ "ˑ": [
386
+ 123
387
+ ],
388
+ "˞": [
389
+ 124
390
+ ],
391
+ "β": [
392
+ 125
393
+ ],
394
+ "θ": [
395
+ 126
396
+ ],
397
+ "χ": [
398
+ 127
399
+ ],
400
+ "ᵻ": [
401
+ 128
402
+ ],
403
+ "ⱱ": [
404
+ 129
405
+ ]
406
+ },
407
+ "num_symbols": 130,
408
+ "num_speakers": 1,
409
+ "speaker_id_map": {},
410
+ "piper_version": "0.2.0",
411
+ "language": {
412
+ "code": "ca_ES",
413
+ "family": "ca",
414
+ "region": "ES",
415
+ "name_native": "Català",
416
+ "name_english": "Catalan",
417
+ "country_english": "Spain"
418
+ },
419
+ "dataset": "upc_pau"
420
+ }
ca/ca_ES/upc_pau/x_low/samples/speaker_0.mp3 ADDED
Binary file (151 kB). View file
 
cs/cs_CZ/jirka/low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for jirka (low)
2
+
3
+ * Language: cs_CZ (Czech, Czech Republic)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/NabuCasa/voice-datasets
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (low quality).
cs/cs_CZ/jirka/low/cs_CZ-jirka-low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72e73fb306a165b41927d2c9d882f71e9f1c86ac5edf37c5441370a6e4e6ef7d
3
+ size 63201294
cs/cs_CZ/jirka/low/cs_CZ-jirka-low.onnx.json ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 16000,
4
+ "quality": "low"
5
+ },
6
+ "espeak": {
7
+ "voice": "cs"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ " ": [
18
+ 3
19
+ ],
20
+ "!": [
21
+ 4
22
+ ],
23
+ "\"": [
24
+ 150
25
+ ],
26
+ "#": [
27
+ 149
28
+ ],
29
+ "$": [
30
+ 2
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ "0": [
51
+ 130
52
+ ],
53
+ "1": [
54
+ 131
55
+ ],
56
+ "2": [
57
+ 132
58
+ ],
59
+ "3": [
60
+ 133
61
+ ],
62
+ "4": [
63
+ 134
64
+ ],
65
+ "5": [
66
+ 135
67
+ ],
68
+ "6": [
69
+ 136
70
+ ],
71
+ "7": [
72
+ 137
73
+ ],
74
+ "8": [
75
+ 138
76
+ ],
77
+ "9": [
78
+ 139
79
+ ],
80
+ ":": [
81
+ 11
82
+ ],
83
+ ";": [
84
+ 12
85
+ ],
86
+ "?": [
87
+ 13
88
+ ],
89
+ "X": [
90
+ 156
91
+ ],
92
+ "^": [
93
+ 1
94
+ ],
95
+ "_": [
96
+ 0
97
+ ],
98
+ "a": [
99
+ 14
100
+ ],
101
+ "b": [
102
+ 15
103
+ ],
104
+ "c": [
105
+ 16
106
+ ],
107
+ "d": [
108
+ 17
109
+ ],
110
+ "e": [
111
+ 18
112
+ ],
113
+ "f": [
114
+ 19
115
+ ],
116
+ "g": [
117
+ 154
118
+ ],
119
+ "h": [
120
+ 20
121
+ ],
122
+ "i": [
123
+ 21
124
+ ],
125
+ "j": [
126
+ 22
127
+ ],
128
+ "k": [
129
+ 23
130
+ ],
131
+ "l": [
132
+ 24
133
+ ],
134
+ "m": [
135
+ 25
136
+ ],
137
+ "n": [
138
+ 26
139
+ ],
140
+ "o": [
141
+ 27
142
+ ],
143
+ "p": [
144
+ 28
145
+ ],
146
+ "q": [
147
+ 29
148
+ ],
149
+ "r": [
150
+ 30
151
+ ],
152
+ "s": [
153
+ 31
154
+ ],
155
+ "t": [
156
+ 32
157
+ ],
158
+ "u": [
159
+ 33
160
+ ],
161
+ "v": [
162
+ 34
163
+ ],
164
+ "w": [
165
+ 35
166
+ ],
167
+ "x": [
168
+ 36
169
+ ],
170
+ "y": [
171
+ 37
172
+ ],
173
+ "z": [
174
+ 38
175
+ ],
176
+ "æ": [
177
+ 39
178
+ ],
179
+ "ç": [
180
+ 40
181
+ ],
182
+ "ð": [
183
+ 41
184
+ ],
185
+ "ø": [
186
+ 42
187
+ ],
188
+ "ħ": [
189
+ 43
190
+ ],
191
+ "ŋ": [
192
+ 44
193
+ ],
194
+ "œ": [
195
+ 45
196
+ ],
197
+ "ǀ": [
198
+ 46
199
+ ],
200
+ "ǁ": [
201
+ 47
202
+ ],
203
+ "ǂ": [
204
+ 48
205
+ ],
206
+ "ǃ": [
207
+ 49
208
+ ],
209
+ "ɐ": [
210
+ 50
211
+ ],
212
+ "ɑ": [
213
+ 51
214
+ ],
215
+ "ɒ": [
216
+ 52
217
+ ],
218
+ "ɓ": [
219
+ 53
220
+ ],
221
+ "ɔ": [
222
+ 54
223
+ ],
224
+ "ɕ": [
225
+ 55
226
+ ],
227
+ "ɖ": [
228
+ 56
229
+ ],
230
+ "ɗ": [
231
+ 57
232
+ ],
233
+ "ɘ": [
234
+ 58
235
+ ],
236
+ "ə": [
237
+ 59
238
+ ],
239
+ "ɚ": [
240
+ 60
241
+ ],
242
+ "ɛ": [
243
+ 61
244
+ ],
245
+ "ɜ": [
246
+ 62
247
+ ],
248
+ "ɞ": [
249
+ 63
250
+ ],
251
+ "ɟ": [
252
+ 64
253
+ ],
254
+ "ɠ": [
255
+ 65
256
+ ],
257
+ "ɡ": [
258
+ 66
259
+ ],
260
+ "ɢ": [
261
+ 67
262
+ ],
263
+ "ɣ": [
264
+ 68
265
+ ],
266
+ "ɤ": [
267
+ 69
268
+ ],
269
+ "ɥ": [
270
+ 70
271
+ ],
272
+ "ɦ": [
273
+ 71
274
+ ],
275
+ "ɧ": [
276
+ 72
277
+ ],
278
+ "ɨ": [
279
+ 73
280
+ ],
281
+ "ɪ": [
282
+ 74
283
+ ],
284
+ "ɫ": [
285
+ 75
286
+ ],
287
+ "ɬ": [
288
+ 76
289
+ ],
290
+ "ɭ": [
291
+ 77
292
+ ],
293
+ "ɮ": [
294
+ 78
295
+ ],
296
+ "ɯ": [
297
+ 79
298
+ ],
299
+ "ɰ": [
300
+ 80
301
+ ],
302
+ "ɱ": [
303
+ 81
304
+ ],
305
+ "ɲ": [
306
+ 82
307
+ ],
308
+ "ɳ": [
309
+ 83
310
+ ],
311
+ "ɴ": [
312
+ 84
313
+ ],
314
+ "ɵ": [
315
+ 85
316
+ ],
317
+ "ɶ": [
318
+ 86
319
+ ],
320
+ "ɸ": [
321
+ 87
322
+ ],
323
+ "ɹ": [
324
+ 88
325
+ ],
326
+ "ɺ": [
327
+ 89
328
+ ],
329
+ "ɻ": [
330
+ 90
331
+ ],
332
+ "ɽ": [
333
+ 91
334
+ ],
335
+ "ɾ": [
336
+ 92
337
+ ],
338
+ "ʀ": [
339
+ 93
340
+ ],
341
+ "ʁ": [
342
+ 94
343
+ ],
344
+ "ʂ": [
345
+ 95
346
+ ],
347
+ "ʃ": [
348
+ 96
349
+ ],
350
+ "ʄ": [
351
+ 97
352
+ ],
353
+ "ʈ": [
354
+ 98
355
+ ],
356
+ "ʉ": [
357
+ 99
358
+ ],
359
+ "ʊ": [
360
+ 100
361
+ ],
362
+ "ʋ": [
363
+ 101
364
+ ],
365
+ "ʌ": [
366
+ 102
367
+ ],
368
+ "ʍ": [
369
+ 103
370
+ ],
371
+ "ʎ": [
372
+ 104
373
+ ],
374
+ "ʏ": [
375
+ 105
376
+ ],
377
+ "ʐ": [
378
+ 106
379
+ ],
380
+ "ʑ": [
381
+ 107
382
+ ],
383
+ "ʒ": [
384
+ 108
385
+ ],
386
+ "ʔ": [
387
+ 109
388
+ ],
389
+ "ʕ": [
390
+ 110
391
+ ],
392
+ "ʘ": [
393
+ 111
394
+ ],
395
+ "ʙ": [
396
+ 112
397
+ ],
398
+ "ʛ": [
399
+ 113
400
+ ],
401
+ "ʜ": [
402
+ 114
403
+ ],
404
+ "ʝ": [
405
+ 115
406
+ ],
407
+ "ʟ": [
408
+ 116
409
+ ],
410
+ "ʡ": [
411
+ 117
412
+ ],
413
+ "ʢ": [
414
+ 118
415
+ ],
416
+ "ʦ": [
417
+ 155
418
+ ],
419
+ "ʰ": [
420
+ 145
421
+ ],
422
+ "ʲ": [
423
+ 119
424
+ ],
425
+ "ˈ": [
426
+ 120
427
+ ],
428
+ "ˌ": [
429
+ 121
430
+ ],
431
+ "ː": [
432
+ 122
433
+ ],
434
+ "ˑ": [
435
+ 123
436
+ ],
437
+ "˞": [
438
+ 124
439
+ ],
440
+ "ˤ": [
441
+ 146
442
+ ],
443
+ "̃": [
444
+ 141
445
+ ],
446
+ "̊": [
447
+ 158
448
+ ],
449
+ "̝": [
450
+ 157
451
+ ],
452
+ "̧": [
453
+ 140
454
+ ],
455
+ "̩": [
456
+ 144
457
+ ],
458
+ "̪": [
459
+ 142
460
+ ],
461
+ "̯": [
462
+ 143
463
+ ],
464
+ "̺": [
465
+ 152
466
+ ],
467
+ "̻": [
468
+ 153
469
+ ],
470
+ "β": [
471
+ 125
472
+ ],
473
+ "ε": [
474
+ 147
475
+ ],
476
+ "θ": [
477
+ 126
478
+ ],
479
+ "χ": [
480
+ 127
481
+ ],
482
+ "ᵻ": [
483
+ 128
484
+ ],
485
+ "↑": [
486
+ 151
487
+ ],
488
+ "↓": [
489
+ 148
490
+ ],
491
+ "ⱱ": [
492
+ 129
493
+ ]
494
+ },
495
+ "num_symbols": 256,
496
+ "num_speakers": 1,
497
+ "speaker_id_map": {},
498
+ "piper_version": "1.0.0",
499
+ "language": {
500
+ "code": "cs_CZ",
501
+ "family": "cs",
502
+ "region": "CZ",
503
+ "name_native": "Čeština",
504
+ "name_english": "Czech",
505
+ "country_english": "Czech Republic"
506
+ },
507
+ "dataset": "jirka"
508
+ }
cs/cs_CZ/jirka/low/samples/speaker_0.mp3 ADDED
Binary file (96.1 kB). View file
 
cs/cs_CZ/jirka/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for jirka (medium)
2
+
3
+ * Language: cs_CZ (Czech, Czech Republic)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/NabuCasa/voice-datasets
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
cs/cs_CZ/jirka/medium/cs_CZ-jirka-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbd5c900acacc8e8cbecd64347abb8de39c00a9d3104bed06fee92e4f319efc8
3
+ size 63201294
cs/cs_CZ/jirka/medium/cs_CZ-jirka-medium.onnx.json ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "cs"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ " ": [
18
+ 3
19
+ ],
20
+ "!": [
21
+ 4
22
+ ],
23
+ "\"": [
24
+ 150
25
+ ],
26
+ "#": [
27
+ 149
28
+ ],
29
+ "$": [
30
+ 2
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ "0": [
51
+ 130
52
+ ],
53
+ "1": [
54
+ 131
55
+ ],
56
+ "2": [
57
+ 132
58
+ ],
59
+ "3": [
60
+ 133
61
+ ],
62
+ "4": [
63
+ 134
64
+ ],
65
+ "5": [
66
+ 135
67
+ ],
68
+ "6": [
69
+ 136
70
+ ],
71
+ "7": [
72
+ 137
73
+ ],
74
+ "8": [
75
+ 138
76
+ ],
77
+ "9": [
78
+ 139
79
+ ],
80
+ ":": [
81
+ 11
82
+ ],
83
+ ";": [
84
+ 12
85
+ ],
86
+ "?": [
87
+ 13
88
+ ],
89
+ "X": [
90
+ 156
91
+ ],
92
+ "^": [
93
+ 1
94
+ ],
95
+ "_": [
96
+ 0
97
+ ],
98
+ "a": [
99
+ 14
100
+ ],
101
+ "b": [
102
+ 15
103
+ ],
104
+ "c": [
105
+ 16
106
+ ],
107
+ "d": [
108
+ 17
109
+ ],
110
+ "e": [
111
+ 18
112
+ ],
113
+ "f": [
114
+ 19
115
+ ],
116
+ "g": [
117
+ 154
118
+ ],
119
+ "h": [
120
+ 20
121
+ ],
122
+ "i": [
123
+ 21
124
+ ],
125
+ "j": [
126
+ 22
127
+ ],
128
+ "k": [
129
+ 23
130
+ ],
131
+ "l": [
132
+ 24
133
+ ],
134
+ "m": [
135
+ 25
136
+ ],
137
+ "n": [
138
+ 26
139
+ ],
140
+ "o": [
141
+ 27
142
+ ],
143
+ "p": [
144
+ 28
145
+ ],
146
+ "q": [
147
+ 29
148
+ ],
149
+ "r": [
150
+ 30
151
+ ],
152
+ "s": [
153
+ 31
154
+ ],
155
+ "t": [
156
+ 32
157
+ ],
158
+ "u": [
159
+ 33
160
+ ],
161
+ "v": [
162
+ 34
163
+ ],
164
+ "w": [
165
+ 35
166
+ ],
167
+ "x": [
168
+ 36
169
+ ],
170
+ "y": [
171
+ 37
172
+ ],
173
+ "z": [
174
+ 38
175
+ ],
176
+ "æ": [
177
+ 39
178
+ ],
179
+ "ç": [
180
+ 40
181
+ ],
182
+ "ð": [
183
+ 41
184
+ ],
185
+ "ø": [
186
+ 42
187
+ ],
188
+ "ħ": [
189
+ 43
190
+ ],
191
+ "ŋ": [
192
+ 44
193
+ ],
194
+ "œ": [
195
+ 45
196
+ ],
197
+ "ǀ": [
198
+ 46
199
+ ],
200
+ "ǁ": [
201
+ 47
202
+ ],
203
+ "ǂ": [
204
+ 48
205
+ ],
206
+ "ǃ": [
207
+ 49
208
+ ],
209
+ "ɐ": [
210
+ 50
211
+ ],
212
+ "ɑ": [
213
+ 51
214
+ ],
215
+ "ɒ": [
216
+ 52
217
+ ],
218
+ "ɓ": [
219
+ 53
220
+ ],
221
+ "ɔ": [
222
+ 54
223
+ ],
224
+ "ɕ": [
225
+ 55
226
+ ],
227
+ "ɖ": [
228
+ 56
229
+ ],
230
+ "ɗ": [
231
+ 57
232
+ ],
233
+ "ɘ": [
234
+ 58
235
+ ],
236
+ "ə": [
237
+ 59
238
+ ],
239
+ "ɚ": [
240
+ 60
241
+ ],
242
+ "ɛ": [
243
+ 61
244
+ ],
245
+ "ɜ": [
246
+ 62
247
+ ],
248
+ "ɞ": [
249
+ 63
250
+ ],
251
+ "ɟ": [
252
+ 64
253
+ ],
254
+ "ɠ": [
255
+ 65
256
+ ],
257
+ "ɡ": [
258
+ 66
259
+ ],
260
+ "ɢ": [
261
+ 67
262
+ ],
263
+ "ɣ": [
264
+ 68
265
+ ],
266
+ "ɤ": [
267
+ 69
268
+ ],
269
+ "ɥ": [
270
+ 70
271
+ ],
272
+ "ɦ": [
273
+ 71
274
+ ],
275
+ "ɧ": [
276
+ 72
277
+ ],
278
+ "ɨ": [
279
+ 73
280
+ ],
281
+ "ɪ": [
282
+ 74
283
+ ],
284
+ "ɫ": [
285
+ 75
286
+ ],
287
+ "ɬ": [
288
+ 76
289
+ ],
290
+ "ɭ": [
291
+ 77
292
+ ],
293
+ "ɮ": [
294
+ 78
295
+ ],
296
+ "ɯ": [
297
+ 79
298
+ ],
299
+ "ɰ": [
300
+ 80
301
+ ],
302
+ "ɱ": [
303
+ 81
304
+ ],
305
+ "ɲ": [
306
+ 82
307
+ ],
308
+ "ɳ": [
309
+ 83
310
+ ],
311
+ "ɴ": [
312
+ 84
313
+ ],
314
+ "ɵ": [
315
+ 85
316
+ ],
317
+ "ɶ": [
318
+ 86
319
+ ],
320
+ "ɸ": [
321
+ 87
322
+ ],
323
+ "ɹ": [
324
+ 88
325
+ ],
326
+ "ɺ": [
327
+ 89
328
+ ],
329
+ "ɻ": [
330
+ 90
331
+ ],
332
+ "ɽ": [
333
+ 91
334
+ ],
335
+ "ɾ": [
336
+ 92
337
+ ],
338
+ "ʀ": [
339
+ 93
340
+ ],
341
+ "ʁ": [
342
+ 94
343
+ ],
344
+ "ʂ": [
345
+ 95
346
+ ],
347
+ "ʃ": [
348
+ 96
349
+ ],
350
+ "ʄ": [
351
+ 97
352
+ ],
353
+ "ʈ": [
354
+ 98
355
+ ],
356
+ "ʉ": [
357
+ 99
358
+ ],
359
+ "ʊ": [
360
+ 100
361
+ ],
362
+ "ʋ": [
363
+ 101
364
+ ],
365
+ "ʌ": [
366
+ 102
367
+ ],
368
+ "ʍ": [
369
+ 103
370
+ ],
371
+ "ʎ": [
372
+ 104
373
+ ],
374
+ "ʏ": [
375
+ 105
376
+ ],
377
+ "ʐ": [
378
+ 106
379
+ ],
380
+ "ʑ": [
381
+ 107
382
+ ],
383
+ "ʒ": [
384
+ 108
385
+ ],
386
+ "ʔ": [
387
+ 109
388
+ ],
389
+ "ʕ": [
390
+ 110
391
+ ],
392
+ "ʘ": [
393
+ 111
394
+ ],
395
+ "ʙ": [
396
+ 112
397
+ ],
398
+ "ʛ": [
399
+ 113
400
+ ],
401
+ "ʜ": [
402
+ 114
403
+ ],
404
+ "ʝ": [
405
+ 115
406
+ ],
407
+ "ʟ": [
408
+ 116
409
+ ],
410
+ "ʡ": [
411
+ 117
412
+ ],
413
+ "ʢ": [
414
+ 118
415
+ ],
416
+ "ʦ": [
417
+ 155
418
+ ],
419
+ "ʰ": [
420
+ 145
421
+ ],
422
+ "ʲ": [
423
+ 119
424
+ ],
425
+ "ˈ": [
426
+ 120
427
+ ],
428
+ "ˌ": [
429
+ 121
430
+ ],
431
+ "ː": [
432
+ 122
433
+ ],
434
+ "ˑ": [
435
+ 123
436
+ ],
437
+ "˞": [
438
+ 124
439
+ ],
440
+ "ˤ": [
441
+ 146
442
+ ],
443
+ "̃": [
444
+ 141
445
+ ],
446
+ "̊": [
447
+ 158
448
+ ],
449
+ "̝": [
450
+ 157
451
+ ],
452
+ "̧": [
453
+ 140
454
+ ],
455
+ "̩": [
456
+ 144
457
+ ],
458
+ "̪": [
459
+ 142
460
+ ],
461
+ "̯": [
462
+ 143
463
+ ],
464
+ "̺": [
465
+ 152
466
+ ],
467
+ "̻": [
468
+ 153
469
+ ],
470
+ "β": [
471
+ 125
472
+ ],
473
+ "ε": [
474
+ 147
475
+ ],
476
+ "θ": [
477
+ 126
478
+ ],
479
+ "χ": [
480
+ 127
481
+ ],
482
+ "ᵻ": [
483
+ 128
484
+ ],
485
+ "↑": [
486
+ 151
487
+ ],
488
+ "↓": [
489
+ 148
490
+ ],
491
+ "ⱱ": [
492
+ 129
493
+ ]
494
+ },
495
+ "num_symbols": 256,
496
+ "num_speakers": 1,
497
+ "speaker_id_map": {},
498
+ "piper_version": "1.0.0",
499
+ "language": {
500
+ "code": "cs_CZ",
501
+ "family": "cs",
502
+ "region": "CZ",
503
+ "name_native": "Čeština",
504
+ "name_english": "Czech",
505
+ "country_english": "Czech Republic"
506
+ },
507
+ "dataset": "jirka"
508
+ }
cs/cs_CZ/jirka/medium/samples/speaker_0.mp3 ADDED
Binary file (132 kB). View file
 
da/da_DK/talesyntese/medium/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ da-nst_talesyntese-medium
da/da_DK/talesyntese/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for talesyntese (medium)
2
+
3
+ * Language: da_DK (Danish, Denmark)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://www.nb.no/sprakbanken/en/resource-catalogue/oai-nb-no-sbr-21/
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
da/da_DK/talesyntese/medium/da_DK-talesyntese-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9271efd25f7b8494bbd28d48dd675c8c119daa284f3ee488008935f515f1241
3
+ size 63201294
da/da_DK/talesyntese/medium/da_DK-talesyntese-medium.onnx.json ADDED
@@ -0,0 +1,493 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "da"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ "_": [
18
+ 0
19
+ ],
20
+ "^": [
21
+ 1
22
+ ],
23
+ "$": [
24
+ 2
25
+ ],
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ ":": [
51
+ 11
52
+ ],
53
+ ";": [
54
+ 12
55
+ ],
56
+ "?": [
57
+ 13
58
+ ],
59
+ "a": [
60
+ 14
61
+ ],
62
+ "b": [
63
+ 15
64
+ ],
65
+ "c": [
66
+ 16
67
+ ],
68
+ "d": [
69
+ 17
70
+ ],
71
+ "e": [
72
+ 18
73
+ ],
74
+ "f": [
75
+ 19
76
+ ],
77
+ "h": [
78
+ 20
79
+ ],
80
+ "i": [
81
+ 21
82
+ ],
83
+ "j": [
84
+ 22
85
+ ],
86
+ "k": [
87
+ 23
88
+ ],
89
+ "l": [
90
+ 24
91
+ ],
92
+ "m": [
93
+ 25
94
+ ],
95
+ "n": [
96
+ 26
97
+ ],
98
+ "o": [
99
+ 27
100
+ ],
101
+ "p": [
102
+ 28
103
+ ],
104
+ "q": [
105
+ 29
106
+ ],
107
+ "r": [
108
+ 30
109
+ ],
110
+ "s": [
111
+ 31
112
+ ],
113
+ "t": [
114
+ 32
115
+ ],
116
+ "u": [
117
+ 33
118
+ ],
119
+ "v": [
120
+ 34
121
+ ],
122
+ "w": [
123
+ 35
124
+ ],
125
+ "x": [
126
+ 36
127
+ ],
128
+ "y": [
129
+ 37
130
+ ],
131
+ "z": [
132
+ 38
133
+ ],
134
+ "æ": [
135
+ 39
136
+ ],
137
+ "ç": [
138
+ 40
139
+ ],
140
+ "ð": [
141
+ 41
142
+ ],
143
+ "ø": [
144
+ 42
145
+ ],
146
+ "ħ": [
147
+ 43
148
+ ],
149
+ "ŋ": [
150
+ 44
151
+ ],
152
+ "œ": [
153
+ 45
154
+ ],
155
+ "ǀ": [
156
+ 46
157
+ ],
158
+ "ǁ": [
159
+ 47
160
+ ],
161
+ "ǂ": [
162
+ 48
163
+ ],
164
+ "ǃ": [
165
+ 49
166
+ ],
167
+ "ɐ": [
168
+ 50
169
+ ],
170
+ "ɑ": [
171
+ 51
172
+ ],
173
+ "ɒ": [
174
+ 52
175
+ ],
176
+ "ɓ": [
177
+ 53
178
+ ],
179
+ "ɔ": [
180
+ 54
181
+ ],
182
+ "ɕ": [
183
+ 55
184
+ ],
185
+ "ɖ": [
186
+ 56
187
+ ],
188
+ "ɗ": [
189
+ 57
190
+ ],
191
+ "ɘ": [
192
+ 58
193
+ ],
194
+ "ə": [
195
+ 59
196
+ ],
197
+ "ɚ": [
198
+ 60
199
+ ],
200
+ "ɛ": [
201
+ 61
202
+ ],
203
+ "ɜ": [
204
+ 62
205
+ ],
206
+ "ɞ": [
207
+ 63
208
+ ],
209
+ "ɟ": [
210
+ 64
211
+ ],
212
+ "ɠ": [
213
+ 65
214
+ ],
215
+ "ɡ": [
216
+ 66
217
+ ],
218
+ "ɢ": [
219
+ 67
220
+ ],
221
+ "ɣ": [
222
+ 68
223
+ ],
224
+ "ɤ": [
225
+ 69
226
+ ],
227
+ "ɥ": [
228
+ 70
229
+ ],
230
+ "ɦ": [
231
+ 71
232
+ ],
233
+ "ɧ": [
234
+ 72
235
+ ],
236
+ "ɨ": [
237
+ 73
238
+ ],
239
+ "ɪ": [
240
+ 74
241
+ ],
242
+ "ɫ": [
243
+ 75
244
+ ],
245
+ "ɬ": [
246
+ 76
247
+ ],
248
+ "ɭ": [
249
+ 77
250
+ ],
251
+ "ɮ": [
252
+ 78
253
+ ],
254
+ "ɯ": [
255
+ 79
256
+ ],
257
+ "ɰ": [
258
+ 80
259
+ ],
260
+ "ɱ": [
261
+ 81
262
+ ],
263
+ "ɲ": [
264
+ 82
265
+ ],
266
+ "ɳ": [
267
+ 83
268
+ ],
269
+ "ɴ": [
270
+ 84
271
+ ],
272
+ "ɵ": [
273
+ 85
274
+ ],
275
+ "ɶ": [
276
+ 86
277
+ ],
278
+ "ɸ": [
279
+ 87
280
+ ],
281
+ "ɹ": [
282
+ 88
283
+ ],
284
+ "ɺ": [
285
+ 89
286
+ ],
287
+ "ɻ": [
288
+ 90
289
+ ],
290
+ "ɽ": [
291
+ 91
292
+ ],
293
+ "ɾ": [
294
+ 92
295
+ ],
296
+ "ʀ": [
297
+ 93
298
+ ],
299
+ "ʁ": [
300
+ 94
301
+ ],
302
+ "ʂ": [
303
+ 95
304
+ ],
305
+ "ʃ": [
306
+ 96
307
+ ],
308
+ "ʄ": [
309
+ 97
310
+ ],
311
+ "ʈ": [
312
+ 98
313
+ ],
314
+ "ʉ": [
315
+ 99
316
+ ],
317
+ "ʊ": [
318
+ 100
319
+ ],
320
+ "ʋ": [
321
+ 101
322
+ ],
323
+ "ʌ": [
324
+ 102
325
+ ],
326
+ "ʍ": [
327
+ 103
328
+ ],
329
+ "ʎ": [
330
+ 104
331
+ ],
332
+ "ʏ": [
333
+ 105
334
+ ],
335
+ "ʐ": [
336
+ 106
337
+ ],
338
+ "ʑ": [
339
+ 107
340
+ ],
341
+ "ʒ": [
342
+ 108
343
+ ],
344
+ "ʔ": [
345
+ 109
346
+ ],
347
+ "ʕ": [
348
+ 110
349
+ ],
350
+ "ʘ": [
351
+ 111
352
+ ],
353
+ "ʙ": [
354
+ 112
355
+ ],
356
+ "ʛ": [
357
+ 113
358
+ ],
359
+ "ʜ": [
360
+ 114
361
+ ],
362
+ "ʝ": [
363
+ 115
364
+ ],
365
+ "ʟ": [
366
+ 116
367
+ ],
368
+ "ʡ": [
369
+ 117
370
+ ],
371
+ "ʢ": [
372
+ 118
373
+ ],
374
+ "ʲ": [
375
+ 119
376
+ ],
377
+ "ˈ": [
378
+ 120
379
+ ],
380
+ "ˌ": [
381
+ 121
382
+ ],
383
+ "ː": [
384
+ 122
385
+ ],
386
+ "ˑ": [
387
+ 123
388
+ ],
389
+ "˞": [
390
+ 124
391
+ ],
392
+ "β": [
393
+ 125
394
+ ],
395
+ "θ": [
396
+ 126
397
+ ],
398
+ "χ": [
399
+ 127
400
+ ],
401
+ "ᵻ": [
402
+ 128
403
+ ],
404
+ "ⱱ": [
405
+ 129
406
+ ],
407
+ "0": [
408
+ 130
409
+ ],
410
+ "1": [
411
+ 131
412
+ ],
413
+ "2": [
414
+ 132
415
+ ],
416
+ "3": [
417
+ 133
418
+ ],
419
+ "4": [
420
+ 134
421
+ ],
422
+ "5": [
423
+ 135
424
+ ],
425
+ "6": [
426
+ 136
427
+ ],
428
+ "7": [
429
+ 137
430
+ ],
431
+ "8": [
432
+ 138
433
+ ],
434
+ "9": [
435
+ 139
436
+ ],
437
+ "̧": [
438
+ 140
439
+ ],
440
+ "̃": [
441
+ 141
442
+ ],
443
+ "̪": [
444
+ 142
445
+ ],
446
+ "̯": [
447
+ 143
448
+ ],
449
+ "̩": [
450
+ 144
451
+ ],
452
+ "ʰ": [
453
+ 145
454
+ ],
455
+ "ˤ": [
456
+ 146
457
+ ],
458
+ "ε": [
459
+ 147
460
+ ],
461
+ "↓": [
462
+ 148
463
+ ],
464
+ "#": [
465
+ 149
466
+ ],
467
+ "\"": [
468
+ 150
469
+ ],
470
+ "↑": [
471
+ 151
472
+ ],
473
+ "̺": [
474
+ 152
475
+ ],
476
+ "̻": [
477
+ 153
478
+ ]
479
+ },
480
+ "num_symbols": 256,
481
+ "num_speakers": 1,
482
+ "speaker_id_map": {},
483
+ "piper_version": "0.2.0",
484
+ "language": {
485
+ "code": "da_DK",
486
+ "family": "da",
487
+ "region": "DK",
488
+ "name_native": "Dansk",
489
+ "name_english": "Danish",
490
+ "country_english": "Denmark"
491
+ },
492
+ "dataset": "talesyntese"
493
+ }
da/da_DK/talesyntese/medium/samples/speaker_0.mp3 ADDED
Binary file (72.7 kB). View file
 
de/de_DE/eva_k/x_low/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ de-eva_k-x-low
de/de_DE/eva_k/x_low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for eva_k (x_low)
2
+
3
+ * Language: de (German)
4
+ * Speakers: 1
5
+ * Quality: x_low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://www.caito.de/2019/01/03/the-m-ailabs-speech-dataset/
11
+ * License: See URL
12
+
13
+ ## Training
14
+
15
+ Trained from scratch.
de/de_DE/eva_k/x_low/de_DE-eva_k-x_low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e88cf290fbfb768bf111330d2e8a46e376b0d85e3423a28bfebbc863a260dad8
3
+ size 20628813
de/de_DE/eva_k/x_low/de_DE-eva_k-x_low.onnx.json ADDED
@@ -0,0 +1,420 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 16000,
4
+ "quality": "x_low"
5
+ },
6
+ "espeak": {
7
+ "voice": "de"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_map": {},
15
+ "phoneme_id_map": {
16
+ "_": [
17
+ 0
18
+ ],
19
+ "^": [
20
+ 1
21
+ ],
22
+ "$": [
23
+ 2
24
+ ],
25
+ " ": [
26
+ 3
27
+ ],
28
+ "!": [
29
+ 4
30
+ ],
31
+ "'": [
32
+ 5
33
+ ],
34
+ "(": [
35
+ 6
36
+ ],
37
+ ")": [
38
+ 7
39
+ ],
40
+ ",": [
41
+ 8
42
+ ],
43
+ "-": [
44
+ 9
45
+ ],
46
+ ".": [
47
+ 10
48
+ ],
49
+ ":": [
50
+ 11
51
+ ],
52
+ ";": [
53
+ 12
54
+ ],
55
+ "?": [
56
+ 13
57
+ ],
58
+ "a": [
59
+ 14
60
+ ],
61
+ "b": [
62
+ 15
63
+ ],
64
+ "c": [
65
+ 16
66
+ ],
67
+ "d": [
68
+ 17
69
+ ],
70
+ "e": [
71
+ 18
72
+ ],
73
+ "f": [
74
+ 19
75
+ ],
76
+ "h": [
77
+ 20
78
+ ],
79
+ "i": [
80
+ 21
81
+ ],
82
+ "j": [
83
+ 22
84
+ ],
85
+ "k": [
86
+ 23
87
+ ],
88
+ "l": [
89
+ 24
90
+ ],
91
+ "m": [
92
+ 25
93
+ ],
94
+ "n": [
95
+ 26
96
+ ],
97
+ "o": [
98
+ 27
99
+ ],
100
+ "p": [
101
+ 28
102
+ ],
103
+ "q": [
104
+ 29
105
+ ],
106
+ "r": [
107
+ 30
108
+ ],
109
+ "s": [
110
+ 31
111
+ ],
112
+ "t": [
113
+ 32
114
+ ],
115
+ "u": [
116
+ 33
117
+ ],
118
+ "v": [
119
+ 34
120
+ ],
121
+ "w": [
122
+ 35
123
+ ],
124
+ "x": [
125
+ 36
126
+ ],
127
+ "y": [
128
+ 37
129
+ ],
130
+ "z": [
131
+ 38
132
+ ],
133
+ "æ": [
134
+ 39
135
+ ],
136
+ "ç": [
137
+ 40
138
+ ],
139
+ "ð": [
140
+ 41
141
+ ],
142
+ "ø": [
143
+ 42
144
+ ],
145
+ "ħ": [
146
+ 43
147
+ ],
148
+ "ŋ": [
149
+ 44
150
+ ],
151
+ "œ": [
152
+ 45
153
+ ],
154
+ "ǀ": [
155
+ 46
156
+ ],
157
+ "ǁ": [
158
+ 47
159
+ ],
160
+ "ǂ": [
161
+ 48
162
+ ],
163
+ "ǃ": [
164
+ 49
165
+ ],
166
+ "ɐ": [
167
+ 50
168
+ ],
169
+ "ɑ": [
170
+ 51
171
+ ],
172
+ "ɒ": [
173
+ 52
174
+ ],
175
+ "ɓ": [
176
+ 53
177
+ ],
178
+ "ɔ": [
179
+ 54
180
+ ],
181
+ "ɕ": [
182
+ 55
183
+ ],
184
+ "ɖ": [
185
+ 56
186
+ ],
187
+ "ɗ": [
188
+ 57
189
+ ],
190
+ "ɘ": [
191
+ 58
192
+ ],
193
+ "ə": [
194
+ 59
195
+ ],
196
+ "ɚ": [
197
+ 60
198
+ ],
199
+ "ɛ": [
200
+ 61
201
+ ],
202
+ "ɜ": [
203
+ 62
204
+ ],
205
+ "ɞ": [
206
+ 63
207
+ ],
208
+ "ɟ": [
209
+ 64
210
+ ],
211
+ "ɠ": [
212
+ 65
213
+ ],
214
+ "ɡ": [
215
+ 66
216
+ ],
217
+ "ɢ": [
218
+ 67
219
+ ],
220
+ "ɣ": [
221
+ 68
222
+ ],
223
+ "ɤ": [
224
+ 69
225
+ ],
226
+ "ɥ": [
227
+ 70
228
+ ],
229
+ "ɦ": [
230
+ 71
231
+ ],
232
+ "ɧ": [
233
+ 72
234
+ ],
235
+ "ɨ": [
236
+ 73
237
+ ],
238
+ "ɪ": [
239
+ 74
240
+ ],
241
+ "ɫ": [
242
+ 75
243
+ ],
244
+ "ɬ": [
245
+ 76
246
+ ],
247
+ "ɭ": [
248
+ 77
249
+ ],
250
+ "ɮ": [
251
+ 78
252
+ ],
253
+ "ɯ": [
254
+ 79
255
+ ],
256
+ "ɰ": [
257
+ 80
258
+ ],
259
+ "ɱ": [
260
+ 81
261
+ ],
262
+ "ɲ": [
263
+ 82
264
+ ],
265
+ "ɳ": [
266
+ 83
267
+ ],
268
+ "ɴ": [
269
+ 84
270
+ ],
271
+ "ɵ": [
272
+ 85
273
+ ],
274
+ "ɶ": [
275
+ 86
276
+ ],
277
+ "ɸ": [
278
+ 87
279
+ ],
280
+ "ɹ": [
281
+ 88
282
+ ],
283
+ "ɺ": [
284
+ 89
285
+ ],
286
+ "ɻ": [
287
+ 90
288
+ ],
289
+ "ɽ": [
290
+ 91
291
+ ],
292
+ "ɾ": [
293
+ 92
294
+ ],
295
+ "ʀ": [
296
+ 93
297
+ ],
298
+ "ʁ": [
299
+ 94
300
+ ],
301
+ "ʂ": [
302
+ 95
303
+ ],
304
+ "ʃ": [
305
+ 96
306
+ ],
307
+ "ʄ": [
308
+ 97
309
+ ],
310
+ "ʈ": [
311
+ 98
312
+ ],
313
+ "ʉ": [
314
+ 99
315
+ ],
316
+ "ʊ": [
317
+ 100
318
+ ],
319
+ "ʋ": [
320
+ 101
321
+ ],
322
+ "ʌ": [
323
+ 102
324
+ ],
325
+ "ʍ": [
326
+ 103
327
+ ],
328
+ "ʎ": [
329
+ 104
330
+ ],
331
+ "ʏ": [
332
+ 105
333
+ ],
334
+ "ʐ": [
335
+ 106
336
+ ],
337
+ "ʑ": [
338
+ 107
339
+ ],
340
+ "ʒ": [
341
+ 108
342
+ ],
343
+ "ʔ": [
344
+ 109
345
+ ],
346
+ "ʕ": [
347
+ 110
348
+ ],
349
+ "ʘ": [
350
+ 111
351
+ ],
352
+ "ʙ": [
353
+ 112
354
+ ],
355
+ "ʛ": [
356
+ 113
357
+ ],
358
+ "ʜ": [
359
+ 114
360
+ ],
361
+ "ʝ": [
362
+ 115
363
+ ],
364
+ "ʟ": [
365
+ 116
366
+ ],
367
+ "ʡ": [
368
+ 117
369
+ ],
370
+ "ʢ": [
371
+ 118
372
+ ],
373
+ "ʲ": [
374
+ 119
375
+ ],
376
+ "ˈ": [
377
+ 120
378
+ ],
379
+ "ˌ": [
380
+ 121
381
+ ],
382
+ "ː": [
383
+ 122
384
+ ],
385
+ "ˑ": [
386
+ 123
387
+ ],
388
+ "˞": [
389
+ 124
390
+ ],
391
+ "β": [
392
+ 125
393
+ ],
394
+ "θ": [
395
+ 126
396
+ ],
397
+ "χ": [
398
+ 127
399
+ ],
400
+ "ᵻ": [
401
+ 128
402
+ ],
403
+ "ⱱ": [
404
+ 129
405
+ ]
406
+ },
407
+ "num_symbols": 130,
408
+ "num_speakers": 1,
409
+ "speaker_id_map": {},
410
+ "piper_version": "0.2.0",
411
+ "language": {
412
+ "code": "de_DE",
413
+ "family": "de",
414
+ "region": "DE",
415
+ "name_native": "Deutsch",
416
+ "name_english": "German",
417
+ "country_english": "Germany"
418
+ },
419
+ "dataset": "eva_k"
420
+ }
de/de_DE/eva_k/x_low/samples/speaker_0.mp3 ADDED
Binary file (73.6 kB). View file
 
de/de_DE/karlsson/low/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ de-karlsson-low
de/de_DE/karlsson/low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for karlsson (low)
2
+
3
+ * Language: de_DE (German, Germany)
4
+ * Speakers: 1
5
+ * Quality: low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://www.caito.de/2019/01/03/the-m-ailabs-speech-dataset/
11
+ * License: See URL
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English Ryan voice (low quality).
de/de_DE/karlsson/low/de_DE-karlsson-low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9793bf7e461a472b3916cf260774bfc9812e9eb72601b147ed649d01064e8fe
3
+ size 63104526
de/de_DE/karlsson/low/de_DE-karlsson-low.onnx.json ADDED
@@ -0,0 +1,420 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 16000,
4
+ "quality": "low"
5
+ },
6
+ "espeak": {
7
+ "voice": "de"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_map": {},
15
+ "phoneme_id_map": {
16
+ "_": [
17
+ 0
18
+ ],
19
+ "^": [
20
+ 1
21
+ ],
22
+ "$": [
23
+ 2
24
+ ],
25
+ " ": [
26
+ 3
27
+ ],
28
+ "!": [
29
+ 4
30
+ ],
31
+ "'": [
32
+ 5
33
+ ],
34
+ "(": [
35
+ 6
36
+ ],
37
+ ")": [
38
+ 7
39
+ ],
40
+ ",": [
41
+ 8
42
+ ],
43
+ "-": [
44
+ 9
45
+ ],
46
+ ".": [
47
+ 10
48
+ ],
49
+ ":": [
50
+ 11
51
+ ],
52
+ ";": [
53
+ 12
54
+ ],
55
+ "?": [
56
+ 13
57
+ ],
58
+ "a": [
59
+ 14
60
+ ],
61
+ "b": [
62
+ 15
63
+ ],
64
+ "c": [
65
+ 16
66
+ ],
67
+ "d": [
68
+ 17
69
+ ],
70
+ "e": [
71
+ 18
72
+ ],
73
+ "f": [
74
+ 19
75
+ ],
76
+ "h": [
77
+ 20
78
+ ],
79
+ "i": [
80
+ 21
81
+ ],
82
+ "j": [
83
+ 22
84
+ ],
85
+ "k": [
86
+ 23
87
+ ],
88
+ "l": [
89
+ 24
90
+ ],
91
+ "m": [
92
+ 25
93
+ ],
94
+ "n": [
95
+ 26
96
+ ],
97
+ "o": [
98
+ 27
99
+ ],
100
+ "p": [
101
+ 28
102
+ ],
103
+ "q": [
104
+ 29
105
+ ],
106
+ "r": [
107
+ 30
108
+ ],
109
+ "s": [
110
+ 31
111
+ ],
112
+ "t": [
113
+ 32
114
+ ],
115
+ "u": [
116
+ 33
117
+ ],
118
+ "v": [
119
+ 34
120
+ ],
121
+ "w": [
122
+ 35
123
+ ],
124
+ "x": [
125
+ 36
126
+ ],
127
+ "y": [
128
+ 37
129
+ ],
130
+ "z": [
131
+ 38
132
+ ],
133
+ "æ": [
134
+ 39
135
+ ],
136
+ "ç": [
137
+ 40
138
+ ],
139
+ "ð": [
140
+ 41
141
+ ],
142
+ "ø": [
143
+ 42
144
+ ],
145
+ "ħ": [
146
+ 43
147
+ ],
148
+ "ŋ": [
149
+ 44
150
+ ],
151
+ "œ": [
152
+ 45
153
+ ],
154
+ "ǀ": [
155
+ 46
156
+ ],
157
+ "ǁ": [
158
+ 47
159
+ ],
160
+ "ǂ": [
161
+ 48
162
+ ],
163
+ "ǃ": [
164
+ 49
165
+ ],
166
+ "ɐ": [
167
+ 50
168
+ ],
169
+ "ɑ": [
170
+ 51
171
+ ],
172
+ "ɒ": [
173
+ 52
174
+ ],
175
+ "ɓ": [
176
+ 53
177
+ ],
178
+ "ɔ": [
179
+ 54
180
+ ],
181
+ "ɕ": [
182
+ 55
183
+ ],
184
+ "ɖ": [
185
+ 56
186
+ ],
187
+ "ɗ": [
188
+ 57
189
+ ],
190
+ "ɘ": [
191
+ 58
192
+ ],
193
+ "ə": [
194
+ 59
195
+ ],
196
+ "ɚ": [
197
+ 60
198
+ ],
199
+ "ɛ": [
200
+ 61
201
+ ],
202
+ "ɜ": [
203
+ 62
204
+ ],
205
+ "ɞ": [
206
+ 63
207
+ ],
208
+ "ɟ": [
209
+ 64
210
+ ],
211
+ "ɠ": [
212
+ 65
213
+ ],
214
+ "ɡ": [
215
+ 66
216
+ ],
217
+ "ɢ": [
218
+ 67
219
+ ],
220
+ "ɣ": [
221
+ 68
222
+ ],
223
+ "ɤ": [
224
+ 69
225
+ ],
226
+ "ɥ": [
227
+ 70
228
+ ],
229
+ "ɦ": [
230
+ 71
231
+ ],
232
+ "ɧ": [
233
+ 72
234
+ ],
235
+ "ɨ": [
236
+ 73
237
+ ],
238
+ "ɪ": [
239
+ 74
240
+ ],
241
+ "ɫ": [
242
+ 75
243
+ ],
244
+ "ɬ": [
245
+ 76
246
+ ],
247
+ "ɭ": [
248
+ 77
249
+ ],
250
+ "ɮ": [
251
+ 78
252
+ ],
253
+ "ɯ": [
254
+ 79
255
+ ],
256
+ "ɰ": [
257
+ 80
258
+ ],
259
+ "ɱ": [
260
+ 81
261
+ ],
262
+ "ɲ": [
263
+ 82
264
+ ],
265
+ "ɳ": [
266
+ 83
267
+ ],
268
+ "ɴ": [
269
+ 84
270
+ ],
271
+ "ɵ": [
272
+ 85
273
+ ],
274
+ "ɶ": [
275
+ 86
276
+ ],
277
+ "ɸ": [
278
+ 87
279
+ ],
280
+ "ɹ": [
281
+ 88
282
+ ],
283
+ "ɺ": [
284
+ 89
285
+ ],
286
+ "ɻ": [
287
+ 90
288
+ ],
289
+ "ɽ": [
290
+ 91
291
+ ],
292
+ "ɾ": [
293
+ 92
294
+ ],
295
+ "ʀ": [
296
+ 93
297
+ ],
298
+ "ʁ": [
299
+ 94
300
+ ],
301
+ "ʂ": [
302
+ 95
303
+ ],
304
+ "ʃ": [
305
+ 96
306
+ ],
307
+ "ʄ": [
308
+ 97
309
+ ],
310
+ "ʈ": [
311
+ 98
312
+ ],
313
+ "ʉ": [
314
+ 99
315
+ ],
316
+ "ʊ": [
317
+ 100
318
+ ],
319
+ "ʋ": [
320
+ 101
321
+ ],
322
+ "ʌ": [
323
+ 102
324
+ ],
325
+ "ʍ": [
326
+ 103
327
+ ],
328
+ "ʎ": [
329
+ 104
330
+ ],
331
+ "ʏ": [
332
+ 105
333
+ ],
334
+ "ʐ": [
335
+ 106
336
+ ],
337
+ "ʑ": [
338
+ 107
339
+ ],
340
+ "ʒ": [
341
+ 108
342
+ ],
343
+ "ʔ": [
344
+ 109
345
+ ],
346
+ "ʕ": [
347
+ 110
348
+ ],
349
+ "ʘ": [
350
+ 111
351
+ ],
352
+ "ʙ": [
353
+ 112
354
+ ],
355
+ "ʛ": [
356
+ 113
357
+ ],
358
+ "ʜ": [
359
+ 114
360
+ ],
361
+ "ʝ": [
362
+ 115
363
+ ],
364
+ "ʟ": [
365
+ 116
366
+ ],
367
+ "ʡ": [
368
+ 117
369
+ ],
370
+ "ʢ": [
371
+ 118
372
+ ],
373
+ "ʲ": [
374
+ 119
375
+ ],
376
+ "ˈ": [
377
+ 120
378
+ ],
379
+ "ˌ": [
380
+ 121
381
+ ],
382
+ "ː": [
383
+ 122
384
+ ],
385
+ "ˑ": [
386
+ 123
387
+ ],
388
+ "˞": [
389
+ 124
390
+ ],
391
+ "β": [
392
+ 125
393
+ ],
394
+ "θ": [
395
+ 126
396
+ ],
397
+ "χ": [
398
+ 127
399
+ ],
400
+ "ᵻ": [
401
+ 128
402
+ ],
403
+ "ⱱ": [
404
+ 129
405
+ ]
406
+ },
407
+ "num_symbols": 130,
408
+ "num_speakers": 1,
409
+ "speaker_id_map": {},
410
+ "piper_version": "0.2.0",
411
+ "language": {
412
+ "code": "de_DE",
413
+ "family": "de",
414
+ "region": "DE",
415
+ "name_native": "Deutsch",
416
+ "name_english": "German",
417
+ "country_english": "Germany"
418
+ },
419
+ "dataset": "karlsson"
420
+ }
de/de_DE/karlsson/low/samples/speaker_0.mp3 ADDED
Binary file (68.2 kB). View file
 
de/de_DE/kerstin/low/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ de-kerstin-low
de/de_DE/kerstin/low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for kerstin (low)
2
+
3
+ * Language: de_DE (German, Germany)
4
+ * Speakers: 1
5
+ * Quality: low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/rhasspy/dataset-voice-kerstin
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English Ryan voice (low quality).
de/de_DE/kerstin/low/de_DE-kerstin-low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d352a7641892cebf2903859af94e9ba81a141110215fe3943bcda7f7da401b7a
3
+ size 63104526
de/de_DE/kerstin/low/de_DE-kerstin-low.onnx.json ADDED
@@ -0,0 +1,420 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 16000,
4
+ "quality": "low"
5
+ },
6
+ "espeak": {
7
+ "voice": "de"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_map": {},
15
+ "phoneme_id_map": {
16
+ "_": [
17
+ 0
18
+ ],
19
+ "^": [
20
+ 1
21
+ ],
22
+ "$": [
23
+ 2
24
+ ],
25
+ " ": [
26
+ 3
27
+ ],
28
+ "!": [
29
+ 4
30
+ ],
31
+ "'": [
32
+ 5
33
+ ],
34
+ "(": [
35
+ 6
36
+ ],
37
+ ")": [
38
+ 7
39
+ ],
40
+ ",": [
41
+ 8
42
+ ],
43
+ "-": [
44
+ 9
45
+ ],
46
+ ".": [
47
+ 10
48
+ ],
49
+ ":": [
50
+ 11
51
+ ],
52
+ ";": [
53
+ 12
54
+ ],
55
+ "?": [
56
+ 13
57
+ ],
58
+ "a": [
59
+ 14
60
+ ],
61
+ "b": [
62
+ 15
63
+ ],
64
+ "c": [
65
+ 16
66
+ ],
67
+ "d": [
68
+ 17
69
+ ],
70
+ "e": [
71
+ 18
72
+ ],
73
+ "f": [
74
+ 19
75
+ ],
76
+ "h": [
77
+ 20
78
+ ],
79
+ "i": [
80
+ 21
81
+ ],
82
+ "j": [
83
+ 22
84
+ ],
85
+ "k": [
86
+ 23
87
+ ],
88
+ "l": [
89
+ 24
90
+ ],
91
+ "m": [
92
+ 25
93
+ ],
94
+ "n": [
95
+ 26
96
+ ],
97
+ "o": [
98
+ 27
99
+ ],
100
+ "p": [
101
+ 28
102
+ ],
103
+ "q": [
104
+ 29
105
+ ],
106
+ "r": [
107
+ 30
108
+ ],
109
+ "s": [
110
+ 31
111
+ ],
112
+ "t": [
113
+ 32
114
+ ],
115
+ "u": [
116
+ 33
117
+ ],
118
+ "v": [
119
+ 34
120
+ ],
121
+ "w": [
122
+ 35
123
+ ],
124
+ "x": [
125
+ 36
126
+ ],
127
+ "y": [
128
+ 37
129
+ ],
130
+ "z": [
131
+ 38
132
+ ],
133
+ "æ": [
134
+ 39
135
+ ],
136
+ "ç": [
137
+ 40
138
+ ],
139
+ "ð": [
140
+ 41
141
+ ],
142
+ "ø": [
143
+ 42
144
+ ],
145
+ "ħ": [
146
+ 43
147
+ ],
148
+ "ŋ": [
149
+ 44
150
+ ],
151
+ "œ": [
152
+ 45
153
+ ],
154
+ "ǀ": [
155
+ 46
156
+ ],
157
+ "ǁ": [
158
+ 47
159
+ ],
160
+ "ǂ": [
161
+ 48
162
+ ],
163
+ "ǃ": [
164
+ 49
165
+ ],
166
+ "ɐ": [
167
+ 50
168
+ ],
169
+ "ɑ": [
170
+ 51
171
+ ],
172
+ "ɒ": [
173
+ 52
174
+ ],
175
+ "ɓ": [
176
+ 53
177
+ ],
178
+ "ɔ": [
179
+ 54
180
+ ],
181
+ "ɕ": [
182
+ 55
183
+ ],
184
+ "ɖ": [
185
+ 56
186
+ ],
187
+ "ɗ": [
188
+ 57
189
+ ],
190
+ "ɘ": [
191
+ 58
192
+ ],
193
+ "ə": [
194
+ 59
195
+ ],
196
+ "ɚ": [
197
+ 60
198
+ ],
199
+ "ɛ": [
200
+ 61
201
+ ],
202
+ "ɜ": [
203
+ 62
204
+ ],
205
+ "ɞ": [
206
+ 63
207
+ ],
208
+ "ɟ": [
209
+ 64
210
+ ],
211
+ "ɠ": [
212
+ 65
213
+ ],
214
+ "ɡ": [
215
+ 66
216
+ ],
217
+ "ɢ": [
218
+ 67
219
+ ],
220
+ "ɣ": [
221
+ 68
222
+ ],
223
+ "ɤ": [
224
+ 69
225
+ ],
226
+ "ɥ": [
227
+ 70
228
+ ],
229
+ "ɦ": [
230
+ 71
231
+ ],
232
+ "ɧ": [
233
+ 72
234
+ ],
235
+ "ɨ": [
236
+ 73
237
+ ],
238
+ "ɪ": [
239
+ 74
240
+ ],
241
+ "ɫ": [
242
+ 75
243
+ ],
244
+ "ɬ": [
245
+ 76
246
+ ],
247
+ "ɭ": [
248
+ 77
249
+ ],
250
+ "ɮ": [
251
+ 78
252
+ ],
253
+ "ɯ": [
254
+ 79
255
+ ],
256
+ "ɰ": [
257
+ 80
258
+ ],
259
+ "ɱ": [
260
+ 81
261
+ ],
262
+ "ɲ": [
263
+ 82
264
+ ],
265
+ "ɳ": [
266
+ 83
267
+ ],
268
+ "ɴ": [
269
+ 84
270
+ ],
271
+ "ɵ": [
272
+ 85
273
+ ],
274
+ "ɶ": [
275
+ 86
276
+ ],
277
+ "ɸ": [
278
+ 87
279
+ ],
280
+ "ɹ": [
281
+ 88
282
+ ],
283
+ "ɺ": [
284
+ 89
285
+ ],
286
+ "ɻ": [
287
+ 90
288
+ ],
289
+ "ɽ": [
290
+ 91
291
+ ],
292
+ "ɾ": [
293
+ 92
294
+ ],
295
+ "ʀ": [
296
+ 93
297
+ ],
298
+ "ʁ": [
299
+ 94
300
+ ],
301
+ "ʂ": [
302
+ 95
303
+ ],
304
+ "ʃ": [
305
+ 96
306
+ ],
307
+ "ʄ": [
308
+ 97
309
+ ],
310
+ "ʈ": [
311
+ 98
312
+ ],
313
+ "ʉ": [
314
+ 99
315
+ ],
316
+ "ʊ": [
317
+ 100
318
+ ],
319
+ "ʋ": [
320
+ 101
321
+ ],
322
+ "ʌ": [
323
+ 102
324
+ ],
325
+ "ʍ": [
326
+ 103
327
+ ],
328
+ "ʎ": [
329
+ 104
330
+ ],
331
+ "ʏ": [
332
+ 105
333
+ ],
334
+ "ʐ": [
335
+ 106
336
+ ],
337
+ "ʑ": [
338
+ 107
339
+ ],
340
+ "ʒ": [
341
+ 108
342
+ ],
343
+ "ʔ": [
344
+ 109
345
+ ],
346
+ "ʕ": [
347
+ 110
348
+ ],
349
+ "ʘ": [
350
+ 111
351
+ ],
352
+ "ʙ": [
353
+ 112
354
+ ],
355
+ "ʛ": [
356
+ 113
357
+ ],
358
+ "ʜ": [
359
+ 114
360
+ ],
361
+ "ʝ": [
362
+ 115
363
+ ],
364
+ "ʟ": [
365
+ 116
366
+ ],
367
+ "ʡ": [
368
+ 117
369
+ ],
370
+ "ʢ": [
371
+ 118
372
+ ],
373
+ "ʲ": [
374
+ 119
375
+ ],
376
+ "ˈ": [
377
+ 120
378
+ ],
379
+ "ˌ": [
380
+ 121
381
+ ],
382
+ "ː": [
383
+ 122
384
+ ],
385
+ "ˑ": [
386
+ 123
387
+ ],
388
+ "˞": [
389
+ 124
390
+ ],
391
+ "β": [
392
+ 125
393
+ ],
394
+ "θ": [
395
+ 126
396
+ ],
397
+ "χ": [
398
+ 127
399
+ ],
400
+ "ᵻ": [
401
+ 128
402
+ ],
403
+ "ⱱ": [
404
+ 129
405
+ ]
406
+ },
407
+ "num_symbols": 130,
408
+ "num_speakers": 1,
409
+ "speaker_id_map": {},
410
+ "piper_version": "0.2.0",
411
+ "language": {
412
+ "code": "de_DE",
413
+ "family": "de",
414
+ "region": "DE",
415
+ "name_native": "Deutsch",
416
+ "name_english": "German",
417
+ "country_english": "Germany"
418
+ },
419
+ "dataset": "kerstin"
420
+ }
de/de_DE/kerstin/low/samples/speaker_0.mp3 ADDED
Binary file (75.3 kB). View file