mychen76 commited on
Commit
06c56bb
1 Parent(s): 87fa777
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. ru/ru_RU/denis/medium/MODEL_CARD +15 -0
  2. ru/ru_RU/denis/medium/ru_RU-denis-medium.onnx +3 -0
  3. ru/ru_RU/denis/medium/ru_RU-denis-medium.onnx.json +487 -0
  4. ru/ru_RU/denis/medium/samples/speaker_0.mp3 +0 -0
  5. ru/ru_RU/dmitri/medium/MODEL_CARD +15 -0
  6. ru/ru_RU/dmitri/medium/ru_RU-dmitri-medium.onnx +3 -0
  7. ru/ru_RU/dmitri/medium/ru_RU-dmitri-medium.onnx.json +487 -0
  8. ru/ru_RU/dmitri/medium/samples/speaker_0.mp3 +0 -0
  9. ru/ru_RU/irina/medium/ALIASES +1 -0
  10. ru/ru_RU/irina/medium/MODEL_CARD +15 -0
  11. ru/ru_RU/irina/medium/ru_RU-irina-medium.onnx +3 -0
  12. ru/ru_RU/irina/medium/ru_RU-irina-medium.onnx.json +483 -0
  13. ru/ru_RU/irina/medium/samples/speaker_0.mp3 +0 -0
  14. ru/ru_RU/ruslan/medium/MODEL_CARD +15 -0
  15. ru/ru_RU/ruslan/medium/ru_RU-ruslan-medium.onnx +3 -0
  16. ru/ru_RU/ruslan/medium/ru_RU-ruslan-medium.onnx.json +493 -0
  17. ru/ru_RU/ruslan/medium/samples/speaker_0.mp3 +0 -0
  18. sk/sk_SK/lili/medium/MODEL_CARD +15 -0
  19. sk/sk_SK/lili/medium/samples/speaker_0.mp3 +0 -0
  20. sk/sk_SK/lili/medium/sk_SK-lili-medium.onnx +3 -0
  21. sk/sk_SK/lili/medium/sk_SK-lili-medium.onnx.json +502 -0
  22. sr/sr_RS/serbski_institut/medium/MODEL_CARD +15 -0
  23. sr/sr_RS/serbski_institut/medium/samples/speaker_0.mp3 +0 -0
  24. sr/sr_RS/serbski_institut/medium/samples/speaker_1.mp3 +0 -0
  25. sr/sr_RS/serbski_institut/medium/sr_RS-serbski_institut-medium.onnx +3 -0
  26. sr/sr_RS/serbski_institut/medium/sr_RS-serbski_institut-medium.onnx.json +505 -0
  27. sv/sv_SE/nst/medium/MODEL_CARD +15 -0
  28. sv/sv_SE/nst/medium/samples/speaker_0.mp3 +0 -0
  29. sv/sv_SE/nst/medium/sv_SE-nst-medium.onnx +3 -0
  30. sv/sv_SE/nst/medium/sv_SE-nst-medium.onnx.json +420 -0
  31. sw/sw_CD/lanfrica/medium/MODEL_CARD +15 -0
  32. sw/sw_CD/lanfrica/medium/samples/speaker_0.mp3 +0 -0
  33. sw/sw_CD/lanfrica/medium/sw_CD-lanfrica-medium.onnx +3 -0
  34. sw/sw_CD/lanfrica/medium/sw_CD-lanfrica-medium.onnx.json +493 -0
  35. tr/tr_TR/dfki/medium/MODEL_CARD +15 -0
  36. tr/tr_TR/dfki/medium/samples/speaker_0.mp3 +0 -0
  37. tr/tr_TR/dfki/medium/tr_TR-dfki-medium.onnx +3 -0
  38. tr/tr_TR/dfki/medium/tr_TR-dfki-medium.onnx.json +498 -0
  39. tr/tr_TR/fahrettin/medium/MODEL_CARD +15 -0
  40. tr/tr_TR/fahrettin/medium/samples/speaker_0.mp3 +0 -0
  41. tr/tr_TR/fahrettin/medium/tr_TR-fahrettin-medium.onnx +3 -0
  42. tr/tr_TR/fahrettin/medium/tr_TR-fahrettin-medium.onnx.json +508 -0
  43. uk/uk_UA/lada/x_low/ALIASES +1 -0
  44. uk/uk_UA/lada/x_low/MODEL_CARD +15 -0
  45. uk/uk_UA/lada/x_low/samples/speaker_0.mp3 +0 -0
  46. uk/uk_UA/lada/x_low/uk_UA-lada-x_low.onnx +3 -0
  47. uk/uk_UA/lada/x_low/uk_UA-lada-x_low.onnx.json +420 -0
  48. uk/uk_UA/ukrainian_tts/medium/MODEL_CARD +16 -0
  49. uk/uk_UA/ukrainian_tts/medium/samples/speaker_0.mp3 +0 -0
  50. uk/uk_UA/ukrainian_tts/medium/samples/speaker_1.mp3 +0 -0
ru/ru_RU/denis/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for denis (medium)
2
+
3
+ * Language: ru_RU (Russian, Russia)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/NabuCasa/voice-datasets
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
ru/ru_RU/denis/medium/ru_RU-denis-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15fab56e11a097858ee115545d0f697fc2a316c41a291a5362349fb870411b0a
3
+ size 63201294
ru/ru_RU/denis/medium/ru_RU-denis-medium.onnx.json ADDED
@@ -0,0 +1,487 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "ru"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ "_": [
18
+ 0
19
+ ],
20
+ "^": [
21
+ 1
22
+ ],
23
+ "$": [
24
+ 2
25
+ ],
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ ":": [
51
+ 11
52
+ ],
53
+ ";": [
54
+ 12
55
+ ],
56
+ "?": [
57
+ 13
58
+ ],
59
+ "a": [
60
+ 14
61
+ ],
62
+ "b": [
63
+ 15
64
+ ],
65
+ "c": [
66
+ 16
67
+ ],
68
+ "d": [
69
+ 17
70
+ ],
71
+ "e": [
72
+ 18
73
+ ],
74
+ "f": [
75
+ 19
76
+ ],
77
+ "h": [
78
+ 20
79
+ ],
80
+ "i": [
81
+ 21
82
+ ],
83
+ "j": [
84
+ 22
85
+ ],
86
+ "k": [
87
+ 23
88
+ ],
89
+ "l": [
90
+ 24
91
+ ],
92
+ "m": [
93
+ 25
94
+ ],
95
+ "n": [
96
+ 26
97
+ ],
98
+ "o": [
99
+ 27
100
+ ],
101
+ "p": [
102
+ 28
103
+ ],
104
+ "q": [
105
+ 29
106
+ ],
107
+ "r": [
108
+ 30
109
+ ],
110
+ "s": [
111
+ 31
112
+ ],
113
+ "t": [
114
+ 32
115
+ ],
116
+ "u": [
117
+ 33
118
+ ],
119
+ "v": [
120
+ 34
121
+ ],
122
+ "w": [
123
+ 35
124
+ ],
125
+ "x": [
126
+ 36
127
+ ],
128
+ "y": [
129
+ 37
130
+ ],
131
+ "z": [
132
+ 38
133
+ ],
134
+ "æ": [
135
+ 39
136
+ ],
137
+ "ç": [
138
+ 40
139
+ ],
140
+ "ð": [
141
+ 41
142
+ ],
143
+ "ø": [
144
+ 42
145
+ ],
146
+ "ħ": [
147
+ 43
148
+ ],
149
+ "ŋ": [
150
+ 44
151
+ ],
152
+ "œ": [
153
+ 45
154
+ ],
155
+ "ǀ": [
156
+ 46
157
+ ],
158
+ "ǁ": [
159
+ 47
160
+ ],
161
+ "ǂ": [
162
+ 48
163
+ ],
164
+ "ǃ": [
165
+ 49
166
+ ],
167
+ "ɐ": [
168
+ 50
169
+ ],
170
+ "ɑ": [
171
+ 51
172
+ ],
173
+ "ɒ": [
174
+ 52
175
+ ],
176
+ "ɓ": [
177
+ 53
178
+ ],
179
+ "ɔ": [
180
+ 54
181
+ ],
182
+ "ɕ": [
183
+ 55
184
+ ],
185
+ "ɖ": [
186
+ 56
187
+ ],
188
+ "ɗ": [
189
+ 57
190
+ ],
191
+ "ɘ": [
192
+ 58
193
+ ],
194
+ "ə": [
195
+ 59
196
+ ],
197
+ "ɚ": [
198
+ 60
199
+ ],
200
+ "ɛ": [
201
+ 61
202
+ ],
203
+ "ɜ": [
204
+ 62
205
+ ],
206
+ "ɞ": [
207
+ 63
208
+ ],
209
+ "ɟ": [
210
+ 64
211
+ ],
212
+ "ɠ": [
213
+ 65
214
+ ],
215
+ "ɡ": [
216
+ 66
217
+ ],
218
+ "ɢ": [
219
+ 67
220
+ ],
221
+ "ɣ": [
222
+ 68
223
+ ],
224
+ "ɤ": [
225
+ 69
226
+ ],
227
+ "ɥ": [
228
+ 70
229
+ ],
230
+ "ɦ": [
231
+ 71
232
+ ],
233
+ "ɧ": [
234
+ 72
235
+ ],
236
+ "ɨ": [
237
+ 73
238
+ ],
239
+ "ɪ": [
240
+ 74
241
+ ],
242
+ "ɫ": [
243
+ 75
244
+ ],
245
+ "ɬ": [
246
+ 76
247
+ ],
248
+ "ɭ": [
249
+ 77
250
+ ],
251
+ "ɮ": [
252
+ 78
253
+ ],
254
+ "ɯ": [
255
+ 79
256
+ ],
257
+ "ɰ": [
258
+ 80
259
+ ],
260
+ "ɱ": [
261
+ 81
262
+ ],
263
+ "ɲ": [
264
+ 82
265
+ ],
266
+ "ɳ": [
267
+ 83
268
+ ],
269
+ "ɴ": [
270
+ 84
271
+ ],
272
+ "ɵ": [
273
+ 85
274
+ ],
275
+ "ɶ": [
276
+ 86
277
+ ],
278
+ "ɸ": [
279
+ 87
280
+ ],
281
+ "ɹ": [
282
+ 88
283
+ ],
284
+ "ɺ": [
285
+ 89
286
+ ],
287
+ "ɻ": [
288
+ 90
289
+ ],
290
+ "ɽ": [
291
+ 91
292
+ ],
293
+ "ɾ": [
294
+ 92
295
+ ],
296
+ "ʀ": [
297
+ 93
298
+ ],
299
+ "ʁ": [
300
+ 94
301
+ ],
302
+ "ʂ": [
303
+ 95
304
+ ],
305
+ "ʃ": [
306
+ 96
307
+ ],
308
+ "ʄ": [
309
+ 97
310
+ ],
311
+ "ʈ": [
312
+ 98
313
+ ],
314
+ "ʉ": [
315
+ 99
316
+ ],
317
+ "ʊ": [
318
+ 100
319
+ ],
320
+ "ʋ": [
321
+ 101
322
+ ],
323
+ "ʌ": [
324
+ 102
325
+ ],
326
+ "ʍ": [
327
+ 103
328
+ ],
329
+ "ʎ": [
330
+ 104
331
+ ],
332
+ "ʏ": [
333
+ 105
334
+ ],
335
+ "ʐ": [
336
+ 106
337
+ ],
338
+ "ʑ": [
339
+ 107
340
+ ],
341
+ "ʒ": [
342
+ 108
343
+ ],
344
+ "ʔ": [
345
+ 109
346
+ ],
347
+ "ʕ": [
348
+ 110
349
+ ],
350
+ "ʘ": [
351
+ 111
352
+ ],
353
+ "ʙ": [
354
+ 112
355
+ ],
356
+ "ʛ": [
357
+ 113
358
+ ],
359
+ "ʜ": [
360
+ 114
361
+ ],
362
+ "ʝ": [
363
+ 115
364
+ ],
365
+ "ʟ": [
366
+ 116
367
+ ],
368
+ "ʡ": [
369
+ 117
370
+ ],
371
+ "ʢ": [
372
+ 118
373
+ ],
374
+ "ʲ": [
375
+ 119
376
+ ],
377
+ "ˈ": [
378
+ 120
379
+ ],
380
+ "ˌ": [
381
+ 121
382
+ ],
383
+ "ː": [
384
+ 122
385
+ ],
386
+ "ˑ": [
387
+ 123
388
+ ],
389
+ "˞": [
390
+ 124
391
+ ],
392
+ "β": [
393
+ 125
394
+ ],
395
+ "θ": [
396
+ 126
397
+ ],
398
+ "χ": [
399
+ 127
400
+ ],
401
+ "ᵻ": [
402
+ 128
403
+ ],
404
+ "ⱱ": [
405
+ 129
406
+ ],
407
+ "0": [
408
+ 130
409
+ ],
410
+ "1": [
411
+ 131
412
+ ],
413
+ "2": [
414
+ 132
415
+ ],
416
+ "3": [
417
+ 133
418
+ ],
419
+ "4": [
420
+ 134
421
+ ],
422
+ "5": [
423
+ 135
424
+ ],
425
+ "6": [
426
+ 136
427
+ ],
428
+ "7": [
429
+ 137
430
+ ],
431
+ "8": [
432
+ 138
433
+ ],
434
+ "9": [
435
+ 139
436
+ ],
437
+ "̧": [
438
+ 140
439
+ ],
440
+ "̃": [
441
+ 141
442
+ ],
443
+ "̪": [
444
+ 142
445
+ ],
446
+ "̯": [
447
+ 143
448
+ ],
449
+ "̩": [
450
+ 144
451
+ ],
452
+ "ʰ": [
453
+ 145
454
+ ],
455
+ "ˤ": [
456
+ 146
457
+ ],
458
+ "ε": [
459
+ 147
460
+ ],
461
+ "↓": [
462
+ 148
463
+ ],
464
+ "#": [
465
+ 149
466
+ ],
467
+ "\"": [
468
+ 150
469
+ ],
470
+ "↑": [
471
+ 151
472
+ ]
473
+ },
474
+ "num_symbols": 256,
475
+ "num_speakers": 1,
476
+ "speaker_id_map": {},
477
+ "piper_version": "1.0.0",
478
+ "language": {
479
+ "code": "ru_RU",
480
+ "family": "ru",
481
+ "region": "RU",
482
+ "name_native": "Русский",
483
+ "name_english": "Russian",
484
+ "country_english": "Russia"
485
+ },
486
+ "dataset": "denis"
487
+ }
ru/ru_RU/denis/medium/samples/speaker_0.mp3 ADDED
Binary file (73.6 kB). View file
 
ru/ru_RU/dmitri/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for dmitri (medium)
2
+
3
+ * Language: ru_RU (Russian, Russia)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/NabuCasa/voice-datasets
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
ru/ru_RU/dmitri/medium/ru_RU-dmitri-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f073356ebc4bd0f80c5af58df2953a5988bd5bdab1eb38635ce960b071fbefcb
3
+ size 63201294
ru/ru_RU/dmitri/medium/ru_RU-dmitri-medium.onnx.json ADDED
@@ -0,0 +1,487 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "ru"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ "_": [
18
+ 0
19
+ ],
20
+ "^": [
21
+ 1
22
+ ],
23
+ "$": [
24
+ 2
25
+ ],
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ ":": [
51
+ 11
52
+ ],
53
+ ";": [
54
+ 12
55
+ ],
56
+ "?": [
57
+ 13
58
+ ],
59
+ "a": [
60
+ 14
61
+ ],
62
+ "b": [
63
+ 15
64
+ ],
65
+ "c": [
66
+ 16
67
+ ],
68
+ "d": [
69
+ 17
70
+ ],
71
+ "e": [
72
+ 18
73
+ ],
74
+ "f": [
75
+ 19
76
+ ],
77
+ "h": [
78
+ 20
79
+ ],
80
+ "i": [
81
+ 21
82
+ ],
83
+ "j": [
84
+ 22
85
+ ],
86
+ "k": [
87
+ 23
88
+ ],
89
+ "l": [
90
+ 24
91
+ ],
92
+ "m": [
93
+ 25
94
+ ],
95
+ "n": [
96
+ 26
97
+ ],
98
+ "o": [
99
+ 27
100
+ ],
101
+ "p": [
102
+ 28
103
+ ],
104
+ "q": [
105
+ 29
106
+ ],
107
+ "r": [
108
+ 30
109
+ ],
110
+ "s": [
111
+ 31
112
+ ],
113
+ "t": [
114
+ 32
115
+ ],
116
+ "u": [
117
+ 33
118
+ ],
119
+ "v": [
120
+ 34
121
+ ],
122
+ "w": [
123
+ 35
124
+ ],
125
+ "x": [
126
+ 36
127
+ ],
128
+ "y": [
129
+ 37
130
+ ],
131
+ "z": [
132
+ 38
133
+ ],
134
+ "æ": [
135
+ 39
136
+ ],
137
+ "ç": [
138
+ 40
139
+ ],
140
+ "ð": [
141
+ 41
142
+ ],
143
+ "ø": [
144
+ 42
145
+ ],
146
+ "ħ": [
147
+ 43
148
+ ],
149
+ "ŋ": [
150
+ 44
151
+ ],
152
+ "œ": [
153
+ 45
154
+ ],
155
+ "ǀ": [
156
+ 46
157
+ ],
158
+ "ǁ": [
159
+ 47
160
+ ],
161
+ "ǂ": [
162
+ 48
163
+ ],
164
+ "ǃ": [
165
+ 49
166
+ ],
167
+ "ɐ": [
168
+ 50
169
+ ],
170
+ "ɑ": [
171
+ 51
172
+ ],
173
+ "ɒ": [
174
+ 52
175
+ ],
176
+ "ɓ": [
177
+ 53
178
+ ],
179
+ "ɔ": [
180
+ 54
181
+ ],
182
+ "ɕ": [
183
+ 55
184
+ ],
185
+ "ɖ": [
186
+ 56
187
+ ],
188
+ "ɗ": [
189
+ 57
190
+ ],
191
+ "ɘ": [
192
+ 58
193
+ ],
194
+ "ə": [
195
+ 59
196
+ ],
197
+ "ɚ": [
198
+ 60
199
+ ],
200
+ "ɛ": [
201
+ 61
202
+ ],
203
+ "ɜ": [
204
+ 62
205
+ ],
206
+ "ɞ": [
207
+ 63
208
+ ],
209
+ "ɟ": [
210
+ 64
211
+ ],
212
+ "ɠ": [
213
+ 65
214
+ ],
215
+ "ɡ": [
216
+ 66
217
+ ],
218
+ "ɢ": [
219
+ 67
220
+ ],
221
+ "ɣ": [
222
+ 68
223
+ ],
224
+ "ɤ": [
225
+ 69
226
+ ],
227
+ "ɥ": [
228
+ 70
229
+ ],
230
+ "ɦ": [
231
+ 71
232
+ ],
233
+ "ɧ": [
234
+ 72
235
+ ],
236
+ "ɨ": [
237
+ 73
238
+ ],
239
+ "ɪ": [
240
+ 74
241
+ ],
242
+ "ɫ": [
243
+ 75
244
+ ],
245
+ "ɬ": [
246
+ 76
247
+ ],
248
+ "ɭ": [
249
+ 77
250
+ ],
251
+ "ɮ": [
252
+ 78
253
+ ],
254
+ "ɯ": [
255
+ 79
256
+ ],
257
+ "ɰ": [
258
+ 80
259
+ ],
260
+ "ɱ": [
261
+ 81
262
+ ],
263
+ "ɲ": [
264
+ 82
265
+ ],
266
+ "ɳ": [
267
+ 83
268
+ ],
269
+ "ɴ": [
270
+ 84
271
+ ],
272
+ "ɵ": [
273
+ 85
274
+ ],
275
+ "ɶ": [
276
+ 86
277
+ ],
278
+ "ɸ": [
279
+ 87
280
+ ],
281
+ "ɹ": [
282
+ 88
283
+ ],
284
+ "ɺ": [
285
+ 89
286
+ ],
287
+ "ɻ": [
288
+ 90
289
+ ],
290
+ "ɽ": [
291
+ 91
292
+ ],
293
+ "ɾ": [
294
+ 92
295
+ ],
296
+ "ʀ": [
297
+ 93
298
+ ],
299
+ "ʁ": [
300
+ 94
301
+ ],
302
+ "ʂ": [
303
+ 95
304
+ ],
305
+ "ʃ": [
306
+ 96
307
+ ],
308
+ "ʄ": [
309
+ 97
310
+ ],
311
+ "ʈ": [
312
+ 98
313
+ ],
314
+ "ʉ": [
315
+ 99
316
+ ],
317
+ "ʊ": [
318
+ 100
319
+ ],
320
+ "ʋ": [
321
+ 101
322
+ ],
323
+ "ʌ": [
324
+ 102
325
+ ],
326
+ "ʍ": [
327
+ 103
328
+ ],
329
+ "ʎ": [
330
+ 104
331
+ ],
332
+ "ʏ": [
333
+ 105
334
+ ],
335
+ "ʐ": [
336
+ 106
337
+ ],
338
+ "ʑ": [
339
+ 107
340
+ ],
341
+ "ʒ": [
342
+ 108
343
+ ],
344
+ "ʔ": [
345
+ 109
346
+ ],
347
+ "ʕ": [
348
+ 110
349
+ ],
350
+ "ʘ": [
351
+ 111
352
+ ],
353
+ "ʙ": [
354
+ 112
355
+ ],
356
+ "ʛ": [
357
+ 113
358
+ ],
359
+ "ʜ": [
360
+ 114
361
+ ],
362
+ "ʝ": [
363
+ 115
364
+ ],
365
+ "ʟ": [
366
+ 116
367
+ ],
368
+ "ʡ": [
369
+ 117
370
+ ],
371
+ "ʢ": [
372
+ 118
373
+ ],
374
+ "ʲ": [
375
+ 119
376
+ ],
377
+ "ˈ": [
378
+ 120
379
+ ],
380
+ "ˌ": [
381
+ 121
382
+ ],
383
+ "ː": [
384
+ 122
385
+ ],
386
+ "ˑ": [
387
+ 123
388
+ ],
389
+ "˞": [
390
+ 124
391
+ ],
392
+ "β": [
393
+ 125
394
+ ],
395
+ "θ": [
396
+ 126
397
+ ],
398
+ "χ": [
399
+ 127
400
+ ],
401
+ "ᵻ": [
402
+ 128
403
+ ],
404
+ "ⱱ": [
405
+ 129
406
+ ],
407
+ "0": [
408
+ 130
409
+ ],
410
+ "1": [
411
+ 131
412
+ ],
413
+ "2": [
414
+ 132
415
+ ],
416
+ "3": [
417
+ 133
418
+ ],
419
+ "4": [
420
+ 134
421
+ ],
422
+ "5": [
423
+ 135
424
+ ],
425
+ "6": [
426
+ 136
427
+ ],
428
+ "7": [
429
+ 137
430
+ ],
431
+ "8": [
432
+ 138
433
+ ],
434
+ "9": [
435
+ 139
436
+ ],
437
+ "̧": [
438
+ 140
439
+ ],
440
+ "̃": [
441
+ 141
442
+ ],
443
+ "̪": [
444
+ 142
445
+ ],
446
+ "̯": [
447
+ 143
448
+ ],
449
+ "̩": [
450
+ 144
451
+ ],
452
+ "ʰ": [
453
+ 145
454
+ ],
455
+ "ˤ": [
456
+ 146
457
+ ],
458
+ "ε": [
459
+ 147
460
+ ],
461
+ "↓": [
462
+ 148
463
+ ],
464
+ "#": [
465
+ 149
466
+ ],
467
+ "\"": [
468
+ 150
469
+ ],
470
+ "↑": [
471
+ 151
472
+ ]
473
+ },
474
+ "num_symbols": 256,
475
+ "num_speakers": 1,
476
+ "speaker_id_map": {},
477
+ "piper_version": "1.0.0",
478
+ "language": {
479
+ "code": "ru_RU",
480
+ "family": "ru",
481
+ "region": "RU",
482
+ "name_native": "Русский",
483
+ "name_english": "Russian",
484
+ "country_english": "Russia"
485
+ },
486
+ "dataset": "dmitri"
487
+ }
ru/ru_RU/dmitri/medium/samples/speaker_0.mp3 ADDED
Binary file (68.5 kB). View file
 
ru/ru_RU/irina/medium/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ ru-irinia-medium
ru/ru_RU/irina/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for irina (medium)
2
+
3
+ * Language: ru_RU (Russian, Russia)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/RHVoice/RHVoice
11
+ * License: Unknown
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
ru/ru_RU/irina/medium/ru_RU-irina-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ff38212d23da300bbe3705c645e6e5b9475f0bfde01558eb17813e22acaaaaa
3
+ size 63201294
ru/ru_RU/irina/medium/ru_RU-irina-medium.onnx.json ADDED
@@ -0,0 +1,483 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "ru"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_map": {},
15
+ "phoneme_id_map": {
16
+ "_": [
17
+ 0
18
+ ],
19
+ "^": [
20
+ 1
21
+ ],
22
+ "$": [
23
+ 2
24
+ ],
25
+ " ": [
26
+ 3
27
+ ],
28
+ "!": [
29
+ 4
30
+ ],
31
+ "'": [
32
+ 5
33
+ ],
34
+ "(": [
35
+ 6
36
+ ],
37
+ ")": [
38
+ 7
39
+ ],
40
+ ",": [
41
+ 8
42
+ ],
43
+ "-": [
44
+ 9
45
+ ],
46
+ ".": [
47
+ 10
48
+ ],
49
+ ":": [
50
+ 11
51
+ ],
52
+ ";": [
53
+ 12
54
+ ],
55
+ "?": [
56
+ 13
57
+ ],
58
+ "a": [
59
+ 14
60
+ ],
61
+ "b": [
62
+ 15
63
+ ],
64
+ "c": [
65
+ 16
66
+ ],
67
+ "d": [
68
+ 17
69
+ ],
70
+ "e": [
71
+ 18
72
+ ],
73
+ "f": [
74
+ 19
75
+ ],
76
+ "h": [
77
+ 20
78
+ ],
79
+ "i": [
80
+ 21
81
+ ],
82
+ "j": [
83
+ 22
84
+ ],
85
+ "k": [
86
+ 23
87
+ ],
88
+ "l": [
89
+ 24
90
+ ],
91
+ "m": [
92
+ 25
93
+ ],
94
+ "n": [
95
+ 26
96
+ ],
97
+ "o": [
98
+ 27
99
+ ],
100
+ "p": [
101
+ 28
102
+ ],
103
+ "q": [
104
+ 29
105
+ ],
106
+ "r": [
107
+ 30
108
+ ],
109
+ "s": [
110
+ 31
111
+ ],
112
+ "t": [
113
+ 32
114
+ ],
115
+ "u": [
116
+ 33
117
+ ],
118
+ "v": [
119
+ 34
120
+ ],
121
+ "w": [
122
+ 35
123
+ ],
124
+ "x": [
125
+ 36
126
+ ],
127
+ "y": [
128
+ 37
129
+ ],
130
+ "z": [
131
+ 38
132
+ ],
133
+ "æ": [
134
+ 39
135
+ ],
136
+ "ç": [
137
+ 40
138
+ ],
139
+ "ð": [
140
+ 41
141
+ ],
142
+ "ø": [
143
+ 42
144
+ ],
145
+ "ħ": [
146
+ 43
147
+ ],
148
+ "ŋ": [
149
+ 44
150
+ ],
151
+ "œ": [
152
+ 45
153
+ ],
154
+ "ǀ": [
155
+ 46
156
+ ],
157
+ "ǁ": [
158
+ 47
159
+ ],
160
+ "ǂ": [
161
+ 48
162
+ ],
163
+ "ǃ": [
164
+ 49
165
+ ],
166
+ "ɐ": [
167
+ 50
168
+ ],
169
+ "ɑ": [
170
+ 51
171
+ ],
172
+ "ɒ": [
173
+ 52
174
+ ],
175
+ "ɓ": [
176
+ 53
177
+ ],
178
+ "ɔ": [
179
+ 54
180
+ ],
181
+ "ɕ": [
182
+ 55
183
+ ],
184
+ "ɖ": [
185
+ 56
186
+ ],
187
+ "ɗ": [
188
+ 57
189
+ ],
190
+ "ɘ": [
191
+ 58
192
+ ],
193
+ "ə": [
194
+ 59
195
+ ],
196
+ "ɚ": [
197
+ 60
198
+ ],
199
+ "ɛ": [
200
+ 61
201
+ ],
202
+ "ɜ": [
203
+ 62
204
+ ],
205
+ "ɞ": [
206
+ 63
207
+ ],
208
+ "ɟ": [
209
+ 64
210
+ ],
211
+ "ɠ": [
212
+ 65
213
+ ],
214
+ "ɡ": [
215
+ 66
216
+ ],
217
+ "ɢ": [
218
+ 67
219
+ ],
220
+ "ɣ": [
221
+ 68
222
+ ],
223
+ "ɤ": [
224
+ 69
225
+ ],
226
+ "ɥ": [
227
+ 70
228
+ ],
229
+ "ɦ": [
230
+ 71
231
+ ],
232
+ "ɧ": [
233
+ 72
234
+ ],
235
+ "ɨ": [
236
+ 73
237
+ ],
238
+ "ɪ": [
239
+ 74
240
+ ],
241
+ "ɫ": [
242
+ 75
243
+ ],
244
+ "ɬ": [
245
+ 76
246
+ ],
247
+ "ɭ": [
248
+ 77
249
+ ],
250
+ "ɮ": [
251
+ 78
252
+ ],
253
+ "ɯ": [
254
+ 79
255
+ ],
256
+ "ɰ": [
257
+ 80
258
+ ],
259
+ "ɱ": [
260
+ 81
261
+ ],
262
+ "ɲ": [
263
+ 82
264
+ ],
265
+ "ɳ": [
266
+ 83
267
+ ],
268
+ "ɴ": [
269
+ 84
270
+ ],
271
+ "ɵ": [
272
+ 85
273
+ ],
274
+ "ɶ": [
275
+ 86
276
+ ],
277
+ "ɸ": [
278
+ 87
279
+ ],
280
+ "ɹ": [
281
+ 88
282
+ ],
283
+ "ɺ": [
284
+ 89
285
+ ],
286
+ "ɻ": [
287
+ 90
288
+ ],
289
+ "ɽ": [
290
+ 91
291
+ ],
292
+ "ɾ": [
293
+ 92
294
+ ],
295
+ "ʀ": [
296
+ 93
297
+ ],
298
+ "ʁ": [
299
+ 94
300
+ ],
301
+ "ʂ": [
302
+ 95
303
+ ],
304
+ "ʃ": [
305
+ 96
306
+ ],
307
+ "ʄ": [
308
+ 97
309
+ ],
310
+ "ʈ": [
311
+ 98
312
+ ],
313
+ "ʉ": [
314
+ 99
315
+ ],
316
+ "ʊ": [
317
+ 100
318
+ ],
319
+ "ʋ": [
320
+ 101
321
+ ],
322
+ "ʌ": [
323
+ 102
324
+ ],
325
+ "ʍ": [
326
+ 103
327
+ ],
328
+ "ʎ": [
329
+ 104
330
+ ],
331
+ "ʏ": [
332
+ 105
333
+ ],
334
+ "ʐ": [
335
+ 106
336
+ ],
337
+ "ʑ": [
338
+ 107
339
+ ],
340
+ "ʒ": [
341
+ 108
342
+ ],
343
+ "ʔ": [
344
+ 109
345
+ ],
346
+ "ʕ": [
347
+ 110
348
+ ],
349
+ "ʘ": [
350
+ 111
351
+ ],
352
+ "ʙ": [
353
+ 112
354
+ ],
355
+ "ʛ": [
356
+ 113
357
+ ],
358
+ "ʜ": [
359
+ 114
360
+ ],
361
+ "ʝ": [
362
+ 115
363
+ ],
364
+ "ʟ": [
365
+ 116
366
+ ],
367
+ "ʡ": [
368
+ 117
369
+ ],
370
+ "ʢ": [
371
+ 118
372
+ ],
373
+ "ʲ": [
374
+ 119
375
+ ],
376
+ "ˈ": [
377
+ 120
378
+ ],
379
+ "ˌ": [
380
+ 121
381
+ ],
382
+ "ː": [
383
+ 122
384
+ ],
385
+ "ˑ": [
386
+ 123
387
+ ],
388
+ "˞": [
389
+ 124
390
+ ],
391
+ "β": [
392
+ 125
393
+ ],
394
+ "θ": [
395
+ 126
396
+ ],
397
+ "χ": [
398
+ 127
399
+ ],
400
+ "ᵻ": [
401
+ 128
402
+ ],
403
+ "ⱱ": [
404
+ 129
405
+ ],
406
+ "0": [
407
+ 130
408
+ ],
409
+ "1": [
410
+ 131
411
+ ],
412
+ "2": [
413
+ 132
414
+ ],
415
+ "3": [
416
+ 133
417
+ ],
418
+ "4": [
419
+ 134
420
+ ],
421
+ "5": [
422
+ 135
423
+ ],
424
+ "6": [
425
+ 136
426
+ ],
427
+ "7": [
428
+ 137
429
+ ],
430
+ "8": [
431
+ 138
432
+ ],
433
+ "9": [
434
+ 139
435
+ ],
436
+ "̧": [
437
+ 140
438
+ ],
439
+ "̃": [
440
+ 141
441
+ ],
442
+ "̪": [
443
+ 142
444
+ ],
445
+ "̯": [
446
+ 143
447
+ ],
448
+ "̩": [
449
+ 144
450
+ ],
451
+ "ʰ": [
452
+ 145
453
+ ],
454
+ "ˤ": [
455
+ 146
456
+ ],
457
+ "ε": [
458
+ 147
459
+ ],
460
+ "↓": [
461
+ 148
462
+ ],
463
+ "#": [
464
+ 149
465
+ ],
466
+ "\"": [
467
+ 150
468
+ ]
469
+ },
470
+ "num_symbols": 256,
471
+ "num_speakers": 1,
472
+ "speaker_id_map": {},
473
+ "piper_version": "1.0.0",
474
+ "language": {
475
+ "code": "ru_RU",
476
+ "family": "ru",
477
+ "region": "RU",
478
+ "name_native": "Русский",
479
+ "name_english": "Russian",
480
+ "country_english": "Russia"
481
+ },
482
+ "dataset": "irina"
483
+ }
ru/ru_RU/irina/medium/samples/speaker_0.mp3 ADDED
Binary file (85.5 kB). View file
 
ru/ru_RU/ruslan/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for ruslan (medium)
2
+
3
+ * Language: ru_RU (Russian, Russia)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://ruslan-corpus.github.io/
11
+ * License: https://creativecommons.org/licenses/by-nc-sa/4.0/
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
ru/ru_RU/ruslan/medium/ru_RU-ruslan-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72a5f88e0b20928064eb45d88e1daa21f8af62d18613580d32cbb4aed48dcf7f
3
+ size 63201294
ru/ru_RU/ruslan/medium/ru_RU-ruslan-medium.onnx.json ADDED
@@ -0,0 +1,493 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "ru"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ "_": [
18
+ 0
19
+ ],
20
+ "^": [
21
+ 1
22
+ ],
23
+ "$": [
24
+ 2
25
+ ],
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ ":": [
51
+ 11
52
+ ],
53
+ ";": [
54
+ 12
55
+ ],
56
+ "?": [
57
+ 13
58
+ ],
59
+ "a": [
60
+ 14
61
+ ],
62
+ "b": [
63
+ 15
64
+ ],
65
+ "c": [
66
+ 16
67
+ ],
68
+ "d": [
69
+ 17
70
+ ],
71
+ "e": [
72
+ 18
73
+ ],
74
+ "f": [
75
+ 19
76
+ ],
77
+ "h": [
78
+ 20
79
+ ],
80
+ "i": [
81
+ 21
82
+ ],
83
+ "j": [
84
+ 22
85
+ ],
86
+ "k": [
87
+ 23
88
+ ],
89
+ "l": [
90
+ 24
91
+ ],
92
+ "m": [
93
+ 25
94
+ ],
95
+ "n": [
96
+ 26
97
+ ],
98
+ "o": [
99
+ 27
100
+ ],
101
+ "p": [
102
+ 28
103
+ ],
104
+ "q": [
105
+ 29
106
+ ],
107
+ "r": [
108
+ 30
109
+ ],
110
+ "s": [
111
+ 31
112
+ ],
113
+ "t": [
114
+ 32
115
+ ],
116
+ "u": [
117
+ 33
118
+ ],
119
+ "v": [
120
+ 34
121
+ ],
122
+ "w": [
123
+ 35
124
+ ],
125
+ "x": [
126
+ 36
127
+ ],
128
+ "y": [
129
+ 37
130
+ ],
131
+ "z": [
132
+ 38
133
+ ],
134
+ "æ": [
135
+ 39
136
+ ],
137
+ "ç": [
138
+ 40
139
+ ],
140
+ "ð": [
141
+ 41
142
+ ],
143
+ "ø": [
144
+ 42
145
+ ],
146
+ "ħ": [
147
+ 43
148
+ ],
149
+ "ŋ": [
150
+ 44
151
+ ],
152
+ "œ": [
153
+ 45
154
+ ],
155
+ "ǀ": [
156
+ 46
157
+ ],
158
+ "ǁ": [
159
+ 47
160
+ ],
161
+ "ǂ": [
162
+ 48
163
+ ],
164
+ "ǃ": [
165
+ 49
166
+ ],
167
+ "ɐ": [
168
+ 50
169
+ ],
170
+ "ɑ": [
171
+ 51
172
+ ],
173
+ "ɒ": [
174
+ 52
175
+ ],
176
+ "ɓ": [
177
+ 53
178
+ ],
179
+ "ɔ": [
180
+ 54
181
+ ],
182
+ "ɕ": [
183
+ 55
184
+ ],
185
+ "ɖ": [
186
+ 56
187
+ ],
188
+ "ɗ": [
189
+ 57
190
+ ],
191
+ "ɘ": [
192
+ 58
193
+ ],
194
+ "ə": [
195
+ 59
196
+ ],
197
+ "ɚ": [
198
+ 60
199
+ ],
200
+ "ɛ": [
201
+ 61
202
+ ],
203
+ "ɜ": [
204
+ 62
205
+ ],
206
+ "ɞ": [
207
+ 63
208
+ ],
209
+ "ɟ": [
210
+ 64
211
+ ],
212
+ "ɠ": [
213
+ 65
214
+ ],
215
+ "ɡ": [
216
+ 66
217
+ ],
218
+ "ɢ": [
219
+ 67
220
+ ],
221
+ "ɣ": [
222
+ 68
223
+ ],
224
+ "ɤ": [
225
+ 69
226
+ ],
227
+ "ɥ": [
228
+ 70
229
+ ],
230
+ "ɦ": [
231
+ 71
232
+ ],
233
+ "ɧ": [
234
+ 72
235
+ ],
236
+ "ɨ": [
237
+ 73
238
+ ],
239
+ "ɪ": [
240
+ 74
241
+ ],
242
+ "ɫ": [
243
+ 75
244
+ ],
245
+ "ɬ": [
246
+ 76
247
+ ],
248
+ "ɭ": [
249
+ 77
250
+ ],
251
+ "ɮ": [
252
+ 78
253
+ ],
254
+ "ɯ": [
255
+ 79
256
+ ],
257
+ "ɰ": [
258
+ 80
259
+ ],
260
+ "ɱ": [
261
+ 81
262
+ ],
263
+ "ɲ": [
264
+ 82
265
+ ],
266
+ "ɳ": [
267
+ 83
268
+ ],
269
+ "ɴ": [
270
+ 84
271
+ ],
272
+ "ɵ": [
273
+ 85
274
+ ],
275
+ "ɶ": [
276
+ 86
277
+ ],
278
+ "ɸ": [
279
+ 87
280
+ ],
281
+ "ɹ": [
282
+ 88
283
+ ],
284
+ "ɺ": [
285
+ 89
286
+ ],
287
+ "ɻ": [
288
+ 90
289
+ ],
290
+ "ɽ": [
291
+ 91
292
+ ],
293
+ "ɾ": [
294
+ 92
295
+ ],
296
+ "ʀ": [
297
+ 93
298
+ ],
299
+ "ʁ": [
300
+ 94
301
+ ],
302
+ "ʂ": [
303
+ 95
304
+ ],
305
+ "ʃ": [
306
+ 96
307
+ ],
308
+ "ʄ": [
309
+ 97
310
+ ],
311
+ "ʈ": [
312
+ 98
313
+ ],
314
+ "ʉ": [
315
+ 99
316
+ ],
317
+ "ʊ": [
318
+ 100
319
+ ],
320
+ "ʋ": [
321
+ 101
322
+ ],
323
+ "ʌ": [
324
+ 102
325
+ ],
326
+ "ʍ": [
327
+ 103
328
+ ],
329
+ "ʎ": [
330
+ 104
331
+ ],
332
+ "ʏ": [
333
+ 105
334
+ ],
335
+ "ʐ": [
336
+ 106
337
+ ],
338
+ "ʑ": [
339
+ 107
340
+ ],
341
+ "ʒ": [
342
+ 108
343
+ ],
344
+ "ʔ": [
345
+ 109
346
+ ],
347
+ "ʕ": [
348
+ 110
349
+ ],
350
+ "ʘ": [
351
+ 111
352
+ ],
353
+ "ʙ": [
354
+ 112
355
+ ],
356
+ "ʛ": [
357
+ 113
358
+ ],
359
+ "ʜ": [
360
+ 114
361
+ ],
362
+ "ʝ": [
363
+ 115
364
+ ],
365
+ "ʟ": [
366
+ 116
367
+ ],
368
+ "ʡ": [
369
+ 117
370
+ ],
371
+ "ʢ": [
372
+ 118
373
+ ],
374
+ "ʲ": [
375
+ 119
376
+ ],
377
+ "ˈ": [
378
+ 120
379
+ ],
380
+ "ˌ": [
381
+ 121
382
+ ],
383
+ "ː": [
384
+ 122
385
+ ],
386
+ "ˑ": [
387
+ 123
388
+ ],
389
+ "˞": [
390
+ 124
391
+ ],
392
+ "β": [
393
+ 125
394
+ ],
395
+ "θ": [
396
+ 126
397
+ ],
398
+ "χ": [
399
+ 127
400
+ ],
401
+ "ᵻ": [
402
+ 128
403
+ ],
404
+ "ⱱ": [
405
+ 129
406
+ ],
407
+ "0": [
408
+ 130
409
+ ],
410
+ "1": [
411
+ 131
412
+ ],
413
+ "2": [
414
+ 132
415
+ ],
416
+ "3": [
417
+ 133
418
+ ],
419
+ "4": [
420
+ 134
421
+ ],
422
+ "5": [
423
+ 135
424
+ ],
425
+ "6": [
426
+ 136
427
+ ],
428
+ "7": [
429
+ 137
430
+ ],
431
+ "8": [
432
+ 138
433
+ ],
434
+ "9": [
435
+ 139
436
+ ],
437
+ "̧": [
438
+ 140
439
+ ],
440
+ "̃": [
441
+ 141
442
+ ],
443
+ "̪": [
444
+ 142
445
+ ],
446
+ "̯": [
447
+ 143
448
+ ],
449
+ "̩": [
450
+ 144
451
+ ],
452
+ "ʰ": [
453
+ 145
454
+ ],
455
+ "ˤ": [
456
+ 146
457
+ ],
458
+ "ε": [
459
+ 147
460
+ ],
461
+ "↓": [
462
+ 148
463
+ ],
464
+ "#": [
465
+ 149
466
+ ],
467
+ "\"": [
468
+ 150
469
+ ],
470
+ "↑": [
471
+ 151
472
+ ],
473
+ "̺": [
474
+ 152
475
+ ],
476
+ "̻": [
477
+ 153
478
+ ]
479
+ },
480
+ "num_symbols": 256,
481
+ "num_speakers": 1,
482
+ "speaker_id_map": {},
483
+ "piper_version": "1.0.0",
484
+ "language": {
485
+ "code": "ru_RU",
486
+ "family": "ru",
487
+ "region": "RU",
488
+ "name_native": "Русский",
489
+ "name_english": "Russian",
490
+ "country_english": "Russia"
491
+ },
492
+ "dataset": "ruslan"
493
+ }
ru/ru_RU/ruslan/medium/samples/speaker_0.mp3 ADDED
Binary file (79 kB). View file
 
sk/sk_SK/lili/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for lili (medium)
2
+
3
+ * Language: sk_SK (Slovak, Slovakia)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/NabuCasa/voice-datasets
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
sk/sk_SK/lili/medium/samples/speaker_0.mp3 ADDED
Binary file (31.1 kB). View file
 
sk/sk_SK/lili/medium/sk_SK-lili-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8e21603e0165252849efe0bcb3fbffd1b3193c36bd1f556e1106911e8015526
3
+ size 63201294
sk/sk_SK/lili/medium/sk_SK-lili-medium.onnx.json ADDED
@@ -0,0 +1,502 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "sk"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ " ": [
18
+ 3
19
+ ],
20
+ "!": [
21
+ 4
22
+ ],
23
+ "\"": [
24
+ 150
25
+ ],
26
+ "#": [
27
+ 149
28
+ ],
29
+ "$": [
30
+ 2
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ "0": [
51
+ 130
52
+ ],
53
+ "1": [
54
+ 131
55
+ ],
56
+ "2": [
57
+ 132
58
+ ],
59
+ "3": [
60
+ 133
61
+ ],
62
+ "4": [
63
+ 134
64
+ ],
65
+ "5": [
66
+ 135
67
+ ],
68
+ "6": [
69
+ 136
70
+ ],
71
+ "7": [
72
+ 137
73
+ ],
74
+ "8": [
75
+ 138
76
+ ],
77
+ "9": [
78
+ 139
79
+ ],
80
+ ":": [
81
+ 11
82
+ ],
83
+ ";": [
84
+ 12
85
+ ],
86
+ "?": [
87
+ 13
88
+ ],
89
+ "X": [
90
+ 156
91
+ ],
92
+ "^": [
93
+ 1
94
+ ],
95
+ "_": [
96
+ 0
97
+ ],
98
+ "a": [
99
+ 14
100
+ ],
101
+ "b": [
102
+ 15
103
+ ],
104
+ "c": [
105
+ 16
106
+ ],
107
+ "d": [
108
+ 17
109
+ ],
110
+ "e": [
111
+ 18
112
+ ],
113
+ "f": [
114
+ 19
115
+ ],
116
+ "g": [
117
+ 154
118
+ ],
119
+ "h": [
120
+ 20
121
+ ],
122
+ "i": [
123
+ 21
124
+ ],
125
+ "j": [
126
+ 22
127
+ ],
128
+ "k": [
129
+ 23
130
+ ],
131
+ "l": [
132
+ 24
133
+ ],
134
+ "m": [
135
+ 25
136
+ ],
137
+ "n": [
138
+ 26
139
+ ],
140
+ "o": [
141
+ 27
142
+ ],
143
+ "p": [
144
+ 28
145
+ ],
146
+ "q": [
147
+ 29
148
+ ],
149
+ "r": [
150
+ 30
151
+ ],
152
+ "s": [
153
+ 31
154
+ ],
155
+ "t": [
156
+ 32
157
+ ],
158
+ "u": [
159
+ 33
160
+ ],
161
+ "v": [
162
+ 34
163
+ ],
164
+ "w": [
165
+ 35
166
+ ],
167
+ "x": [
168
+ 36
169
+ ],
170
+ "y": [
171
+ 37
172
+ ],
173
+ "z": [
174
+ 38
175
+ ],
176
+ "æ": [
177
+ 39
178
+ ],
179
+ "ç": [
180
+ 40
181
+ ],
182
+ "ð": [
183
+ 41
184
+ ],
185
+ "ø": [
186
+ 42
187
+ ],
188
+ "ħ": [
189
+ 43
190
+ ],
191
+ "ŋ": [
192
+ 44
193
+ ],
194
+ "œ": [
195
+ 45
196
+ ],
197
+ "ǀ": [
198
+ 46
199
+ ],
200
+ "ǁ": [
201
+ 47
202
+ ],
203
+ "ǂ": [
204
+ 48
205
+ ],
206
+ "ǃ": [
207
+ 49
208
+ ],
209
+ "ɐ": [
210
+ 50
211
+ ],
212
+ "ɑ": [
213
+ 51
214
+ ],
215
+ "ɒ": [
216
+ 52
217
+ ],
218
+ "ɓ": [
219
+ 53
220
+ ],
221
+ "ɔ": [
222
+ 54
223
+ ],
224
+ "ɕ": [
225
+ 55
226
+ ],
227
+ "ɖ": [
228
+ 56
229
+ ],
230
+ "ɗ": [
231
+ 57
232
+ ],
233
+ "ɘ": [
234
+ 58
235
+ ],
236
+ "ə": [
237
+ 59
238
+ ],
239
+ "ɚ": [
240
+ 60
241
+ ],
242
+ "ɛ": [
243
+ 61
244
+ ],
245
+ "ɜ": [
246
+ 62
247
+ ],
248
+ "ɞ": [
249
+ 63
250
+ ],
251
+ "ɟ": [
252
+ 64
253
+ ],
254
+ "ɠ": [
255
+ 65
256
+ ],
257
+ "ɡ": [
258
+ 66
259
+ ],
260
+ "ɢ": [
261
+ 67
262
+ ],
263
+ "ɣ": [
264
+ 68
265
+ ],
266
+ "ɤ": [
267
+ 69
268
+ ],
269
+ "ɥ": [
270
+ 70
271
+ ],
272
+ "ɦ": [
273
+ 71
274
+ ],
275
+ "ɧ": [
276
+ 72
277
+ ],
278
+ "ɨ": [
279
+ 73
280
+ ],
281
+ "ɪ": [
282
+ 74
283
+ ],
284
+ "ɫ": [
285
+ 75
286
+ ],
287
+ "ɬ": [
288
+ 76
289
+ ],
290
+ "ɭ": [
291
+ 77
292
+ ],
293
+ "ɮ": [
294
+ 78
295
+ ],
296
+ "ɯ": [
297
+ 79
298
+ ],
299
+ "ɰ": [
300
+ 80
301
+ ],
302
+ "ɱ": [
303
+ 81
304
+ ],
305
+ "ɲ": [
306
+ 82
307
+ ],
308
+ "ɳ": [
309
+ 83
310
+ ],
311
+ "ɴ": [
312
+ 84
313
+ ],
314
+ "ɵ": [
315
+ 85
316
+ ],
317
+ "ɶ": [
318
+ 86
319
+ ],
320
+ "ɸ": [
321
+ 87
322
+ ],
323
+ "ɹ": [
324
+ 88
325
+ ],
326
+ "ɺ": [
327
+ 89
328
+ ],
329
+ "ɻ": [
330
+ 90
331
+ ],
332
+ "ɽ": [
333
+ 91
334
+ ],
335
+ "ɾ": [
336
+ 92
337
+ ],
338
+ "ʀ": [
339
+ 93
340
+ ],
341
+ "ʁ": [
342
+ 94
343
+ ],
344
+ "ʂ": [
345
+ 95
346
+ ],
347
+ "ʃ": [
348
+ 96
349
+ ],
350
+ "ʄ": [
351
+ 97
352
+ ],
353
+ "ʈ": [
354
+ 98
355
+ ],
356
+ "ʉ": [
357
+ 99
358
+ ],
359
+ "ʊ": [
360
+ 100
361
+ ],
362
+ "ʋ": [
363
+ 101
364
+ ],
365
+ "ʌ": [
366
+ 102
367
+ ],
368
+ "ʍ": [
369
+ 103
370
+ ],
371
+ "ʎ": [
372
+ 104
373
+ ],
374
+ "ʏ": [
375
+ 105
376
+ ],
377
+ "ʐ": [
378
+ 106
379
+ ],
380
+ "ʑ": [
381
+ 107
382
+ ],
383
+ "ʒ": [
384
+ 108
385
+ ],
386
+ "ʔ": [
387
+ 109
388
+ ],
389
+ "ʕ": [
390
+ 110
391
+ ],
392
+ "ʘ": [
393
+ 111
394
+ ],
395
+ "ʙ": [
396
+ 112
397
+ ],
398
+ "ʛ": [
399
+ 113
400
+ ],
401
+ "ʜ": [
402
+ 114
403
+ ],
404
+ "ʝ": [
405
+ 115
406
+ ],
407
+ "ʟ": [
408
+ 116
409
+ ],
410
+ "ʡ": [
411
+ 117
412
+ ],
413
+ "ʢ": [
414
+ 118
415
+ ],
416
+ "ʦ": [
417
+ 155
418
+ ],
419
+ "ʰ": [
420
+ 145
421
+ ],
422
+ "ʲ": [
423
+ 119
424
+ ],
425
+ "ˈ": [
426
+ 120
427
+ ],
428
+ "ˌ": [
429
+ 121
430
+ ],
431
+ "ː": [
432
+ 122
433
+ ],
434
+ "ˑ": [
435
+ 123
436
+ ],
437
+ "˞": [
438
+ 124
439
+ ],
440
+ "ˤ": [
441
+ 146
442
+ ],
443
+ "̃": [
444
+ 141
445
+ ],
446
+ "̧": [
447
+ 140
448
+ ],
449
+ "̩": [
450
+ 144
451
+ ],
452
+ "̪": [
453
+ 142
454
+ ],
455
+ "̯": [
456
+ 143
457
+ ],
458
+ "̺": [
459
+ 152
460
+ ],
461
+ "̻": [
462
+ 153
463
+ ],
464
+ "β": [
465
+ 125
466
+ ],
467
+ "ε": [
468
+ 147
469
+ ],
470
+ "θ": [
471
+ 126
472
+ ],
473
+ "χ": [
474
+ 127
475
+ ],
476
+ "ᵻ": [
477
+ 128
478
+ ],
479
+ "↑": [
480
+ 151
481
+ ],
482
+ "↓": [
483
+ 148
484
+ ],
485
+ "ⱱ": [
486
+ 129
487
+ ]
488
+ },
489
+ "num_symbols": 256,
490
+ "num_speakers": 1,
491
+ "speaker_id_map": {},
492
+ "piper_version": "1.0.0",
493
+ "language": {
494
+ "code": "sk_SK",
495
+ "family": "sk",
496
+ "region": "SK",
497
+ "name_native": "Slovenčina",
498
+ "name_english": "Slovak",
499
+ "country_english": "Slovakia"
500
+ },
501
+ "dataset": "lili"
502
+ }
sr/sr_RS/serbski_institut/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for serbski_institut (medium)
2
+
3
+ * Language: sr_RS (Serbian, Serbia)
4
+ * Speakers: 2
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/marytts/serbski-institut-dsb-data
11
+ * License: https://creativecommons.org/licenses/by-nc-sa/4.0/
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
sr/sr_RS/serbski_institut/medium/samples/speaker_0.mp3 ADDED
Binary file (112 kB). View file
 
sr/sr_RS/serbski_institut/medium/samples/speaker_1.mp3 ADDED
Binary file (127 kB). View file
 
sr/sr_RS/serbski_institut/medium/sr_RS-serbski_institut-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7003890cf596e653f660a4fd97fd17f57f1eceb6d9727abad9cd76d2fda0d80
3
+ size 76733615
sr/sr_RS/serbski_institut/medium/sr_RS-serbski_institut-medium.onnx.json ADDED
@@ -0,0 +1,505 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "piper_version": "1.0.0",
3
+ "audio": {
4
+ "sample_rate": 22050,
5
+ "quality": "medium"
6
+ },
7
+ "espeak": {
8
+ "voice": "sr"
9
+ },
10
+ "inference": {
11
+ "noise_scale": 0.667,
12
+ "length_scale": 1,
13
+ "noise_w": 0.8
14
+ },
15
+ "phoneme_type": "espeak",
16
+ "phoneme_map": {},
17
+ "phoneme_id_map": {
18
+ " ": [
19
+ 3
20
+ ],
21
+ "!": [
22
+ 4
23
+ ],
24
+ "\"": [
25
+ 150
26
+ ],
27
+ "#": [
28
+ 149
29
+ ],
30
+ "$": [
31
+ 2
32
+ ],
33
+ "'": [
34
+ 5
35
+ ],
36
+ "(": [
37
+ 6
38
+ ],
39
+ ")": [
40
+ 7
41
+ ],
42
+ ",": [
43
+ 8
44
+ ],
45
+ "-": [
46
+ 9
47
+ ],
48
+ ".": [
49
+ 10
50
+ ],
51
+ "0": [
52
+ 130
53
+ ],
54
+ "1": [
55
+ 131
56
+ ],
57
+ "2": [
58
+ 132
59
+ ],
60
+ "3": [
61
+ 133
62
+ ],
63
+ "4": [
64
+ 134
65
+ ],
66
+ "5": [
67
+ 135
68
+ ],
69
+ "6": [
70
+ 136
71
+ ],
72
+ "7": [
73
+ 137
74
+ ],
75
+ "8": [
76
+ 138
77
+ ],
78
+ "9": [
79
+ 139
80
+ ],
81
+ ":": [
82
+ 11
83
+ ],
84
+ ";": [
85
+ 12
86
+ ],
87
+ "?": [
88
+ 13
89
+ ],
90
+ "X": [
91
+ 156
92
+ ],
93
+ "^": [
94
+ 1
95
+ ],
96
+ "_": [
97
+ 0
98
+ ],
99
+ "a": [
100
+ 14
101
+ ],
102
+ "b": [
103
+ 15
104
+ ],
105
+ "c": [
106
+ 16
107
+ ],
108
+ "d": [
109
+ 17
110
+ ],
111
+ "e": [
112
+ 18
113
+ ],
114
+ "f": [
115
+ 19
116
+ ],
117
+ "g": [
118
+ 154
119
+ ],
120
+ "h": [
121
+ 20
122
+ ],
123
+ "i": [
124
+ 21
125
+ ],
126
+ "j": [
127
+ 22
128
+ ],
129
+ "k": [
130
+ 23
131
+ ],
132
+ "l": [
133
+ 24
134
+ ],
135
+ "m": [
136
+ 25
137
+ ],
138
+ "n": [
139
+ 26
140
+ ],
141
+ "o": [
142
+ 27
143
+ ],
144
+ "p": [
145
+ 28
146
+ ],
147
+ "q": [
148
+ 29
149
+ ],
150
+ "r": [
151
+ 30
152
+ ],
153
+ "s": [
154
+ 31
155
+ ],
156
+ "t": [
157
+ 32
158
+ ],
159
+ "u": [
160
+ 33
161
+ ],
162
+ "v": [
163
+ 34
164
+ ],
165
+ "w": [
166
+ 35
167
+ ],
168
+ "x": [
169
+ 36
170
+ ],
171
+ "y": [
172
+ 37
173
+ ],
174
+ "z": [
175
+ 38
176
+ ],
177
+ "æ": [
178
+ 39
179
+ ],
180
+ "ç": [
181
+ 40
182
+ ],
183
+ "ð": [
184
+ 41
185
+ ],
186
+ "ø": [
187
+ 42
188
+ ],
189
+ "ħ": [
190
+ 43
191
+ ],
192
+ "ŋ": [
193
+ 44
194
+ ],
195
+ "œ": [
196
+ 45
197
+ ],
198
+ "ǀ": [
199
+ 46
200
+ ],
201
+ "ǁ": [
202
+ 47
203
+ ],
204
+ "ǂ": [
205
+ 48
206
+ ],
207
+ "ǃ": [
208
+ 49
209
+ ],
210
+ "ɐ": [
211
+ 50
212
+ ],
213
+ "ɑ": [
214
+ 51
215
+ ],
216
+ "ɒ": [
217
+ 52
218
+ ],
219
+ "ɓ": [
220
+ 53
221
+ ],
222
+ "ɔ": [
223
+ 54
224
+ ],
225
+ "ɕ": [
226
+ 55
227
+ ],
228
+ "ɖ": [
229
+ 56
230
+ ],
231
+ "ɗ": [
232
+ 57
233
+ ],
234
+ "ɘ": [
235
+ 58
236
+ ],
237
+ "ə": [
238
+ 59
239
+ ],
240
+ "ɚ": [
241
+ 60
242
+ ],
243
+ "ɛ": [
244
+ 61
245
+ ],
246
+ "ɜ": [
247
+ 62
248
+ ],
249
+ "ɞ": [
250
+ 63
251
+ ],
252
+ "ɟ": [
253
+ 64
254
+ ],
255
+ "ɠ": [
256
+ 65
257
+ ],
258
+ "ɡ": [
259
+ 66
260
+ ],
261
+ "ɢ": [
262
+ 67
263
+ ],
264
+ "ɣ": [
265
+ 68
266
+ ],
267
+ "ɤ": [
268
+ 69
269
+ ],
270
+ "ɥ": [
271
+ 70
272
+ ],
273
+ "ɦ": [
274
+ 71
275
+ ],
276
+ "ɧ": [
277
+ 72
278
+ ],
279
+ "ɨ": [
280
+ 73
281
+ ],
282
+ "ɪ": [
283
+ 74
284
+ ],
285
+ "ɫ": [
286
+ 75
287
+ ],
288
+ "ɬ": [
289
+ 76
290
+ ],
291
+ "ɭ": [
292
+ 77
293
+ ],
294
+ "ɮ": [
295
+ 78
296
+ ],
297
+ "ɯ": [
298
+ 79
299
+ ],
300
+ "ɰ": [
301
+ 80
302
+ ],
303
+ "ɱ": [
304
+ 81
305
+ ],
306
+ "ɲ": [
307
+ 82
308
+ ],
309
+ "ɳ": [
310
+ 83
311
+ ],
312
+ "ɴ": [
313
+ 84
314
+ ],
315
+ "ɵ": [
316
+ 85
317
+ ],
318
+ "ɶ": [
319
+ 86
320
+ ],
321
+ "ɸ": [
322
+ 87
323
+ ],
324
+ "ɹ": [
325
+ 88
326
+ ],
327
+ "ɺ": [
328
+ 89
329
+ ],
330
+ "ɻ": [
331
+ 90
332
+ ],
333
+ "ɽ": [
334
+ 91
335
+ ],
336
+ "ɾ": [
337
+ 92
338
+ ],
339
+ "ʀ": [
340
+ 93
341
+ ],
342
+ "ʁ": [
343
+ 94
344
+ ],
345
+ "ʂ": [
346
+ 95
347
+ ],
348
+ "ʃ": [
349
+ 96
350
+ ],
351
+ "ʄ": [
352
+ 97
353
+ ],
354
+ "ʈ": [
355
+ 98
356
+ ],
357
+ "ʉ": [
358
+ 99
359
+ ],
360
+ "ʊ": [
361
+ 100
362
+ ],
363
+ "ʋ": [
364
+ 101
365
+ ],
366
+ "ʌ": [
367
+ 102
368
+ ],
369
+ "ʍ": [
370
+ 103
371
+ ],
372
+ "ʎ": [
373
+ 104
374
+ ],
375
+ "ʏ": [
376
+ 105
377
+ ],
378
+ "ʐ": [
379
+ 106
380
+ ],
381
+ "ʑ": [
382
+ 107
383
+ ],
384
+ "ʒ": [
385
+ 108
386
+ ],
387
+ "ʔ": [
388
+ 109
389
+ ],
390
+ "ʕ": [
391
+ 110
392
+ ],
393
+ "ʘ": [
394
+ 111
395
+ ],
396
+ "ʙ": [
397
+ 112
398
+ ],
399
+ "ʛ": [
400
+ 113
401
+ ],
402
+ "ʜ": [
403
+ 114
404
+ ],
405
+ "ʝ": [
406
+ 115
407
+ ],
408
+ "ʟ": [
409
+ 116
410
+ ],
411
+ "ʡ": [
412
+ 117
413
+ ],
414
+ "ʢ": [
415
+ 118
416
+ ],
417
+ "ʦ": [
418
+ 155
419
+ ],
420
+ "ʰ": [
421
+ 145
422
+ ],
423
+ "ʲ": [
424
+ 119
425
+ ],
426
+ "ˈ": [
427
+ 120
428
+ ],
429
+ "ˌ": [
430
+ 121
431
+ ],
432
+ "ː": [
433
+ 122
434
+ ],
435
+ "ˑ": [
436
+ 123
437
+ ],
438
+ "˞": [
439
+ 124
440
+ ],
441
+ "ˤ": [
442
+ 146
443
+ ],
444
+ "̃": [
445
+ 141
446
+ ],
447
+ "̧": [
448
+ 140
449
+ ],
450
+ "̩": [
451
+ 144
452
+ ],
453
+ "̪": [
454
+ 142
455
+ ],
456
+ "̯": [
457
+ 143
458
+ ],
459
+ "̺": [
460
+ 152
461
+ ],
462
+ "̻": [
463
+ 153
464
+ ],
465
+ "β": [
466
+ 125
467
+ ],
468
+ "ε": [
469
+ 147
470
+ ],
471
+ "θ": [
472
+ 126
473
+ ],
474
+ "χ": [
475
+ 127
476
+ ],
477
+ "ᵻ": [
478
+ 128
479
+ ],
480
+ "↑": [
481
+ 151
482
+ ],
483
+ "↓": [
484
+ 148
485
+ ],
486
+ "ⱱ": [
487
+ 129
488
+ ]
489
+ },
490
+ "num_symbols": 256,
491
+ "num_speakers": 2,
492
+ "speaker_id_map": {
493
+ "dsb": 0,
494
+ "hsb": 1
495
+ },
496
+ "language": {
497
+ "code": "sr_RS",
498
+ "family": "sr",
499
+ "region": "RS",
500
+ "name_native": "srpski",
501
+ "name_english": "Serbian",
502
+ "country_english": "Serbia"
503
+ },
504
+ "dataset": "serbski_institut"
505
+ }
sv/sv_SE/nst/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for nst (medium)
2
+
3
+ * Language: sv_SE (Swedish, Sweden)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://www.nb.no/sprakbanken/en/resource-catalogue/oai-nb-no-sbr-17/
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Trained from scratch by KBLab at The National Library of Sweden.
sv/sv_SE/nst/medium/samples/speaker_0.mp3 ADDED
Binary file (117 kB). View file
 
sv/sv_SE/nst/medium/sv_SE-nst-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df011f56825a59dd1efc080c38a65a1ef70407e60f63050e9246f43a3d7e471e
3
+ size 63104526
sv/sv_SE/nst/medium/sv_SE-nst-medium.onnx.json ADDED
@@ -0,0 +1,420 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "sv"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_map": {},
15
+ "phoneme_id_map": {
16
+ "_": [
17
+ 0
18
+ ],
19
+ "^": [
20
+ 1
21
+ ],
22
+ "$": [
23
+ 2
24
+ ],
25
+ " ": [
26
+ 3
27
+ ],
28
+ "!": [
29
+ 4
30
+ ],
31
+ "'": [
32
+ 5
33
+ ],
34
+ "(": [
35
+ 6
36
+ ],
37
+ ")": [
38
+ 7
39
+ ],
40
+ ",": [
41
+ 8
42
+ ],
43
+ "-": [
44
+ 9
45
+ ],
46
+ ".": [
47
+ 10
48
+ ],
49
+ ":": [
50
+ 11
51
+ ],
52
+ ";": [
53
+ 12
54
+ ],
55
+ "?": [
56
+ 13
57
+ ],
58
+ "a": [
59
+ 14
60
+ ],
61
+ "b": [
62
+ 15
63
+ ],
64
+ "c": [
65
+ 16
66
+ ],
67
+ "d": [
68
+ 17
69
+ ],
70
+ "e": [
71
+ 18
72
+ ],
73
+ "f": [
74
+ 19
75
+ ],
76
+ "h": [
77
+ 20
78
+ ],
79
+ "i": [
80
+ 21
81
+ ],
82
+ "j": [
83
+ 22
84
+ ],
85
+ "k": [
86
+ 23
87
+ ],
88
+ "l": [
89
+ 24
90
+ ],
91
+ "m": [
92
+ 25
93
+ ],
94
+ "n": [
95
+ 26
96
+ ],
97
+ "o": [
98
+ 27
99
+ ],
100
+ "p": [
101
+ 28
102
+ ],
103
+ "q": [
104
+ 29
105
+ ],
106
+ "r": [
107
+ 30
108
+ ],
109
+ "s": [
110
+ 31
111
+ ],
112
+ "t": [
113
+ 32
114
+ ],
115
+ "u": [
116
+ 33
117
+ ],
118
+ "v": [
119
+ 34
120
+ ],
121
+ "w": [
122
+ 35
123
+ ],
124
+ "x": [
125
+ 36
126
+ ],
127
+ "y": [
128
+ 37
129
+ ],
130
+ "z": [
131
+ 38
132
+ ],
133
+ "æ": [
134
+ 39
135
+ ],
136
+ "ç": [
137
+ 40
138
+ ],
139
+ "ð": [
140
+ 41
141
+ ],
142
+ "ø": [
143
+ 42
144
+ ],
145
+ "ħ": [
146
+ 43
147
+ ],
148
+ "ŋ": [
149
+ 44
150
+ ],
151
+ "œ": [
152
+ 45
153
+ ],
154
+ "ǀ": [
155
+ 46
156
+ ],
157
+ "ǁ": [
158
+ 47
159
+ ],
160
+ "ǂ": [
161
+ 48
162
+ ],
163
+ "ǃ": [
164
+ 49
165
+ ],
166
+ "ɐ": [
167
+ 50
168
+ ],
169
+ "ɑ": [
170
+ 51
171
+ ],
172
+ "ɒ": [
173
+ 52
174
+ ],
175
+ "ɓ": [
176
+ 53
177
+ ],
178
+ "ɔ": [
179
+ 54
180
+ ],
181
+ "ɕ": [
182
+ 55
183
+ ],
184
+ "ɖ": [
185
+ 56
186
+ ],
187
+ "ɗ": [
188
+ 57
189
+ ],
190
+ "ɘ": [
191
+ 58
192
+ ],
193
+ "ə": [
194
+ 59
195
+ ],
196
+ "ɚ": [
197
+ 60
198
+ ],
199
+ "ɛ": [
200
+ 61
201
+ ],
202
+ "ɜ": [
203
+ 62
204
+ ],
205
+ "ɞ": [
206
+ 63
207
+ ],
208
+ "ɟ": [
209
+ 64
210
+ ],
211
+ "ɠ": [
212
+ 65
213
+ ],
214
+ "ɡ": [
215
+ 66
216
+ ],
217
+ "ɢ": [
218
+ 67
219
+ ],
220
+ "ɣ": [
221
+ 68
222
+ ],
223
+ "ɤ": [
224
+ 69
225
+ ],
226
+ "ɥ": [
227
+ 70
228
+ ],
229
+ "ɦ": [
230
+ 71
231
+ ],
232
+ "ɧ": [
233
+ 72
234
+ ],
235
+ "ɨ": [
236
+ 73
237
+ ],
238
+ "ɪ": [
239
+ 74
240
+ ],
241
+ "ɫ": [
242
+ 75
243
+ ],
244
+ "ɬ": [
245
+ 76
246
+ ],
247
+ "ɭ": [
248
+ 77
249
+ ],
250
+ "ɮ": [
251
+ 78
252
+ ],
253
+ "ɯ": [
254
+ 79
255
+ ],
256
+ "ɰ": [
257
+ 80
258
+ ],
259
+ "ɱ": [
260
+ 81
261
+ ],
262
+ "ɲ": [
263
+ 82
264
+ ],
265
+ "ɳ": [
266
+ 83
267
+ ],
268
+ "ɴ": [
269
+ 84
270
+ ],
271
+ "ɵ": [
272
+ 85
273
+ ],
274
+ "ɶ": [
275
+ 86
276
+ ],
277
+ "ɸ": [
278
+ 87
279
+ ],
280
+ "ɹ": [
281
+ 88
282
+ ],
283
+ "ɺ": [
284
+ 89
285
+ ],
286
+ "ɻ": [
287
+ 90
288
+ ],
289
+ "ɽ": [
290
+ 91
291
+ ],
292
+ "ɾ": [
293
+ 92
294
+ ],
295
+ "ʀ": [
296
+ 93
297
+ ],
298
+ "ʁ": [
299
+ 94
300
+ ],
301
+ "ʂ": [
302
+ 95
303
+ ],
304
+ "ʃ": [
305
+ 96
306
+ ],
307
+ "ʄ": [
308
+ 97
309
+ ],
310
+ "ʈ": [
311
+ 98
312
+ ],
313
+ "ʉ": [
314
+ 99
315
+ ],
316
+ "ʊ": [
317
+ 100
318
+ ],
319
+ "ʋ": [
320
+ 101
321
+ ],
322
+ "ʌ": [
323
+ 102
324
+ ],
325
+ "ʍ": [
326
+ 103
327
+ ],
328
+ "ʎ": [
329
+ 104
330
+ ],
331
+ "ʏ": [
332
+ 105
333
+ ],
334
+ "ʐ": [
335
+ 106
336
+ ],
337
+ "ʑ": [
338
+ 107
339
+ ],
340
+ "ʒ": [
341
+ 108
342
+ ],
343
+ "ʔ": [
344
+ 109
345
+ ],
346
+ "ʕ": [
347
+ 110
348
+ ],
349
+ "ʘ": [
350
+ 111
351
+ ],
352
+ "ʙ": [
353
+ 112
354
+ ],
355
+ "ʛ": [
356
+ 113
357
+ ],
358
+ "ʜ": [
359
+ 114
360
+ ],
361
+ "ʝ": [
362
+ 115
363
+ ],
364
+ "ʟ": [
365
+ 116
366
+ ],
367
+ "ʡ": [
368
+ 117
369
+ ],
370
+ "ʢ": [
371
+ 118
372
+ ],
373
+ "ʲ": [
374
+ 119
375
+ ],
376
+ "ˈ": [
377
+ 120
378
+ ],
379
+ "ˌ": [
380
+ 121
381
+ ],
382
+ "ː": [
383
+ 122
384
+ ],
385
+ "ˑ": [
386
+ 123
387
+ ],
388
+ "˞": [
389
+ 124
390
+ ],
391
+ "β": [
392
+ 125
393
+ ],
394
+ "θ": [
395
+ 126
396
+ ],
397
+ "χ": [
398
+ 127
399
+ ],
400
+ "ᵻ": [
401
+ 128
402
+ ],
403
+ "ⱱ": [
404
+ 129
405
+ ]
406
+ },
407
+ "num_symbols": 130,
408
+ "num_speakers": 1,
409
+ "speaker_id_map": {},
410
+ "piper_version": "0.2.0",
411
+ "language": {
412
+ "code": "sv_SE",
413
+ "family": "sv",
414
+ "region": "SE",
415
+ "name_native": "Svenska",
416
+ "name_english": "Swedish",
417
+ "country_english": "Sweden"
418
+ },
419
+ "dataset": "nst"
420
+ }
sw/sw_CD/lanfrica/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for lanfrica (medium)
2
+
3
+ * Language: sw_CD (Swahili, Democratic Republic of the Congo)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://lanfrica.com/record/kiswahili-tts-dataset
11
+ * License: See URL
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
sw/sw_CD/lanfrica/medium/samples/speaker_0.mp3 ADDED
Binary file (78 kB). View file
 
sw/sw_CD/lanfrica/medium/sw_CD-lanfrica-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f195ed12ca5e7875114618e5f00207af364602e21ca78c8a6d3d7674f9259fa
3
+ size 63201294
sw/sw_CD/lanfrica/medium/sw_CD-lanfrica-medium.onnx.json ADDED
@@ -0,0 +1,493 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "sw"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ "_": [
18
+ 0
19
+ ],
20
+ "^": [
21
+ 1
22
+ ],
23
+ "$": [
24
+ 2
25
+ ],
26
+ " ": [
27
+ 3
28
+ ],
29
+ "!": [
30
+ 4
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ ":": [
51
+ 11
52
+ ],
53
+ ";": [
54
+ 12
55
+ ],
56
+ "?": [
57
+ 13
58
+ ],
59
+ "a": [
60
+ 14
61
+ ],
62
+ "b": [
63
+ 15
64
+ ],
65
+ "c": [
66
+ 16
67
+ ],
68
+ "d": [
69
+ 17
70
+ ],
71
+ "e": [
72
+ 18
73
+ ],
74
+ "f": [
75
+ 19
76
+ ],
77
+ "h": [
78
+ 20
79
+ ],
80
+ "i": [
81
+ 21
82
+ ],
83
+ "j": [
84
+ 22
85
+ ],
86
+ "k": [
87
+ 23
88
+ ],
89
+ "l": [
90
+ 24
91
+ ],
92
+ "m": [
93
+ 25
94
+ ],
95
+ "n": [
96
+ 26
97
+ ],
98
+ "o": [
99
+ 27
100
+ ],
101
+ "p": [
102
+ 28
103
+ ],
104
+ "q": [
105
+ 29
106
+ ],
107
+ "r": [
108
+ 30
109
+ ],
110
+ "s": [
111
+ 31
112
+ ],
113
+ "t": [
114
+ 32
115
+ ],
116
+ "u": [
117
+ 33
118
+ ],
119
+ "v": [
120
+ 34
121
+ ],
122
+ "w": [
123
+ 35
124
+ ],
125
+ "x": [
126
+ 36
127
+ ],
128
+ "y": [
129
+ 37
130
+ ],
131
+ "z": [
132
+ 38
133
+ ],
134
+ "æ": [
135
+ 39
136
+ ],
137
+ "ç": [
138
+ 40
139
+ ],
140
+ "ð": [
141
+ 41
142
+ ],
143
+ "ø": [
144
+ 42
145
+ ],
146
+ "ħ": [
147
+ 43
148
+ ],
149
+ "ŋ": [
150
+ 44
151
+ ],
152
+ "œ": [
153
+ 45
154
+ ],
155
+ "ǀ": [
156
+ 46
157
+ ],
158
+ "ǁ": [
159
+ 47
160
+ ],
161
+ "ǂ": [
162
+ 48
163
+ ],
164
+ "ǃ": [
165
+ 49
166
+ ],
167
+ "ɐ": [
168
+ 50
169
+ ],
170
+ "ɑ": [
171
+ 51
172
+ ],
173
+ "ɒ": [
174
+ 52
175
+ ],
176
+ "ɓ": [
177
+ 53
178
+ ],
179
+ "ɔ": [
180
+ 54
181
+ ],
182
+ "ɕ": [
183
+ 55
184
+ ],
185
+ "ɖ": [
186
+ 56
187
+ ],
188
+ "ɗ": [
189
+ 57
190
+ ],
191
+ "ɘ": [
192
+ 58
193
+ ],
194
+ "ə": [
195
+ 59
196
+ ],
197
+ "ɚ": [
198
+ 60
199
+ ],
200
+ "ɛ": [
201
+ 61
202
+ ],
203
+ "ɜ": [
204
+ 62
205
+ ],
206
+ "ɞ": [
207
+ 63
208
+ ],
209
+ "ɟ": [
210
+ 64
211
+ ],
212
+ "ɠ": [
213
+ 65
214
+ ],
215
+ "ɡ": [
216
+ 66
217
+ ],
218
+ "ɢ": [
219
+ 67
220
+ ],
221
+ "ɣ": [
222
+ 68
223
+ ],
224
+ "ɤ": [
225
+ 69
226
+ ],
227
+ "ɥ": [
228
+ 70
229
+ ],
230
+ "ɦ": [
231
+ 71
232
+ ],
233
+ "ɧ": [
234
+ 72
235
+ ],
236
+ "ɨ": [
237
+ 73
238
+ ],
239
+ "ɪ": [
240
+ 74
241
+ ],
242
+ "ɫ": [
243
+ 75
244
+ ],
245
+ "ɬ": [
246
+ 76
247
+ ],
248
+ "ɭ": [
249
+ 77
250
+ ],
251
+ "ɮ": [
252
+ 78
253
+ ],
254
+ "ɯ": [
255
+ 79
256
+ ],
257
+ "ɰ": [
258
+ 80
259
+ ],
260
+ "ɱ": [
261
+ 81
262
+ ],
263
+ "ɲ": [
264
+ 82
265
+ ],
266
+ "ɳ": [
267
+ 83
268
+ ],
269
+ "ɴ": [
270
+ 84
271
+ ],
272
+ "ɵ": [
273
+ 85
274
+ ],
275
+ "ɶ": [
276
+ 86
277
+ ],
278
+ "ɸ": [
279
+ 87
280
+ ],
281
+ "ɹ": [
282
+ 88
283
+ ],
284
+ "ɺ": [
285
+ 89
286
+ ],
287
+ "ɻ": [
288
+ 90
289
+ ],
290
+ "ɽ": [
291
+ 91
292
+ ],
293
+ "ɾ": [
294
+ 92
295
+ ],
296
+ "ʀ": [
297
+ 93
298
+ ],
299
+ "ʁ": [
300
+ 94
301
+ ],
302
+ "ʂ": [
303
+ 95
304
+ ],
305
+ "ʃ": [
306
+ 96
307
+ ],
308
+ "ʄ": [
309
+ 97
310
+ ],
311
+ "ʈ": [
312
+ 98
313
+ ],
314
+ "ʉ": [
315
+ 99
316
+ ],
317
+ "ʊ": [
318
+ 100
319
+ ],
320
+ "ʋ": [
321
+ 101
322
+ ],
323
+ "ʌ": [
324
+ 102
325
+ ],
326
+ "ʍ": [
327
+ 103
328
+ ],
329
+ "ʎ": [
330
+ 104
331
+ ],
332
+ "ʏ": [
333
+ 105
334
+ ],
335
+ "ʐ": [
336
+ 106
337
+ ],
338
+ "ʑ": [
339
+ 107
340
+ ],
341
+ "ʒ": [
342
+ 108
343
+ ],
344
+ "ʔ": [
345
+ 109
346
+ ],
347
+ "ʕ": [
348
+ 110
349
+ ],
350
+ "ʘ": [
351
+ 111
352
+ ],
353
+ "ʙ": [
354
+ 112
355
+ ],
356
+ "ʛ": [
357
+ 113
358
+ ],
359
+ "ʜ": [
360
+ 114
361
+ ],
362
+ "ʝ": [
363
+ 115
364
+ ],
365
+ "ʟ": [
366
+ 116
367
+ ],
368
+ "ʡ": [
369
+ 117
370
+ ],
371
+ "ʢ": [
372
+ 118
373
+ ],
374
+ "ʲ": [
375
+ 119
376
+ ],
377
+ "ˈ": [
378
+ 120
379
+ ],
380
+ "ˌ": [
381
+ 121
382
+ ],
383
+ "ː": [
384
+ 122
385
+ ],
386
+ "ˑ": [
387
+ 123
388
+ ],
389
+ "˞": [
390
+ 124
391
+ ],
392
+ "β": [
393
+ 125
394
+ ],
395
+ "θ": [
396
+ 126
397
+ ],
398
+ "χ": [
399
+ 127
400
+ ],
401
+ "ᵻ": [
402
+ 128
403
+ ],
404
+ "ⱱ": [
405
+ 129
406
+ ],
407
+ "0": [
408
+ 130
409
+ ],
410
+ "1": [
411
+ 131
412
+ ],
413
+ "2": [
414
+ 132
415
+ ],
416
+ "3": [
417
+ 133
418
+ ],
419
+ "4": [
420
+ 134
421
+ ],
422
+ "5": [
423
+ 135
424
+ ],
425
+ "6": [
426
+ 136
427
+ ],
428
+ "7": [
429
+ 137
430
+ ],
431
+ "8": [
432
+ 138
433
+ ],
434
+ "9": [
435
+ 139
436
+ ],
437
+ "̧": [
438
+ 140
439
+ ],
440
+ "̃": [
441
+ 141
442
+ ],
443
+ "̪": [
444
+ 142
445
+ ],
446
+ "̯": [
447
+ 143
448
+ ],
449
+ "̩": [
450
+ 144
451
+ ],
452
+ "ʰ": [
453
+ 145
454
+ ],
455
+ "ˤ": [
456
+ 146
457
+ ],
458
+ "ε": [
459
+ 147
460
+ ],
461
+ "↓": [
462
+ 148
463
+ ],
464
+ "#": [
465
+ 149
466
+ ],
467
+ "\"": [
468
+ 150
469
+ ],
470
+ "↑": [
471
+ 151
472
+ ],
473
+ "̺": [
474
+ 152
475
+ ],
476
+ "̻": [
477
+ 153
478
+ ]
479
+ },
480
+ "num_symbols": 256,
481
+ "num_speakers": 1,
482
+ "speaker_id_map": {},
483
+ "piper_version": "1.0.0",
484
+ "language": {
485
+ "code": "sw_CD",
486
+ "family": "sw",
487
+ "region": "CD",
488
+ "name_native": "Kiswahili",
489
+ "name_english": "Swahili",
490
+ "country_english": "Democratic Republic of the Congo"
491
+ },
492
+ "dataset": "lanfrica"
493
+ }
tr/tr_TR/dfki/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for dfki (medium)
2
+
3
+ * Language: tr_TR (Turkish, Turkey)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/marytts/dfki-ot-data/
11
+ * License: https://creativecommons.org/licenses/by-nc-sa/4.0/
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
tr/tr_TR/dfki/medium/samples/speaker_0.mp3 ADDED
Binary file (107 kB). View file
 
tr/tr_TR/dfki/medium/tr_TR-dfki-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2844717f524ab965d3fe86e60562cbb601d3e456836efcc2196cc3a14112a8fb
3
+ size 63201294
tr/tr_TR/dfki/medium/tr_TR-dfki-medium.onnx.json ADDED
@@ -0,0 +1,498 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "piper_version": "1.2.0",
3
+ "audio": {
4
+ "sample_rate": 22050,
5
+ "quality": "medium"
6
+ },
7
+ "espeak": {
8
+ "voice": "tr"
9
+ },
10
+ "inference": {
11
+ "noise_scale": 0.667,
12
+ "length_scale": 1,
13
+ "noise_w": 0.8,
14
+ "phoneme_silence": {
15
+ ",": 0.1,
16
+ ":": 0.1,
17
+ ";": 0.1
18
+ }
19
+ },
20
+ "phoneme_type": "espeak",
21
+ "phoneme_map": {},
22
+ "phoneme_id_map": {
23
+ "_": [
24
+ 0
25
+ ],
26
+ "^": [
27
+ 1
28
+ ],
29
+ "$": [
30
+ 2
31
+ ],
32
+ " ": [
33
+ 3
34
+ ],
35
+ "!": [
36
+ 4
37
+ ],
38
+ "'": [
39
+ 5
40
+ ],
41
+ "(": [
42
+ 6
43
+ ],
44
+ ")": [
45
+ 7
46
+ ],
47
+ ",": [
48
+ 8
49
+ ],
50
+ "-": [
51
+ 9
52
+ ],
53
+ ".": [
54
+ 10
55
+ ],
56
+ ":": [
57
+ 11
58
+ ],
59
+ ";": [
60
+ 12
61
+ ],
62
+ "?": [
63
+ 13
64
+ ],
65
+ "a": [
66
+ 14
67
+ ],
68
+ "b": [
69
+ 15
70
+ ],
71
+ "c": [
72
+ 16
73
+ ],
74
+ "d": [
75
+ 17
76
+ ],
77
+ "e": [
78
+ 18
79
+ ],
80
+ "f": [
81
+ 19
82
+ ],
83
+ "h": [
84
+ 20
85
+ ],
86
+ "i": [
87
+ 21
88
+ ],
89
+ "j": [
90
+ 22
91
+ ],
92
+ "k": [
93
+ 23
94
+ ],
95
+ "l": [
96
+ 24
97
+ ],
98
+ "m": [
99
+ 25
100
+ ],
101
+ "n": [
102
+ 26
103
+ ],
104
+ "o": [
105
+ 27
106
+ ],
107
+ "p": [
108
+ 28
109
+ ],
110
+ "q": [
111
+ 29
112
+ ],
113
+ "r": [
114
+ 30
115
+ ],
116
+ "s": [
117
+ 31
118
+ ],
119
+ "t": [
120
+ 32
121
+ ],
122
+ "u": [
123
+ 33
124
+ ],
125
+ "v": [
126
+ 34
127
+ ],
128
+ "w": [
129
+ 35
130
+ ],
131
+ "x": [
132
+ 36
133
+ ],
134
+ "y": [
135
+ 37
136
+ ],
137
+ "z": [
138
+ 38
139
+ ],
140
+ "æ": [
141
+ 39
142
+ ],
143
+ "ç": [
144
+ 40
145
+ ],
146
+ "ð": [
147
+ 41
148
+ ],
149
+ "ø": [
150
+ 42
151
+ ],
152
+ "ħ": [
153
+ 43
154
+ ],
155
+ "ŋ": [
156
+ 44
157
+ ],
158
+ "œ": [
159
+ 45
160
+ ],
161
+ "ǀ": [
162
+ 46
163
+ ],
164
+ "ǁ": [
165
+ 47
166
+ ],
167
+ "ǂ": [
168
+ 48
169
+ ],
170
+ "ǃ": [
171
+ 49
172
+ ],
173
+ "ɐ": [
174
+ 50
175
+ ],
176
+ "ɑ": [
177
+ 51
178
+ ],
179
+ "ɒ": [
180
+ 52
181
+ ],
182
+ "ɓ": [
183
+ 53
184
+ ],
185
+ "ɔ": [
186
+ 54
187
+ ],
188
+ "ɕ": [
189
+ 55
190
+ ],
191
+ "ɖ": [
192
+ 56
193
+ ],
194
+ "ɗ": [
195
+ 57
196
+ ],
197
+ "ɘ": [
198
+ 58
199
+ ],
200
+ "ə": [
201
+ 59
202
+ ],
203
+ "ɚ": [
204
+ 60
205
+ ],
206
+ "ɛ": [
207
+ 61
208
+ ],
209
+ "ɜ": [
210
+ 62
211
+ ],
212
+ "ɞ": [
213
+ 63
214
+ ],
215
+ "ɟ": [
216
+ 64
217
+ ],
218
+ "ɠ": [
219
+ 65
220
+ ],
221
+ "ɡ": [
222
+ 66
223
+ ],
224
+ "ɢ": [
225
+ 67
226
+ ],
227
+ "ɣ": [
228
+ 68
229
+ ],
230
+ "ɤ": [
231
+ 69
232
+ ],
233
+ "ɥ": [
234
+ 70
235
+ ],
236
+ "ɦ": [
237
+ 71
238
+ ],
239
+ "ɧ": [
240
+ 72
241
+ ],
242
+ "ɨ": [
243
+ 73
244
+ ],
245
+ "ɪ": [
246
+ 74
247
+ ],
248
+ "ɫ": [
249
+ 75
250
+ ],
251
+ "ɬ": [
252
+ 76
253
+ ],
254
+ "ɭ": [
255
+ 77
256
+ ],
257
+ "ɮ": [
258
+ 78
259
+ ],
260
+ "ɯ": [
261
+ 79
262
+ ],
263
+ "ɰ": [
264
+ 80
265
+ ],
266
+ "ɱ": [
267
+ 81
268
+ ],
269
+ "ɲ": [
270
+ 82
271
+ ],
272
+ "ɳ": [
273
+ 83
274
+ ],
275
+ "ɴ": [
276
+ 84
277
+ ],
278
+ "ɵ": [
279
+ 85
280
+ ],
281
+ "ɶ": [
282
+ 86
283
+ ],
284
+ "ɸ": [
285
+ 87
286
+ ],
287
+ "ɹ": [
288
+ 88
289
+ ],
290
+ "ɺ": [
291
+ 89
292
+ ],
293
+ "ɻ": [
294
+ 90
295
+ ],
296
+ "ɽ": [
297
+ 91
298
+ ],
299
+ "ɾ": [
300
+ 92
301
+ ],
302
+ "ʀ": [
303
+ 93
304
+ ],
305
+ "ʁ": [
306
+ 94
307
+ ],
308
+ "ʂ": [
309
+ 95
310
+ ],
311
+ "ʃ": [
312
+ 96
313
+ ],
314
+ "ʄ": [
315
+ 97
316
+ ],
317
+ "ʈ": [
318
+ 98
319
+ ],
320
+ "ʉ": [
321
+ 99
322
+ ],
323
+ "ʊ": [
324
+ 100
325
+ ],
326
+ "ʋ": [
327
+ 101
328
+ ],
329
+ "ʌ": [
330
+ 102
331
+ ],
332
+ "ʍ": [
333
+ 103
334
+ ],
335
+ "ʎ": [
336
+ 104
337
+ ],
338
+ "ʏ": [
339
+ 105
340
+ ],
341
+ "ʐ": [
342
+ 106
343
+ ],
344
+ "ʑ": [
345
+ 107
346
+ ],
347
+ "ʒ": [
348
+ 108
349
+ ],
350
+ "ʔ": [
351
+ 109
352
+ ],
353
+ "ʕ": [
354
+ 110
355
+ ],
356
+ "ʘ": [
357
+ 111
358
+ ],
359
+ "ʙ": [
360
+ 112
361
+ ],
362
+ "ʛ": [
363
+ 113
364
+ ],
365
+ "ʜ": [
366
+ 114
367
+ ],
368
+ "ʝ": [
369
+ 115
370
+ ],
371
+ "ʟ": [
372
+ 116
373
+ ],
374
+ "ʡ": [
375
+ 117
376
+ ],
377
+ "ʢ": [
378
+ 118
379
+ ],
380
+ "ʲ": [
381
+ 119
382
+ ],
383
+ "ˈ": [
384
+ 120
385
+ ],
386
+ "ˌ": [
387
+ 121
388
+ ],
389
+ "ː": [
390
+ 122
391
+ ],
392
+ "ˑ": [
393
+ 123
394
+ ],
395
+ "˞": [
396
+ 124
397
+ ],
398
+ "β": [
399
+ 125
400
+ ],
401
+ "θ": [
402
+ 126
403
+ ],
404
+ "χ": [
405
+ 127
406
+ ],
407
+ "ᵻ": [
408
+ 128
409
+ ],
410
+ "ⱱ": [
411
+ 129
412
+ ],
413
+ "0": [
414
+ 130
415
+ ],
416
+ "1": [
417
+ 131
418
+ ],
419
+ "2": [
420
+ 132
421
+ ],
422
+ "3": [
423
+ 133
424
+ ],
425
+ "4": [
426
+ 134
427
+ ],
428
+ "5": [
429
+ 135
430
+ ],
431
+ "6": [
432
+ 136
433
+ ],
434
+ "7": [
435
+ 137
436
+ ],
437
+ "8": [
438
+ 138
439
+ ],
440
+ "9": [
441
+ 139
442
+ ],
443
+ "̧": [
444
+ 140
445
+ ],
446
+ "̃": [
447
+ 141
448
+ ],
449
+ "̪": [
450
+ 142
451
+ ],
452
+ "̯": [
453
+ 143
454
+ ],
455
+ "̩": [
456
+ 144
457
+ ],
458
+ "ʰ": [
459
+ 145
460
+ ],
461
+ "ˤ": [
462
+ 146
463
+ ],
464
+ "ε": [
465
+ 147
466
+ ],
467
+ "↓": [
468
+ 148
469
+ ],
470
+ "#": [
471
+ 149
472
+ ],
473
+ "\"": [
474
+ 150
475
+ ],
476
+ "↑": [
477
+ 151
478
+ ],
479
+ "̺": [
480
+ 152
481
+ ],
482
+ "̻": [
483
+ 153
484
+ ]
485
+ },
486
+ "num_symbols": 256,
487
+ "num_speakers": 1,
488
+ "speaker_id_map": {},
489
+ "language": {
490
+ "code": "tr_TR",
491
+ "family": "tr",
492
+ "region": "TR",
493
+ "name_native": "Türkçe",
494
+ "name_english": "Turkish",
495
+ "country_english": "Turkey"
496
+ },
497
+ "dataset": "dfki"
498
+ }
tr/tr_TR/fahrettin/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for fahrettin (medium)
2
+
3
+ * Language: tr_TR (Turkish, Turkey)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/NabuCasa/voice-datasets
11
+ * License: CC0
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
tr/tr_TR/fahrettin/medium/samples/speaker_0.mp3 ADDED
Binary file (82.9 kB). View file
 
tr/tr_TR/fahrettin/medium/tr_TR-fahrettin-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39081c47270180e8a0dfac69b07bf329fb6d039fcc1279dbe26c2daf2848b190
3
+ size 63201294
tr/tr_TR/fahrettin/medium/tr_TR-fahrettin-medium.onnx.json ADDED
@@ -0,0 +1,508 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "tr"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_type": "espeak",
15
+ "phoneme_map": {},
16
+ "phoneme_id_map": {
17
+ " ": [
18
+ 3
19
+ ],
20
+ "!": [
21
+ 4
22
+ ],
23
+ "\"": [
24
+ 150
25
+ ],
26
+ "#": [
27
+ 149
28
+ ],
29
+ "$": [
30
+ 2
31
+ ],
32
+ "'": [
33
+ 5
34
+ ],
35
+ "(": [
36
+ 6
37
+ ],
38
+ ")": [
39
+ 7
40
+ ],
41
+ ",": [
42
+ 8
43
+ ],
44
+ "-": [
45
+ 9
46
+ ],
47
+ ".": [
48
+ 10
49
+ ],
50
+ "0": [
51
+ 130
52
+ ],
53
+ "1": [
54
+ 131
55
+ ],
56
+ "2": [
57
+ 132
58
+ ],
59
+ "3": [
60
+ 133
61
+ ],
62
+ "4": [
63
+ 134
64
+ ],
65
+ "5": [
66
+ 135
67
+ ],
68
+ "6": [
69
+ 136
70
+ ],
71
+ "7": [
72
+ 137
73
+ ],
74
+ "8": [
75
+ 138
76
+ ],
77
+ "9": [
78
+ 139
79
+ ],
80
+ ":": [
81
+ 11
82
+ ],
83
+ ";": [
84
+ 12
85
+ ],
86
+ "?": [
87
+ 13
88
+ ],
89
+ "X": [
90
+ 156
91
+ ],
92
+ "^": [
93
+ 1
94
+ ],
95
+ "_": [
96
+ 0
97
+ ],
98
+ "a": [
99
+ 14
100
+ ],
101
+ "b": [
102
+ 15
103
+ ],
104
+ "c": [
105
+ 16
106
+ ],
107
+ "d": [
108
+ 17
109
+ ],
110
+ "e": [
111
+ 18
112
+ ],
113
+ "f": [
114
+ 19
115
+ ],
116
+ "g": [
117
+ 154
118
+ ],
119
+ "h": [
120
+ 20
121
+ ],
122
+ "i": [
123
+ 21
124
+ ],
125
+ "j": [
126
+ 22
127
+ ],
128
+ "k": [
129
+ 23
130
+ ],
131
+ "l": [
132
+ 24
133
+ ],
134
+ "m": [
135
+ 25
136
+ ],
137
+ "n": [
138
+ 26
139
+ ],
140
+ "o": [
141
+ 27
142
+ ],
143
+ "p": [
144
+ 28
145
+ ],
146
+ "q": [
147
+ 29
148
+ ],
149
+ "r": [
150
+ 30
151
+ ],
152
+ "s": [
153
+ 31
154
+ ],
155
+ "t": [
156
+ 32
157
+ ],
158
+ "u": [
159
+ 33
160
+ ],
161
+ "v": [
162
+ 34
163
+ ],
164
+ "w": [
165
+ 35
166
+ ],
167
+ "x": [
168
+ 36
169
+ ],
170
+ "y": [
171
+ 37
172
+ ],
173
+ "z": [
174
+ 38
175
+ ],
176
+ "æ": [
177
+ 39
178
+ ],
179
+ "ç": [
180
+ 40
181
+ ],
182
+ "ð": [
183
+ 41
184
+ ],
185
+ "ø": [
186
+ 42
187
+ ],
188
+ "ħ": [
189
+ 43
190
+ ],
191
+ "ŋ": [
192
+ 44
193
+ ],
194
+ "œ": [
195
+ 45
196
+ ],
197
+ "ǀ": [
198
+ 46
199
+ ],
200
+ "ǁ": [
201
+ 47
202
+ ],
203
+ "ǂ": [
204
+ 48
205
+ ],
206
+ "ǃ": [
207
+ 49
208
+ ],
209
+ "ɐ": [
210
+ 50
211
+ ],
212
+ "ɑ": [
213
+ 51
214
+ ],
215
+ "ɒ": [
216
+ 52
217
+ ],
218
+ "ɓ": [
219
+ 53
220
+ ],
221
+ "ɔ": [
222
+ 54
223
+ ],
224
+ "ɕ": [
225
+ 55
226
+ ],
227
+ "ɖ": [
228
+ 56
229
+ ],
230
+ "ɗ": [
231
+ 57
232
+ ],
233
+ "ɘ": [
234
+ 58
235
+ ],
236
+ "ə": [
237
+ 59
238
+ ],
239
+ "ɚ": [
240
+ 60
241
+ ],
242
+ "ɛ": [
243
+ 61
244
+ ],
245
+ "ɜ": [
246
+ 62
247
+ ],
248
+ "ɞ": [
249
+ 63
250
+ ],
251
+ "ɟ": [
252
+ 64
253
+ ],
254
+ "ɠ": [
255
+ 65
256
+ ],
257
+ "ɡ": [
258
+ 66
259
+ ],
260
+ "ɢ": [
261
+ 67
262
+ ],
263
+ "ɣ": [
264
+ 68
265
+ ],
266
+ "ɤ": [
267
+ 69
268
+ ],
269
+ "ɥ": [
270
+ 70
271
+ ],
272
+ "ɦ": [
273
+ 71
274
+ ],
275
+ "ɧ": [
276
+ 72
277
+ ],
278
+ "ɨ": [
279
+ 73
280
+ ],
281
+ "ɪ": [
282
+ 74
283
+ ],
284
+ "ɫ": [
285
+ 75
286
+ ],
287
+ "ɬ": [
288
+ 76
289
+ ],
290
+ "ɭ": [
291
+ 77
292
+ ],
293
+ "ɮ": [
294
+ 78
295
+ ],
296
+ "ɯ": [
297
+ 79
298
+ ],
299
+ "ɰ": [
300
+ 80
301
+ ],
302
+ "ɱ": [
303
+ 81
304
+ ],
305
+ "ɲ": [
306
+ 82
307
+ ],
308
+ "ɳ": [
309
+ 83
310
+ ],
311
+ "ɴ": [
312
+ 84
313
+ ],
314
+ "ɵ": [
315
+ 85
316
+ ],
317
+ "ɶ": [
318
+ 86
319
+ ],
320
+ "ɸ": [
321
+ 87
322
+ ],
323
+ "ɹ": [
324
+ 88
325
+ ],
326
+ "ɺ": [
327
+ 89
328
+ ],
329
+ "ɻ": [
330
+ 90
331
+ ],
332
+ "ɽ": [
333
+ 91
334
+ ],
335
+ "ɾ": [
336
+ 92
337
+ ],
338
+ "ʀ": [
339
+ 93
340
+ ],
341
+ "ʁ": [
342
+ 94
343
+ ],
344
+ "ʂ": [
345
+ 95
346
+ ],
347
+ "ʃ": [
348
+ 96
349
+ ],
350
+ "ʄ": [
351
+ 97
352
+ ],
353
+ "ʈ": [
354
+ 98
355
+ ],
356
+ "ʉ": [
357
+ 99
358
+ ],
359
+ "ʊ": [
360
+ 100
361
+ ],
362
+ "ʋ": [
363
+ 101
364
+ ],
365
+ "ʌ": [
366
+ 102
367
+ ],
368
+ "ʍ": [
369
+ 103
370
+ ],
371
+ "ʎ": [
372
+ 104
373
+ ],
374
+ "ʏ": [
375
+ 105
376
+ ],
377
+ "ʐ": [
378
+ 106
379
+ ],
380
+ "ʑ": [
381
+ 107
382
+ ],
383
+ "ʒ": [
384
+ 108
385
+ ],
386
+ "ʔ": [
387
+ 109
388
+ ],
389
+ "ʕ": [
390
+ 110
391
+ ],
392
+ "ʘ": [
393
+ 111
394
+ ],
395
+ "ʙ": [
396
+ 112
397
+ ],
398
+ "ʛ": [
399
+ 113
400
+ ],
401
+ "ʜ": [
402
+ 114
403
+ ],
404
+ "ʝ": [
405
+ 115
406
+ ],
407
+ "ʟ": [
408
+ 116
409
+ ],
410
+ "ʡ": [
411
+ 117
412
+ ],
413
+ "ʢ": [
414
+ 118
415
+ ],
416
+ "ʦ": [
417
+ 155
418
+ ],
419
+ "ʰ": [
420
+ 145
421
+ ],
422
+ "ʲ": [
423
+ 119
424
+ ],
425
+ "ˈ": [
426
+ 120
427
+ ],
428
+ "ˌ": [
429
+ 121
430
+ ],
431
+ "ː": [
432
+ 122
433
+ ],
434
+ "ˑ": [
435
+ 123
436
+ ],
437
+ "˞": [
438
+ 124
439
+ ],
440
+ "ˤ": [
441
+ 146
442
+ ],
443
+ "̃": [
444
+ 141
445
+ ],
446
+ "̊": [
447
+ 158
448
+ ],
449
+ "̝": [
450
+ 157
451
+ ],
452
+ "̧": [
453
+ 140
454
+ ],
455
+ "̩": [
456
+ 144
457
+ ],
458
+ "̪": [
459
+ 142
460
+ ],
461
+ "̯": [
462
+ 143
463
+ ],
464
+ "̺": [
465
+ 152
466
+ ],
467
+ "̻": [
468
+ 153
469
+ ],
470
+ "β": [
471
+ 125
472
+ ],
473
+ "ε": [
474
+ 147
475
+ ],
476
+ "θ": [
477
+ 126
478
+ ],
479
+ "χ": [
480
+ 127
481
+ ],
482
+ "ᵻ": [
483
+ 128
484
+ ],
485
+ "↑": [
486
+ 151
487
+ ],
488
+ "↓": [
489
+ 148
490
+ ],
491
+ "ⱱ": [
492
+ 129
493
+ ]
494
+ },
495
+ "num_symbols": 256,
496
+ "num_speakers": 1,
497
+ "speaker_id_map": {},
498
+ "piper_version": "1.0.0",
499
+ "language": {
500
+ "code": "tr_TR",
501
+ "family": "tr",
502
+ "region": "TR",
503
+ "name_native": "Türkçe",
504
+ "name_english": "Turkish",
505
+ "country_english": "Turkey"
506
+ },
507
+ "dataset": "fahrettin"
508
+ }
uk/uk_UA/lada/x_low/ALIASES ADDED
@@ -0,0 +1 @@
 
 
1
+ uk-lada-x-low
uk/uk_UA/lada/x_low/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for lada (x_low)
2
+
3
+ * Language: uk_UA (Ukranian, Ukraine)
4
+ * Speakers: 1
5
+ * Quality: x_low
6
+ * Samplerate: 16,000Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://github.com/egorsmkv/ukrainian-tts-datasets/tree/main/lada
11
+ * License: Apache 2.0
12
+
13
+ ## Training
14
+
15
+ Trained from scratch.
uk/uk_UA/lada/x_low/samples/speaker_0.mp3 ADDED
Binary file (97.6 kB). View file
 
uk/uk_UA/lada/x_low/uk_UA-lada-x_low.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8d015d3fc19ea6bd8ac3ca1fd0c0fbac5054c609599ee73799235fd2cf5c786
3
+ size 20628813
uk/uk_UA/lada/x_low/uk_UA-lada-x_low.onnx.json ADDED
@@ -0,0 +1,420 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 16000,
4
+ "quality": "x_low"
5
+ },
6
+ "espeak": {
7
+ "voice": "uk"
8
+ },
9
+ "inference": {
10
+ "noise_scale": 0.667,
11
+ "length_scale": 1,
12
+ "noise_w": 0.8
13
+ },
14
+ "phoneme_map": {},
15
+ "phoneme_id_map": {
16
+ "_": [
17
+ 0
18
+ ],
19
+ "^": [
20
+ 1
21
+ ],
22
+ "$": [
23
+ 2
24
+ ],
25
+ " ": [
26
+ 3
27
+ ],
28
+ "!": [
29
+ 4
30
+ ],
31
+ "'": [
32
+ 5
33
+ ],
34
+ "(": [
35
+ 6
36
+ ],
37
+ ")": [
38
+ 7
39
+ ],
40
+ ",": [
41
+ 8
42
+ ],
43
+ "-": [
44
+ 9
45
+ ],
46
+ ".": [
47
+ 10
48
+ ],
49
+ ":": [
50
+ 11
51
+ ],
52
+ ";": [
53
+ 12
54
+ ],
55
+ "?": [
56
+ 13
57
+ ],
58
+ "a": [
59
+ 14
60
+ ],
61
+ "b": [
62
+ 15
63
+ ],
64
+ "c": [
65
+ 16
66
+ ],
67
+ "d": [
68
+ 17
69
+ ],
70
+ "e": [
71
+ 18
72
+ ],
73
+ "f": [
74
+ 19
75
+ ],
76
+ "h": [
77
+ 20
78
+ ],
79
+ "i": [
80
+ 21
81
+ ],
82
+ "j": [
83
+ 22
84
+ ],
85
+ "k": [
86
+ 23
87
+ ],
88
+ "l": [
89
+ 24
90
+ ],
91
+ "m": [
92
+ 25
93
+ ],
94
+ "n": [
95
+ 26
96
+ ],
97
+ "o": [
98
+ 27
99
+ ],
100
+ "p": [
101
+ 28
102
+ ],
103
+ "q": [
104
+ 29
105
+ ],
106
+ "r": [
107
+ 30
108
+ ],
109
+ "s": [
110
+ 31
111
+ ],
112
+ "t": [
113
+ 32
114
+ ],
115
+ "u": [
116
+ 33
117
+ ],
118
+ "v": [
119
+ 34
120
+ ],
121
+ "w": [
122
+ 35
123
+ ],
124
+ "x": [
125
+ 36
126
+ ],
127
+ "y": [
128
+ 37
129
+ ],
130
+ "z": [
131
+ 38
132
+ ],
133
+ "æ": [
134
+ 39
135
+ ],
136
+ "ç": [
137
+ 40
138
+ ],
139
+ "ð": [
140
+ 41
141
+ ],
142
+ "ø": [
143
+ 42
144
+ ],
145
+ "ħ": [
146
+ 43
147
+ ],
148
+ "ŋ": [
149
+ 44
150
+ ],
151
+ "œ": [
152
+ 45
153
+ ],
154
+ "ǀ": [
155
+ 46
156
+ ],
157
+ "ǁ": [
158
+ 47
159
+ ],
160
+ "ǂ": [
161
+ 48
162
+ ],
163
+ "ǃ": [
164
+ 49
165
+ ],
166
+ "ɐ": [
167
+ 50
168
+ ],
169
+ "ɑ": [
170
+ 51
171
+ ],
172
+ "ɒ": [
173
+ 52
174
+ ],
175
+ "ɓ": [
176
+ 53
177
+ ],
178
+ "ɔ": [
179
+ 54
180
+ ],
181
+ "ɕ": [
182
+ 55
183
+ ],
184
+ "ɖ": [
185
+ 56
186
+ ],
187
+ "ɗ": [
188
+ 57
189
+ ],
190
+ "ɘ": [
191
+ 58
192
+ ],
193
+ "ə": [
194
+ 59
195
+ ],
196
+ "ɚ": [
197
+ 60
198
+ ],
199
+ "ɛ": [
200
+ 61
201
+ ],
202
+ "ɜ": [
203
+ 62
204
+ ],
205
+ "ɞ": [
206
+ 63
207
+ ],
208
+ "ɟ": [
209
+ 64
210
+ ],
211
+ "ɠ": [
212
+ 65
213
+ ],
214
+ "ɡ": [
215
+ 66
216
+ ],
217
+ "ɢ": [
218
+ 67
219
+ ],
220
+ "ɣ": [
221
+ 68
222
+ ],
223
+ "ɤ": [
224
+ 69
225
+ ],
226
+ "ɥ": [
227
+ 70
228
+ ],
229
+ "ɦ": [
230
+ 71
231
+ ],
232
+ "ɧ": [
233
+ 72
234
+ ],
235
+ "ɨ": [
236
+ 73
237
+ ],
238
+ "ɪ": [
239
+ 74
240
+ ],
241
+ "ɫ": [
242
+ 75
243
+ ],
244
+ "ɬ": [
245
+ 76
246
+ ],
247
+ "ɭ": [
248
+ 77
249
+ ],
250
+ "ɮ": [
251
+ 78
252
+ ],
253
+ "ɯ": [
254
+ 79
255
+ ],
256
+ "ɰ": [
257
+ 80
258
+ ],
259
+ "ɱ": [
260
+ 81
261
+ ],
262
+ "ɲ": [
263
+ 82
264
+ ],
265
+ "ɳ": [
266
+ 83
267
+ ],
268
+ "ɴ": [
269
+ 84
270
+ ],
271
+ "ɵ": [
272
+ 85
273
+ ],
274
+ "ɶ": [
275
+ 86
276
+ ],
277
+ "ɸ": [
278
+ 87
279
+ ],
280
+ "ɹ": [
281
+ 88
282
+ ],
283
+ "ɺ": [
284
+ 89
285
+ ],
286
+ "ɻ": [
287
+ 90
288
+ ],
289
+ "ɽ": [
290
+ 91
291
+ ],
292
+ "ɾ": [
293
+ 92
294
+ ],
295
+ "ʀ": [
296
+ 93
297
+ ],
298
+ "ʁ": [
299
+ 94
300
+ ],
301
+ "ʂ": [
302
+ 95
303
+ ],
304
+ "ʃ": [
305
+ 96
306
+ ],
307
+ "ʄ": [
308
+ 97
309
+ ],
310
+ "ʈ": [
311
+ 98
312
+ ],
313
+ "ʉ": [
314
+ 99
315
+ ],
316
+ "ʊ": [
317
+ 100
318
+ ],
319
+ "ʋ": [
320
+ 101
321
+ ],
322
+ "ʌ": [
323
+ 102
324
+ ],
325
+ "ʍ": [
326
+ 103
327
+ ],
328
+ "ʎ": [
329
+ 104
330
+ ],
331
+ "ʏ": [
332
+ 105
333
+ ],
334
+ "ʐ": [
335
+ 106
336
+ ],
337
+ "ʑ": [
338
+ 107
339
+ ],
340
+ "ʒ": [
341
+ 108
342
+ ],
343
+ "ʔ": [
344
+ 109
345
+ ],
346
+ "ʕ": [
347
+ 110
348
+ ],
349
+ "ʘ": [
350
+ 111
351
+ ],
352
+ "ʙ": [
353
+ 112
354
+ ],
355
+ "ʛ": [
356
+ 113
357
+ ],
358
+ "ʜ": [
359
+ 114
360
+ ],
361
+ "ʝ": [
362
+ 115
363
+ ],
364
+ "ʟ": [
365
+ 116
366
+ ],
367
+ "ʡ": [
368
+ 117
369
+ ],
370
+ "ʢ": [
371
+ 118
372
+ ],
373
+ "ʲ": [
374
+ 119
375
+ ],
376
+ "ˈ": [
377
+ 120
378
+ ],
379
+ "ˌ": [
380
+ 121
381
+ ],
382
+ "ː": [
383
+ 122
384
+ ],
385
+ "ˑ": [
386
+ 123
387
+ ],
388
+ "˞": [
389
+ 124
390
+ ],
391
+ "β": [
392
+ 125
393
+ ],
394
+ "θ": [
395
+ 126
396
+ ],
397
+ "χ": [
398
+ 127
399
+ ],
400
+ "ᵻ": [
401
+ 128
402
+ ],
403
+ "ⱱ": [
404
+ 129
405
+ ]
406
+ },
407
+ "num_symbols": 130,
408
+ "num_speakers": 1,
409
+ "speaker_id_map": {},
410
+ "piper_version": "0.2.0",
411
+ "language": {
412
+ "code": "uk_UA",
413
+ "family": "uk",
414
+ "region": "UA",
415
+ "name_native": "украї́нська мо́ва",
416
+ "name_english": "Ukrainian",
417
+ "country_english": "Ukraine"
418
+ },
419
+ "dataset": "lada"
420
+ }
uk/uk_UA/ukrainian_tts/medium/MODEL_CARD ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for ukrainian_tts (medium)
2
+
3
+ * Language: uk_UA (Ukrainian, Ukraine)
4
+ * Speakers: 3
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+ * Phonemes: text
8
+
9
+ ## Dataset
10
+
11
+ * URL: https://github.com/NabuCasa/voice-datasets
12
+ * License: CC0
13
+
14
+ ## Training
15
+
16
+ Trained from scratch.
uk/uk_UA/ukrainian_tts/medium/samples/speaker_0.mp3 ADDED
Binary file (115 kB). View file
 
uk/uk_UA/ukrainian_tts/medium/samples/speaker_1.mp3 ADDED
Binary file (143 kB). View file