ONNX
Michael Hansen commited on
Commit
aae8b0c
·
1 Parent(s): 3b9e4ab

Add arjun (ml_IN)

Browse files
_script/voicefest.py CHANGED
@@ -43,6 +43,7 @@ _LANGUAGES = {
43
  "nl_BE": Language("Nederlands", "Dutch", "Belgium"),
44
  "nl_NL": Language("Nederlands", "Dutch", "Netherlands"),
45
  "no_NO": Language("Norsk", "Norwegian", "Norway"),
 
46
  "pl_PL": Language("Polski", "Polish", "Poland"),
47
  "pt_BR": Language("Português", "Portuguese", "Brazil"),
48
  "pt_PT": Language("Português", "Portuguese", "Portugal"),
 
43
  "nl_BE": Language("Nederlands", "Dutch", "Belgium"),
44
  "nl_NL": Language("Nederlands", "Dutch", "Netherlands"),
45
  "no_NO": Language("Norsk", "Norwegian", "Norway"),
46
+ "ml_IN": Language("മലയാളം", "Malayalam", "India"),
47
  "pl_PL": Language("Polski", "Polish", "Poland"),
48
  "pt_BR": Language("Português", "Portuguese", "Brazil"),
49
  "pt_PT": Language("Português", "Portuguese", "Portugal"),
ml/ml_IN/arjun/medium/MODEL_CARD ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Model card for arjun (medium)
2
+
3
+ * Language: ml_IN (Malayalam, India)
4
+ * Speakers: 1
5
+ * Quality: medium
6
+ * Samplerate: 22,050Hz
7
+
8
+ ## Dataset
9
+
10
+ * URL: https://www.kaggle.com/code/mpwolke/indic-tts-malayalam-speech-corpus
11
+ * License: See URL
12
+
13
+ ## Training
14
+
15
+ Finetuned from U.S. English lessac voice (medium quality).
ml/ml_IN/arjun/medium/ml_IN-arjun-medium.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e881130516a874306972a07dcf262e6900140430c5658131121744a80ef3f11b
3
+ size 62950044
ml/ml_IN/arjun/medium/ml_IN-arjun-medium.onnx.json ADDED
@@ -0,0 +1,512 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
+ },
6
+ "espeak": {
7
+ "voice": "ml"
8
+ },
9
+ "phoneme_type": "espeak",
10
+ "piper_version": "1.3.0",
11
+ "num_symbols": 256,
12
+ "num_speakers": 1,
13
+ "inference": {
14
+ "noise_scale": 0.667,
15
+ "length_scale": 1.0,
16
+ "noise_w": 0.8
17
+ },
18
+ "phoneme_id_map": {
19
+ "_": [
20
+ 0
21
+ ],
22
+ "^": [
23
+ 1
24
+ ],
25
+ "$": [
26
+ 2
27
+ ],
28
+ " ": [
29
+ 3
30
+ ],
31
+ "!": [
32
+ 4
33
+ ],
34
+ "'": [
35
+ 5
36
+ ],
37
+ "(": [
38
+ 6
39
+ ],
40
+ ")": [
41
+ 7
42
+ ],
43
+ ",": [
44
+ 8
45
+ ],
46
+ "-": [
47
+ 9
48
+ ],
49
+ ".": [
50
+ 10
51
+ ],
52
+ ":": [
53
+ 11
54
+ ],
55
+ ";": [
56
+ 12
57
+ ],
58
+ "?": [
59
+ 13
60
+ ],
61
+ "a": [
62
+ 14
63
+ ],
64
+ "b": [
65
+ 15
66
+ ],
67
+ "c": [
68
+ 16
69
+ ],
70
+ "d": [
71
+ 17
72
+ ],
73
+ "e": [
74
+ 18
75
+ ],
76
+ "f": [
77
+ 19
78
+ ],
79
+ "h": [
80
+ 20
81
+ ],
82
+ "i": [
83
+ 21
84
+ ],
85
+ "j": [
86
+ 22
87
+ ],
88
+ "k": [
89
+ 23
90
+ ],
91
+ "l": [
92
+ 24
93
+ ],
94
+ "m": [
95
+ 25
96
+ ],
97
+ "n": [
98
+ 26
99
+ ],
100
+ "o": [
101
+ 27
102
+ ],
103
+ "p": [
104
+ 28
105
+ ],
106
+ "q": [
107
+ 29
108
+ ],
109
+ "r": [
110
+ 30
111
+ ],
112
+ "s": [
113
+ 31
114
+ ],
115
+ "t": [
116
+ 32
117
+ ],
118
+ "u": [
119
+ 33
120
+ ],
121
+ "v": [
122
+ 34
123
+ ],
124
+ "w": [
125
+ 35
126
+ ],
127
+ "x": [
128
+ 36
129
+ ],
130
+ "y": [
131
+ 37
132
+ ],
133
+ "z": [
134
+ 38
135
+ ],
136
+ "æ": [
137
+ 39
138
+ ],
139
+ "ç": [
140
+ 40
141
+ ],
142
+ "ð": [
143
+ 41
144
+ ],
145
+ "ø": [
146
+ 42
147
+ ],
148
+ "ħ": [
149
+ 43
150
+ ],
151
+ "ŋ": [
152
+ 44
153
+ ],
154
+ "œ": [
155
+ 45
156
+ ],
157
+ "ǀ": [
158
+ 46
159
+ ],
160
+ "ǁ": [
161
+ 47
162
+ ],
163
+ "ǂ": [
164
+ 48
165
+ ],
166
+ "ǃ": [
167
+ 49
168
+ ],
169
+ "ɐ": [
170
+ 50
171
+ ],
172
+ "ɑ": [
173
+ 51
174
+ ],
175
+ "ɒ": [
176
+ 52
177
+ ],
178
+ "ɓ": [
179
+ 53
180
+ ],
181
+ "ɔ": [
182
+ 54
183
+ ],
184
+ "ɕ": [
185
+ 55
186
+ ],
187
+ "ɖ": [
188
+ 56
189
+ ],
190
+ "ɗ": [
191
+ 57
192
+ ],
193
+ "ɘ": [
194
+ 58
195
+ ],
196
+ "ə": [
197
+ 59
198
+ ],
199
+ "ɚ": [
200
+ 60
201
+ ],
202
+ "ɛ": [
203
+ 61
204
+ ],
205
+ "ɜ": [
206
+ 62
207
+ ],
208
+ "ɞ": [
209
+ 63
210
+ ],
211
+ "ɟ": [
212
+ 64
213
+ ],
214
+ "ɠ": [
215
+ 65
216
+ ],
217
+ "ɡ": [
218
+ 66
219
+ ],
220
+ "ɢ": [
221
+ 67
222
+ ],
223
+ "ɣ": [
224
+ 68
225
+ ],
226
+ "ɤ": [
227
+ 69
228
+ ],
229
+ "ɥ": [
230
+ 70
231
+ ],
232
+ "ɦ": [
233
+ 71
234
+ ],
235
+ "ɧ": [
236
+ 72
237
+ ],
238
+ "ɨ": [
239
+ 73
240
+ ],
241
+ "ɪ": [
242
+ 74
243
+ ],
244
+ "ɫ": [
245
+ 75
246
+ ],
247
+ "ɬ": [
248
+ 76
249
+ ],
250
+ "ɭ": [
251
+ 77
252
+ ],
253
+ "ɮ": [
254
+ 78
255
+ ],
256
+ "ɯ": [
257
+ 79
258
+ ],
259
+ "ɰ": [
260
+ 80
261
+ ],
262
+ "ɱ": [
263
+ 81
264
+ ],
265
+ "ɲ": [
266
+ 82
267
+ ],
268
+ "ɳ": [
269
+ 83
270
+ ],
271
+ "ɴ": [
272
+ 84
273
+ ],
274
+ "ɵ": [
275
+ 85
276
+ ],
277
+ "ɶ": [
278
+ 86
279
+ ],
280
+ "ɸ": [
281
+ 87
282
+ ],
283
+ "ɹ": [
284
+ 88
285
+ ],
286
+ "ɺ": [
287
+ 89
288
+ ],
289
+ "ɻ": [
290
+ 90
291
+ ],
292
+ "ɽ": [
293
+ 91
294
+ ],
295
+ "ɾ": [
296
+ 92
297
+ ],
298
+ "ʀ": [
299
+ 93
300
+ ],
301
+ "ʁ": [
302
+ 94
303
+ ],
304
+ "ʂ": [
305
+ 95
306
+ ],
307
+ "ʃ": [
308
+ 96
309
+ ],
310
+ "ʄ": [
311
+ 97
312
+ ],
313
+ "ʈ": [
314
+ 98
315
+ ],
316
+ "ʉ": [
317
+ 99
318
+ ],
319
+ "ʊ": [
320
+ 100
321
+ ],
322
+ "ʋ": [
323
+ 101
324
+ ],
325
+ "ʌ": [
326
+ 102
327
+ ],
328
+ "ʍ": [
329
+ 103
330
+ ],
331
+ "ʎ": [
332
+ 104
333
+ ],
334
+ "ʏ": [
335
+ 105
336
+ ],
337
+ "ʐ": [
338
+ 106
339
+ ],
340
+ "ʑ": [
341
+ 107
342
+ ],
343
+ "ʒ": [
344
+ 108
345
+ ],
346
+ "ʔ": [
347
+ 109
348
+ ],
349
+ "ʕ": [
350
+ 110
351
+ ],
352
+ "ʘ": [
353
+ 111
354
+ ],
355
+ "ʙ": [
356
+ 112
357
+ ],
358
+ "ʛ": [
359
+ 113
360
+ ],
361
+ "ʜ": [
362
+ 114
363
+ ],
364
+ "ʝ": [
365
+ 115
366
+ ],
367
+ "ʟ": [
368
+ 116
369
+ ],
370
+ "ʡ": [
371
+ 117
372
+ ],
373
+ "ʢ": [
374
+ 118
375
+ ],
376
+ "ʲ": [
377
+ 119
378
+ ],
379
+ "ˈ": [
380
+ 120
381
+ ],
382
+ "ˌ": [
383
+ 121
384
+ ],
385
+ "ː": [
386
+ 122
387
+ ],
388
+ "ˑ": [
389
+ 123
390
+ ],
391
+ "˞": [
392
+ 124
393
+ ],
394
+ "β": [
395
+ 125
396
+ ],
397
+ "θ": [
398
+ 126
399
+ ],
400
+ "χ": [
401
+ 127
402
+ ],
403
+ "ᵻ": [
404
+ 128
405
+ ],
406
+ "ⱱ": [
407
+ 129
408
+ ],
409
+ "0": [
410
+ 130
411
+ ],
412
+ "1": [
413
+ 131
414
+ ],
415
+ "2": [
416
+ 132
417
+ ],
418
+ "3": [
419
+ 133
420
+ ],
421
+ "4": [
422
+ 134
423
+ ],
424
+ "5": [
425
+ 135
426
+ ],
427
+ "6": [
428
+ 136
429
+ ],
430
+ "7": [
431
+ 137
432
+ ],
433
+ "8": [
434
+ 138
435
+ ],
436
+ "9": [
437
+ 139
438
+ ],
439
+ "̧": [
440
+ 140
441
+ ],
442
+ "̃": [
443
+ 141
444
+ ],
445
+ "̪": [
446
+ 142
447
+ ],
448
+ "̯": [
449
+ 143
450
+ ],
451
+ "̩": [
452
+ 144
453
+ ],
454
+ "ʰ": [
455
+ 145
456
+ ],
457
+ "ˤ": [
458
+ 146
459
+ ],
460
+ "ε": [
461
+ 147
462
+ ],
463
+ "↓": [
464
+ 148
465
+ ],
466
+ "#": [
467
+ 149
468
+ ],
469
+ "\"": [
470
+ 150
471
+ ],
472
+ "↑": [
473
+ 151
474
+ ],
475
+ "̺": [
476
+ 152
477
+ ],
478
+ "̻": [
479
+ 153
480
+ ],
481
+ "g": [
482
+ 154
483
+ ],
484
+ "ʦ": [
485
+ 155
486
+ ],
487
+ "X": [
488
+ 156
489
+ ],
490
+ "̝": [
491
+ 157
492
+ ],
493
+ "̊": [
494
+ 158
495
+ ],
496
+ "ɝ": [
497
+ 159
498
+ ],
499
+ "ʷ": [
500
+ 160
501
+ ]
502
+ },
503
+ "language": {
504
+ "code": "ml_IN",
505
+ "family": "ml",
506
+ "region": "IN",
507
+ "name_native": "മലയാളം",
508
+ "name_english": "Malayalam",
509
+ "country_english": "India"
510
+ },
511
+ "dataset": "arjun"
512
+ }
ml/ml_IN/meera/medium/ml_IN-meera-medium.onnx.json CHANGED
@@ -1,11 +1,13 @@
1
  {
2
  "audio": {
3
- "sample_rate": 22050
 
4
  },
5
  "espeak": {
6
  "voice": "ml"
7
  },
8
  "phoneme_type": "espeak",
 
9
  "num_symbols": 256,
10
  "num_speakers": 1,
11
  "inference": {
@@ -497,5 +499,14 @@
497
  "ʷ": [
498
  160
499
  ]
500
- }
501
- }
 
 
 
 
 
 
 
 
 
 
1
  {
2
  "audio": {
3
+ "sample_rate": 22050,
4
+ "quality": "medium"
5
  },
6
  "espeak": {
7
  "voice": "ml"
8
  },
9
  "phoneme_type": "espeak",
10
+ "piper_version": "1.3.0",
11
  "num_symbols": 256,
12
  "num_speakers": 1,
13
  "inference": {
 
499
  "ʷ": [
500
  160
501
  ]
502
+ },
503
+ "language": {
504
+ "code": "ml_IN",
505
+ "family": "ml",
506
+ "region": "IN",
507
+ "name_native": "മലയാളം",
508
+ "name_english": "Malayalam",
509
+ "country_english": "India"
510
+ },
511
+ "dataset": "meera"
512
+ }
voices.json CHANGED
@@ -5264,6 +5264,66 @@
5264
  },
5265
  "aliases": []
5266
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5267
  "ne_NP-google-medium": {
5268
  "key": "ne_NP-google-medium",
5269
  "name": "google",
 
5264
  },
5265
  "aliases": []
5266
  },
5267
+ "ml_IN-arjun-medium": {
5268
+ "key": "ml_IN-arjun-medium",
5269
+ "name": "arjun",
5270
+ "language": {
5271
+ "code": "ml_IN",
5272
+ "family": "ml",
5273
+ "region": "IN",
5274
+ "name_native": "മലയാളം",
5275
+ "name_english": "Malayalam",
5276
+ "country_english": "India"
5277
+ },
5278
+ "quality": "medium",
5279
+ "num_speakers": 1,
5280
+ "speaker_id_map": {},
5281
+ "files": {
5282
+ "ml/ml_IN/arjun/medium/ml_IN-arjun-medium.onnx": {
5283
+ "size_bytes": 62950044,
5284
+ "md5_digest": "4f20109c108aa80f46df85ab9cda5daa"
5285
+ },
5286
+ "ml/ml_IN/arjun/medium/ml_IN-arjun-medium.onnx.json": {
5287
+ "size_bytes": 5044,
5288
+ "md5_digest": "18454efcad5bb889ee4cb1cb035993f5"
5289
+ },
5290
+ "ml/ml_IN/arjun/medium/MODEL_CARD": {
5291
+ "size_bytes": 308,
5292
+ "md5_digest": "eb0037396b93f38ffbc093dba42cf8be"
5293
+ }
5294
+ },
5295
+ "aliases": []
5296
+ },
5297
+ "ml_IN-meera-medium": {
5298
+ "key": "ml_IN-meera-medium",
5299
+ "name": "meera",
5300
+ "language": {
5301
+ "code": "ml_IN",
5302
+ "family": "ml",
5303
+ "region": "IN",
5304
+ "name_native": "മലയാളം",
5305
+ "name_english": "Malayalam",
5306
+ "country_english": "India"
5307
+ },
5308
+ "quality": "medium",
5309
+ "num_speakers": 1,
5310
+ "speaker_id_map": {},
5311
+ "files": {
5312
+ "ml/ml_IN/meera/medium/ml_IN-meera-medium.onnx": {
5313
+ "size_bytes": 62950044,
5314
+ "md5_digest": "3eb7b05d25c1551f7a7cec1e1c153b1f"
5315
+ },
5316
+ "ml/ml_IN/meera/medium/ml_IN-meera-medium.onnx.json": {
5317
+ "size_bytes": 5045,
5318
+ "md5_digest": "64c2eee28c62e3a072ccc2ea3d812748"
5319
+ },
5320
+ "ml/ml_IN/meera/medium/MODEL_CARD": {
5321
+ "size_bytes": 308,
5322
+ "md5_digest": "626a0c1d744d0ce6ffca95665c526939"
5323
+ }
5324
+ },
5325
+ "aliases": []
5326
+ },
5327
  "ne_NP-google-medium": {
5328
  "key": "ne_NP-google-medium",
5329
  "name": "google",