Skip to content

Commit a34f2bf

Browse files
authored
add audio to audio translation to SeamlessM4T (rsxdalv#284)
* add audio to audio translation to SeamlessM4T * readme
1 parent d04bafe commit a34f2bf

File tree

3 files changed

+203
-164
lines changed

3 files changed

+203
-164
lines changed

README.md

+1
Original file line numberDiff line numberDiff line change
@@ -43,6 +43,7 @@ https://github.com/rsxdalv/tts-generation-webui/discussions/186#discussioncommen
4343
## Changelog
4444
Mar 10:
4545
* Add Batching to React UI Magnet (#283)
46+
* Add audio to audio translation to SeamlessM4T (#284)
4647

4748
Mar 5:
4849
* Add Batching to React UI MusicGen (#281), thanks to https://github.com/Aamir3d for requesting this and providing feedback
+127
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,127 @@
1+
language_code_to_name = {
2+
"afr": "Afrikaans",
3+
"amh": "Amharic",
4+
"arb": "Modern Standard Arabic",
5+
"ary": "Moroccan Arabic",
6+
"arz": "Egyptian Arabic",
7+
"asm": "Assamese",
8+
"ast": "Asturian",
9+
"azj": "North Azerbaijani",
10+
"bel": "Belarusian",
11+
"ben": "Bengali",
12+
"bos": "Bosnian",
13+
"bul": "Bulgarian",
14+
"cat": "Catalan",
15+
"ceb": "Cebuano",
16+
"ces": "Czech",
17+
"ckb": "Central Kurdish",
18+
"cmn": "Mandarin Chinese",
19+
"cmn_Hant": "Traditional Mandarin Chinese",
20+
"cym": "Welsh",
21+
"dan": "Danish",
22+
"deu": "German",
23+
"ell": "Greek",
24+
"eng": "English",
25+
"est": "Estonian",
26+
"eus": "Basque",
27+
"fin": "Finnish",
28+
"fra": "French",
29+
"gaz": "West Central Oromo",
30+
"gle": "Irish",
31+
"glg": "Galician",
32+
"guj": "Gujarati",
33+
"heb": "Hebrew",
34+
"hin": "Hindi",
35+
"hrv": "Croatian",
36+
"hun": "Hungarian",
37+
"hye": "Armenian",
38+
"ibo": "Igbo",
39+
"ind": "Indonesian",
40+
"isl": "Icelandic",
41+
"ita": "Italian",
42+
"jav": "Javanese",
43+
"jpn": "Japanese",
44+
"kam": "Kamba",
45+
"kan": "Kannada",
46+
"kat": "Georgian",
47+
"kaz": "Kazakh",
48+
"kea": "Kabuverdianu",
49+
"khk": "Halh Mongolian",
50+
"khm": "Khmer",
51+
"kir": "Kyrgyz",
52+
"kor": "Korean",
53+
"lao": "Lao",
54+
"lit": "Lithuanian",
55+
"ltz": "Luxembourgish",
56+
"lug": "Ganda",
57+
"luo": "Luo",
58+
"lvs": "Standard Latvian",
59+
"mai": "Maithili",
60+
"mal": "Malayalam",
61+
"mar": "Marathi",
62+
"mkd": "Macedonian",
63+
"mlt": "Maltese",
64+
"mni": "Meitei",
65+
"mya": "Burmese",
66+
"nld": "Dutch",
67+
"nno": "Norwegian Nynorsk",
68+
"nob": "Norwegian Bokm\u00e5l",
69+
"npi": "Nepali",
70+
"nya": "Nyanja",
71+
"oci": "Occitan",
72+
"ory": "Odia",
73+
"pan": "Punjabi",
74+
"pbt": "Southern Pashto",
75+
"pes": "Western Persian",
76+
"pol": "Polish",
77+
"por": "Portuguese",
78+
"ron": "Romanian",
79+
"rus": "Russian",
80+
"slk": "Slovak",
81+
"slv": "Slovenian",
82+
"sna": "Shona",
83+
"snd": "Sindhi",
84+
"som": "Somali",
85+
"spa": "Spanish",
86+
"srp": "Serbian",
87+
"swe": "Swedish",
88+
"swh": "Swahili",
89+
"tam": "Tamil",
90+
"tel": "Telugu",
91+
"tgk": "Tajik",
92+
"tgl": "Tagalog",
93+
"tha": "Thai",
94+
"tur": "Turkish",
95+
"ukr": "Ukrainian",
96+
"urd": "Urdu",
97+
"uzn": "Northern Uzbek",
98+
"vie": "Vietnamese",
99+
"xho": "Xhosa",
100+
"yor": "Yoruba",
101+
"yue": "Cantonese",
102+
"zlm": "Colloquial Malay",
103+
"zsm": "Standard Malay",
104+
"zul": "Zulu",
105+
106+
"fuv": "Nigerian Fulfulde",
107+
"gle": "Irish",
108+
"sat": "Santali",
109+
"pbt": "Southern Pashto",
110+
"zsm": "Standard Malay",
111+
"xho": "Xhosa",
112+
"kea": "Kabuverdianu",
113+
}
114+
115+
116+
def get_language_name(language_code):
117+
return language_code_to_name[language_code]
118+
119+
text_source_codes = ["afr","amh","arb","ary","arz","asm","azj","bel","ben","bos","bul","cat","ceb","ces","ckb","cmn","cmn_Hant","cym","dan","deu","ell","eng","est","eus","fin","fra","fuv","gaz","gle","glg","guj","heb","hin","hrv","hun","hye","ibo","ind","isl","ita","jav","jpn","kan","kat","kaz","khk","khm","kir","kor","lao","lit","lug","luo","lvs","mai","mal","mar","mkd","mlt","mni","mya","nld","nno","nob","npi","nya","ory","pan","pbt","pes","pol","por","ron","rus","slk","slv","sna","snd","som","spa","srp","swe","swh","tam","tel","tgk","tgl","tha","tur","ukr","urd","uzn","vie","yor","yue","zsm","zul"]
120+
text_target_codes = ["afr","amh","arb","ary","arz","asm","azj","bel","ben","bos","bul","cat","ceb","ces","ckb","cmn","cmn_Hant","cym","dan","deu","ell","eng","est","eus","fin","fra","fuv","gaz","gle","glg","guj","heb","hin","hrv","hun","hye","ibo","ind","isl","ita","jav","jpn","kan","kat","kaz","khk","khm","kir","kor","lao","lit","lug","luo","lvs","mai","mal","mar","mkd","mlt","mni","mya","nld","nno","nob","npi","nya","ory","pan","pbt","pes","pol","por","ron","rus","slk","slv","sna","snd","som","spa","srp","swe","swh","tam","tel","tgk","tgl","tha","tur","ukr","urd","uzn","vie","yor","yue","zsm","zul"]
121+
speech_source_codes = ["afr","amh","arb","ary","arz","asm","ast","azj","bel","ben","bos","bul","cat","ceb","ces","ckb","cmn","cmn_Hant","cym","dan","deu","ell","eng","est","eus","fin","fra","fuv","gaz","gle","glg","guj","heb","hin","hrv","hun","hye","ibo","ind","isl","ita","jav","jpn","kam","kan","kat","kaz","kea","khk","khm","kir","kor","lao","lit","ltz","lug","luo","lvs","mai","mal","mar","mkd","mlt","mni","mya","nld","nno","nob","npi","nya","oci","ory","pan","pbt","pes","pol","por","ron","rus","slk","slv","sna","snd","som","spa","srp","swe","swh","tam","tel","tgk","tgl","tha","tur","ukr","urd","uzn","vie","xho","yor","yue","zlm","zul"]
122+
speech_target_codes = ["arb","ben","cat","ces","cmn","cmn_Hant","cym","dan","deu","eng","est","fin","fra","hin","ind","ita","jpn","kor","mlt","nld","pes","pol","por","ron","rus","slk","spa","swe","swh","tel","tgl","tha","tur","ukr","urd","uzn","vie"]
123+
124+
text_source_languages = [get_language_name(code) for code in text_source_codes]
125+
text_target_languages = [get_language_name(code) for code in text_target_codes]
126+
speech_source_languages = [get_language_name(code) for code in speech_source_codes]
127+
speech_target_languages = [get_language_name(code) for code in speech_target_codes]

0 commit comments

Comments
 (0)