|
244 | 244 | } # fmt: skip
|
245 | 245 |
|
246 | 246 | SUNBIRD_SUPPORTED_LANGUAGES = {
|
247 |
| - "eng", "swa", "ach", "lgg", "lug", "nyn", |
248 |
| - "teo", "xog", "ttj", "kin", "myx", |
| 247 | + "ach": "<|su|>", "eng": "<|en|>", "kin": "<|as|>", "lgg": "<|jw|>", "lug": "<|ba|>", "myx": "<|mg|>", |
| 248 | + "nyn": "<|ha|>", "swa": "<|sw|>", "teo": "<|ln|>", "ttj": "<|tt|>", "xog": "<|haw|>" |
249 | 249 | } # fmt: skip
|
250 | 250 |
|
| 251 | + |
251 | 252 | # https://translation.ghananlp.org/api-details#api=ghananlp-translation-webservice-api
|
252 | 253 | GHANA_NLP_SUPPORTED = {'en': 'English', 'tw': 'Twi', 'gaa': 'Ga', 'ee': 'Ewe', 'fat': 'Fante', 'dag': 'Dagbani',
|
253 | 254 | 'gur': 'Gurene', 'yo': 'Yoruba', 'ki': 'Kikuyu', 'luo': 'Luo', 'mer': 'Kimeru'} # fmt: skip
|
@@ -1301,6 +1302,8 @@ def run_asr(
|
1301 | 1302 | # don't pass language or task
|
1302 | 1303 | kwargs.pop("task", None)
|
1303 | 1304 | kwargs["max_length"] = 448
|
| 1305 | + elif selected_model == AsrModels.whisper_sunbird_large_v3: |
| 1306 | + kwargs["language"] = SUNBIRD_SUPPORTED_LANGUAGES[language.strip()] |
1304 | 1307 | elif "whisper" in selected_model.name:
|
1305 | 1308 | forced_lang = forced_asr_languages.get(selected_model)
|
1306 | 1309 | if forced_lang:
|
|
0 commit comments