From 3db0dec08aa1f55e6762684d7f6acf890e2e8d94 Mon Sep 17 00:00:00 2001 From: David Martin Rius Date: Wed, 28 Feb 2024 20:23:53 +0100 Subject: [PATCH] Add 2 functions to verify any spacy language can be instantiated. By now, the only one that needs special packages is Korean. So, all languages works well but Korean --- TTS/tts/layers/xtts/tokenizer.py | 18 +++++++++++++++++- 1 file changed, 17 insertions(+), 1 deletion(-) diff --git a/TTS/tts/layers/xtts/tokenizer.py b/TTS/tts/layers/xtts/tokenizer.py index fb941d7033..5d580a55ef 100644 --- a/TTS/tts/layers/xtts/tokenizer.py +++ b/TTS/tts/layers/xtts/tokenizer.py @@ -15,11 +15,27 @@ from TTS.tts.layers.xtts.zh_num2words import TextNorm as zh_num2words +import spacy + +# These 2 functions are to verify that any language can be instantiated +def get_spacy_available_langs(): + from pathlib import Path + spacy_path = Path(spacy.__file__.replace('__init__.py','')) + spacy_langs = spacy_path / 'lang' + SPACY_LANGS = [str(x).split('/')[-1] for x in spacy_langs.iterdir() if x.is_dir() and str(x).split('/')[-1] != '__pycache__'] + print("Available languages in Spacy:", SPACY_LANGS) + return SPACY_LANGS +def get_all_spacy_langs(): + SPACY_LANGS = get_spacy_available_langs() + spacy_lang_instances = [] + for lang in SPACY_LANGS: + spacy_lang_instances.append(get_spacy_lang(lang)) def get_spacy_lang(lang): try: lang_model = get_lang_class(lang)() - except ImportError: + except ImportError as e: + print("Error", e) # Fallback to English if the language model is not available lang_model = English() return lang_model