from text.symbols import * _symbol_to_id = {s: i for i, s in enumerate(symbols)} def cleaned_text_to_sequence(cleaned_text, tones, language): """Converts a string of text to a sequence of IDs corresponding to the symbols in the text. Args: text: string to convert to a sequence Returns: List of integers corresponding to the symbols in the text """ phones = [_symbol_to_id[symbol] for symbol in cleaned_text] tone_start = language_tone_start_map[language] tones = [i + tone_start for i in tones] lang_id = language_id_map[language] lang_ids = [lang_id for i in phones] return phones, tones, lang_ids def get_bert( text, word2ph, language, device, assist_text=None, assist_text_weight=0.7, ignore_unknown=False, ): if language == "ZH": from .chinese_bert import get_bert_feature as zh_bert return zh_bert(text, word2ph, device, assist_text, assist_text_weight) elif language == "EN": from .english_bert_mock import get_bert_feature as en_bert return en_bert(text, word2ph, device, assist_text, assist_text_weight) elif language == "JP": from .japanese_bert import get_bert_feature as jp_bert return jp_bert( text, word2ph, device, assist_text, assist_text_weight, ignore_unknown ) else: raise ValueError(f"Language {language} not supported")