import re from src.text.korean import latin_to_hangul, number_to_hangul, divide_hangul, korean_to_lazy_ipa, korean_to_ipa def japanese_cleaners(text): from text.japanese import japanese_to_romaji_with_accent text = japanese_to_romaji_with_accent(text) if len(text) == 0 or re.match('[A-Za-z]', text[-1]): text += '.' return text def japanese_cleaners2(text): text = text.replace('・・・', '…').replace('・', ' ') text = japanese_cleaners(text).replace('ts', 'ʦ').replace('...', '…') \ .replace('(', '').replace(')', '') \ .replace('[', '').replace(']', '') \ .replace('*', ' ').replace('{', '').replace('}', '') return text def korean_cleaners(text): text = latin_to_hangul(text) text = number_to_hangul(text) #text = divide_hangul(text) if re.match('[\u3131-\u3163]', text[-1]): text += '.' text = korean_to_ipa(text) return text