Use combined characters available in TTS phonemes (like ç)

pull/506/head
Michael Hansen 2021-06-11 10:43:52 -04:00 committed by Eren Gölge
parent da6f6a4a01
commit 618b509204
1 changed files with 5 additions and 0 deletions

View File

@ -53,6 +53,11 @@ def clean_gruut_phonemes(ph_list):
cleaned_phonemes = []
for phoneme_text in ph_list:
phoneme_text = unicodedata.normalize("NFC", phoneme_text)
if phoneme_text in phonemes:
cleaned_phonemes.append(phoneme_text)
continue
# Decompose into codepoints (ã -> ["a", "\u0303"])
phoneme_text = unicodedata.normalize("NFD", phoneme_text)
for codepoint in phoneme_text.translate(GRUUT_TRANS_TABLE):