File size: 756 Bytes
c0c84cf
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
from .symbols import *


_symbol_to_id = {s: i for i, s in enumerate(symbols)}


def phonemes_to_ids(cleaned_text, tones, language, symbol_to_id=None):
    """Converts a list of phoneme symbols to a sequence of integer IDs."""
    symbol_to_id_map = symbol_to_id if symbol_to_id else _symbol_to_id
    unk_id = symbol_to_id_map.get("UNK")
    if unk_id is None:
        phones = [symbol_to_id_map[symbol] for symbol in cleaned_text]
    else:
        phones = [symbol_to_id_map.get(symbol, unk_id) for symbol in cleaned_text]
    tone_start = language_tone_start_map[language]
    tones = [i + tone_start for i in tones]
    lang_id = language_id_map[language]
    lang_ids = [lang_id for _ in phones]
    return phones, tones, lang_ids