punctuation = ["!", "?", "…", ",", ".", "'", "-"] pu_symbols = punctuation + ["SP", "UNK"] pad = "_" # chinese zh_symbols = [ "E", "En", "a", "ai", "an", "ang", "ao", "b", "c", "ch", "d", "e", "ei", "en", "eng", "er", "f", "g", "h", "i", "i0", "ia", "ian", "iang", "iao", "ie", "in", "ing", "iong", "ir", "iu", "j", "k", "l", "m", "n", "o", "ong", "ou", "p", "q", "r", "s", "sh", "t", "u", "ua", "uai", "uan", "uang", "ui", "un", "uo", "v", "van", "ve", "vn", "w", "x", "y", "z", "zh", "AA", "EE", "OO", ] num_zh_tones = 6 # japanese ja_symbols_legacy = ['I', 'N', 'U', 'a', 'b', 'by', 'ch', 'cl', 'd', 'dy', 'e', 'f', 'g', 'gy', 'h', 'hy', 'i', 'j', 'k', 'ky', 'm', 'my', 'n', 'ny', 'o', 'p', 'py', 'r', 'ry', 's', 'sh', 't', 'ts', 'u', 'V', 'w', 'y', 'z'] ja_symbols = [ "N", "a", "a:", "b", "by", "ch", "d", "dy", "e", "e:", "f", "g", "gy", "h", "hy", "i", "i:", "j", "k", "ky", "m", "my", "n", "ny", "o", "o:", "p", "py", "q", "r", "ry", "s", "sh", "t", "ts", "ty", "u", "u:", "w", "y", "z", "zy", ] num_ja_tones_v111 = 1 num_ja_tones = 2 # English en_symbols = [ "aa", "ae", "ah", "ao", "aw", "ay", "b", "ch", "d", "dh", "eh", "er", "ey", "f", "g", "hh", "ih", "iy", "jh", "k", "l", "m", "n", "ng", "ow", "oy", "p", "r", "s", "sh", "t", "th", "uh", "uw", "V", "w", "y", "z", "zh", ] num_en_tones = 4 normal_symbols = sorted(set(zh_symbols + ja_symbols + en_symbols)) symbols = [pad] + normal_symbols + pu_symbols sil_phonemes_ids = [symbols.index(i) for i in pu_symbols] # legacy normal_symbols_legacy = sorted(set(zh_symbols + ja_symbols_legacy + en_symbols)) symbols_legacy = [pad] + normal_symbols_legacy + pu_symbols sil_phonemes_ids_legacy = [symbols_legacy.index(i) for i in pu_symbols] # combine all tones num_tones_v111 = num_zh_tones + num_ja_tones_v111 + num_en_tones num_tones = num_zh_tones + num_ja_tones + num_en_tones # language maps language_id_map = {"zh": 0, "ja": 1, "en": 2} num_languages = len(language_id_map.keys()) language_tone_start_map_v111 = { "zh": 0, "ja": num_zh_tones, "en": num_zh_tones + num_ja_tones_v111, } language_tone_start_map = { "zh": 0, "ja": num_zh_tones, "en": num_zh_tones + num_ja_tones, } if __name__ == "__main__": zh = set(zh_symbols) en = set(en_symbols) ja = set(ja_symbols) print(zh) print(en) print(ja) print(sorted(zh & en))