File size: 774 Bytes
2f6b10b |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 |
import os
import hangul_jamo
root_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
dictionary_dir = os.path.join(root_dir, 'dictionary')
staging_dir = os.path.join(dictionary_dir, 'training')
jamo_dict = os.path.join(staging_dir, 'korean_jamo_mfa.dict')
hangul_dict= os.path.join(staging_dir, 'korean_mfa.dict')
phone_set = set()
with open(jamo_dict, 'r', encoding='utf8') as jamo_f, \
open(hangul_dict, 'w', encoding='utf8') as hangul_f:
for line in jamo_f:
line = line.strip()
line = line.split()
word = line.pop(0)
pronunciation = ' '.join(line)
phone_set.update(line)
hangul_word = hangul_jamo.compose(word)
hangul_f.write(f'{hangul_word}\t{pronunciation}\n')
print(sorted(phone_set))
|