with open('corpus.txt', 'r', encoding='utf-8') as f: corpus = f.read()