English
AgGPT10m / corpus.py
AGofficial's picture
Upload 8 files
de00bef verified
raw
history blame contribute delete
241 Bytes
import json
from encoder import TextEncoder
encoder = TextEncoder(vocab_path="vocab.json", by_char=False)
with open("AgGPT10m.agmodel", "r") as f:
encoded = json.load(f)
decoded_text = encoder.decode(encoded)
corpus = decoded_text