Spaces:
Sleeping
Sleeping
| import torch | |
| from .tokenizer import CharacterLevelTokenizer | |
| from dataclasses import dataclass | |
| with open('data/harry_potter_data', 'r', encoding='utf-8') as f: | |
| data = f.read() | |
| class Config: | |
| tokenizer = CharacterLevelTokenizer(data) | |
| block_size = 256 # context-length | |
| batch_size = 64 # mini-batch size | |
| vocab_size = tokenizer.VOCAB_SIZE | |
| n_embed = 256 | |
| n_heads = 8 | |
| head_size =n_embed //n_heads # computes to 384/6=64 or 128/4=32 or 256/8 | |
| n_layers = 3 | |
| train_iters = 10_000 | |
| val_iters = 1000 | |
| lr = 3e-4 | |
| attn_dropout = 0.1 | |
| block_dropout = 0.1 | |
| device = 'cuda' if torch.cuda.is_available() else 'cpu' | |