Spaces:
Sleeping
Sleeping
File size: 565 Bytes
79078fe | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 | from dataclasses import dataclass
from pathlib import Path
@dataclass
class SmallGPTConfig:
block_size: int = 48
batch_size: int = 20
d_model: int = 96
n_heads: int = 4
n_layers: int = 3
dropout: float = 0.1
learning_rate: float = 2.5e-3
bootstrap_steps: int = 80
cpu_threads: int = 4
seed: int = 42
@property
def root_dir(self) -> Path:
return Path(__file__).resolve().parents[1]
@property
def checkpoint_path(self) -> Path:
return self.root_dir / "artifacts" / "small_gpt_checkpoint.pt"
|