File size: 510 Bytes
feba2ad
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
"""
Constants used throughout the codebase
"""

# Basic Training Constants used throughout the codebase
VOCAB_SIZE = 50304
MAX_SEQ_LEN = 2048
BATCH_SIZE = 1024
GRADIENT_ACCUMULATION_STEPS = 128

# Directories used to store training runs, checkpoints, logs, and evaluation results
RUNS_DIR = "runs"
CHECKPOINTS_DIR = "checkpoints"
LOGS_DIR = "logs"
FABRIC_CHECKPOINT_DIR = "fabric_state"
FABRIC_CHECKPOINT_FILENAME = "checkpoint.pt"
LEARNING_DYNAMICS_DIR = "learning_dynamics"
EVAL_RESULTS_DIR = "eval_results"