ThomasTheMaker's picture
Upload folder using huggingface_hub
feba2ad verified
raw
history blame
510 Bytes
"""
Constants used throughout the codebase
"""
# Basic Training Constants used throughout the codebase
VOCAB_SIZE = 50304
MAX_SEQ_LEN = 2048
BATCH_SIZE = 1024
GRADIENT_ACCUMULATION_STEPS = 128
# Directories used to store training runs, checkpoints, logs, and evaluation results
RUNS_DIR = "runs"
CHECKPOINTS_DIR = "checkpoints"
LOGS_DIR = "logs"
FABRIC_CHECKPOINT_DIR = "fabric_state"
FABRIC_CHECKPOINT_FILENAME = "checkpoint.pt"
LEARNING_DYNAMICS_DIR = "learning_dynamics"
EVAL_RESULTS_DIR = "eval_results"