AgGPT-13Mini / config /train_aggpt_char.py
AGofficial's picture
Upload 13 files
39bdf0e verified
# train AgGPT
out_dir = 'out-aggpt'
eval_interval = 250
eval_iters = 200
log_interval = 10
always_save_checkpoint = False
wandb_log = False
wandb_project = 'train_aggpt_char'
wandb_run_name = 'mini-gpt'
dataset = 'chats'
gradient_accumulation_steps = 1
batch_size = 64
block_size = 256
n_layer = 6
n_head = 6
n_embd = 384
dropout = 0.2
learning_rate = 1e-3
max_iters = 5000
lr_decay_iters = 5000
min_lr = 1e-4
beta2 = 0.99
warmup_iters = 100