reFlow / config /train_reflow_1.py
reuAC's picture
Upload folder using huggingface_hub
672259a verified
model_config = 'reflow'
log_file = 'logs/reflow-1.log'
out_dir = 'out/reflow-1'
eval_interval = 500
log_interval = 1
eval_iters = 500
eval_only = False
always_save_checkpoint = False
init_from = 'scratch'
wandb_log = False
wandb_project = 'reflow-1'
wandb_run_name = 'reflow-1'
dataset = 'openwebtext'
gradient_accumulation_steps = 64
batch_size = 1
block_size = 1024
n_layer = 32
n_head = 16
n_embd = 1024
n_signals = 1024
vocab_size = 50304
dropout = 0.0
bias = False
learning_rate = 1.5e-4
max_iters = 50000
weight_decay = 0.1
beta1 = 0.9
beta2 = 0.95
grad_clip = 1.0
decay_lr = False
warmup_iters = 2000
lr_decay_iters = 600000
min_lr = 6e-5
backend = 'nccl'
device = 'cuda'
dtype = 'float16'
compile = True