AbstractPhil's picture
Add training checkpoints (safetensors)
895d705 verified
raw
history blame contribute delete
517 Bytes
{
"d_model": 1024,
"max_text_len": 32,
"batch_size": 256,
"eval_batch_size": 512,
"train_num_workers": 4,
"eval_num_workers": 2,
"epochs": 3,
"lr": 0.0003,
"weight_decay": 0.01,
"min_lr": 1e-06,
"grad_clip": 1.0,
"align_samples": 5000,
"whiten_procrustes": true,
"enforce_rotation_only": false,
"pw": 0.1,
"aw": 0.05,
"checkpoint_dir": "/home/claude/bertenstein_checkpoints",
"tensorboard_dir": "/home/claude/bertenstein_tb",
"save_every_epoch": true,
"log_every_n_steps": 10
}