{ "bayesian_train": true, "loss_weights": "log", "tokenized_ds_dir": "data/goemotions_v1_seq512", "encoder_lr": 0.00001, "head_lr": 0.0005, "lr_warmup": 0.05, "weight_decay": 0.01, "batch_size": 32, "gradient_accumulation_steps": 8, "num_epochs": 10 }