| { | |
| "output_dir": "./results", | |
| "num_train_epochs": 10, | |
| "per_device_train_batch_size": 16, | |
| "gradient_accumulation_steps": 1, | |
| "learning_rate": 0.0001, | |
| "weight_decay": 0.01, | |
| "logging_steps": 100, | |
| "save_steps": 1000, | |
| "eval_steps": 500, | |
| "warmup_steps": 500, | |
| "max_grad_norm": 1.0, | |
| "fp16": false, | |
| "dataloader_num_workers": 4, | |
| "load_best_model_at_end": true, | |
| "metric_for_best_model": "loss", | |
| "greater_is_better": false, | |
| "report_to": [], | |
| "seed": 42 | |
| } |