| { | |
| "output_dir": "./output", | |
| "overwrite_output_dir": true, | |
| "num_train_epochs": 50, | |
| "per_device_train_batch_size": 8, | |
| "gradient_accumulation_steps": 1, | |
| "learning_rate": 5e-5, | |
| "weight_decay": 0.01, | |
| "warmup_steps": 0, | |
| "fp16": true, | |
| "seed": 42, | |
| "per_device_eval_batch_size": 8, | |
| "eval_strategy": "epoch", | |
| "metric_for_best_model": "eval_loss", | |
| "greater_is_better": false, | |
| "eval_steps": null, | |
| "load_best_model_at_end": true, | |
| "save_strategy": "epoch", | |
| "save_steps": null, | |
| "save_total_limit": 2, | |
| "logging_dir": "./output/logs", | |
| "logging_steps": 100, | |
| "report_to": "wandb", | |
| "run_name": "Se124M100K", | |
| "push_to_hub": true, | |
| "hub_model_id": "augustocsc/Se124M100K", | |
| "hub_token": null | |
| } |