| { | |
| "train_data": "datasets/processed/final/train.jsonl", | |
| "val_data": "datasets/processed/final/val.jsonl", | |
| "model_name_or_path": "microsoft/DialoGPT-small", | |
| "output_dir": "models/bilingual-lm/", | |
| "max_length": 128, | |
| "batch_size": 8, | |
| "num_epochs": 3, | |
| "learning_rate": 5e-05, | |
| "weight_decay": 0.01, | |
| "warmup_steps": 500, | |
| "gradient_accumulation_steps": 1, | |
| "max_grad_norm": 1.0, | |
| "seed": 42, | |
| "max_train_samples": null, | |
| "max_val_samples": null, | |
| "fp16": false | |
| } |