{ "train_data": "datasets/processed/final/train.jsonl", "val_data": "datasets/processed/final/val.jsonl", "model_name_or_path": "microsoft/DialoGPT-small", "output_dir": "models/bilingual-lm/", "max_length": 128, "batch_size": 8, "num_epochs": 3, "learning_rate": 5e-05, "weight_decay": 0.01, "warmup_steps": 500, "gradient_accumulation_steps": 1, "max_grad_norm": 1.0, "seed": 42, "max_train_samples": null, "max_val_samples": null, "fp16": false }