{
  "train_data": "datasets/processed/final/train.jsonl",
  "val_data": "datasets/processed/final/val.jsonl",
  "model_name_or_path": "microsoft/DialoGPT-small",
  "output_dir": "models/bilingual-lm/",
  "max_length": 128,
  "batch_size": 8,
  "num_epochs": 3,
  "learning_rate": 5e-05,
  "weight_decay": 0.01,
  "warmup_steps": 500,
  "gradient_accumulation_steps": 1,
  "max_grad_norm": 1.0,
  "seed": 42,
  "max_train_samples": null,
  "max_val_samples": null,
  "fp16": false
}