bilingual-lm / training_args.json
khulnasoft's picture
Upload folder using huggingface_hub
8eed7ac verified
raw
history blame contribute delete
481 Bytes
{
"train_data": "datasets/processed/final/train.jsonl",
"val_data": "datasets/processed/final/val.jsonl",
"model_name_or_path": "microsoft/DialoGPT-small",
"output_dir": "models/bilingual-lm/",
"max_length": 128,
"batch_size": 8,
"num_epochs": 3,
"learning_rate": 5e-05,
"weight_decay": 0.01,
"warmup_steps": 500,
"gradient_accumulation_steps": 1,
"max_grad_norm": 1.0,
"seed": 42,
"max_train_samples": null,
"max_val_samples": null,
"fp16": false
}