{ "model_type": "gpt2", "model_checkpoint": "gpt2", "device": "cuda:0", "use_amp": true, "train_batch_size": 3, "valid_batch_size": 3, "gradient_accumulation_steps": 10, "lr": 6.25e-05, "max_norm": 1.0, "n_epochs": 3, "eval_before_start": false, "dataset_cache_dir": "/home/ubuntu/question-generation/caches/datasets", "dataset_dir": "datasets/SQuAD/qg", "local_rank": 0, "output_dir": "/home/ubuntu/question-generation/outputs/train", "save_interval_epoch": 1, "iterations_before_checking": 0, "n_saved_epoch": 3, "distributed": true }