File size: 574 Bytes
b804092 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 | {
"model_type": "gpt2",
"model_checkpoint": "gpt2",
"device": "cuda:0",
"use_amp": true,
"train_batch_size": 3,
"valid_batch_size": 3,
"gradient_accumulation_steps": 10,
"lr": 6.25e-05,
"max_norm": 1.0,
"n_epochs": 3,
"eval_before_start": false,
"dataset_cache_dir": "/home/ubuntu/question-generation/caches/datasets",
"dataset_dir": "datasets/SQuAD/qg",
"local_rank": 0,
"output_dir": "/home/ubuntu/question-generation/outputs/train",
"save_interval_epoch": 1,
"iterations_before_checking": 0,
"n_saved_epoch": 3,
"distributed": true
} |