| _n_gpu: 1
|
| adafactor: false
|
| adam_beta1: 0.9
|
| adam_beta2: 0.999
|
| adam_epsilon: 1.0e-08
|
| cache_dir: null
|
| compute_metric_task_list:
|
| - question-generation
|
| - question-answering
|
| dataloader_drop_last: false
|
| dataloader_num_workers: 0
|
| dataloader_pin_memory: true
|
| ddp_find_unused_parameters: null
|
| debug: []
|
| deepspeed: null
|
| disable_tqdm: false
|
| do_eval: true
|
| do_predict: false
|
| do_train: true
|
| eval_accumulation_steps: 1
|
| eval_steps: 2000
|
| evaluation_strategy: &id001 !!python/object/apply:transformers.trainer_utils.IntervalStrategy
|
| - steps
|
| fp16: false
|
| fp16_backend: auto
|
| fp16_full_eval: false
|
| fp16_opt_level: O1
|
| freeze_embeddings: false
|
| gradient_accumulation_steps: 1
|
| greater_is_better: null
|
| group_by_length: false
|
| ignore_data_skip: false
|
| label_names: null
|
| label_smoothing: 0
|
| label_smoothing_factor: 0.0
|
| learning_rate: 0.0001
|
| length_column_name: length
|
| load_best_model_at_end: false
|
| local_rank: -1
|
| log_level: -1
|
| log_level_replica: -1
|
| log_on_each_node: true
|
| logging_dir: runs/exp10\runs\Jul10_02-34-34_DESKTOP-65UI233
|
| logging_first_step: false
|
| logging_steps: 500
|
| logging_strategy: *id001
|
| lr_scheduler_type: !!python/object/apply:transformers.trainer_utils.SchedulerType
|
| - linear
|
| max_grad_norm: 1.0
|
| max_source_length: 512
|
| max_steps: -1
|
| max_target_length: 64
|
| metric_for_best_model: null
|
| model_name_or_path: google/mt5-small
|
| mp_parameters: ''
|
| neptune_api_token: null
|
| neptune_project: null
|
| no_cuda: false
|
| num_train_epochs: 15
|
| output_dir: runs/exp10
|
| overwrite_output_dir: false
|
| past_index: -1
|
| per_device_eval_batch_size: 4
|
| per_device_train_batch_size: 4
|
| per_gpu_eval_batch_size: null
|
| per_gpu_train_batch_size: null
|
| prediction_loss_only: false
|
| prepare_data: true
|
| push_to_hub: false
|
| push_to_hub_model_id: exp10
|
| push_to_hub_organization: null
|
| push_to_hub_token: null
|
| remove_unused_columns: false
|
| report_to:
|
| - wandb
|
| - neptune
|
| resume_from_checkpoint: null
|
| run_name: exp10
|
| save_steps: 500
|
| save_strategy: *id001
|
| save_total_limit: 1
|
| seed: 42
|
| sharded_ddp: []
|
| skip_memory_metrics: true
|
| tokenizer_path: mt5_small_tokenizer
|
| tpu_metrics_debug: false
|
| tpu_num_cores: null
|
| train_dataset_list:
|
| - tquad-train
|
| - tquad-valid
|
| - xquad.tr
|
| train_file_path: data/train_data_multitask_mt5.pt
|
| use_legacy_prediction_loop: false
|
| valid_dataset_list:
|
| - tquad-valid
|
| valid_file_path: data/valid_data_multitask_mt5.pt
|
| wandb_project: turkish-qa-qg
|
| warmup_ratio: 0.0
|
| warmup_steps: 0
|
| weight_decay: 0.0
|
|
|