| { | |
| "_CHeeSEArguments": "CHeeSEArguments", | |
| "model_name_or_path": "LennartKeller/nystromformer-gottbert-base-8192", | |
| "dataset_path": "./dataset.py", | |
| "metric_path": "./metric.py", | |
| "task": "stance_detection", | |
| "first_sentence_inputs": [ | |
| "question" | |
| ], | |
| "second_sentence_inputs": [ | |
| "title", | |
| "snippet", | |
| "paragraphs" | |
| ], | |
| "labels_to_predict": [ | |
| "stance" | |
| ], | |
| "_CHeeSETrainingArguments": "CHeeSETrainingArguments", | |
| "do_train": true, | |
| "do_eval": true, | |
| "do_predict": true, | |
| "do_cross_validation": false, | |
| "output_dir": "/netscratch/schnitzler/nystromformer-8", | |
| "logging_dir": "/netscratch/schnitzler/nystromformer-8", | |
| "save_total_limit": 3, | |
| "log_to_file": true, | |
| "logging_strategy": "steps", | |
| "logging_steps": 50, | |
| "cross_validation_folds": 5, | |
| "save_steps": 1000, | |
| "evaluation_strategy": "steps", | |
| "eval_steps": 500, | |
| "seed": 121, | |
| "num_train_epochs": 4, | |
| "per_device_train_batch_size": 8, | |
| "per_device_eval_batch_size": 8, | |
| "learning_rate": 3e-05, | |
| "prediction_csv_kwargs": { | |
| "index": false | |
| }, | |
| "prediction_columns_to_include": [ | |
| "title", | |
| "snippet", | |
| "paragraphs", | |
| "question", | |
| "labels", | |
| "stance" | |
| ], | |
| "overwrite_output_dir": true | |
| } |