| cutoff_len: 4096 | |
| dataset_dir: data | |
| do_predict: true | |
| eval_dataset: test_hal_detection | |
| finetuning_type: full | |
| flash_attn: auto | |
| max_new_tokens: 512 | |
| max_samples: 100000 | |
| model_name_or_path: saves/Llama-3-8B/full/train_2024-11-22-23-46-34 | |
| output_dir: saves/Llama-3-8B/full/ragtruth_eval_2024-11-23 | |
| per_device_eval_batch_size: 2 | |
| predict_with_generate: true | |
| preprocessing_num_workers: 16 | |
| quantization_method: bitsandbytes | |
| stage: sft | |
| temperature: 0.95 | |
| template: default | |
| top_p: 0.7 | |