| { |
| "custom_generation_config": null, |
| "model_params": { |
| "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct", |
| "generation_config": { |
| "bos_token_id": 128000, |
| "do_sample": true, |
| "eos_token_id": [ |
| 128001, |
| 128009, |
| 198, |
| 271 |
| ], |
| "max_length": 8192, |
| "max_new_tokens": 64, |
| "pad_token_id": 128001, |
| "stop_strings": [ |
| "\n", |
| "\n\n" |
| ], |
| "temperature": 0.1, |
| "top_k": 40, |
| "top_p": 0.9, |
| "transformers_version": "4.38.2", |
| "trust_remote_code": [ |
| false |
| ] |
| }, |
| "conversation_template": { |
| "system_prompt": "", |
| "system_message_template": "", |
| "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>", |
| "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>", |
| "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}", |
| "user_role": "user", |
| "bot_role": "assistant", |
| "system_role": "system", |
| "global_prefix": "<|begin_of_text|>", |
| "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n", |
| "add_special_tokens": false, |
| "eos_token": "<|eot_id|>" |
| }, |
| "load_in_8bit": false, |
| "torch_dtype": "auto", |
| "use_flash_attention_2": true, |
| "device_map": "cuda:0", |
| "use_fast_tokenizer": true, |
| "leading_space": false, |
| "space_token": null, |
| "trust_remote_code": [ |
| false |
| ], |
| "max_model_len": 8192 |
| }, |
| "task_params": { |
| "max_len": 4000, |
| "few_shot_count": 5, |
| "batch_size": 1, |
| "max_sample_per_dataset": 10000000000000, |
| "method": "calculate_tokens_proba" |
| } |
| } |
|
|