RefalMachine commited on Jul 12, 2024

Commit

427b863

verified ·

1 Parent(s): e5efdd8

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +20 -0
llmtf_eval_k0/daru_treewayabstractive.jsonl +0 -0
llmtf_eval_k0/daru_treewayabstractive_params.jsonl +62 -0
llmtf_eval_k0/daru_treewayabstractive_total.jsonl +8 -0
llmtf_eval_k0/daru_treewayextractive.jsonl +3 -0
llmtf_eval_k0/daru_treewayextractive_params.jsonl +57 -0
llmtf_eval_k0/daru_treewayextractive_total.jsonl +7 -0
llmtf_eval_k0/darumeru_MultiQ.jsonl +0 -0
llmtf_eval_k0/darumeru_MultiQ_params.jsonl +62 -0
llmtf_eval_k0/darumeru_MultiQ_total.jsonl +8 -0
llmtf_eval_k0/darumeru_PARus.jsonl +0 -0
llmtf_eval_k0/darumeru_PARus_params.jsonl +62 -0
llmtf_eval_k0/darumeru_PARus_total.jsonl +7 -0
llmtf_eval_k0/darumeru_RCB.jsonl +0 -0
llmtf_eval_k0/darumeru_RCB_params.jsonl +62 -0
llmtf_eval_k0/darumeru_RCB_total.jsonl +8 -0
llmtf_eval_k0/darumeru_RWSD.jsonl +0 -0
llmtf_eval_k0/darumeru_RWSD_params.jsonl +62 -0
llmtf_eval_k0/darumeru_RWSD_total.jsonl +7 -0
llmtf_eval_k0/darumeru_USE.jsonl +0 -0
llmtf_eval_k0/darumeru_USE_params.jsonl +62 -0
llmtf_eval_k0/darumeru_USE_total.jsonl +7 -0
llmtf_eval_k0/darumeru_cp_para_en.jsonl +0 -0
llmtf_eval_k0/darumeru_cp_para_en_params.jsonl +62 -0
llmtf_eval_k0/darumeru_cp_para_en_total.jsonl +9 -0
llmtf_eval_k0/darumeru_cp_para_ru.jsonl +0 -0
llmtf_eval_k0/darumeru_cp_para_ru_params.jsonl +62 -0
llmtf_eval_k0/darumeru_cp_para_ru_total.jsonl +9 -0
llmtf_eval_k0/darumeru_cp_sent_en.jsonl +0 -0
llmtf_eval_k0/darumeru_cp_sent_en_params.jsonl +62 -0
llmtf_eval_k0/darumeru_cp_sent_en_total.jsonl +9 -0
llmtf_eval_k0/darumeru_cp_sent_ru.jsonl +0 -0
llmtf_eval_k0/darumeru_cp_sent_ru_params.jsonl +62 -0
llmtf_eval_k0/darumeru_cp_sent_ru_total.jsonl +9 -0
llmtf_eval_k0/darumeru_ruMMLU.jsonl +3 -0
llmtf_eval_k0/darumeru_ruMMLU_params.jsonl +62 -0
llmtf_eval_k0/darumeru_ruMMLU_total.jsonl +7 -0
llmtf_eval_k0/darumeru_ruOpenBookQA.jsonl +0 -0
llmtf_eval_k0/darumeru_ruOpenBookQA_params.jsonl +62 -0
llmtf_eval_k0/darumeru_ruOpenBookQA_total.jsonl +8 -0
llmtf_eval_k0/darumeru_ruTiE.jsonl +3 -0
llmtf_eval_k0/darumeru_ruTiE_params.jsonl +62 -0
llmtf_eval_k0/darumeru_ruTiE_total.jsonl +7 -0
llmtf_eval_k0/darumeru_ruWorldTree.jsonl +0 -0
llmtf_eval_k0/darumeru_ruWorldTree_params.jsonl +62 -0
llmtf_eval_k0/darumeru_ruWorldTree_total.jsonl +8 -0
llmtf_eval_k0/evaluation_log.txt +273 -0
llmtf_eval_k0/evaluation_results.txt +2 -0
llmtf_eval_k0/nlpcoreteam_enMMLU.jsonl +3 -0
llmtf_eval_k0/nlpcoreteam_enMMLU_params.jsonl +57 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,23 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k0/daru_treewayextractive.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k0/darumeru_ruMMLU.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k0/darumeru_ruTiE.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k0/nlpcoreteam_enMMLU.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k0/nlpcoreteam_ruMMLU.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k1/daru_treewayextractive.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k1/darumeru_ruMMLU.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k1/darumeru_ruTiE.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k1/nlpcoreteam_enMMLU.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k1/nlpcoreteam_ruMMLU.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k5/daru_treewayabstractive.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k5/daru_treewayextractive.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k5/darumeru_MultiQ.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k5/darumeru_USE.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k5/darumeru_ruMMLU.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k5/darumeru_ruOpenBookQA.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k5/darumeru_ruTiE.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k5/nlpcoreteam_enMMLU.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k5/nlpcoreteam_ruMMLU.jsonl filter=lfs diff=lfs merge=lfs -text
+llmtf_eval_k5/russiannlp_rucola_custom.jsonl filter=lfs diff=lfs merge=lfs -text

llmtf_eval_k0/daru_treewayabstractive.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/daru_treewayabstractive_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 512,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 500,
+        "method": "generate"
+    }
+}

llmtf_eval_k0/daru_treewayabstractive_total.jsonl ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "task_name": "daru/treewayabstractive",
+    "results": {
+        "rouge1": 0.35401411318813847,
+        "rouge2": 0.12752218193565362
+    },
+    "leaderboard_result": 0.24076814756189605
+}

llmtf_eval_k0/daru_treewayextractive.jsonl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:817a79eb937233b0782b5c9419bcf8fb9fa8a48faf6f412c6781323a7530d54c
+size 1985804644

llmtf_eval_k0/daru_treewayextractive_params.jsonl ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 1,
+            "pad_token_id": 128001,
+            "stop_strings": [],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 500,
+        "method": "calculate_logsoftmax"
+    }
+}

llmtf_eval_k0/daru_treewayextractive_total.jsonl ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+    "task_name": "daru/treewayextractive",
+    "results": {
+        "r-prec": 0.3960751082251082
+    },
+    "leaderboard_result": 0.3960751082251082
+}

llmtf_eval_k0/darumeru_MultiQ.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/darumeru_MultiQ_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 64,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "generate"
+    }
+}

llmtf_eval_k0/darumeru_MultiQ_total.jsonl ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "task_name": "darumeru/MultiQ",
+    "results": {
+        "f1": 0.34566216745831274,
+        "em": 0.21510516252390058
+    },
+    "leaderboard_result": 0.2803836649911067
+}

llmtf_eval_k0/darumeru_PARus.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/darumeru_PARus_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 64,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "calculate_tokens_proba"
+    }
+}

llmtf_eval_k0/darumeru_PARus_total.jsonl ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+    "task_name": "darumeru/PARus",
+    "results": {
+        "acc": 0.66
+    },
+    "leaderboard_result": 0.66
+}

llmtf_eval_k0/darumeru_RCB.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/darumeru_RCB_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 64,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "calculate_tokens_proba"
+    }
+}

llmtf_eval_k0/darumeru_RCB_total.jsonl ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "task_name": "darumeru/RCB",
+    "results": {
+        "acc": 0.5,
+        "f1_macro": 0.43018975381906
+    },
+    "leaderboard_result": 0.46509487690953
+}

llmtf_eval_k0/darumeru_RWSD.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/darumeru_RWSD_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 64,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "calculate_tokens_proba"
+    }
+}

llmtf_eval_k0/darumeru_RWSD_total.jsonl ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+    "task_name": "darumeru/RWSD",
+    "results": {
+        "acc": 0.5441176470588235
+    },
+    "leaderboard_result": 0.5441176470588235
+}

llmtf_eval_k0/darumeru_USE.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/darumeru_USE_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 64,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "generate"
+    }
+}

llmtf_eval_k0/darumeru_USE_total.jsonl ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+    "task_name": "darumeru/USE",
+    "results": {
+        "grade_norm": 0.14411764705882352
+    },
+    "leaderboard_result": 0.14411764705882352
+}

llmtf_eval_k0/darumeru_cp_para_en.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/darumeru_cp_para_en_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 1024,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "generate"
+    }
+}

llmtf_eval_k0/darumeru_cp_para_en_total.jsonl ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "task_name": "darumeru/cp_para_en",
+    "results": {
+        "symbol_per_token": 4.482081117192222,
+        "len": 0.9950333263716172,
+        "lcs": 0.9677363847232712
+    },
+    "leaderboard_result": 0.9677363847232712
+}

llmtf_eval_k0/darumeru_cp_para_ru.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/darumeru_cp_para_ru_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 1024,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "generate"
+    }
+}

llmtf_eval_k0/darumeru_cp_para_ru_total.jsonl ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "task_name": "darumeru/cp_para_ru",
+    "results": {
+        "symbol_per_token": 2.968769203133834,
+        "len": 0.9946084786539394,
+        "lcs": 0.9078334163780103
+    },
+    "leaderboard_result": 0.9078334163780103
+}

llmtf_eval_k0/darumeru_cp_sent_en.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/darumeru_cp_sent_en_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 128,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "generate"
+    }
+}

llmtf_eval_k0/darumeru_cp_sent_en_total.jsonl ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "task_name": "darumeru/cp_sent_en",
+    "results": {
+        "symbol_per_token": 4.424738337449315,
+        "len": 0.9996416196590585,
+        "lcs": 0.9958136839407484
+    },
+    "leaderboard_result": 0.9996416196590585
+}

llmtf_eval_k0/darumeru_cp_sent_ru.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/darumeru_cp_sent_ru_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 128,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "generate"
+    }
+}

llmtf_eval_k0/darumeru_cp_sent_ru_total.jsonl ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "task_name": "darumeru/cp_sent_ru",
+    "results": {
+        "symbol_per_token": 2.8277022347634286,
+        "len": 0.9903323908366956,
+        "lcs": 0.9539355441644095
+    },
+    "leaderboard_result": 0.9903323908366956
+}

llmtf_eval_k0/darumeru_ruMMLU.jsonl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:454e30175faf86134597baf9cad35c4c5a62bdc849eee8d85a27c472c0d729cb
+size 32909111

llmtf_eval_k0/darumeru_ruMMLU_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 64,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "calculate_tokens_proba"
+    }
+}

llmtf_eval_k0/darumeru_ruMMLU_total.jsonl ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+    "task_name": "darumeru/ruMMLU",
+    "results": {
+        "acc": 0.5046393295420533
+    },
+    "leaderboard_result": 0.5046393295420533
+}

llmtf_eval_k0/darumeru_ruOpenBookQA.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/darumeru_ruOpenBookQA_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 64,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "calculate_tokens_proba"
+    }
+}

llmtf_eval_k0/darumeru_ruOpenBookQA_total.jsonl ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "task_name": "darumeru/ruOpenBookQA",
+    "results": {
+        "acc": 0.6924398625429553,
+        "f1_macro": 0.6928205333186971
+    },
+    "leaderboard_result": 0.6926301979308263
+}

llmtf_eval_k0/darumeru_ruTiE.jsonl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:52057ed1300597156320b34738e0b48e92b4112bbd55d3c9b283972df4eb6e15
+size 12832579

llmtf_eval_k0/darumeru_ruTiE_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 64,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "calculate_tokens_proba"
+    }
+}

llmtf_eval_k0/darumeru_ruTiE_total.jsonl ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+    "task_name": "darumeru/ruTiE",
+    "results": {
+        "acc": 0.3511627906976744
+    },
+    "leaderboard_result": 0.3511627906976744
+}

llmtf_eval_k0/darumeru_ruWorldTree.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

llmtf_eval_k0/darumeru_ruWorldTree_params.jsonl ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009,
+                198,
+                271
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 64,
+            "pad_token_id": 128001,
+            "stop_strings": [
+                "\n",
+                "\n\n"
+            ],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "calculate_tokens_proba"
+    }
+}

llmtf_eval_k0/darumeru_ruWorldTree_total.jsonl ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "task_name": "darumeru/ruWorldTree",
+    "results": {
+        "acc": 0.8476190476190476,
+        "f1_macro": 0.8445201637796824
+    },
+    "leaderboard_result": 0.8460696056993651
+}

llmtf_eval_k0/evaluation_log.txt ADDED Viewed

	@@ -0,0 +1,273 @@

+INFO: 2024-07-12 11:07:49,951: llmtf.base.evaluator: Starting eval on ['darumeru/multiq', 'darumeru/parus', 'darumeru/rcb', 'darumeru/ruopenbookqa', 'darumeru/rutie', 'darumeru/ruworldtree', 'darumeru/rwsd', 'darumeru/use', 'russiannlp/rucola_custom']
+INFO: 2024-07-12 11:07:49,953: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:07:49,953: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:07:51,044: llmtf.base.evaluator: Starting eval on ['darumeru/rummlu']
+INFO: 2024-07-12 11:07:51,045: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:07:51,045: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:07:53,196: llmtf.base.evaluator: Starting eval on ['nlpcoreteam/rummlu']
+INFO: 2024-07-12 11:07:53,197: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009]
+INFO: 2024-07-12 11:07:53,197: llmtf.base.hfmodel: Updated generation_config.stop_strings: []
+INFO: 2024-07-12 11:07:53,614: llmtf.base.darumeru/MultiQ: Loading Dataset: 3.66s
+INFO: 2024-07-12 11:07:54,515: llmtf.base.evaluator: Starting eval on ['nlpcoreteam/enmmlu']
+INFO: 2024-07-12 11:07:54,515: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009]
+INFO: 2024-07-12 11:07:54,515: llmtf.base.hfmodel: Updated generation_config.stop_strings: []
+INFO: 2024-07-12 11:07:57,115: llmtf.base.evaluator: Starting eval on ['daru/treewayabstractive']
+INFO: 2024-07-12 11:07:57,116: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:07:57,116: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:07:58,519: llmtf.base.evaluator: Starting eval on ['daru/treewayextractive']
+INFO: 2024-07-12 11:07:58,520: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009]
+INFO: 2024-07-12 11:07:58,520: llmtf.base.hfmodel: Updated generation_config.stop_strings: []
+INFO: 2024-07-12 11:07:59,295: llmtf.base.darumeru/ruMMLU: Loading Dataset: 8.25s
+INFO: 2024-07-12 11:08:00,328: llmtf.base.evaluator: Starting eval on ['darumeru/cp_sent_ru', 'darumeru/cp_sent_en', 'darumeru/cp_para_ru', 'darumeru/cp_para_en']
+INFO: 2024-07-12 11:08:00,328: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:08:00,328: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:08:01,857: llmtf.base.daru/treewayabstractive: Loading Dataset: 4.74s
+INFO: 2024-07-12 11:08:04,251: llmtf.base.darumeru/cp_sent_ru: Loading Dataset: 3.92s
+INFO: 2024-07-12 11:08:10,121: llmtf.base.daru/treewayextractive: Loading Dataset: 11.60s
+INFO: 2024-07-12 11:10:06,434: llmtf.base.nlpcoreteam/enMMLU: Loading Dataset: 131.92s
+INFO: 2024-07-12 11:10:07,629: llmtf.base.nlpcoreteam/ruMMLU: Loading Dataset: 134.43s
+INFO: 2024-07-12 11:14:10,567: llmtf.base.darumeru/ruMMLU: Processing Dataset: 371.27s
+INFO: 2024-07-12 11:14:10,571: llmtf.base.darumeru/ruMMLU: Results for darumeru/ruMMLU:
+INFO: 2024-07-12 11:14:10,592: llmtf.base.darumeru/ruMMLU: {'acc': 0.5046393295420533}
+INFO: 2024-07-12 11:14:10,628: llmtf.base.evaluator: Ended eval
+INFO: 2024-07-12 11:14:10,633: llmtf.base.evaluator:
+mean	darumeru/ruMMLU
+0.505	0.505
+INFO: 2024-07-12 11:17:48,926: llmtf.base.darumeru/cp_sent_ru: Processing Dataset: 584.67s
+INFO: 2024-07-12 11:17:48,928: llmtf.base.darumeru/cp_sent_ru: Results for darumeru/cp_sent_ru:
+INFO: 2024-07-12 11:17:48,948: llmtf.base.darumeru/cp_sent_ru: {'symbol_per_token': 2.8277022347634286, 'len': 0.9903323908366956, 'lcs': 0.9539355441644095}
+INFO: 2024-07-12 11:17:48,949: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:17:48,949: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:17:53,551: llmtf.base.darumeru/cp_sent_en: Loading Dataset: 4.60s
+INFO: 2024-07-12 11:18:10,281: llmtf.base.nlpcoreteam/enMMLU: Processing Dataset: 483.84s
+INFO: 2024-07-12 11:18:10,299: llmtf.base.nlpcoreteam/enMMLU: Results for nlpcoreteam/enMMLU:
+INFO: 2024-07-12 11:18:10,342: llmtf.base.nlpcoreteam/enMMLU:                                        metric
+subject
+abstract_algebra                     0.340000
+anatomy                              0.718519
+astronomy                            0.736842
+business_ethics                      0.720000
+clinical_knowledge                   0.735849
+college_biology                      0.791667
+college_chemistry                    0.470000
+college_computer_science             0.590000
+college_mathematics                  0.300000
+college_medicine                     0.653179
+college_physics                      0.480392
+computer_security                    0.760000
+conceptual_physics                   0.565957
+econometrics                         0.517544
+electrical_engineering               0.600000
+elementary_mathematics               0.481481
+formal_logic                         0.523810
+global_facts                         0.410000
+high_school_biology                  0.800000
+high_school_chemistry                0.551724
+high_school_computer_science         0.730000
+high_school_european_history         0.751515
+high_school_geography                0.828283
+high_school_government_and_politics  0.865285
+high_school_macroeconomics           0.633333
+high_school_mathematics              0.366667
+high_school_microeconomics           0.747899
+high_school_physics                  0.423841
+high_school_psychology               0.853211
+high_school_statistics               0.532407
+high_school_us_history               0.828431
+high_school_world_history            0.835443
+human_aging                          0.721973
+human_sexuality                      0.778626
+international_law                    0.760331
+jurisprudence                        0.796296
+logical_fallacies                    0.779141
+machine_learning                     0.455357
+management                           0.805825
+marketing                            0.893162
+medical_genetics                     0.780000
+miscellaneous                        0.837803
+moral_disputes                       0.690751
+moral_scenarios                      0.289385
+nutrition                            0.764706
+philosophy                           0.720257
+prehistory                           0.709877
+professional_accounting              0.531915
+professional_law                     0.479140
+professional_medicine                0.731618
+professional_psychology              0.674837
+public_relations                     0.654545
+security_studies                     0.714286
+sociology                            0.825871
+us_foreign_policy                    0.890000
+virology                             0.487952
+world_religions                      0.824561
+INFO: 2024-07-12 11:18:10,350: llmtf.base.nlpcoreteam/enMMLU:                                    metric
+subject
+STEM                             0.554241
+humanities                       0.691457
+other (business, health, misc.)  0.699464
+social sciences                  0.748643
+INFO: 2024-07-12 11:18:10,374: llmtf.base.nlpcoreteam/enMMLU: {'acc': 0.6734513449759852}
+INFO: 2024-07-12 11:18:10,406: llmtf.base.evaluator: Ended eval
+INFO: 2024-07-12 11:18:10,411: llmtf.base.evaluator:
+mean	darumeru/cp_sent_ru	darumeru/ruMMLU	nlpcoreteam/enMMLU
+0.723	0.990	0.505	0.673
+INFO: 2024-07-12 11:18:50,749: llmtf.base.nlpcoreteam/ruMMLU: Processing Dataset: 523.12s
+INFO: 2024-07-12 11:18:50,751: llmtf.base.nlpcoreteam/ruMMLU: Results for nlpcoreteam/ruMMLU:
+INFO: 2024-07-12 11:18:50,790: llmtf.base.nlpcoreteam/ruMMLU:                                        metric
+subject
+abstract_algebra                     0.290000
+anatomy                              0.459259
+astronomy                            0.657895
+business_ethics                      0.600000
+clinical_knowledge                   0.562264
+college_biology                      0.548611
+college_chemistry                    0.400000
+college_computer_science             0.470000
+college_mathematics                  0.330000
+college_medicine                     0.497110
+college_physics                      0.333333
+computer_security                    0.570000
+conceptual_physics                   0.493617
+econometrics                         0.342105
+electrical_engineering               0.531034
+elementary_mathematics               0.412698
+formal_logic                         0.380952
+global_facts                         0.350000
+high_school_biology                  0.635484
+high_school_chemistry                0.428571
+high_school_computer_science         0.620000
+high_school_european_history         0.715152
+high_school_geography                0.656566
+high_school_government_and_politics  0.595855
+high_school_macroeconomics           0.517949
+high_school_mathematics              0.348148
+high_school_microeconomics           0.495798
+high_school_physics                  0.350993
+high_school_psychology               0.667890
+high_school_statistics               0.458333
+high_school_us_history               0.661765
+high_school_world_history            0.708861
+human_aging                          0.556054
+human_sexuality                      0.664122
+international_law                    0.702479
+jurisprudence                        0.592593
+logical_fallacies                    0.527607
+machine_learning                     0.339286
+management                           0.669903
+marketing                            0.700855
+medical_genetics                     0.570000
+miscellaneous                        0.646232
+moral_disputes                       0.554913
+moral_scenarios                      0.248045
+nutrition                            0.594771
+philosophy                           0.565916
+prehistory                           0.558642
+professional_accounting              0.386525
+professional_law                     0.362451
+professional_medicine                0.522059
+professional_psychology              0.480392
+public_relations                     0.563636
+security_studies                     0.620408
+sociology                            0.696517
+us_foreign_policy                    0.770000
+virology                             0.415663
+world_religions                      0.690058
+INFO: 2024-07-12 11:18:50,798: llmtf.base.nlpcoreteam/ruMMLU:                                    metric
+subject
+STEM                             0.456556
+humanities                       0.559187
+other (business, health, misc.)  0.537907
+social sciences                  0.589270
+INFO: 2024-07-12 11:18:50,819: llmtf.base.nlpcoreteam/ruMMLU: {'acc': 0.5357299468552112}
+INFO: 2024-07-12 11:18:50,850: llmtf.base.evaluator: Ended eval
+INFO: 2024-07-12 11:18:50,856: llmtf.base.evaluator:
+mean	darumeru/cp_sent_ru	darumeru/ruMMLU	nlpcoreteam/enMMLU	nlpcoreteam/ruMMLU
+0.676	0.990	0.505	0.673	0.536
+INFO: 2024-07-12 11:19:25,952: llmtf.base.darumeru/MultiQ: Processing Dataset: 692.34s
+INFO: 2024-07-12 11:19:25,955: llmtf.base.darumeru/MultiQ: Results for darumeru/MultiQ:
+INFO: 2024-07-12 11:19:25,975: llmtf.base.darumeru/MultiQ: {'f1': 0.34566216745831274, 'em': 0.21510516252390058}
+INFO: 2024-07-12 11:19:25,980: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:19:25,980: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:19:27,975: llmtf.base.darumeru/PARus: Loading Dataset: 1.99s
+INFO: 2024-07-12 11:19:34,512: llmtf.base.darumeru/PARus: Processing Dataset: 6.54s
+INFO: 2024-07-12 11:19:34,513: llmtf.base.darumeru/PARus: Results for darumeru/PARus:
+INFO: 2024-07-12 11:19:34,540: llmtf.base.darumeru/PARus: {'acc': 0.66}
+INFO: 2024-07-12 11:19:34,542: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:19:34,542: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:19:36,333: llmtf.base.darumeru/RCB: Loading Dataset: 1.79s
+INFO: 2024-07-12 11:19:44,027: llmtf.base.darumeru/RCB: Processing Dataset: 7.69s
+INFO: 2024-07-12 11:19:44,028: llmtf.base.darumeru/RCB: Results for darumeru/RCB:
+INFO: 2024-07-12 11:19:44,035: llmtf.base.darumeru/RCB: {'acc': 0.5, 'f1_macro': 0.43018975381906}
+INFO: 2024-07-12 11:19:44,036: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:19:44,036: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:19:46,672: llmtf.base.darumeru/ruOpenBookQA: Loading Dataset: 2.63s
+INFO: 2024-07-12 11:21:04,051: llmtf.base.darumeru/ruOpenBookQA: Processing Dataset: 77.38s
+INFO: 2024-07-12 11:21:04,067: llmtf.base.darumeru/ruOpenBookQA: Results for darumeru/ruOpenBookQA:
+INFO: 2024-07-12 11:21:04,081: llmtf.base.darumeru/ruOpenBookQA: {'acc': 0.6924398625429553, 'f1_macro': 0.6928205333186971}
+INFO: 2024-07-12 11:21:04,089: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:21:04,089: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:21:11,537: llmtf.base.darumeru/ruTiE: Loading Dataset: 7.45s
+INFO: 2024-07-12 11:25:40,282: llmtf.base.darumeru/ruTiE: Processing Dataset: 268.74s
+INFO: 2024-07-12 11:25:40,283: llmtf.base.darumeru/ruTiE: Results for darumeru/ruTiE:
+INFO: 2024-07-12 11:25:40,361: llmtf.base.darumeru/ruTiE: {'acc': 0.3511627906976744}
+INFO: 2024-07-12 11:25:40,365: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:25:40,365: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:25:42,670: llmtf.base.darumeru/ruWorldTree: Loading Dataset: 2.30s
+INFO: 2024-07-12 11:25:46,171: llmtf.base.darumeru/ruWorldTree: Processing Dataset: 3.50s
+INFO: 2024-07-12 11:25:46,173: llmtf.base.darumeru/ruWorldTree: Results for darumeru/ruWorldTree:
+INFO: 2024-07-12 11:25:46,178: llmtf.base.darumeru/ruWorldTree: {'acc': 0.8476190476190476, 'f1_macro': 0.8445201637796824}
+INFO: 2024-07-12 11:25:46,179: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:25:46,179: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:25:48,322: llmtf.base.darumeru/RWSD: Loading Dataset: 2.14s
+INFO: 2024-07-12 11:25:53,464: llmtf.base.darumeru/cp_sent_en: Processing Dataset: 479.91s
+INFO: 2024-07-12 11:25:53,466: llmtf.base.darumeru/cp_sent_en: Results for darumeru/cp_sent_en:
+INFO: 2024-07-12 11:25:53,470: llmtf.base.darumeru/cp_sent_en: {'symbol_per_token': 4.424738337449315, 'len': 0.9996416196590585, 'lcs': 0.9958136839407484}
+INFO: 2024-07-12 11:25:53,471: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:25:53,471: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:25:55,479: llmtf.base.darumeru/RWSD: Processing Dataset: 7.16s
+INFO: 2024-07-12 11:25:55,481: llmtf.base.darumeru/RWSD: Results for darumeru/RWSD:
+INFO: 2024-07-12 11:25:55,485: llmtf.base.darumeru/RWSD: {'acc': 0.5441176470588235}
+INFO: 2024-07-12 11:25:55,486: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:25:55,486: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:25:57,669: llmtf.base.darumeru/cp_para_ru: Loading Dataset: 4.20s
+INFO: 2024-07-12 11:25:58,310: llmtf.base.darumeru/USE: Loading Dataset: 2.82s
+INFO: 2024-07-12 11:29:53,584: llmtf.base.daru/treewayextractive: Processing Dataset: 1303.46s
+INFO: 2024-07-12 11:29:53,601: llmtf.base.daru/treewayextractive: Results for daru/treewayextractive:
+INFO: 2024-07-12 11:29:53,850: llmtf.base.daru/treewayextractive: {'r-prec': 0.3960751082251082}
+INFO: 2024-07-12 11:29:54,328: llmtf.base.evaluator: Ended eval
+INFO: 2024-07-12 11:29:54,338: llmtf.base.evaluator:
+mean	daru/treewayextractive	darumeru/MultiQ	darumeru/PARus	darumeru/RCB	darumeru/RWSD	darumeru/cp_sent_en	darumeru/cp_sent_ru	darumeru/ruMMLU	darumeru/ruOpenBookQA	darumeru/ruTiE	darumeru/ruWorldTree	nlpcoreteam/enMMLU	nlpcoreteam/ruMMLU
+0.611	0.396	0.280	0.660	0.465	0.544	1.000	0.990	0.505	0.693	0.351	0.846	0.673	0.536
+INFO: 2024-07-12 11:30:30,009: llmtf.base.darumeru/USE: Processing Dataset: 271.70s
+INFO: 2024-07-12 11:30:30,010: llmtf.base.darumeru/USE: Results for darumeru/USE:
+INFO: 2024-07-12 11:30:30,016: llmtf.base.darumeru/USE: {'grade_norm': 0.14411764705882352}
+INFO: 2024-07-12 11:30:30,019: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009]
+INFO: 2024-07-12 11:30:30,019: llmtf.base.hfmodel: Updated generation_config.stop_strings: []
+INFO: 2024-07-12 11:30:34,123: llmtf.base.russiannlp/rucola_custom: Loading Dataset: 4.10s
+INFO: 2024-07-12 11:32:06,029: llmtf.base.russiannlp/rucola_custom: Processing Dataset: 91.90s
+INFO: 2024-07-12 11:32:06,034: llmtf.base.russiannlp/rucola_custom: Results for russiannlp/rucola_custom:
+INFO: 2024-07-12 11:32:06,045: llmtf.base.russiannlp/rucola_custom: {'acc': 0.7068532472192322, 'mcc': 0.2623100586905413}
+INFO: 2024-07-12 11:32:06,049: llmtf.base.evaluator: Ended eval
+INFO: 2024-07-12 11:32:06,089: llmtf.base.evaluator:
+mean	daru/treewayextractive	darumeru/MultiQ	darumeru/PARus	darumeru/RCB	darumeru/RWSD	darumeru/USE	darumeru/cp_sent_en	darumeru/cp_sent_ru	darumeru/ruMMLU	darumeru/ruOpenBookQA	darumeru/ruTiE	darumeru/ruWorldTree	nlpcoreteam/enMMLU	nlpcoreteam/ruMMLU	russiannlp/rucola_custom
+0.571	0.396	0.280	0.660	0.465	0.544	0.144	1.000	0.990	0.505	0.693	0.351	0.846	0.673	0.536	0.485
+INFO: 2024-07-12 11:38:34,822: llmtf.base.daru/treewayabstractive: Processing Dataset: 1832.96s
+INFO: 2024-07-12 11:38:34,826: llmtf.base.daru/treewayabstractive: Results for daru/treewayabstractive:
+INFO: 2024-07-12 11:38:34,829: llmtf.base.daru/treewayabstractive: {'rouge1': 0.35401411318813847, 'rouge2': 0.12752218193565362}
+INFO: 2024-07-12 11:38:34,832: llmtf.base.evaluator: Ended eval
+INFO: 2024-07-12 11:38:34,856: llmtf.base.evaluator:
+mean	daru/treewayabstractive	daru/treewayextractive	darumeru/MultiQ	darumeru/PARus	darumeru/RCB	darumeru/RWSD	darumeru/USE	darumeru/cp_sent_en	darumeru/cp_sent_ru	darumeru/ruMMLU	darumeru/ruOpenBookQA	darumeru/ruTiE	darumeru/ruWorldTree	nlpcoreteam/enMMLU	nlpcoreteam/ruMMLU	russiannlp/rucola_custom
+0.551	0.241	0.396	0.280	0.660	0.465	0.544	0.144	1.000	0.990	0.505	0.693	0.351	0.846	0.673	0.536	0.485
+INFO: 2024-07-12 11:38:48,843: llmtf.base.darumeru/cp_para_ru: Processing Dataset: 771.17s
+INFO: 2024-07-12 11:38:48,845: llmtf.base.darumeru/cp_para_ru: Results for darumeru/cp_para_ru:
+INFO: 2024-07-12 11:38:48,849: llmtf.base.darumeru/cp_para_ru: {'symbol_per_token': 2.968769203133834, 'len': 0.9946084786539394, 'lcs': 0.9078334163780103}
+INFO: 2024-07-12 11:38:48,850: llmtf.base.hfmodel: Updated generation_config.eos_token_id: [128001, 128009, 198, 271]
+INFO: 2024-07-12 11:38:48,850: llmtf.base.hfmodel: Updated generation_config.stop_strings: ['\n', '\n\n']
+INFO: 2024-07-12 11:38:53,153: llmtf.base.darumeru/cp_para_en: Loading Dataset: 4.30s
+INFO: 2024-07-12 11:49:13,434: llmtf.base.darumeru/cp_para_en: Processing Dataset: 620.28s
+INFO: 2024-07-12 11:49:13,451: llmtf.base.darumeru/cp_para_en: Results for darumeru/cp_para_en:
+INFO: 2024-07-12 11:49:13,455: llmtf.base.darumeru/cp_para_en: {'symbol_per_token': 4.482081117192222, 'len': 0.9950333263716172, 'lcs': 0.9677363847232712}
+INFO: 2024-07-12 11:49:13,455: llmtf.base.evaluator: Ended eval
+INFO: 2024-07-12 11:49:13,483: llmtf.base.evaluator:
+mean	daru/treewayabstractive	daru/treewayextractive	darumeru/MultiQ	darumeru/PARus	darumeru/RCB	darumeru/RWSD	darumeru/USE	darumeru/cp_para_en	darumeru/cp_para_ru	darumeru/cp_sent_en	darumeru/cp_sent_ru	darumeru/ruMMLU	darumeru/ruOpenBookQA	darumeru/ruTiE	darumeru/ruWorldTree	nlpcoreteam/enMMLU	nlpcoreteam/ruMMLU	russiannlp/rucola_custom
+0.594	0.241	0.396	0.280	0.660	0.465	0.544	0.144	0.968	0.908	1.000	0.990	0.505	0.693	0.351	0.846	0.673	0.536	0.485

llmtf_eval_k0/evaluation_results.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ mean daru/treewayabstractive daru/treewayextractive darumeru/MultiQ darumeru/PARus darumeru/RCB darumeru/RWSD darumeru/USE darumeru/cp_para_en darumeru/cp_para_ru darumeru/cp_sent_en darumeru/cp_sent_ru darumeru/ruMMLU darumeru/ruOpenBookQA darumeru/ruTiE darumeru/ruWorldTree nlpcoreteam/enMMLU nlpcoreteam/ruMMLU russiannlp/rucola_custom
2	+ 0.594 0.241 0.396 0.280 0.660 0.465 0.544 0.144 0.968 0.908 1.000 0.990 0.505 0.693 0.351 0.846 0.673 0.536 0.485

llmtf_eval_k0/nlpcoreteam_enMMLU.jsonl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7a3488fe16dd4c6cc5496a219929273e2746e659cceba1baa45750cf002c05f5
+size 38085342

llmtf_eval_k0/nlpcoreteam_enMMLU_params.jsonl ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+    "custom_generation_config": null,
+    "model_params": {
+        "model_name_or_path": "NousResearch/Meta-Llama-3-8B-Instruct",
+        "generation_config": {
+            "bos_token_id": 128000,
+            "do_sample": true,
+            "eos_token_id": [
+                128001,
+                128009
+            ],
+            "max_length": 8192,
+            "max_new_tokens": 64,
+            "pad_token_id": 128001,
+            "stop_strings": [],
+            "temperature": 0.1,
+            "top_k": 40,
+            "top_p": 0.9,
+            "transformers_version": "4.38.2",
+            "trust_remote_code": [
+                false
+            ]
+        },
+        "conversation_template": {
+            "system_prompt": "",
+            "system_message_template": "",
+            "user_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}<|eot_id|>",
+            "bot_message_template_incomplete": "<|start_header_id|>{role}<|end_header_id|>\n\n{content}",
+            "user_role": "user",
+            "bot_role": "assistant",
+            "system_role": "system",
+            "global_prefix": "<|begin_of_text|>",
+            "suffix": "<|start_header_id|>assistant<|end_header_id|>\n\n",
+            "add_special_tokens": false,
+            "eos_token": "<|eot_id|>"
+        },
+        "load_in_8bit": false,
+        "torch_dtype": "auto",
+        "use_flash_attention_2": true,
+        "device_map": "cuda:0",
+        "use_fast_tokenizer": true,
+        "leading_space": false,
+        "space_token": null,
+        "trust_remote_code": [
+            false
+        ],
+        "max_model_len": 8192
+    },
+    "task_params": {
+        "max_len": 4000,
+        "few_shot_count": 0,
+        "batch_size": 1,
+        "max_sample_per_dataset": 10000000000000,
+        "method": "calculate_tokens_proba"
+    }
+}