Spaces:

orbtailwaves23
/

open_dutch_llm_leaderboard

Sleeping

App Files Files Community

Bram Vanroy commited on Dec 13, 2023

Commit

351f9fe

1 Parent(s): b1e6575

add correct evals:

Browse files

Files changed (1) hide show

evals/models.json +53 -45

evals/models.json CHANGED Viewed

@@ -1,122 +1,130 @@
 {
     "gpt-neo-1.3b-dutch": {
         "compute_dtype": "bfloat16",
         "model_name": "yhavinga/gpt-neo-1.3B-dutch",
-        "num_parameters": 1315575808,
-        "quantization": "8-bit",
         "model_type": "pretrained",
-        "dutch_coverage": "pretrained"
     },
     "gpt-neo-125m-dutch": {
         "compute_dtype": "bfloat16",
         "model_name": "yhavinga/gpt-neo-125M-dutch",
-        "num_parameters": 125198592,
-        "quantization": "8-bit",
         "model_type": "pretrained",
-        "dutch_coverage": "pretrained"
     },
     "gpt2-large-dutch": {
         "compute_dtype": "bfloat16",
         "model_name": "yhavinga/gpt2-large-dutch",
-        "num_parameters": 774030080,
-        "quantization": "8-bit",
         "model_type": "pretrained",
-        "dutch_coverage": "pretrained"
     },
     "gpt2-medium-dutch": {
         "compute_dtype": "bfloat16",
         "model_name": "yhavinga/gpt2-medium-dutch",
-        "num_parameters": 354823168,
-        "quantization": "8-bit",
         "model_type": "pretrained",
-        "dutch_coverage": "pretrained"
     },
     "llama-2-13b-chat-dutch": {
         "compute_dtype": "bfloat16",
         "model_name": "BramVanroy/Llama-2-13b-chat-dutch",
-        "num_parameters": 13015864320,
-        "quantization": "8-bit",
         "model_type": "instruction-tuned",
-        "dutch_coverage": "fine-tuned"
     },
     "llama-2-13b-chat-hf": {
         "compute_dtype": "bfloat16",
         "model_name": "meta-llama/Llama-2-13b-chat-hf",
-        "num_parameters": 13015864320,
-        "quantization": "8-bit",
         "model_type": "instruction-tuned",
-        "dutch_coverage": "none"
     },
     "llama-2-13b-hf": {
         "compute_dtype": "bfloat16",
         "model_name": "meta-llama/Llama-2-13b-hf",
-        "num_parameters": 13015864320,
-        "quantization": "8-bit",
         "model_type": "pretrained",
-        "dutch_coverage": "none"
     },
     "llama-2-7b-chat-hf": {
         "compute_dtype": "bfloat16",
         "model_name": "meta-llama/Llama-2-7b-chat-hf",
-        "num_parameters": 6738415616,
-        "quantization": "8-bit",
         "model_type": "instruction-tuned",
-        "dutch_coverage": "none"
     },
     "llama-2-7b-hf": {
         "compute_dtype": "bfloat16",
         "model_name": "meta-llama/Llama-2-7b-hf",
-        "num_parameters": 6738415616,
-        "quantization": "8-bit",
         "model_type": "pretrained",
-        "dutch_coverage": "none"
     },
     "llama2-13b-ft-mc4_nl_cleaned_tiny": {
         "compute_dtype": "bfloat16",
         "model_name": "BramVanroy/llama2-13b-ft-mc4_nl_cleaned_tiny",
-        "num_parameters": 13015864320,
-        "quantization": "8-bit",
         "model_type": "fine-tuned",
-        "dutch_coverage": "fine-tuned"
     },
     "mistral-7b-v0.1": {
         "compute_dtype": "bfloat16",
         "model_name": "mistralai/Mistral-7B-v0.1",
-        "num_parameters": 7241732096,
-        "quantization": "8-bit",
         "model_type": "pretrained",
-        "dutch_coverage": "none"
     },
     "neural-chat-7b-v3-1": {
         "compute_dtype": "bfloat16",
         "model_name": "Intel/neural-chat-7b-v3-1",
-        "num_parameters": 7241732096,
-        "quantization": "8-bit",
         "model_type": "RL-tuned",
-        "dutch_coverage": "none"
     },
     "orca-2-13b": {
         "compute_dtype": "bfloat16",
         "model_name": "microsoft/Orca-2-13b",
-        "num_parameters": 13015895040,
-        "quantization": "8-bit",
         "model_type": "fine-tuned",
-        "dutch_coverage": "none"
     },
     "orca-2-7b": {
         "compute_dtype": "bfloat16",
         "model_name": "microsoft/Orca-2-7b",
-        "num_parameters": 6738440192,
-        "quantization": "8-bit",
         "model_type": "fine-tuned",
-        "dutch_coverage": "none"
     },
     "zephyr-7b-beta": {
         "compute_dtype": "bfloat16",
         "model_name": "HuggingFaceH4/zephyr-7b-beta",
-        "num_parameters": 7241732096,
-        "quantization": "8-bit",
         "model_type": "RL-tuned",
-        "dutch_coverage": "none"
     }
 }

 {
     "gpt-neo-1.3b-dutch": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "pretrained",
         "model_name": "yhavinga/gpt-neo-1.3B-dutch",
         "model_type": "pretrained",
+        "num_parameters": 1315575808,
+        "quantization": "8-bit"
     },
     "gpt-neo-125m-dutch": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "pretrained",
         "model_name": "yhavinga/gpt-neo-125M-dutch",
         "model_type": "pretrained",
+        "num_parameters": 125198592,
+        "quantization": "8-bit"
     },
     "gpt2-large-dutch": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "pretrained",
         "model_name": "yhavinga/gpt2-large-dutch",
         "model_type": "pretrained",
+        "num_parameters": 774030080,
+        "quantization": "8-bit"
     },
     "gpt2-medium-dutch": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "pretrained",
         "model_name": "yhavinga/gpt2-medium-dutch",
         "model_type": "pretrained",
+        "num_parameters": 354823168,
+        "quantization": "8-bit"
     },
     "llama-2-13b-chat-dutch": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "fine-tuned",
         "model_name": "BramVanroy/Llama-2-13b-chat-dutch",
         "model_type": "instruction-tuned",
+        "num_parameters": 13015864320,
+        "quantization": "8-bit"
     },
     "llama-2-13b-chat-hf": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "none",
         "model_name": "meta-llama/Llama-2-13b-chat-hf",
         "model_type": "instruction-tuned",
+        "num_parameters": 13015864320,
+        "quantization": "8-bit"
     },
     "llama-2-13b-hf": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "none",
         "model_name": "meta-llama/Llama-2-13b-hf",
         "model_type": "pretrained",
+        "num_parameters": 13015864320,
+        "quantization": "8-bit"
     },
     "llama-2-7b-chat-hf": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "none",
         "model_name": "meta-llama/Llama-2-7b-chat-hf",
         "model_type": "instruction-tuned",
+        "num_parameters": 6738415616,
+        "quantization": "8-bit"
     },
     "llama-2-7b-hf": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "none",
         "model_name": "meta-llama/Llama-2-7b-hf",
         "model_type": "pretrained",
+        "num_parameters": 6738415616,
+        "quantization": "8-bit"
     },
     "llama2-13b-ft-mc4_nl_cleaned_tiny": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "fine-tuned",
         "model_name": "BramVanroy/llama2-13b-ft-mc4_nl_cleaned_tiny",
         "model_type": "fine-tuned",
+        "num_parameters": 13015864320,
+        "quantization": "8-bit"
     },
     "mistral-7b-v0.1": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "none",
         "model_name": "mistralai/Mistral-7B-v0.1",
         "model_type": "pretrained",
+        "num_parameters": 7241732096,
+        "quantization": "8-bit"
+    },
+    "mixtral-8x7b-v0.1": {
+        "compute_dtype": "auto",
+        "dutch_coverage": "not-given",
+        "model_name": "mistralai/Mixtral-8x7B-v0.1",
+        "model_type": "not-given",
+        "num_parameters": 46702792704,
+        "quantization": null
     },
     "neural-chat-7b-v3-1": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "none",
         "model_name": "Intel/neural-chat-7b-v3-1",
         "model_type": "RL-tuned",
+        "num_parameters": 7241732096,
+        "quantization": "8-bit"
     },
     "orca-2-13b": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "none",
         "model_name": "microsoft/Orca-2-13b",
         "model_type": "fine-tuned",
+        "num_parameters": 13015895040,
+        "quantization": "8-bit"
     },
     "orca-2-7b": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "none",
         "model_name": "microsoft/Orca-2-7b",
         "model_type": "fine-tuned",
+        "num_parameters": 6738440192,
+        "quantization": "8-bit"
     },
     "zephyr-7b-beta": {
         "compute_dtype": "bfloat16",
+        "dutch_coverage": "none",
         "model_name": "HuggingFaceH4/zephyr-7b-beta",
         "model_type": "RL-tuned",
+        "num_parameters": 7241732096,
+        "quantization": "8-bit"
     }
 }