Spaces:
Paused
Paused
config(hchat): move Qwen 2.5 72B first (#1580)
Browse files- chart/env/prod.yaml +29 -29
chart/env/prod.yaml
CHANGED
|
@@ -48,6 +48,35 @@ envVars:
|
|
| 48 |
METRICS_ENABLED: "true"
|
| 49 |
MODELS: >
|
| 50 |
[
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 51 |
{
|
| 52 |
"name": "meta-llama/Meta-Llama-3.1-70B-Instruct",
|
| 53 |
"id": "meta-llama/Meta-Llama-3.1-70B-Instruct",
|
|
@@ -108,35 +137,6 @@ envVars:
|
|
| 108 |
}
|
| 109 |
]
|
| 110 |
},
|
| 111 |
-
{
|
| 112 |
-
"name": "Qwen/Qwen2.5-72B-Instruct",
|
| 113 |
-
"tokenizer": "Qwen/Qwen2.5-72B-Instruct",
|
| 114 |
-
"description": "The latest Qwen open model with improved role-playing, long text generation and structured data understanding.",
|
| 115 |
-
"modelUrl": "https://huggingface.co/Qwen/Qwen2.5-72B-Instruct",
|
| 116 |
-
"websiteUrl": "https://qwenlm.github.io/blog/qwen2.5/",
|
| 117 |
-
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/qwen-logo.png",
|
| 118 |
-
"preprompt": "You are Qwen, created by Alibaba Cloud. You are a helpful assistant.",
|
| 119 |
-
"parameters": {
|
| 120 |
-
"stop": ["<|endoftext|>", "<|im_end|>"],
|
| 121 |
-
"temperature": 0.6,
|
| 122 |
-
"truncate": 28672,
|
| 123 |
-
"max_new_tokens": 3072
|
| 124 |
-
},
|
| 125 |
-
"promptExamples": [
|
| 126 |
-
{
|
| 127 |
-
"title": "Write an email from bullet list",
|
| 128 |
-
"prompt": "As a restaurant owner, write a professional email to the supplier to get these products every week: \n\n- Wine (x10)\n- Eggs (x24)\n- Bread (x12)"
|
| 129 |
-
},
|
| 130 |
-
{
|
| 131 |
-
"title": "Code a snake game",
|
| 132 |
-
"prompt": "Code a basic snake game in python, give explanations for each step."
|
| 133 |
-
},
|
| 134 |
-
{
|
| 135 |
-
"title": "Assist in a task",
|
| 136 |
-
"prompt": "How do I make a delicious lemon cheesecake?"
|
| 137 |
-
}
|
| 138 |
-
]
|
| 139 |
-
},
|
| 140 |
{
|
| 141 |
"name": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF",
|
| 142 |
"tokenizer": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF",
|
|
|
|
| 48 |
METRICS_ENABLED: "true"
|
| 49 |
MODELS: >
|
| 50 |
[
|
| 51 |
+
{
|
| 52 |
+
"name": "Qwen/Qwen2.5-72B-Instruct",
|
| 53 |
+
"tokenizer": "Qwen/Qwen2.5-72B-Instruct",
|
| 54 |
+
"description": "The latest Qwen open model with improved role-playing, long text generation and structured data understanding.",
|
| 55 |
+
"modelUrl": "https://huggingface.co/Qwen/Qwen2.5-72B-Instruct",
|
| 56 |
+
"websiteUrl": "https://qwenlm.github.io/blog/qwen2.5/",
|
| 57 |
+
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/qwen-logo.png",
|
| 58 |
+
"preprompt": "You are Qwen, created by Alibaba Cloud. You are a helpful assistant.",
|
| 59 |
+
"parameters": {
|
| 60 |
+
"stop": ["<|endoftext|>", "<|im_end|>"],
|
| 61 |
+
"temperature": 0.6,
|
| 62 |
+
"truncate": 28672,
|
| 63 |
+
"max_new_tokens": 3072
|
| 64 |
+
},
|
| 65 |
+
"promptExamples": [
|
| 66 |
+
{
|
| 67 |
+
"title": "Write an email from bullet list",
|
| 68 |
+
"prompt": "As a restaurant owner, write a professional email to the supplier to get these products every week: \n\n- Wine (x10)\n- Eggs (x24)\n- Bread (x12)"
|
| 69 |
+
},
|
| 70 |
+
{
|
| 71 |
+
"title": "Code a snake game",
|
| 72 |
+
"prompt": "Code a basic snake game in python, give explanations for each step."
|
| 73 |
+
},
|
| 74 |
+
{
|
| 75 |
+
"title": "Assist in a task",
|
| 76 |
+
"prompt": "How do I make a delicious lemon cheesecake?"
|
| 77 |
+
}
|
| 78 |
+
]
|
| 79 |
+
},
|
| 80 |
{
|
| 81 |
"name": "meta-llama/Meta-Llama-3.1-70B-Instruct",
|
| 82 |
"id": "meta-llama/Meta-Llama-3.1-70B-Instruct",
|
|
|
|
| 137 |
}
|
| 138 |
]
|
| 139 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 140 |
{
|
| 141 |
"name": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF",
|
| 142 |
"tokenizer": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF",
|