Spaces:
Sleeping
Sleeping
feat: add Mistral-Small-3.1-24B-Instruct-2503 model and Phi-4 (#1806)
Browse files- chart/env/prod.yaml +51 -36
chart/env/prod.yaml
CHANGED
|
@@ -300,6 +300,36 @@ envVars:
|
|
| 300 |
}
|
| 301 |
]
|
| 302 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 303 |
{
|
| 304 |
"name": "meta-llama/Llama-3.2-11B-Vision-Instruct",
|
| 305 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/meta-logo.png",
|
|
@@ -370,40 +400,11 @@ envVars:
|
|
| 370 |
}
|
| 371 |
},
|
| 372 |
{
|
| 373 |
-
"name": "
|
| 374 |
-
"
|
| 375 |
-
"description": "A small model with good capabilities in language understanding and commonsense reasoning.",
|
| 376 |
-
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/mistral-logo.png",
|
| 377 |
-
"websiteUrl": "https://mistral.ai/news/mistral-nemo/",
|
| 378 |
-
"modelUrl": "https://huggingface.co/mistralai/Mistral-Nemo-Instruct-2407",
|
| 379 |
-
"preprompt": "",
|
| 380 |
-
"parameters": {
|
| 381 |
-
"stop": ["</s>"],
|
| 382 |
-
"temperature": 0.6,
|
| 383 |
-
"truncate": 14336,
|
| 384 |
-
"max_new_tokens": 1536
|
| 385 |
-
},
|
| 386 |
-
"promptExamples": [
|
| 387 |
-
{
|
| 388 |
-
"title": "Write an email",
|
| 389 |
-
"prompt": "As a restaurant owner, write a professional email to the supplier to get these products every week: \n\n- Wine (x10)\n- Eggs (x24)\n- Bread (x12)"
|
| 390 |
-
},
|
| 391 |
-
{
|
| 392 |
-
"title": "Code a game",
|
| 393 |
-
"prompt": "Code a basic snake game in python, give explanations for each step."
|
| 394 |
-
},
|
| 395 |
-
{
|
| 396 |
-
"title": "Recipe help",
|
| 397 |
-
"prompt": "How do I make a delicious lemon cheesecake?"
|
| 398 |
-
}
|
| 399 |
-
]
|
| 400 |
-
},
|
| 401 |
-
{
|
| 402 |
-
"name": "microsoft/Phi-3.5-mini-instruct",
|
| 403 |
-
"description": "One of the best small models (3.8B parameters), super fast for simple tasks.",
|
| 404 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/microsoft-logo.png",
|
| 405 |
-
"modelUrl": "https://huggingface.co/microsoft/Phi-
|
| 406 |
-
"websiteUrl": "https://techcommunity.microsoft.com/
|
| 407 |
"preprompt": "",
|
| 408 |
"parameters": {
|
| 409 |
"stop": ["<|end|>", "<|endoftext|>", "<|assistant|>"],
|
|
@@ -424,6 +425,12 @@ envVars:
|
|
| 424 |
"title": "Recipe help",
|
| 425 |
"prompt": "How do I make a delicious lemon cheesecake?"
|
| 426 |
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 427 |
]
|
| 428 |
},
|
| 429 |
{
|
|
@@ -471,7 +478,7 @@ envVars:
|
|
| 471 |
},
|
| 472 |
{
|
| 473 |
"name": "mistralai/Mixtral-8x7B-Instruct-v0.1",
|
| 474 |
-
"transferTo": "mistralai/Mistral-
|
| 475 |
},
|
| 476 |
{
|
| 477 |
"name": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
|
|
@@ -479,11 +486,11 @@ envVars:
|
|
| 479 |
},
|
| 480 |
{
|
| 481 |
"name": "mistralai/Mistral-7B-Instruct-v0.3",
|
| 482 |
-
"transferTo": "mistralai/Mistral-
|
| 483 |
},
|
| 484 |
{
|
| 485 |
"name": "microsoft/Phi-3-mini-4k-instruct",
|
| 486 |
-
"transferTo": "microsoft/Phi-
|
| 487 |
},
|
| 488 |
{
|
| 489 |
"name": "meta-llama/Meta-Llama-3.1-70B-Instruct",
|
|
@@ -492,6 +499,14 @@ envVars:
|
|
| 492 |
{
|
| 493 |
"name": "Qwen/QwQ-32B-Preview",
|
| 494 |
"transferTo": "Qwen/QwQ-32B"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 495 |
}
|
| 496 |
]
|
| 497 |
PUBLIC_ORIGIN: "https://huggingface.co"
|
|
|
|
| 300 |
}
|
| 301 |
]
|
| 302 |
},
|
| 303 |
+
{
|
| 304 |
+
"name": "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
|
| 305 |
+
"displayName": "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
|
| 306 |
+
"description": "A small model with good capabilities in language understanding and commonsense reasoning.",
|
| 307 |
+
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/mistral-logo.png",
|
| 308 |
+
"websiteUrl": "https://mistral.ai/news/mistral-nemo/",
|
| 309 |
+
"modelUrl": "https://huggingface.co/mistralai/mistralai/Mistral-Small-3.1-24B-Instruct-2503",
|
| 310 |
+
"preprompt": "",
|
| 311 |
+
"promptExamples": [
|
| 312 |
+
{
|
| 313 |
+
"title": "Write an email",
|
| 314 |
+
"prompt": "As a restaurant owner, write a professional email to the supplier to get these products every week: \n\n- Wine (x10)\n- Eggs (x24)\n- Bread (x12)"
|
| 315 |
+
},
|
| 316 |
+
{
|
| 317 |
+
"title": "Code a game",
|
| 318 |
+
"prompt": "Code a basic snake game in python, give explanations for each step."
|
| 319 |
+
},
|
| 320 |
+
{
|
| 321 |
+
"title": "Recipe help",
|
| 322 |
+
"prompt": "How do I make a delicious lemon cheesecake?"
|
| 323 |
+
}
|
| 324 |
+
],
|
| 325 |
+
|
| 326 |
+
"endpoints": [
|
| 327 |
+
{
|
| 328 |
+
"type": "openai",
|
| 329 |
+
"baseURL": "https://hkjfqcryevvq9cie.us-east-1.aws.endpoints.huggingface.cloud/v1"
|
| 330 |
+
}
|
| 331 |
+
]
|
| 332 |
+
},
|
| 333 |
{
|
| 334 |
"name": "meta-llama/Llama-3.2-11B-Vision-Instruct",
|
| 335 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/meta-logo.png",
|
|
|
|
| 400 |
}
|
| 401 |
},
|
| 402 |
{
|
| 403 |
+
"name": "microsoft/Phi-4",
|
| 404 |
+
"description": "One of the best small models, super fast for simple tasks.",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 405 |
"logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/microsoft-logo.png",
|
| 406 |
+
"modelUrl": "https://huggingface.co/microsoft/Phi-4",
|
| 407 |
+
"websiteUrl": "https://techcommunity.microsoft.com/blog/aiplatformblog/introducing-phi-4-microsoft%E2%80%99s-newest-small-language-model-specializing-in-comple/4357090",
|
| 408 |
"preprompt": "",
|
| 409 |
"parameters": {
|
| 410 |
"stop": ["<|end|>", "<|endoftext|>", "<|assistant|>"],
|
|
|
|
| 425 |
"title": "Recipe help",
|
| 426 |
"prompt": "How do I make a delicious lemon cheesecake?"
|
| 427 |
}
|
| 428 |
+
],
|
| 429 |
+
"endpoints": [
|
| 430 |
+
{
|
| 431 |
+
"type": "openai",
|
| 432 |
+
"baseURL": "https://up5ijetg6a2e9zlb.us-east-1.aws.endpoints.huggingface.cloud/v1"
|
| 433 |
+
}
|
| 434 |
]
|
| 435 |
},
|
| 436 |
{
|
|
|
|
| 478 |
},
|
| 479 |
{
|
| 480 |
"name": "mistralai/Mixtral-8x7B-Instruct-v0.1",
|
| 481 |
+
"transferTo": "mistralai/Mistral-Small-3.1-24B-Instruct-2503"
|
| 482 |
},
|
| 483 |
{
|
| 484 |
"name": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
|
|
|
|
| 486 |
},
|
| 487 |
{
|
| 488 |
"name": "mistralai/Mistral-7B-Instruct-v0.3",
|
| 489 |
+
"transferTo": "mistralai/Mistral-Small-3.1-24B-Instruct-2503"
|
| 490 |
},
|
| 491 |
{
|
| 492 |
"name": "microsoft/Phi-3-mini-4k-instruct",
|
| 493 |
+
"transferTo": "microsoft/Phi-4"
|
| 494 |
},
|
| 495 |
{
|
| 496 |
"name": "meta-llama/Meta-Llama-3.1-70B-Instruct",
|
|
|
|
| 499 |
{
|
| 500 |
"name": "Qwen/QwQ-32B-Preview",
|
| 501 |
"transferTo": "Qwen/QwQ-32B"
|
| 502 |
+
},
|
| 503 |
+
{
|
| 504 |
+
"name": "mistralai/Mistral-Nemo-Instruct-2407",
|
| 505 |
+
"transferTo": "mistralai/Mistral-Small-3.1-24B-Instruct-2503"
|
| 506 |
+
},
|
| 507 |
+
{
|
| 508 |
+
"name": "microsoft/Phi-3.5-mini-instruct",
|
| 509 |
+
"transferTo": "microsoft/Phi-4"
|
| 510 |
}
|
| 511 |
]
|
| 512 |
PUBLIC_ORIGIN: "https://huggingface.co"
|