nsarrazin commited on
Commit
9111ea7
·
unverified ·
1 Parent(s): 7ba01e9

feat: add Mistral-Small-3.1-24B-Instruct-2503 model and Phi-4 (#1806)

Browse files
Files changed (1) hide show
  1. chart/env/prod.yaml +51 -36
chart/env/prod.yaml CHANGED
@@ -300,6 +300,36 @@ envVars:
300
  }
301
  ]
302
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
303
  {
304
  "name": "meta-llama/Llama-3.2-11B-Vision-Instruct",
305
  "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/meta-logo.png",
@@ -370,40 +400,11 @@ envVars:
370
  }
371
  },
372
  {
373
- "name": "mistralai/Mistral-Nemo-Instruct-2407",
374
- "displayName": "mistralai/Mistral-Nemo-Instruct-2407",
375
- "description": "A small model with good capabilities in language understanding and commonsense reasoning.",
376
- "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/mistral-logo.png",
377
- "websiteUrl": "https://mistral.ai/news/mistral-nemo/",
378
- "modelUrl": "https://huggingface.co/mistralai/Mistral-Nemo-Instruct-2407",
379
- "preprompt": "",
380
- "parameters": {
381
- "stop": ["</s>"],
382
- "temperature": 0.6,
383
- "truncate": 14336,
384
- "max_new_tokens": 1536
385
- },
386
- "promptExamples": [
387
- {
388
- "title": "Write an email",
389
- "prompt": "As a restaurant owner, write a professional email to the supplier to get these products every week: \n\n- Wine (x10)\n- Eggs (x24)\n- Bread (x12)"
390
- },
391
- {
392
- "title": "Code a game",
393
- "prompt": "Code a basic snake game in python, give explanations for each step."
394
- },
395
- {
396
- "title": "Recipe help",
397
- "prompt": "How do I make a delicious lemon cheesecake?"
398
- }
399
- ]
400
- },
401
- {
402
- "name": "microsoft/Phi-3.5-mini-instruct",
403
- "description": "One of the best small models (3.8B parameters), super fast for simple tasks.",
404
  "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/microsoft-logo.png",
405
- "modelUrl": "https://huggingface.co/microsoft/Phi-3.5-mini-instruct",
406
- "websiteUrl": "https://techcommunity.microsoft.com/t5/ai-azure-ai-services-blog/discover-the-new-multi-lingual-high-quality-phi-3-5-slms/ba-p/4225280/",
407
  "preprompt": "",
408
  "parameters": {
409
  "stop": ["<|end|>", "<|endoftext|>", "<|assistant|>"],
@@ -424,6 +425,12 @@ envVars:
424
  "title": "Recipe help",
425
  "prompt": "How do I make a delicious lemon cheesecake?"
426
  }
 
 
 
 
 
 
427
  ]
428
  },
429
  {
@@ -471,7 +478,7 @@ envVars:
471
  },
472
  {
473
  "name": "mistralai/Mixtral-8x7B-Instruct-v0.1",
474
- "transferTo": "mistralai/Mistral-Nemo-Instruct-2407"
475
  },
476
  {
477
  "name": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
@@ -479,11 +486,11 @@ envVars:
479
  },
480
  {
481
  "name": "mistralai/Mistral-7B-Instruct-v0.3",
482
- "transferTo": "mistralai/Mistral-Nemo-Instruct-2407"
483
  },
484
  {
485
  "name": "microsoft/Phi-3-mini-4k-instruct",
486
- "transferTo": "microsoft/Phi-3.5-mini-instruct"
487
  },
488
  {
489
  "name": "meta-llama/Meta-Llama-3.1-70B-Instruct",
@@ -492,6 +499,14 @@ envVars:
492
  {
493
  "name": "Qwen/QwQ-32B-Preview",
494
  "transferTo": "Qwen/QwQ-32B"
 
 
 
 
 
 
 
 
495
  }
496
  ]
497
  PUBLIC_ORIGIN: "https://huggingface.co"
 
300
  }
301
  ]
302
  },
303
+ {
304
+ "name": "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
305
+ "displayName": "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
306
+ "description": "A small model with good capabilities in language understanding and commonsense reasoning.",
307
+ "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/mistral-logo.png",
308
+ "websiteUrl": "https://mistral.ai/news/mistral-nemo/",
309
+ "modelUrl": "https://huggingface.co/mistralai/mistralai/Mistral-Small-3.1-24B-Instruct-2503",
310
+ "preprompt": "",
311
+ "promptExamples": [
312
+ {
313
+ "title": "Write an email",
314
+ "prompt": "As a restaurant owner, write a professional email to the supplier to get these products every week: \n\n- Wine (x10)\n- Eggs (x24)\n- Bread (x12)"
315
+ },
316
+ {
317
+ "title": "Code a game",
318
+ "prompt": "Code a basic snake game in python, give explanations for each step."
319
+ },
320
+ {
321
+ "title": "Recipe help",
322
+ "prompt": "How do I make a delicious lemon cheesecake?"
323
+ }
324
+ ],
325
+
326
+ "endpoints": [
327
+ {
328
+ "type": "openai",
329
+ "baseURL": "https://hkjfqcryevvq9cie.us-east-1.aws.endpoints.huggingface.cloud/v1"
330
+ }
331
+ ]
332
+ },
333
  {
334
  "name": "meta-llama/Llama-3.2-11B-Vision-Instruct",
335
  "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/meta-logo.png",
 
400
  }
401
  },
402
  {
403
+ "name": "microsoft/Phi-4",
404
+ "description": "One of the best small models, super fast for simple tasks.",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
405
  "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/microsoft-logo.png",
406
+ "modelUrl": "https://huggingface.co/microsoft/Phi-4",
407
+ "websiteUrl": "https://techcommunity.microsoft.com/blog/aiplatformblog/introducing-phi-4-microsoft%E2%80%99s-newest-small-language-model-specializing-in-comple/4357090",
408
  "preprompt": "",
409
  "parameters": {
410
  "stop": ["<|end|>", "<|endoftext|>", "<|assistant|>"],
 
425
  "title": "Recipe help",
426
  "prompt": "How do I make a delicious lemon cheesecake?"
427
  }
428
+ ],
429
+ "endpoints": [
430
+ {
431
+ "type": "openai",
432
+ "baseURL": "https://up5ijetg6a2e9zlb.us-east-1.aws.endpoints.huggingface.cloud/v1"
433
+ }
434
  ]
435
  },
436
  {
 
478
  },
479
  {
480
  "name": "mistralai/Mixtral-8x7B-Instruct-v0.1",
481
+ "transferTo": "mistralai/Mistral-Small-3.1-24B-Instruct-2503"
482
  },
483
  {
484
  "name": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
 
486
  },
487
  {
488
  "name": "mistralai/Mistral-7B-Instruct-v0.3",
489
+ "transferTo": "mistralai/Mistral-Small-3.1-24B-Instruct-2503"
490
  },
491
  {
492
  "name": "microsoft/Phi-3-mini-4k-instruct",
493
+ "transferTo": "microsoft/Phi-4"
494
  },
495
  {
496
  "name": "meta-llama/Meta-Llama-3.1-70B-Instruct",
 
499
  {
500
  "name": "Qwen/QwQ-32B-Preview",
501
  "transferTo": "Qwen/QwQ-32B"
502
+ },
503
+ {
504
+ "name": "mistralai/Mistral-Nemo-Instruct-2407",
505
+ "transferTo": "mistralai/Mistral-Small-3.1-24B-Instruct-2503"
506
+ },
507
+ {
508
+ "name": "microsoft/Phi-3.5-mini-instruct",
509
+ "transferTo": "microsoft/Phi-4"
510
  }
511
  ]
512
  PUBLIC_ORIGIN: "https://huggingface.co"