nsarrazin commited on
Commit
e390fd0
·
unverified ·
1 Parent(s): 0f74344

feat: new model 29-04-25 (#1808)

Browse files
Files changed (1) hide show
  1. chart/env/prod.yaml +37 -0
chart/env/prod.yaml CHANGED
@@ -75,6 +75,43 @@ envVars:
75
  }
76
  ]
77
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
78
  {
79
  "name": "Qwen/Qwen2.5-72B-Instruct",
80
  "description": "The latest Qwen open model with improved role-playing, long text generation and structured data understanding.",
 
75
  }
76
  ]
77
  },
78
+ {
79
+ "name": "Qwen/Qwen3-235B-A22B",
80
+ "description": "Qwen's flagship model featuring optional reasoning. Exceptional performance with benchmarks rivaling R1 and o1.",
81
+ "modelUrl": "https://huggingface.co/Qwen/Qwen3-235B-A22B",
82
+ "websiteUrl": "https://qwenlm.github.io/blog/qwen3/",
83
+ "logoUrl": "https://huggingface.co/datasets/huggingchat/models-logo/resolve/main/qwen-logo.png",
84
+ "preprompt": "You are Qwen, created by Alibaba Cloud. You are a helpful assistant.",
85
+ "reasoning": {
86
+ "type": "tokens",
87
+ "beginToken": "<think>",
88
+ "endToken": "</think>"
89
+ },
90
+ "parameters": {
91
+ "stop": ["<|endoftext|>", "<|im_end|>"],
92
+ "temperature": 0.6,
93
+ },
94
+ "promptExamples": [
95
+ {
96
+ "title": "Write an email",
97
+ "prompt": "As a restaurant owner, write a professional email to the supplier to get these products every week: \n\n- Wine (x10)\n- Eggs (x24)\n- Bread (x12) \nothink"
98
+ },
99
+ {
100
+ "title": "Build a website",
101
+ "prompt": "Generate a snazzy static landing page for a local coffee shop using HTML and CSS. You can use tailwind using <script src='https://cdn.tailwindcss.com'></script>."
102
+ },
103
+ {
104
+ "title": "Larger number",
105
+ "prompt": "9.11 or 9.9 which number is larger?"
106
+ },
107
+ ],
108
+ "endpoints": [
109
+ {
110
+ "type": "openai",
111
+ "baseURL": "https://internal.api-inference.huggingface.co/models/Qwen/Qwen3-235B-A22B/v1"
112
+ }
113
+ ]
114
+ },
115
  {
116
  "name": "Qwen/Qwen2.5-72B-Instruct",
117
  "description": "The latest Qwen open model with improved role-playing, long text generation and structured data understanding.",