Spaces:
Running
Running
Add high-rate-limit Silicon Flow models for free tier usage
Browse files- api/routes.py +13 -1
api/routes.py
CHANGED
|
@@ -45,13 +45,25 @@ REQUESTED_PROVIDER_MODELS = [
|
|
| 45 |
# qwen-3-235b-a22b-instruct-2507 exists but is rate-limited
|
| 46 |
# zai-glm-4.7 and gpt-oss-120b are not accessible with current key
|
| 47 |
"cerebras/llama3.1-8b",
|
| 48 |
-
# Silicon Flow models (
|
|
|
|
| 49 |
"silicon/Qwen/Qwen3.6-35B-A3B",
|
| 50 |
"silicon/Qwen/Qwen3.6-27B",
|
|
|
|
| 51 |
"silicon/Qwen/Qwen3.5-35B-A3B",
|
| 52 |
"silicon/Qwen/Qwen3.5-27B",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 53 |
"silicon/google/gemma-4-26B-A4B-it",
|
| 54 |
"silicon/google/gemma-4-31B-it",
|
|
|
|
| 55 |
# Groq models (ultra fast inference)
|
| 56 |
"groq/llama-3.3-70b-versatile",
|
| 57 |
"groq/llama-3.1-8b-instant",
|
|
|
|
| 45 |
# qwen-3-235b-a22b-instruct-2507 exists but is rate-limited
|
| 46 |
# zai-glm-4.7 and gpt-oss-120b are not accessible with current key
|
| 47 |
"cerebras/llama3.1-8b",
|
| 48 |
+
# Silicon Flow models (high rate limits, free tier)
|
| 49 |
+
# Qwen3.6 series - high speed multimodal
|
| 50 |
"silicon/Qwen/Qwen3.6-35B-A3B",
|
| 51 |
"silicon/Qwen/Qwen3.6-27B",
|
| 52 |
+
# Qwen3.5 series - high throughput
|
| 53 |
"silicon/Qwen/Qwen3.5-35B-A3B",
|
| 54 |
"silicon/Qwen/Qwen3.5-27B",
|
| 55 |
+
"silicon/Qwen/Qwen2.5-7B-Instruct",
|
| 56 |
+
"silicon/Qwen/Qwen2.5-72B-Instruct",
|
| 57 |
+
# Qwen3 Coder - best for coding
|
| 58 |
+
"silicon/Qwen/Qwen3-Coder-32B-A3B-Instruct",
|
| 59 |
+
"silicon/Qwen/Qwen3-Coder-480B-A35B-Instruct",
|
| 60 |
+
# DeepSeek - extremely high throughput MoE
|
| 61 |
+
"silicon/deepseek-ai/DeepSeek-V4-Flash",
|
| 62 |
+
"silicon/deepseek-ai/DeepSeek-V3",
|
| 63 |
+
# Google Gemma - fast and capable
|
| 64 |
"silicon/google/gemma-4-26B-A4B-it",
|
| 65 |
"silicon/google/gemma-4-31B-it",
|
| 66 |
+
"silicon/google/gemma-3-27B-it",
|
| 67 |
# Groq models (ultra fast inference)
|
| 68 |
"groq/llama-3.3-70b-versatile",
|
| 69 |
"groq/llama-3.1-8b-instant",
|