Yash030 commited on
Commit
5bba595
·
1 Parent(s): c9c8b95

Keep only 5 best Silicon Flow models for free tier

Browse files
Files changed (1) hide show
  1. api/routes.py +9 -17
api/routes.py CHANGED
@@ -45,25 +45,17 @@ REQUESTED_PROVIDER_MODELS = [
45
  # qwen-3-235b-a22b-instruct-2507 exists but is rate-limited
46
  # zai-glm-4.7 and gpt-oss-120b are not accessible with current key
47
  "cerebras/llama3.1-8b",
48
- # Silicon Flow models (high rate limits, free tier)
49
- # Qwen3.6 series - high speed multimodal
 
 
 
 
50
  "silicon/Qwen/Qwen3.6-35B-A3B",
51
- "silicon/Qwen/Qwen3.6-27B",
52
- # Qwen3.5 series - high throughput
53
- "silicon/Qwen/Qwen3.5-35B-A3B",
54
- "silicon/Qwen/Qwen3.5-27B",
55
- "silicon/Qwen/Qwen2.5-7B-Instruct",
56
  "silicon/Qwen/Qwen2.5-72B-Instruct",
57
- # Qwen3 Coder - best for coding
58
- "silicon/Qwen/Qwen3-Coder-32B-A3B-Instruct",
59
- "silicon/Qwen/Qwen3-Coder-480B-A35B-Instruct",
60
- # DeepSeek - extremely high throughput MoE
61
- "silicon/deepseek-ai/DeepSeek-V4-Flash",
62
- "silicon/deepseek-ai/DeepSeek-V3",
63
- # Google Gemma - fast and capable
64
- "silicon/google/gemma-4-26B-A4B-it",
65
- "silicon/google/gemma-4-31B-it",
66
- "silicon/google/gemma-3-27B-it",
67
  # Groq models (ultra fast inference)
68
  "groq/llama-3.3-70b-versatile",
69
  "groq/llama-3.1-8b-instant",
 
45
  # qwen-3-235b-a22b-instruct-2507 exists but is rate-limited
46
  # zai-glm-4.7 and gpt-oss-120b are not accessible with current key
47
  "cerebras/llama3.1-8b",
48
+ # Silicon Flow models (top 5 for free tier)
49
+ # DeepSeek-V4-Flash - best overall coding, 1M context, MoE
50
+ "silicon/deepseek-ai/DeepSeek-V4-Flash",
51
+ # Qwen3-Coder-480B - repository-scale coding, 256K+ context
52
+ "silicon/Qwen/Qwen3-Coder-480B-A35B-Instruct",
53
+ # Qwen3.6-35B-A3B - multimodal, 262K context
54
  "silicon/Qwen/Qwen3.6-35B-A3B",
55
+ # Qwen2.5-72B - strong general purpose, 128K context
 
 
 
 
56
  "silicon/Qwen/Qwen2.5-72B-Instruct",
57
+ # QwQ-32B - best reasoning model
58
+ "silicon/Qwen/QwQ-32B",
 
 
 
 
 
 
 
 
59
  # Groq models (ultra fast inference)
60
  "groq/llama-3.3-70b-versatile",
61
  "groq/llama-3.1-8b-instant",