Yash030 commited on
Commit
c9c8b95
·
1 Parent(s): c66ebaa

Add high-rate-limit Silicon Flow models for free tier usage

Browse files
Files changed (1) hide show
  1. api/routes.py +13 -1
api/routes.py CHANGED
@@ -45,13 +45,25 @@ REQUESTED_PROVIDER_MODELS = [
45
  # qwen-3-235b-a22b-instruct-2507 exists but is rate-limited
46
  # zai-glm-4.7 and gpt-oss-120b are not accessible with current key
47
  "cerebras/llama3.1-8b",
48
- # Silicon Flow models (uses bare model IDs on the API)
 
49
  "silicon/Qwen/Qwen3.6-35B-A3B",
50
  "silicon/Qwen/Qwen3.6-27B",
 
51
  "silicon/Qwen/Qwen3.5-35B-A3B",
52
  "silicon/Qwen/Qwen3.5-27B",
 
 
 
 
 
 
 
 
 
53
  "silicon/google/gemma-4-26B-A4B-it",
54
  "silicon/google/gemma-4-31B-it",
 
55
  # Groq models (ultra fast inference)
56
  "groq/llama-3.3-70b-versatile",
57
  "groq/llama-3.1-8b-instant",
 
45
  # qwen-3-235b-a22b-instruct-2507 exists but is rate-limited
46
  # zai-glm-4.7 and gpt-oss-120b are not accessible with current key
47
  "cerebras/llama3.1-8b",
48
+ # Silicon Flow models (high rate limits, free tier)
49
+ # Qwen3.6 series - high speed multimodal
50
  "silicon/Qwen/Qwen3.6-35B-A3B",
51
  "silicon/Qwen/Qwen3.6-27B",
52
+ # Qwen3.5 series - high throughput
53
  "silicon/Qwen/Qwen3.5-35B-A3B",
54
  "silicon/Qwen/Qwen3.5-27B",
55
+ "silicon/Qwen/Qwen2.5-7B-Instruct",
56
+ "silicon/Qwen/Qwen2.5-72B-Instruct",
57
+ # Qwen3 Coder - best for coding
58
+ "silicon/Qwen/Qwen3-Coder-32B-A3B-Instruct",
59
+ "silicon/Qwen/Qwen3-Coder-480B-A35B-Instruct",
60
+ # DeepSeek - extremely high throughput MoE
61
+ "silicon/deepseek-ai/DeepSeek-V4-Flash",
62
+ "silicon/deepseek-ai/DeepSeek-V3",
63
+ # Google Gemma - fast and capable
64
  "silicon/google/gemma-4-26B-A4B-it",
65
  "silicon/google/gemma-4-31B-it",
66
+ "silicon/google/gemma-3-27B-it",
67
  # Groq models (ultra fast inference)
68
  "groq/llama-3.3-70b-versatile",
69
  "groq/llama-3.1-8b-instant",