Spaces:

Yash030
/

claude-code-proxy

Running

Yash030 commited on 4 days ago

Commit

c9c8b95

1 Parent(s): c66ebaa

Add high-rate-limit Silicon Flow models for free tier usage

Files changed (1) hide show

api/routes.py CHANGED Viewed

@@ -45,13 +45,25 @@ REQUESTED_PROVIDER_MODELS = [
     # qwen-3-235b-a22b-instruct-2507 exists but is rate-limited
     # zai-glm-4.7 and gpt-oss-120b are not accessible with current key
     "cerebras/llama3.1-8b",
-    # Silicon Flow models (uses bare model IDs on the API)
     "silicon/Qwen/Qwen3.6-35B-A3B",
     "silicon/Qwen/Qwen3.6-27B",
     "silicon/Qwen/Qwen3.5-35B-A3B",
     "silicon/Qwen/Qwen3.5-27B",
     "silicon/google/gemma-4-26B-A4B-it",
     "silicon/google/gemma-4-31B-it",
     # Groq models (ultra fast inference)
     "groq/llama-3.3-70b-versatile",
     "groq/llama-3.1-8b-instant",

     # qwen-3-235b-a22b-instruct-2507 exists but is rate-limited
     # zai-glm-4.7 and gpt-oss-120b are not accessible with current key
     "cerebras/llama3.1-8b",
+    # Silicon Flow models (high rate limits, free tier)
+    # Qwen3.6 series - high speed multimodal
     "silicon/Qwen/Qwen3.6-35B-A3B",
     "silicon/Qwen/Qwen3.6-27B",
+    # Qwen3.5 series - high throughput
     "silicon/Qwen/Qwen3.5-35B-A3B",
     "silicon/Qwen/Qwen3.5-27B",
+    "silicon/Qwen/Qwen2.5-7B-Instruct",
+    "silicon/Qwen/Qwen2.5-72B-Instruct",
+    # Qwen3 Coder - best for coding
+    "silicon/Qwen/Qwen3-Coder-32B-A3B-Instruct",
+    "silicon/Qwen/Qwen3-Coder-480B-A35B-Instruct",
+    # DeepSeek - extremely high throughput MoE
+    "silicon/deepseek-ai/DeepSeek-V4-Flash",
+    "silicon/deepseek-ai/DeepSeek-V3",
+    # Google Gemma - fast and capable
     "silicon/google/gemma-4-26B-A4B-it",
     "silicon/google/gemma-4-31B-it",
+    "silicon/google/gemma-3-27B-it",
     # Groq models (ultra fast inference)
     "groq/llama-3.3-70b-versatile",
     "groq/llama-3.1-8b-instant",