Gaston895 commited on
Commit
e404c5a
·
verified ·
1 Parent(s): 5017f1d

Fix: Use only HuggingFace Inference API (no external API keys needed)

Browse files
Files changed (1) hide show
  1. app.py +7 -8
app.py CHANGED
@@ -37,11 +37,10 @@ GLOBAL_REGIONS = [
37
  # HuggingFace Token for all providers
38
  HF_TOKEN = os.getenv('HF_TOKEN', '')
39
 
40
- # Multiple API Providers for automatic failover when quotas are exhausted
41
- # All using HuggingFace Inference API with different model endpoints
42
  API_PROVIDERS = [
43
  {
44
- "name": "deepseek-primary",
45
  "base_url": "https://api-inference.huggingface.co/models/deepseek-ai/DeepSeek-V3.2-Exp",
46
  "headers": {
47
  "Authorization": f"Bearer {HF_TOKEN}",
@@ -51,14 +50,14 @@ API_PROVIDERS = [
51
  "model": "deepseek-ai/DeepSeek-V3.2-Exp"
52
  },
53
  {
54
- "name": "deepseek-secondary",
55
- "base_url": "https://api-inference.huggingface.co/models/deepseek-ai/deepseek-v3-base",
56
  "headers": {
57
  "Authorization": f"Bearer {HF_TOKEN}",
58
  "Content-Type": "application/json"
59
  },
60
  "provider": "hf_inference",
61
- "model": "deepseek-ai/deepseek-v3-base"
62
  },
63
  {
64
  "name": "deepseek-fallback",
@@ -136,8 +135,8 @@ def call_deepseek_api(messages: List[Dict], provider: Dict, max_retries: int = 3
136
  logger.warning(f"💸 Rate limit reached for {provider['name']}, switching to next provider...")
137
  return None
138
  elif response.status_code == 503:
139
- logger.warning(f"⏳ Model loading for {provider['name']}, retrying...")
140
- time.sleep(5)
141
  return None
142
  else:
143
  logger.warning(f"⚠️ API error from {provider['name']}: {response.status_code} - {response.text}")
 
37
  # HuggingFace Token for all providers
38
  HF_TOKEN = os.getenv('HF_TOKEN', '')
39
 
40
+ # HuggingFace Inference API using linked DeepSeek models
 
41
  API_PROVIDERS = [
42
  {
43
+ "name": "deepseek-v3.2-exp",
44
  "base_url": "https://api-inference.huggingface.co/models/deepseek-ai/DeepSeek-V3.2-Exp",
45
  "headers": {
46
  "Authorization": f"Bearer {HF_TOKEN}",
 
50
  "model": "deepseek-ai/DeepSeek-V3.2-Exp"
51
  },
52
  {
53
+ "name": "deepseek-v3-base",
54
+ "base_url": "https://api-inference.huggingface.co/models/deepseek-ai/DeepSeek-V3-Base",
55
  "headers": {
56
  "Authorization": f"Bearer {HF_TOKEN}",
57
  "Content-Type": "application/json"
58
  },
59
  "provider": "hf_inference",
60
+ "model": "deepseek-ai/DeepSeek-V3-Base"
61
  },
62
  {
63
  "name": "deepseek-fallback",
 
135
  logger.warning(f"💸 Rate limit reached for {provider['name']}, switching to next provider...")
136
  return None
137
  elif response.status_code == 503:
138
+ logger.warning(f"⏳ Model loading for {provider['name']}, waiting 15 seconds...")
139
+ time.sleep(15) # Wait longer for model to load
140
  return None
141
  else:
142
  logger.warning(f"⚠️ API error from {provider['name']}: {response.status_code} - {response.text}")