Subhadip007 commited on
Commit
f7e2e5e
·
1 Parent(s): 2798de4

fix: switch HF endpoint to universal router URL (auto-selects provider)

Browse files
Files changed (2) hide show
  1. Dockerfile +1 -1
  2. src/rag/llm_client.py +1 -1
Dockerfile CHANGED
@@ -15,7 +15,7 @@ RUN pip install --no-cache-dir -r requirements.txt
15
 
16
  # Cache-bust: forces Docker to re-copy source code on every build
17
  # This ensures HuggingFace always gets the latest code from git
18
- ARG CACHEBUST=20260414_3
19
 
20
  # Copy source code
21
  COPY src/ ./src/
 
15
 
16
  # Cache-bust: forces Docker to re-copy source code on every build
17
  # This ensures HuggingFace always gets the latest code from git
18
+ ARG CACHEBUST=20260414_4
19
 
20
  # Copy source code
21
  COPY src/ ./src/
src/rag/llm_client.py CHANGED
@@ -55,7 +55,7 @@ class MultiModelClient:
55
  if not self.hf_api_key:
56
  raise ValueError("HF_API_KEY not configured")
57
 
58
- url = f"https://router.huggingface.co/hf-inference/models/{model_id}/v1/chat/completions"
59
  headers = {
60
  "Authorization": f"Bearer {self.hf_api_key}",
61
  "Content-Type": "application/json"
 
55
  if not self.hf_api_key:
56
  raise ValueError("HF_API_KEY not configured")
57
 
58
+ url = "https://router.huggingface.co/v1/chat/completions"
59
  headers = {
60
  "Authorization": f"Bearer {self.hf_api_key}",
61
  "Content-Type": "application/json"