anycoder

Paused

AbuAlone09 commited on 18 days ago

Commit

5a5470f

verified ·

1 Parent(s): 0b02baa

Update backend_models.py

Files changed (1) hide show

backend_models.py CHANGED Viewed

@@ -3,26 +3,21 @@ from openai import OpenAI
 def get_inference_client(model_id: str, provider: str = "auto"):
     """
-    Tự động phân biệt giữa model miễn phí và model trả phí.
     """
-    # Danh sách model miễn phí của Hugging Face
-    free_models = [
-        "meta-llama/Llama-3.1-8B-Instruct",
-        "google/gemma-2-9b-it",
-        "Qwen/Qwen2.5-7B-Instruct",
-        "mistralai/Mistral-7B-Instruct-v0.3"
-    ]
-    if model_id in free_models:
-        # Dùng endpoint miễn phí
-        return OpenAI(
-            base_url="https://api-inference.huggingface.co/v1/",
-            api_key=os.getenv("HF_TOKEN")
-        )
-    else:
-        # Nếu dùng model trả phí mà đã hết quota, ta trả về client rỗng hoặc báo lỗi
-        # để hệ thống không bị crash đột ngột
-        raise Exception(f"Model {model_id} yêu cầu trả phí (Out of credits). Hãy chọn các model Llama hoặc Gemma trong menu.")
 def get_real_model_id(model_id: str) -> str:
-    return model_id

 def get_inference_client(model_id: str, provider: str = "auto"):
     """
+    Ép hệ thống sử dụng endpoint miễn phí của Hugging Face
+    cho tất cả các model trong danh sách.
     """
+    # Xóa bỏ hoàn toàn header X-HF-Bill-To để tránh lỗi 402
+    return OpenAI(
+        base_url="https://api-inference.huggingface.co/v1/",
+        api_key=os.getenv("HF_TOKEN")
+    )
 def get_real_model_id(model_id: str) -> str:
+    # Trả về ID sạch, không có hậu tố :novita hay :cerebras
+    return model_id.split(":")[0]
+def is_native_sdk_model(model_id: str) -> bool:
+    return False
+def is_mistral_model(model_id: str) -> bool:
+    return "mistral" in model_id.lower()