anycoder

Paused

AbuAlone09 commited on 18 days ago

Commit

0b02baa

verified ·

1 Parent(s): af9599c

Update backend_models.py

Files changed (1) hide show

backend_models.py CHANGED Viewed

@@ -1,31 +1,28 @@
-"""
-Standalone model inference - Optimized for Free Tier (Serverless Inference API)
-"""
 import os
 from openai import OpenAI
 def get_inference_client(model_id: str, provider: str = "auto"):
     """
-    Sử dụng Serverless Inference API miễn phí của Hugging Face.
-    Không còn tham số trả phí (X-HF-Bill-To).
     """
-    # Sử dụng base_url mặc định của Hugging Face Inference API cho các model phổ biến
-    return OpenAI(
-        base_url="https://api-inference.huggingface.co/v1/",
-        api_key=os.getenv("HF_TOKEN")
-    )
 def get_real_model_id(model_id: str) -> str:
-    """
-    Trả về ID model gốc, bỏ qua các hậu tố trả phí (novita, cerebras).
-    """
-    # Loại bỏ hậu tố provider nếu có (ví dụ: model:provider -> model)
-    if ":" in model_id:
-        return model_id.split(":")[0]
     return model_id
-def is_native_sdk_model(model_id: str) -> bool:
-    return False
-def is_mistral_model(model_id: str) -> bool:
-    return "mistral" in model_id.lower()

 import os
 from openai import OpenAI
 def get_inference_client(model_id: str, provider: str = "auto"):
     """
+    Tự động phân biệt giữa model miễn phí và model trả phí.
     """
+    # Danh sách model miễn phí của Hugging Face
+    free_models = [
+        "meta-llama/Llama-3.1-8B-Instruct",
+        "google/gemma-2-9b-it",
+        "Qwen/Qwen2.5-7B-Instruct",
+        "mistralai/Mistral-7B-Instruct-v0.3"
+    ]
+    if model_id in free_models:
+        # Dùng endpoint miễn phí
+        return OpenAI(
+            base_url="https://api-inference.huggingface.co/v1/",
+            api_key=os.getenv("HF_TOKEN")
+        )
+    else:
+        # Nếu dùng model trả phí mà đã hết quota, ta trả về client rỗng hoặc báo lỗi
+        # để hệ thống không bị crash đột ngột
+        raise Exception(f"Model {model_id} yêu cầu trả phí (Out of credits). Hãy chọn các model Llama hoặc Gemma trong menu.")
 def get_real_model_id(model_id: str) -> str:
     return model_id