Spaces:
Running
Running
github-actions[bot] commited on
Commit ·
c062993
1
Parent(s): 174b574
🚀 Auto-deploy backend from GitHub (a19161d)
Browse files
services/inference_client.py
CHANGED
|
@@ -177,7 +177,7 @@ def _resolve_key(key: str) -> str:
|
|
| 177 |
|
| 178 |
def get_model_for_task(task_type: str) -> str:
|
| 179 |
task = (task_type or "default").strip().lower()
|
| 180 |
-
enforce_lock = os.getenv("INFERENCE_ENFORCE_LOCK_MODEL", "
|
| 181 |
if enforce_lock:
|
| 182 |
override = (
|
| 183 |
_RUNTIME_OVERRIDES.get("INFERENCE_LOCK_MODEL_ID")
|
|
@@ -281,7 +281,7 @@ class InferenceClient:
|
|
| 281 |
)
|
| 282 |
self.local_generate_path = os.getenv("INFERENCE_LOCAL_SPACE_GENERATE_PATH", "/gradio_api/call/generate")
|
| 283 |
|
| 284 |
-
self.enforce_lock_model = os.getenv("INFERENCE_ENFORCE_LOCK_MODEL", "
|
| 285 |
self.lock_model_id = os.getenv("INFERENCE_LOCK_MODEL_ID", CHAT_MODEL).strip() or CHAT_MODEL
|
| 286 |
|
| 287 |
default_model_fallback = str(primary.get("id") or CHAT_MODEL)
|
|
|
|
| 177 |
|
| 178 |
def get_model_for_task(task_type: str) -> str:
|
| 179 |
task = (task_type or "default").strip().lower()
|
| 180 |
+
enforce_lock = os.getenv("INFERENCE_ENFORCE_LOCK_MODEL", "false").strip().lower() in {"1", "true", "yes", "on"}
|
| 181 |
if enforce_lock:
|
| 182 |
override = (
|
| 183 |
_RUNTIME_OVERRIDES.get("INFERENCE_LOCK_MODEL_ID")
|
|
|
|
| 281 |
)
|
| 282 |
self.local_generate_path = os.getenv("INFERENCE_LOCAL_SPACE_GENERATE_PATH", "/gradio_api/call/generate")
|
| 283 |
|
| 284 |
+
self.enforce_lock_model = os.getenv("INFERENCE_ENFORCE_LOCK_MODEL", "false").strip().lower() in {"1", "true", "yes", "on"}
|
| 285 |
self.lock_model_id = os.getenv("INFERENCE_LOCK_MODEL_ID", CHAT_MODEL).strip() or CHAT_MODEL
|
| 286 |
|
| 287 |
default_model_fallback = str(primary.get("id") or CHAT_MODEL)
|