Spaces:
Sleeping
Sleeping
Upload folder using huggingface_hub
Browse files- inference.py +3 -3
- server/inference.py +1 -1
inference.py
CHANGED
|
@@ -43,7 +43,7 @@ from openai import OpenAI
|
|
| 43 |
|
| 44 |
IMAGE_NAME = os.getenv("IMAGE_NAME")
|
| 45 |
API_KEY = (
|
| 46 |
-
os.getenv("HF_TOKEN") or
|
| 47 |
os.getenv("OPENAI_API_KEY")
|
| 48 |
or os.getenv("API_KEY")
|
| 49 |
)
|
|
@@ -159,7 +159,7 @@ def start_container(image_name: str, port: int = 8000) -> Optional[str]:
|
|
| 159 |
try:
|
| 160 |
result = subprocess.run(
|
| 161 |
["docker", "run", "-d", "--rm", "-p", f"{port}:{port}", image_name],
|
| 162 |
-
capture_output=True, text=True, timeout=
|
| 163 |
)
|
| 164 |
if result.returncode == 0:
|
| 165 |
cid = result.stdout.strip()
|
|
@@ -340,7 +340,7 @@ def main() -> None:
|
|
| 340 |
print("[DEBUG] Could not start container — assuming server already running.", flush=True)
|
| 341 |
|
| 342 |
# Wait for server to be ready
|
| 343 |
-
if not wait_for_server(BASE_URL, retries=
|
| 344 |
print("ERROR: Server never became ready.", file=sys.stderr)
|
| 345 |
if container_id:
|
| 346 |
stop_container(container_id)
|
|
|
|
| 43 |
|
| 44 |
IMAGE_NAME = os.getenv("IMAGE_NAME")
|
| 45 |
API_KEY = (
|
| 46 |
+
# os.getenv("HF_TOKEN") or
|
| 47 |
os.getenv("OPENAI_API_KEY")
|
| 48 |
or os.getenv("API_KEY")
|
| 49 |
)
|
|
|
|
| 159 |
try:
|
| 160 |
result = subprocess.run(
|
| 161 |
["docker", "run", "-d", "--rm", "-p", f"{port}:{port}", image_name],
|
| 162 |
+
capture_output=True, text=True, timeout=120,
|
| 163 |
)
|
| 164 |
if result.returncode == 0:
|
| 165 |
cid = result.stdout.strip()
|
|
|
|
| 340 |
print("[DEBUG] Could not start container — assuming server already running.", flush=True)
|
| 341 |
|
| 342 |
# Wait for server to be ready
|
| 343 |
+
if not wait_for_server(BASE_URL, retries=40, delay=3.0):
|
| 344 |
print("ERROR: Server never became ready.", file=sys.stderr)
|
| 345 |
if container_id:
|
| 346 |
stop_container(container_id)
|
server/inference.py
CHANGED
|
@@ -22,7 +22,7 @@ except ImportError:
|
|
| 22 |
# ---------------------------------------------------------------------------
|
| 23 |
|
| 24 |
IMAGE_NAME = os.getenv("IMAGE_NAME")
|
| 25 |
-
API_KEY =
|
| 26 |
API_BASE_URL = os.getenv("API_BASE_URL", "https://router.huggingface.co/v1")
|
| 27 |
MODEL_NAME = os.getenv("MODEL_NAME", "Qwen/Qwen2.5-72B-Instruct")
|
| 28 |
BASE_URL = os.getenv("ENV_BASE_URL", "http://localhost:8000")
|
|
|
|
| 22 |
# ---------------------------------------------------------------------------
|
| 23 |
|
| 24 |
IMAGE_NAME = os.getenv("IMAGE_NAME")
|
| 25 |
+
API_KEY = os.getenv("HF_TOKEN") or os.getenv("OPENAI_API_KEY")
|
| 26 |
API_BASE_URL = os.getenv("API_BASE_URL", "https://router.huggingface.co/v1")
|
| 27 |
MODEL_NAME = os.getenv("MODEL_NAME", "Qwen/Qwen2.5-72B-Instruct")
|
| 28 |
BASE_URL = os.getenv("ENV_BASE_URL", "http://localhost:8000")
|