Revanth-ml commited on
Commit
3be06e2
·
verified ·
1 Parent(s): d0bdb29

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. inference.py +3 -3
  2. server/inference.py +1 -1
inference.py CHANGED
@@ -43,7 +43,7 @@ from openai import OpenAI
43
 
44
  IMAGE_NAME = os.getenv("IMAGE_NAME")
45
  API_KEY = (
46
- os.getenv("HF_TOKEN") or
47
  os.getenv("OPENAI_API_KEY")
48
  or os.getenv("API_KEY")
49
  )
@@ -159,7 +159,7 @@ def start_container(image_name: str, port: int = 8000) -> Optional[str]:
159
  try:
160
  result = subprocess.run(
161
  ["docker", "run", "-d", "--rm", "-p", f"{port}:{port}", image_name],
162
- capture_output=True, text=True, timeout=30,
163
  )
164
  if result.returncode == 0:
165
  cid = result.stdout.strip()
@@ -340,7 +340,7 @@ def main() -> None:
340
  print("[DEBUG] Could not start container — assuming server already running.", flush=True)
341
 
342
  # Wait for server to be ready
343
- if not wait_for_server(BASE_URL, retries=20, delay=3.0):
344
  print("ERROR: Server never became ready.", file=sys.stderr)
345
  if container_id:
346
  stop_container(container_id)
 
43
 
44
  IMAGE_NAME = os.getenv("IMAGE_NAME")
45
  API_KEY = (
46
+ # os.getenv("HF_TOKEN") or
47
  os.getenv("OPENAI_API_KEY")
48
  or os.getenv("API_KEY")
49
  )
 
159
  try:
160
  result = subprocess.run(
161
  ["docker", "run", "-d", "--rm", "-p", f"{port}:{port}", image_name],
162
+ capture_output=True, text=True, timeout=120,
163
  )
164
  if result.returncode == 0:
165
  cid = result.stdout.strip()
 
340
  print("[DEBUG] Could not start container — assuming server already running.", flush=True)
341
 
342
  # Wait for server to be ready
343
+ if not wait_for_server(BASE_URL, retries=40, delay=3.0):
344
  print("ERROR: Server never became ready.", file=sys.stderr)
345
  if container_id:
346
  stop_container(container_id)
server/inference.py CHANGED
@@ -22,7 +22,7 @@ except ImportError:
22
  # ---------------------------------------------------------------------------
23
 
24
  IMAGE_NAME = os.getenv("IMAGE_NAME")
25
- API_KEY = os.getenv("OPENAI_API_KEY")
26
  API_BASE_URL = os.getenv("API_BASE_URL", "https://router.huggingface.co/v1")
27
  MODEL_NAME = os.getenv("MODEL_NAME", "Qwen/Qwen2.5-72B-Instruct")
28
  BASE_URL = os.getenv("ENV_BASE_URL", "http://localhost:8000")
 
22
  # ---------------------------------------------------------------------------
23
 
24
  IMAGE_NAME = os.getenv("IMAGE_NAME")
25
+ API_KEY = os.getenv("HF_TOKEN") or os.getenv("OPENAI_API_KEY")
26
  API_BASE_URL = os.getenv("API_BASE_URL", "https://router.huggingface.co/v1")
27
  MODEL_NAME = os.getenv("MODEL_NAME", "Qwen/Qwen2.5-72B-Instruct")
28
  BASE_URL = os.getenv("ENV_BASE_URL", "http://localhost:8000")