Spaces:

ceoavinash
/

codearena-rl

Sleeping

havinashpatil commited on 17 days ago

Commit

a8bc575

1 Parent(s): 434afdf

Fix TGI endpoint plumbing and use full TGI runtime image in Dockerfile

Files changed (2) hide show

Dockerfile CHANGED Viewed

@@ -9,19 +9,8 @@ RUN npm install
 COPY frontend/ ./
 RUN npm run build
-# TGI stage for LLM serving
-FROM ghcr.io/huggingface/text-generation-inference:3.0.2 AS tgi-builder
-# Main stage: Python app with TGI
-FROM python:3.10-slim
-# Install TGI runtime dependencies
-RUN apt-get update && apt-get install -y --no-install-recommends \
-    ca-certificates \
-    && rm -rf /var/lib/apt/lists/*
-# Copy TGI binary from builder
-COPY --from=tgi-builder /usr/local/bin/text-generation-inference /usr/local/bin/
 WORKDIR /app
@@ -39,8 +28,9 @@ RUN mkdir -p /data && chmod 777 /data
 RUN mkdir -p /.cache && chmod 777 /.cache
 RUN mkdir -p /.triton && chmod 777 /.triton
-# Required for HF Spaces: Expose default port 7860 for FastAPI
 EXPOSE 7860
 # Start both FastAPI server and TGI in background
 CMD ["sh", "-c", "text-generation-inference --model-id TinyLlama/TinyLlama-1.1B-Chat-v1.0 --port 8080 --hostname 0.0.0.0 & uvicorn server.app:app --host 0.0.0.0 --port 7860"]

 COPY frontend/ ./
 RUN npm run build
+# Main stage: Python app with TGI runtime
+FROM ghcr.io/huggingface/text-generation-inference:3.0.2
 WORKDIR /app
 RUN mkdir -p /.cache && chmod 777 /.cache
 RUN mkdir -p /.triton && chmod 777 /.triton
+# Required for HF Spaces: Expose default ports for FastAPI and TGI
 EXPOSE 7860
+EXPOSE 8080
 # Start both FastAPI server and TGI in background
 CMD ["sh", "-c", "text-generation-inference --model-id TinyLlama/TinyLlama-1.1B-Chat-v1.0 --port 8080 --hostname 0.0.0.0 & uvicorn server.app:app --host 0.0.0.0 --port 7860"]

server/ai_fixer.py CHANGED Viewed

@@ -23,20 +23,20 @@ from server.memory import store_success, retrieve_memory, log_complexity_reward
 TGI_BASE_URL = os.environ.get("TGI_BASE_URL", "http://localhost:8080")
 TGI_AVAILABLE = False
-def check_tgi_availability():
     """Check if TGI server is available."""
     global TGI_AVAILABLE
     try:
-        response = httpx.get(f"{TGI_BASE_URL}/health", timeout=5.0)
         TGI_AVAILABLE = response.status_code == 200
-    except:
         TGI_AVAILABLE = False
     return TGI_AVAILABLE
-def fix_with_tgi(code: str) -> Optional[str]:
     """Use TGI for advanced code fixing."""
-    if not TGI_AVAILABLE and not check_tgi_availability():
         return None
     prompt = f"""You are an expert competitive programmer.
@@ -54,7 +54,7 @@ Return ONLY the corrected code without any explanation:
     try:
         response = httpx.post(
-            f"{TGI_BASE_URL}/v1/chat/completions",
             json={
                 "model": "tgi",
                 "messages": [{"role": "user", "content": prompt}],
@@ -479,7 +479,7 @@ def generate_fix(
     Returns: { fixed_code, method, success, explanation }
     """
     if use_tgi:
-        fixed_code = fix_with_tgi(code)
         if fixed_code:
             # Log complexity vs reward for research tracking
             complexity = detect_complexity(fixed_code)

 TGI_BASE_URL = os.environ.get("TGI_BASE_URL", "http://localhost:8080")
 TGI_AVAILABLE = False
+def check_tgi_availability(tgi_url: str = TGI_BASE_URL) -> bool:
     """Check if TGI server is available."""
     global TGI_AVAILABLE
     try:
+        response = httpx.get(f"{tgi_url}/health", timeout=5.0)
         TGI_AVAILABLE = response.status_code == 200
+    except Exception:
         TGI_AVAILABLE = False
     return TGI_AVAILABLE
+def fix_with_tgi(code: str, tgi_url: str = TGI_BASE_URL) -> Optional[str]:
     """Use TGI for advanced code fixing."""
+    if not TGI_AVAILABLE and not check_tgi_availability(tgi_url):
         return None
     prompt = f"""You are an expert competitive programmer.
     try:
         response = httpx.post(
+            f"{tgi_url}/v1/chat/completions",
             json={
                 "model": "tgi",
                 "messages": [{"role": "user", "content": prompt}],
     Returns: { fixed_code, method, success, explanation }
     """
     if use_tgi:
+        fixed_code = fix_with_tgi(code, tgi_url=tgi_url)
         if fixed_code:
             # Log complexity vs reward for research tracking
             complexity = detect_complexity(fixed_code)