Spaces:

Vishinka
/

Code_LLM

Sleeping

AnatoliiG commited on Jan 18

Commit

5c8b266

1 Parent(s): e5ebe08

fix docker + add check in app

Files changed (2) hide show

Dockerfile CHANGED Viewed

@@ -3,9 +3,8 @@ FROM python:3.10-slim-bookworm
 RUN apt-get update && apt-get install -y --no-install-recommends \
     build-essential \
     cmake \
-    libopenblas0 \
     libgomp1 \
-    git \
     curl \
     && rm -rf /var/lib/apt/lists/*
@@ -19,8 +18,8 @@ WORKDIR /app
 RUN pip install --no-cache-dir --upgrade pip
-RUN pip install --no-cache-dir \
-    https://github.com/abetlen/llama-cpp-python/releases/download/v0.2.90/llama_cpp_python-0.2.90-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
 COPY --chown=user requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt

 RUN apt-get update && apt-get install -y --no-install-recommends \
     build-essential \
     cmake \
+    libopenblas-dev \
     libgomp1 \
     curl \
     && rm -rf /var/lib/apt/lists/*
 RUN pip install --no-cache-dir --upgrade pip
+RUN pip install llama-cpp-python \
+    --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cpu
 COPY --chown=user requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt

app.py CHANGED Viewed

@@ -42,6 +42,9 @@ async def chat_completions(request: Request):
     temperature = data.get("temperature", 0.2)
     max_tokens = data.get("max_tokens", 2048)
     output = llm.create_chat_completion(
         messages=messages, max_tokens=max_tokens, temperature=temperature, stream=stream
     )

     temperature = data.get("temperature", 0.2)
     max_tokens = data.get("max_tokens", 2048)
+    if not messages:
+        return JSONResponse(content={"error": "No messages provided"}, status_code=400)
     output = llm.create_chat_completion(
         messages=messages, max_tokens=max_tokens, temperature=temperature, stream=stream
     )