SeaWolf-AI commited on
Commit
7255ef6
·
verified ·
1 Parent(s): e4bf98e

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +7 -14
Dockerfile CHANGED
@@ -1,28 +1,21 @@
1
- FROM nvidia/cuda:12.4.1-runtime-ubuntu22.04
2
 
3
  ENV DEBIAN_FRONTEND=noninteractive
4
  ENV PYTHONUNBUFFERED=1
5
 
6
- # System deps
7
- RUN apt-get update && apt-get install -y --no-install-recommends \
8
- python3.11 python3.11-venv python3-pip curl && \
9
- ln -sf /usr/bin/python3.11 /usr/bin/python3 && \
10
- ln -sf /usr/bin/python3.11 /usr/bin/python && \
11
- apt-get clean && rm -rf /var/lib/apt/lists/*
12
-
13
- # Python packages — vLLM + TriAttention + FastAPI
14
  RUN pip install --no-cache-dir --upgrade pip && \
15
  pip install --no-cache-dir \
16
- vllm>=0.15.0 \
17
- aither-kvcache[vllm]>=2.0.0 \
18
  gradio>=5.0 \
19
  fastapi \
20
  uvicorn \
21
- openai \
22
  httpx \
23
  requests \
24
- PyMuPDF \
25
- huggingface_hub
 
 
26
 
27
  WORKDIR /app
28
  COPY . /app
 
1
+ FROM vllm/vllm-openai:latest
2
 
3
  ENV DEBIAN_FRONTEND=noninteractive
4
  ENV PYTHONUNBUFFERED=1
5
 
6
+ # Gemma 4 requires transformers 5.5.0+
 
 
 
 
 
 
 
7
  RUN pip install --no-cache-dir --upgrade pip && \
8
  pip install --no-cache-dir \
9
+ "transformers>=5.5.0" \
 
10
  gradio>=5.0 \
11
  fastapi \
12
  uvicorn \
 
13
  httpx \
14
  requests \
15
+ PyMuPDF
16
+
17
+ # TriAttention (optional - fails gracefully if unavailable)
18
+ RUN pip install --no-cache-dir aither-kvcache || true
19
 
20
  WORKDIR /app
21
  COPY . /app