chipling commited on
Commit
ca228a3
·
verified ·
1 Parent(s): 14de79a

Create Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +29 -0
Dockerfile ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Use a lightweight Python image
2
+ FROM python:3.10-slim
3
+
4
+ # Set working directory
5
+ WORKDIR /app
6
+
7
+ # Install system dependencies
8
+ RUN apt-get update && apt-get install -y \
9
+ gcc g++ make cmake git libopenblas-dev \
10
+ && rm -rf /var/lib/apt/lists/*
11
+
12
+ # Copy requirements and install
13
+ COPY requirements.txt .
14
+ RUN pip install --no-cache-dir -r requirements.txt
15
+
16
+ # Download the model during build so the Space starts faster
17
+ RUN python3 -c "from huggingface_hub import hf_hub_download; hf_hub_download(repo_id='HauhauCS/Qwen3.5-4B-Uncensored-HauhauCS-Aggressive', filename='Qwen3.5-4B-Uncensored-HauhauCS-Aggressive-Q4_K_M.gguf', local_dir='.')"
18
+
19
+ # Expose the standard HF Space port
20
+ EXPOSE 7860
21
+
22
+ # Run the OpenAI compatible server
23
+ # We use host 0.0.0.0 and port 7860 for HF compatibility
24
+ CMD ["python3", "-m", "llama_cpp.server", \
25
+ "--model", "Qwen3.5-4B-Uncensored-HauhauCS-Aggressive-Q4_K_M.gguf", \
26
+ "--host", "0.0.0.0", \
27
+ "--port", "7860", \
28
+ "--n_threads", "2", \
29
+ "--n_ctx", "2048"]