File size: 740 Bytes
b8efa34
 
ca228a3
b8efa34
 
 
 
 
2b1604a
b8efa34
eb12c5f
 
ca228a3
b8efa34
 
8d4f925
b8efa34
ca228a3
 
b8efa34
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
# Use the ultra-compact pre-compiled image
FROM samueltallet/alpine-llama-cpp-server:latest

# Hugging Face Free Tier settings
ENV LLAMA_ARG_HOST=0.0.0.0
ENV LLAMA_ARG_PORT=7860
ENV LLAMA_ARG_THREADS=2
ENV LLAMA_ARG_CTX_SIZE=4096

# Define the Qwen 3.5 model to download and run
ENV LLAMA_ARG_HF_REPO=amkkk/Qwen3.5-0.8B-quantized_uncensored_finetuned
ENV LLAMA_ARG_HF_FILE=qwen3.5-0.8b-finetuned-ablated-e2-ablation020.Q4_K_M.gguf

# Optional: Set an API Key to keep your Space private
# ENV LLAMA_API_KEY=your_secret_key_here

# Hugging Face needs to know which port to look at
EXPOSE 7860

# The image has its own entrypoint that handles the download and server start
# We don't need a CMD or ENTRYPOINT here as the base image handles it.