Spaces:

Bleak
/

Qwen3-API

Runtime error

App Files Files Community

Bleak commited on Nov 2, 2025

Commit

9df9f40

verified ·

1 Parent(s): a5a3a6c

Update Dockerfile

Browse files

Files changed (1) hide show

Dockerfile +56 -56

Dockerfile CHANGED Viewed

@@ -1,57 +1,57 @@
-#Ollama-API By BleakPrestiger
-# Builder stage
-FROM ubuntu:latest
-WORKDIR /app
-COPY ..
-# In your Dockerfile
-RUN pip install huggingface_hub
-# Download the model during the build process
-RUN python -c "from huggingface_hub import hf_hub_download; hf_hub_download(repo_id='Qwen/Qwen3-1.7B-GGUF', filename='Qwen3-1.7B-Q8_0.gguf', local_dir='./')"
-# Update packages and install curl and gnupg
-RUN apt-get update && apt-get upgrade -y && apt-get install -y \
-    curl \
-    wget \
-    gnupg
-RUN cd llama-b6795-bin-ubuntu-x64/build/bin && chmod +x ./llama-server && ./llama-server --model Qwen3-1.7B-Q8_0.gguf --ctx-size-draft 32767 --ctx-size 32767 --temp 1.0 --top-k 64 --top-k 0.95 --min-p 0.0 --log-file llama.log &
-# Copy the entry point script
-#COPY entrypoint.sh /entrypoint.sh
-RUN chmod +x /entrypoint.sh
-# Set the entry point script as the default command
-ENTRYPOINT ["/entrypoint.sh"]
-#CMD ["ollama", "serve"]
-# Expose the server port
-EXPOSE 7860
-# Add NVIDIA package repositories
-#RUN curl -fsSL https://nvidia.github.io/libnvidia-container/gpgkey | gpg --dearmor -o /usr/share/keyrings/nvidia-container-toolkit-keyring.gpg \
-    #&& echo "deb [signed-by=/usr/share/keyrings/nvidia-container-toolkit-keyring.gpg] https://nvidia.github.io/libnvidia-container/stable/deb/ $(. /etc/os-release; echo $UBUNTU_CODENAME) main" > /etc/apt/sources.list.d/nvidia-container-toolkit.list
-# Install NVIDIA container toolkit (Check for any updated methods or URLs for Ubuntu jammy)
-#RUN apt-get update && apt-get install -y nvidia-container-toolkit || true
-# Install application
-#RUN curl https://ollama.ai/install.sh | sh
-# Below is to fix embedding bug as per
-# RUN curl -fsSL https://ollama.com/install.sh | sed 's#https://ollama.com/download#https://github.com/jmorganca/ollama/releases/download/v0.1.29#' | sh
-# Create the directory and give appropriate permissions
-#RUN mkdir -p /.ollama && chmod 777 /.ollama
-#WORKDIR /.ollama
-# Set the entry point script as the default command
-#ENTRYPOINT ["/entrypoint.sh"]
-#CMD ["ollama", "serve"]
-# Set the model as an environment variable (this can be overridden)
 #ENV model=${model}

+#Ollama-API By BleakPrestiger
+# Builder stage
+FROM ubuntu:latest
+WORKDIR /app
+COPY .. app
+# In your Dockerfile
+RUN pip install huggingface_hub
+# Download the model during the build process
+RUN python -c "from huggingface_hub import hf_hub_download; hf_hub_download(repo_id='Qwen/Qwen3-1.7B-GGUF', filename='Qwen3-1.7B-Q8_0.gguf', local_dir='./')"
+# Update packages and install curl and gnupg
+RUN apt-get update && apt-get upgrade -y && apt-get install -y \
+    curl \
+    wget \
+    gnupg
+RUN cd llama-b6795-bin-ubuntu-x64/build/bin && chmod +x ./llama-server && ./llama-server --model Qwen3-1.7B-Q8_0.gguf --ctx-size-draft 32767 --ctx-size 32767 --temp 1.0 --top-k 64 --top-k 0.95 --min-p 0.0 --log-file llama.log &
+# Copy the entry point script
+#COPY entrypoint.sh /entrypoint.sh
+RUN chmod +x /entrypoint.sh
+# Set the entry point script as the default command
+ENTRYPOINT ["/entrypoint.sh"]
+#CMD ["ollama", "serve"]
+# Expose the server port
+EXPOSE 7860
+# Add NVIDIA package repositories
+#RUN curl -fsSL https://nvidia.github.io/libnvidia-container/gpgkey | gpg --dearmor -o /usr/share/keyrings/nvidia-container-toolkit-keyring.gpg \
+    #&& echo "deb [signed-by=/usr/share/keyrings/nvidia-container-toolkit-keyring.gpg] https://nvidia.github.io/libnvidia-container/stable/deb/ $(. /etc/os-release; echo $UBUNTU_CODENAME) main" > /etc/apt/sources.list.d/nvidia-container-toolkit.list
+# Install NVIDIA container toolkit (Check for any updated methods or URLs for Ubuntu jammy)
+#RUN apt-get update && apt-get install -y nvidia-container-toolkit || true
+# Install application
+#RUN curl https://ollama.ai/install.sh | sh
+# Below is to fix embedding bug as per
+# RUN curl -fsSL https://ollama.com/install.sh | sed 's#https://ollama.com/download#https://github.com/jmorganca/ollama/releases/download/v0.1.29#' | sh
+# Create the directory and give appropriate permissions
+#RUN mkdir -p /.ollama && chmod 777 /.ollama
+#WORKDIR /.ollama
+# Set the entry point script as the default command
+#ENTRYPOINT ["/entrypoint.sh"]
+#CMD ["ollama", "serve"]
+# Set the model as an environment variable (this can be overridden)
 #ENV model=${model}