Spaces:
Sleeping
Sleeping
Emmanuel Durand commited on
Commit ·
94116e7
1
Parent(s): 15ed30c
Test now with llama.cpp
Browse files- .gitignore +1 -0
- Dockerfile +5 -6
- README.md +1 -0
.gitignore
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
*.swp
|
Dockerfile
CHANGED
|
@@ -1,13 +1,12 @@
|
|
| 1 |
FROM nvidia/cuda:12.9.0-cudnn-devel-ubuntu24.04
|
| 2 |
|
| 3 |
RUN DEBIAN_FRONTED=noninteractive apt update && apt upgrade -y
|
| 4 |
-
RUN DEBIAN_FRONTED=noninteractive apt install -y git git-lfs build-essential cmake ninja-build curl
|
| 5 |
|
| 6 |
-
RUN git clone https://github.com/ggml-org/
|
| 7 |
-
WORKDIR
|
| 8 |
-
RUN sh ./models/download-ggml-model.sh base.en
|
| 9 |
ENV LD_LIBRARY_PATH="/usr/local/cuda/compat:$LD_LIBRARY_PATH"
|
| 10 |
-
RUN cmake -B build -GNinja -DGGML_CUDA=1
|
| 11 |
cmake --build build --config Release
|
| 12 |
|
| 13 |
-
CMD ./build/bin/
|
|
|
|
| 1 |
FROM nvidia/cuda:12.9.0-cudnn-devel-ubuntu24.04
|
| 2 |
|
| 3 |
RUN DEBIAN_FRONTED=noninteractive apt update && apt upgrade -y
|
| 4 |
+
RUN DEBIAN_FRONTED=noninteractive apt install -y git git-lfs build-essential cmake ninja-build curl libcurl4-openssl-dev
|
| 5 |
|
| 6 |
+
RUN git clone https://github.com/ggml-org/llama.cpp.git
|
| 7 |
+
WORKDIR llama.cpp
|
|
|
|
| 8 |
ENV LD_LIBRARY_PATH="/usr/local/cuda/compat:$LD_LIBRARY_PATH"
|
| 9 |
+
RUN cmake -B build -GNinja -DGGML_CUDA=1 && \
|
| 10 |
cmake --build build --config Release
|
| 11 |
|
| 12 |
+
CMD ./build/bin/llama-server --host 0.0.0.0 -hf ggml-org/SmolVLM-256M-Instruct-GGUF
|
README.md
CHANGED
|
@@ -5,6 +5,7 @@ colorFrom: red
|
|
| 5 |
colorTo: yellow
|
| 6 |
sdk: docker
|
| 7 |
pinned: false
|
|
|
|
| 8 |
---
|
| 9 |
|
| 10 |
Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
|
|
|
|
| 5 |
colorTo: yellow
|
| 6 |
sdk: docker
|
| 7 |
pinned: false
|
| 8 |
+
app_port: 8080
|
| 9 |
---
|
| 10 |
|
| 11 |
Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
|