Upload 2 files
Browse files- Dockerfile +21 -0
- script.sh +8 -0
Dockerfile
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
FROM ghcr.io/ggerganov/llama.cpp:server-cuda-7c27a19b2eb91bb0f43c7f7aec0386cec2dddc33
|
| 2 |
+
|
| 3 |
+
RUN apt-get update && apt-get install -y wget pip python3 git
|
| 4 |
+
|
| 5 |
+
ENTRYPOINT ["/bin/sh", "-c"]
|
| 6 |
+
|
| 7 |
+
WORKDIR llama.cpp
|
| 8 |
+
|
| 9 |
+
RUN wget -q https://huggingface.co/Mihaiii/shieldgemma-2b-Q5_K_M-GGUF/resolve/main/shieldgemma-2b-q5_k_m-imat.gguf
|
| 10 |
+
RUN wget -q https://huggingface.co/bartowski/gemma-2-2b-it-GGUF/resolve/main/gemma-2-2b-it-Q5_K_M.gguf
|
| 11 |
+
|
| 12 |
+
COPY script.sh .
|
| 13 |
+
|
| 14 |
+
RUN chmod +x ./script.sh
|
| 15 |
+
RUN chmod 777 .
|
| 16 |
+
|
| 17 |
+
RUN git clone https://github.com/Mihaiii/trivia.git
|
| 18 |
+
RUN cd trivia && pip install -r requirements.txt
|
| 19 |
+
RUN chmod 777 ./trivia
|
| 20 |
+
|
| 21 |
+
CMD ["./script.sh"]
|
script.sh
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
#!/bin/bash
|
| 2 |
+
../llama-server -m ./shieldgemma-2b-q5_k_m-imat.gguf -c 8192 -t 4 --port 8000 --host 127.0.0.1 --parallel 2 -cb &
|
| 3 |
+
../llama-server -m ./gemma-2-2b-it-Q5_K_M.gguf -c 8192 -t --port 7888 --host 127.0.0.1 --parallel 2 -cb &
|
| 4 |
+
|
| 5 |
+
sleep 5
|
| 6 |
+
|
| 7 |
+
cd trivia
|
| 8 |
+
uvicorn app:app --port 7860 --host 0.0.0.0
|