Rename app.py to start.sh
Browse files
app.py
DELETED
|
@@ -1,23 +0,0 @@
|
|
| 1 |
-
from flask import Flask, request, jsonify
|
| 2 |
-
import subprocess
|
| 3 |
-
|
| 4 |
-
app = Flask(__name__)
|
| 5 |
-
MODEL_PATH = "/llama.cpp/models/llama3.gguf"
|
| 6 |
-
|
| 7 |
-
@app.route("/generate", methods=["POST"])
|
| 8 |
-
def generate():
|
| 9 |
-
prompt = request.json.get("prompt", "")
|
| 10 |
-
|
| 11 |
-
cmd = [
|
| 12 |
-
"/llama.cpp/main",
|
| 13 |
-
"-m", MODEL_PATH,
|
| 14 |
-
"-p", prompt,
|
| 15 |
-
"--n-predict", "128",
|
| 16 |
-
"--ctx-size", "2048",
|
| 17 |
-
"--temp", "0.7"
|
| 18 |
-
]
|
| 19 |
-
|
| 20 |
-
result = subprocess.run(cmd, capture_output=True, text=True)
|
| 21 |
-
return jsonify({"response": result.stdout})
|
| 22 |
-
|
| 23 |
-
app.run(host="0.0.0.0", port=7860)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
start.sh
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
#!/bin/bash
|
| 2 |
+
|
| 3 |
+
# Start Ollama server
|
| 4 |
+
ollama serve &
|
| 5 |
+
|
| 6 |
+
# Give it time to boot
|
| 7 |
+
sleep 15
|
| 8 |
+
|
| 9 |
+
# Pull LLaMA 3 (8B)
|
| 10 |
+
ollama pull llama3
|
| 11 |
+
|
| 12 |
+
# Keep container alive
|
| 13 |
+
tail -f /dev/null
|