mindcraft-vllm

Sleeping

App Files Files Community

yousuff.s commited on Dec 24, 2025

Commit

c38633f

1 Parent(s): bdf1636

add Flask app and entrypoint script for Ollama service

Browse files

Files changed (3) hide show

Dockerfile +3 -69
app.py +74 -0
entrypoint.sh +20 -0

Dockerfile CHANGED Viewed

@@ -2,80 +2,14 @@ FROM ollama/ollama:latest
 WORKDIR /app
-# Install dependencies
 RUN apt-get update && apt-get install -y curl python3 python3-pip && \
     rm -rf /var/lib/apt/lists/*
-# Install Flask
 RUN pip3 install flask requests --break-system-packages
-# Create Flask app
-RUN printf '%s\n' \
-'from flask import Flask, request, jsonify, Response' \
-'import requests' \
-'' \
-'app = Flask(__name__)' \
-'OLLAMA_URL = "http://localhost:11434"' \
-'' \
-'@app.route("/")' \
-'def home():' \
-'    return """<!DOCTYPE html>' \
-'<html><head><title>Ollama API</title></head>' \
-'<body style="font-family:Arial;padding:50px;text-align:center;">' \
-'<h1>🦙 Ollama API Running!</h1>' \
-'<p>Model: llama3.2:3b</p>' \
-'<h3>Test with:</h3>' \
-'<pre style="background:#f4f4f4;padding:20px;text-align:left;">curl -X POST https://YOUR-SPACE.hf.space/api/generate \\' \
-'  -H "Content-Type: application/json" \\' \
-'  -d '"'"'{"model":"llama3.2:3b","prompt":"Hello!","stream":false}'"'"'</pre>' \
-'</body></html>"""' \
-'' \
-'@app.route("/api/generate", methods=["POST"])' \
-'def generate():' \
-'    try:' \
-'        data = request.json' \
-'        resp = requests.post(f"{OLLAMA_URL}/api/generate", json=data, stream=data.get("stream", False))' \
-'        if data.get("stream", False):' \
-'            def gen():' \
-'                for line in resp.iter_lines():' \
-'                    if line: yield line + b"\\n"' \
-'            return Response(gen(), content_type="application/x-ndjson")' \
-'        return jsonify(resp.json())' \
-'    except Exception as e:' \
-'        return jsonify({"error": str(e)}), 500' \
-'' \
-'@app.route("/api/chat", methods=["POST"])' \
-'def chat():' \
-'    try:' \
-'        data = request.json' \
-'        resp = requests.post(f"{OLLAMA_URL}/api/chat", json=data, stream=data.get("stream", False))' \
-'        if data.get("stream", False):' \
-'            def gen():' \
-'                for line in resp.iter_lines():' \
-'                    if line: yield line + b"\\n"' \
-'            return Response(gen(), content_type="application/x-ndjson")' \
-'        return jsonify(resp.json())' \
-'    except Exception as e:' \
-'        return jsonify({"error": str(e)}), 500' \
-'' \
-'if __name__ == "__main__":' \
-'    app.run(host="0.0.0.0", port=7860)' \
-> /app/app.py
-# Create startup script
-RUN printf '%s\n' \
-'#!/bin/bash' \
-'set -e' \
-'echo "Starting Ollama..."' \
-'ollama serve &' \
-'sleep 10' \
-'echo "Pulling model..."' \
-'ollama pull llama3.2:3b' \
-'echo "Starting Flask..."' \
-'python3 /app/app.py &' \
-'echo "Ready!"' \
-'wait' \
-> /entrypoint.sh && chmod +x /entrypoint.sh
 EXPOSE 7860 11434

 WORKDIR /app
 RUN apt-get update && apt-get install -y curl python3 python3-pip && \
     rm -rf /var/lib/apt/lists/*
 RUN pip3 install flask requests --break-system-packages
+COPY app.py /app/app.py
+COPY entrypoint.sh /entrypoint.sh
+RUN chmod +x /entrypoint.sh
 EXPOSE 7860 11434

app.py ADDED Viewed

	@@ -0,0 +1,74 @@

+from flask import Flask, request, jsonify, Response
+import requests
+app = Flask(__name__)
+OLLAMA_URL = "http://localhost:11434"
+@app.route('/')
+def home():
+    return '''<!DOCTYPE html>
+<html><head><title>Ollama API</title></head>
+<body style="font-family:Arial;padding:50px;text-align:center;">
+<h1>🦙 Ollama API Running!</h1>
+<p>Model: llama3.2:3b</p>
+<h3>Test with:</h3>
+<pre style="background:#f4f4f4;padding:20px;text-align:left;max-width:700px;margin:20px auto;">
+curl -X POST https://my-ollama.hf.space/api/generate \\
+  -H "Content-Type: application/json" \\
+  -d '{"model":"llama3.2:3b","prompt":"Hello!","stream":false}'
+</pre>
+</body></html>'''
+@app.route('/api/generate', methods=['POST'])
+def generate():
+    print("Received request to /api/generate")
+    try:
+        data = request.get_json()
+        print(f"Request data: {data}")
+        resp = requests.post(
+            f"{OLLAMA_URL}/api/generate",
+            json=data,
+            stream=data.get('stream', False),
+            timeout=120
+        )
+        if data.get('stream', False):
+            def gen():
+                for line in resp.iter_lines():
+                    if line:
+                        yield line + b'\n'
+            return Response(gen(), content_type='application/x-ndjson')
+        else:
+            return jsonify(resp.json())
+    except Exception as e:
+        print(f"Error: {e}")
+        return jsonify({"error": str(e)}), 500
+@app.route('/api/chat', methods=['POST'])
+def chat():
+    print("Received request to /api/chat")
+    try:
+        data = request.get_json()
+        resp = requests.post(
+            f"{OLLAMA_URL}/api/chat",
+            json=data,
+            stream=data.get('stream', False),
+            timeout=120
+        )
+        if data.get('stream', False):
+            def gen():
+                for line in resp.iter_lines():
+                    if line:
+                        yield line + b'\n'
+            return Response(gen(), content_type='application/x-ndjson')
+        else:
+            return jsonify(resp.json())
+    except Exception as e:
+        print(f"Error: {e}")
+        return jsonify({"error": str(e)}), 500
+if __name__ == '__main__':
+    print("Starting Flask on port 7860...")
+    app.run(host='0.0.0.0', port=7860, debug=False)

entrypoint.sh ADDED Viewed

	@@ -0,0 +1,20 @@

+#!/bin/bash
+set -e
+echo "Starting Ollama..."
+ollama serve &
+OLLAMA_PID=$!
+echo "Waiting for Ollama to be ready..."
+sleep 10
+echo "Pulling model..."
+ollama pull llama3.2:3b
+echo "Starting Flask..."
+python3 /app/app.py &
+FLASK_PID=$!
+echo "Ready!"
+wait $OLLAMA_PID $FLASK_PID