QJMKWB commited on
Commit
3bb3fbd
·
verified ·
1 Parent(s): 086d105

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +32 -0
app.py ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+ import subprocess
3
+ from huggingface_hub import hf_hub_download
4
+
5
+ print("--- START: Inicializacia Space ---")
6
+
7
+ # 1. Stiahnutie modelu (uvidíš progres v logoch)
8
+ repo_id = "bartowski/Qwen2.5-Coder-7B-Instruct-GGUF"
9
+ filename = "Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf"
10
+
11
+ print(f"--- Stahujem model {filename} z {repo_id} ---")
12
+ model_path = hf_hub_download(repo_id=repo_id, filename=filename, local_dir=".")
13
+ print(f"--- Model je pripraveny v: {model_path} ---")
14
+
15
+ # 2. Spustenie llama-cpp servera
16
+ command = [
17
+ "python3", "-m", "llama_cpp.server",
18
+ "--model", filename,
19
+ "--host", "0.0.0.0",
20
+ "--port", "7860",
21
+ "--chat_format", "chatml",
22
+ "--verbose", "True"
23
+ ]
24
+
25
+ print(f"--- Spustam server: {' '.join(command)} ---")
26
+
27
+ # Spustíme proces a budeme preposielať logy do konzoly
28
+ process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=STDOUT, text=True)
29
+
30
+ # Toto zabezpečí, že každý riadok zo servera uvidíš v logoch okamžite
31
+ for line in process.stdout:
32
+ print(line, end='')