File size: 676 Bytes
3bb3fbd
 
26bc55c
d7ee138
26bc55c
 
3bb3fbd
26bc55c
 
e932502
26bc55c
 
 
e932502
3bb3fbd
26bc55c
 
 
 
e932502
 
d7ee138
26bc55c
3bb3fbd
e932502
26bc55c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
import os
import subprocess
from huggingface_hub import hf_hub_download

# Rýchle sťahovanie
os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "1"

def run():
    # Stiahneš model (už máš llama-cpp pripravené v systéme)
    model_path = hf_hub_download(
        repo_id="bartowski/Qwen2.5-Coder-7B-Instruct-GGUF", 
        filename="Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf",
        local_dir="."
    )

    # Spustíš server
    subprocess.run([
        "python3", "-m", "llama_cpp.server",
        "--model", "Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf",
        "--host", "0.0.0.0",
        "--port", "7860",
        "--n_ctx", "4096"
    ])

if __name__ == "__main__":
    run()