hugh007 commited on
Commit
82ad52b
·
verified ·
1 Parent(s): 0745c6f

fix: upgrade to Q6_K (600MB) better quality

Browse files
Files changed (2) hide show
  1. Dockerfile +2 -2
  2. app.py +1 -1
Dockerfile CHANGED
@@ -10,8 +10,8 @@ RUN pip install --no-cache-dir --timeout 300 llama-cpp-python==0.3.23 \
10
  RUN apt-get update && apt-get install -y --no-install-recommends curl \
11
  && rm -rf /var/lib/apt/lists/*
12
  RUN mkdir -p /app/models && \
13
- curl -sL -o /app/models/MiniCPM-V-4_6-Thinking-Q4_K_M.gguf \
14
- "https://huggingface.co/openbmb/MiniCPM-V-4.6-Thinking-gguf/resolve/main/MiniCPM-V-4_6-Thinking-Q4_K_M.gguf" && \
15
  curl -sL -o /app/models/mmproj-model-f16.gguf \
16
  "https://huggingface.co/openbmb/MiniCPM-V-4.6-Thinking-gguf/resolve/main/mmproj-model-f16.gguf"
17
 
 
10
  RUN apt-get update && apt-get install -y --no-install-recommends curl \
11
  && rm -rf /var/lib/apt/lists/*
12
  RUN mkdir -p /app/models && \
13
+ curl -sL -o /app/models/MiniCPM-V-4_6-Thinking-Q6_K.gguf \
14
+ "https://huggingface.co/openbmb/MiniCPM-V-4.6-Thinking-gguf/resolve/main/MiniCPM-V-4_6-Thinking-Q6_K.gguf" && \
15
  curl -sL -o /app/models/mmproj-model-f16.gguf \
16
  "https://huggingface.co/openbmb/MiniCPM-V-4.6-Thinking-gguf/resolve/main/mmproj-model-f16.gguf"
17
 
app.py CHANGED
@@ -11,7 +11,7 @@ _ready = False
11
  _llm = None
12
  _llm_lock = threading.Lock()
13
  _tasks = {}
14
- MODEL_PATH = "/app/models/MiniCPM-V-4_6-Thinking-Q4_K_M.gguf"
15
  MMPROJ_PATH = "/app/models/mmproj-model-f16.gguf"
16
 
17
 
 
11
  _llm = None
12
  _llm_lock = threading.Lock()
13
  _tasks = {}
14
+ MODEL_PATH = "/app/models/MiniCPM-V-4_6-Thinking-Q6_K.gguf"
15
  MMPROJ_PATH = "/app/models/mmproj-model-f16.gguf"
16
 
17