AIencoder commited on
Commit
1ee8232
·
verified ·
1 Parent(s): ed77a98

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +18 -4
app.py CHANGED
@@ -1,4 +1,4 @@
1
- import os
2
  import gradio as gr
3
  import json
4
  import time
@@ -13,11 +13,25 @@ MODELS_DIR = "/data/models"
13
  MAX_TOKENS = 2048
14
  CONTEXT_SIZE = 4096
15
 
16
- # Map models to their likely GGUF repositories (Falling back to Qwen for the 3B)
17
  MODEL_REPOS = {
 
 
 
 
18
  "qwen2.5-coder-3b-instruct-q4_k_m.gguf": "Qwen/Qwen2.5-Coder-3B-Instruct-GGUF",
19
- "qwen2.5-coder-7b-instruct-q4_k_m.gguf": "Qwen/Qwen2.5-Coder-7B-Instruct-GGUF",
20
- # You can add others here
 
 
 
 
 
 
 
 
 
 
 
21
  }
22
 
23
  MODELS = {
 
1
+ mport os
2
  import gradio as gr
3
  import json
4
  import time
 
13
  MAX_TOKENS = 2048
14
  CONTEXT_SIZE = 4096
15
 
 
16
  MODEL_REPOS = {
17
+ # 30B: Unsloth is the most reliable source for Qwen3 GGUFs currently
18
+ "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M.gguf": "unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF",
19
+
20
+ # 3B: Qwen actually has an official one, but bartowski is safer fallback
21
  "qwen2.5-coder-3b-instruct-q4_k_m.gguf": "Qwen/Qwen2.5-Coder-3B-Instruct-GGUF",
22
+
23
+ # 7B: Official Qwen GGUF is often missing/broken. Bartowski is the go-to here.
24
+ "qwen2.5-coder-7b-instruct-q4_k_m.gguf": "bartowski/Qwen2.5-Coder-7B-Instruct-GGUF",
25
+
26
+ # 14B: Bartowski is recommended for consistency
27
+ "qwen2.5-coder-14b-instruct-q4_k_m.gguf": "bartowski/Qwen2.5-Coder-14B-Instruct-GGUF",
28
+
29
+ # DeepSeek: Definitely needs community repo
30
+ "DeepSeek-Coder-V2-Lite-Instruct-Q4_K_M.gguf": "bartowski/DeepSeek-Coder-V2-Lite-Instruct-GGUF",
31
+
32
+ # Tiny models
33
+ "qwen2.5-coder-1.5b-instruct-q4_k_m.gguf": "Qwen/Qwen2.5-Coder-1.5B-Instruct-GGUF",
34
+ "qwen2.5-coder-0.5b-instruct-q4_k_m.gguf": "Qwen/Qwen2.5-Coder-0.5B-Instruct-GGUF",
35
  }
36
 
37
  MODELS = {