Jodaro commited on
Commit
863eb49
·
verified ·
1 Parent(s): 5db6945

Switch to Llama 3.2 3B Instruct Q4_K_M

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -1,13 +1,13 @@
1
  import gradio as gr
2
  from ctransformers import AutoModelForCausalLM
3
 
4
- MODEL_REPO = "Qwen/Qwen2.5-3B-Instruct-GGUF"
5
- MODEL_FILE = "qwen2.5-3b-instruct-q4_k_m.gguf"
6
 
7
  llm = AutoModelForCausalLM.from_pretrained(
8
  MODEL_REPO,
9
  model_file=MODEL_FILE,
10
- model_type="qwen",
11
  gpu_layers=0,
12
  context_length=8192,
13
  )
 
1
  import gradio as gr
2
  from ctransformers import AutoModelForCausalLM
3
 
4
+ MODEL_REPO = "hugging-quants/Llama-3.2-3B-Instruct-Q4_K_M-GGUF"
5
+ MODEL_FILE = "llama-3.2-3b-instruct-q4_k_m.gguf"
6
 
7
  llm = AutoModelForCausalLM.from_pretrained(
8
  MODEL_REPO,
9
  model_file=MODEL_FILE,
10
+ model_type="llama",
11
  gpu_layers=0,
12
  context_length=8192,
13
  )