hermes3-llama-cpp

Running

Jodaro commited on about 23 hours ago

Commit

863eb49

verified ·

1 Parent(s): 5db6945

Switch to Llama 3.2 3B Instruct Q4_K_M

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,13 +1,13 @@
 import gradio as gr
 from ctransformers import AutoModelForCausalLM
-MODEL_REPO = "Qwen/Qwen2.5-3B-Instruct-GGUF"
-MODEL_FILE = "qwen2.5-3b-instruct-q4_k_m.gguf"
 llm = AutoModelForCausalLM.from_pretrained(
     MODEL_REPO,
     model_file=MODEL_FILE,
-    model_type="qwen",
     gpu_layers=0,
     context_length=8192,
 )

 import gradio as gr
 from ctransformers import AutoModelForCausalLM
+MODEL_REPO = "hugging-quants/Llama-3.2-3B-Instruct-Q4_K_M-GGUF"
+MODEL_FILE = "llama-3.2-3b-instruct-q4_k_m.gguf"
 llm = AutoModelForCausalLM.from_pretrained(
     MODEL_REPO,
     model_file=MODEL_FILE,
+    model_type="llama",
     gpu_layers=0,
     context_length=8192,
 )