Spaces:
Running
Running
Switch to Llama 3.2 3B Instruct Q4_K_M
Browse files
app.py
CHANGED
|
@@ -1,13 +1,13 @@
|
|
| 1 |
import gradio as gr
|
| 2 |
from ctransformers import AutoModelForCausalLM
|
| 3 |
|
| 4 |
-
MODEL_REPO = "
|
| 5 |
-
MODEL_FILE = "
|
| 6 |
|
| 7 |
llm = AutoModelForCausalLM.from_pretrained(
|
| 8 |
MODEL_REPO,
|
| 9 |
model_file=MODEL_FILE,
|
| 10 |
-
model_type="
|
| 11 |
gpu_layers=0,
|
| 12 |
context_length=8192,
|
| 13 |
)
|
|
|
|
| 1 |
import gradio as gr
|
| 2 |
from ctransformers import AutoModelForCausalLM
|
| 3 |
|
| 4 |
+
MODEL_REPO = "hugging-quants/Llama-3.2-3B-Instruct-Q4_K_M-GGUF"
|
| 5 |
+
MODEL_FILE = "llama-3.2-3b-instruct-q4_k_m.gguf"
|
| 6 |
|
| 7 |
llm = AutoModelForCausalLM.from_pretrained(
|
| 8 |
MODEL_REPO,
|
| 9 |
model_file=MODEL_FILE,
|
| 10 |
+
model_type="llama",
|
| 11 |
gpu_layers=0,
|
| 12 |
context_length=8192,
|
| 13 |
)
|