Update README.md
Browse files
README.md
CHANGED
|
@@ -55,7 +55,7 @@ from llama_cpp import Llama
|
|
| 55 |
|
| 56 |
model_path = hf_hub_download(
|
| 57 |
repo_id="MoxoffSpA/VolareQuantized",
|
| 58 |
-
filename="Volare-Q4_K_M.gguf"
|
| 59 |
)
|
| 60 |
|
| 61 |
# Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
|
|
|
|
| 55 |
|
| 56 |
model_path = hf_hub_download(
|
| 57 |
repo_id="MoxoffSpA/VolareQuantized",
|
| 58 |
+
filename="Volare-ggml-Q4_K_M.gguf"
|
| 59 |
)
|
| 60 |
|
| 61 |
# Set gpu_layers to the number of layers to offload to GPU. Set to 0 if no GPU acceleration is available on your system.
|