Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
|
@@ -7,8 +7,9 @@ from huggingface_hub import hf_hub_download
|
|
| 7 |
|
| 8 |
llm = Llama(
|
| 9 |
model_path=hf_hub_download(
|
| 10 |
-
repo_id=os.environ.get("REPO_ID", "
|
| 11 |
-
|
|
|
|
| 12 |
),
|
| 13 |
n_ctx=2048,
|
| 14 |
n_gpu_layers=50, # change n_gpu_layers if you have more or less VRAM
|
|
|
|
| 7 |
|
| 8 |
llm = Llama(
|
| 9 |
model_path=hf_hub_download(
|
| 10 |
+
repo_id=os.environ.get("REPO_ID", "unsloth/NVIDIA-Nemotron-3-Nano-4B-GGUF:Q4_K_M"),# Run inference directly in the terminal:
|
| 11 |
+
|
| 12 |
+
filename=os.environ.get("MODEL_FILE", "NVIDIA-Nemotron-3-Nano-4B-GGUF:Q4_K_M"),
|
| 13 |
),
|
| 14 |
n_ctx=2048,
|
| 15 |
n_gpu_layers=50, # change n_gpu_layers if you have more or less VRAM
|