Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -12,7 +12,7 @@ llm = Llama(
|
|
| 12 |
filename="llama-2-7b-chat.ggmlv3.q5_0.bin",
|
| 13 |
),
|
| 14 |
n_ctx=2048,
|
| 15 |
-
n_gpu_layers=
|
| 16 |
)
|
| 17 |
|
| 18 |
history = []
|
|
@@ -61,6 +61,8 @@ demo = gr.ChatInterface(
|
|
| 61 |
generate_text,
|
| 62 |
title="llama-cpp-python on GPU",
|
| 63 |
description="Running LLM with https://github.com/abetlen/llama-cpp-python",
|
|
|
|
|
|
|
| 64 |
retry_btn=None,
|
| 65 |
undo_btn="Delete Previous",
|
| 66 |
clear_btn="Clear",
|
|
|
|
| 12 |
filename="llama-2-7b-chat.ggmlv3.q5_0.bin",
|
| 13 |
),
|
| 14 |
n_ctx=2048,
|
| 15 |
+
n_gpu_layers=5000, # change n_gpu_layers if you have more or less VRAM
|
| 16 |
)
|
| 17 |
|
| 18 |
history = []
|
|
|
|
| 61 |
generate_text,
|
| 62 |
title="llama-cpp-python on GPU",
|
| 63 |
description="Running LLM with https://github.com/abetlen/llama-cpp-python",
|
| 64 |
+
examples=["tell me everything about llamas"],
|
| 65 |
+
cache_examples=True,
|
| 66 |
retry_btn=None,
|
| 67 |
undo_btn="Delete Previous",
|
| 68 |
clear_btn="Clear",
|