Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -65,11 +65,18 @@ ddg = DuckDuckGoSearchTool()
|
|
| 65 |
# custom_role_conversions=None,
|
| 66 |
# )
|
| 67 |
|
| 68 |
-
model = LiteLLMModel(
|
| 69 |
-
|
| 70 |
-
|
| 71 |
-
|
| 72 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 73 |
)
|
| 74 |
|
| 75 |
# Import tool from Hub
|
|
|
|
| 65 |
# custom_role_conversions=None,
|
| 66 |
# )
|
| 67 |
|
| 68 |
+
# model = LiteLLMModel(
|
| 69 |
+
# model_id="ollama_chat/qwen2.5:7b", # Ollama model identifier
|
| 70 |
+
# api_base="http://127.0.0.1:11434", # default Ollama HTTP port
|
| 71 |
+
# num_ctx=8192,
|
| 72 |
+
# temperature=0.5
|
| 73 |
+
# )
|
| 74 |
+
|
| 75 |
+
model = LocalModel(
|
| 76 |
+
model_id="TheBloke/vicuna-7B-1.1-HF",
|
| 77 |
+
trust_remote_code=True, # needed if the repo defines its own model classes
|
| 78 |
+
device="cuda", # or "cpu" if no GPU
|
| 79 |
+
quantize="4bit" # optional: drastically reduce VRAM usage
|
| 80 |
)
|
| 81 |
|
| 82 |
# Import tool from Hub
|