MichaelP719 commited on
Commit
5f3c471
·
verified ·
1 Parent(s): 99be101

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -5
app.py CHANGED
@@ -65,11 +65,18 @@ ddg = DuckDuckGoSearchTool()
65
  # custom_role_conversions=None,
66
  # )
67
 
68
- model = LiteLLMModel(
69
- model_id="ollama_chat/qwen2.5:7b", # Ollama model identifier
70
- api_base="http://127.0.0.1:11434", # default Ollama HTTP port
71
- num_ctx=8192,
72
- temperature=0.5
 
 
 
 
 
 
 
73
  )
74
 
75
  # Import tool from Hub
 
65
  # custom_role_conversions=None,
66
  # )
67
 
68
+ # model = LiteLLMModel(
69
+ # model_id="ollama_chat/qwen2.5:7b", # Ollama model identifier
70
+ # api_base="http://127.0.0.1:11434", # default Ollama HTTP port
71
+ # num_ctx=8192,
72
+ # temperature=0.5
73
+ # )
74
+
75
+ model = LocalModel(
76
+ model_id="TheBloke/vicuna-7B-1.1-HF",
77
+ trust_remote_code=True, # needed if the repo defines its own model classes
78
+ device="cuda", # or "cpu" if no GPU
79
+ quantize="4bit" # optional: drastically reduce VRAM usage
80
  )
81
 
82
  # Import tool from Hub