Spaces:

QuixiAI
/

chat

Running on Zero

pabloce commited on May 25, 2024

Commit

2cd2fd0

verified ·

1 Parent(s): 155c9c7

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,12 +1,15 @@
 import spaces
 import json
 import subprocess
 import gradio as gr
 from huggingface_hub import hf_hub_download
-subprocess.run('pip install llama-cpp-python==0.2.75 --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cu124', shell=True)
-subprocess.run('pip install llama-cpp-agent==0.2.10', shell=True)
 hf_hub_download(repo_id="bartowski/dolphin-2.9.1-yi-1.5-34b-GGUF", filename="dolphin-2.9.1-yi-1.5-34b-Q6_K.gguf",  local_dir = "./models")
 hf_hub_download(repo_id="crusoeai/dolphin-2.9.1-llama-3-70b-GGUF", filename="dolphin-2.9.1-llama-3-70b.Q3_K_M.gguf",  local_dir = "./models")
 # hf_hub_download(repo_id="bartowski/dolphin-2.9.1-yi-1.5-9b-GGUF", filename="dolphin-2.9.1-yi-1.5-9b-f32.gguf",  local_dir = "./models")
@@ -66,16 +69,7 @@ def respond(
     top_k,
     repeat_penalty,
     model,
-):
-    from llama_cpp import Llama
-    from llama_cpp_agent import LlamaCppAgent
-    from llama_cpp_agent import MessagesFormatterType
-    from llama_cpp_agent.providers import LlamaCppPythonProvider
-    from llama_cpp_agent.chat_history import BasicChatHistory
-    from llama_cpp_agent.chat_history.messages import Roles
-    print(message)
-    print(history)
     llm = Llama(
         model_path=f"models/{model}",
         flash_attn=True,

 import spaces
 import json
 import subprocess
+from llama_cpp import Llama
+from llama_cpp_agent import LlamaCppAgent
+from llama_cpp_agent import MessagesFormatterType
+from llama_cpp_agent.providers import LlamaCppPythonProvider
+from llama_cpp_agent.chat_history import BasicChatHistory
+from llama_cpp_agent.chat_history.messages import Roles
 import gradio as gr
 from huggingface_hub import hf_hub_download
 hf_hub_download(repo_id="bartowski/dolphin-2.9.1-yi-1.5-34b-GGUF", filename="dolphin-2.9.1-yi-1.5-34b-Q6_K.gguf",  local_dir = "./models")
 hf_hub_download(repo_id="crusoeai/dolphin-2.9.1-llama-3-70b-GGUF", filename="dolphin-2.9.1-llama-3-70b.Q3_K_M.gguf",  local_dir = "./models")
 # hf_hub_download(repo_id="bartowski/dolphin-2.9.1-yi-1.5-9b-GGUF", filename="dolphin-2.9.1-yi-1.5-9b-f32.gguf",  local_dir = "./models")
     top_k,
     repeat_penalty,
     model,
+):
     llm = Llama(
         model_path=f"models/{model}",
         flash_attn=True,