Spaces:

alessandroptsn
/

fastllmapi

Runtime error

Neodranzer commited on Jan 26, 2025

Commit

9a8cd2a

1 Parent(s): 5ff5c8e

fix

Files changed (4) hide show

__pycache__/llm_func.cpython-310.pyc ADDED Viewed

Binary file (908 Bytes). View file

__pycache__/main.cpython-310.pyc ADDED Viewed

Binary file (869 Bytes). View file

llm_func.py CHANGED Viewed

@@ -4,10 +4,9 @@ model = Llama.from_pretrained(repo_id="tensorblock/SmolLM-135M-Instruct-GGUF",fi
 def mdl(input):
-	print(query)
-	start = time.time()
-    output = model(
-    prompt=f"""<|im_start|>system
      You are a helpful chatbot.<|im_end|>
      <|im_start|>user
      {input}<|im_end|>""",
@@ -17,6 +16,6 @@ def mdl(input):
     echo=False,
     stop=["#"])
     end = time.time()
-	total_time = end - start
-	print(f"Execution time: {total_time:.2f} seconds")
     return output["choices"][0]["text"].replace('\nassistant\n','')

 def mdl(input):
+    print(input)
+    start = time.time()
+    output = model(prompt=f"""<|im_start|>system
      You are a helpful chatbot.<|im_end|>
      <|im_start|>user
      {input}<|im_end|>""",
     echo=False,
     stop=["#"])
     end = time.time()
+    total_time = end - start
+    print(f"Execution time: {total_time:.2f} seconds")
     return output["choices"][0]["text"].replace('\nassistant\n','')

requirements.txt CHANGED Viewed

@@ -1,4 +1,5 @@
 fastapi
 uvicorn
 llama-cpp-python==0.3.6 --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cpu
-huggingface

 fastapi
 uvicorn
 llama-cpp-python==0.3.6 --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cpu
+huggingface
+huggingface-hub