Spaces:

MarionHalgrain
/

phi2_appli

Sleeping

marion Halgrain commited on Mar 15, 2024

Commit

337deff

verified ·

1 Parent(s): 0334d57

Update main.py

Files changed (1) hide show

main.py CHANGED Viewed

@@ -1,22 +1,24 @@
-from llama_cpp import LlamaModel
 from fastapi import FastAPI
 from pydantic import BaseModel
-# Charger le modèle LLaMA
-llm = LlamaModel(model_path="phi-2.Q5_K_M.gguf")
-# Pydantic object
-class Validation(BaseModel):
-    prompt: str
-# Fast API
 app = FastAPI()
 @app.post("/llm_on_cpu")
-async def stream(item: Validation):
     system_prompt = 'Below is an instruction that describes a task. Write a response that appropriately completes the request.'
     E_INST = "</s>"
     user, assistant = "<|user|>", "<|assistant|>"
     prompt = f"{system_prompt}{E_INST}\n{user}\n{item.prompt}{E_INST}\n{assistant}\n"
-    response = llm.generate(prompt, max_new_tokens=1096, num_threads=3)
-    return response

+from ctransformers import AutoModelForCausalLM
 from fastapi import FastAPI
 from pydantic import BaseModel
+llm = AutoModelForCausalLM.from_pretrained("zephyr-7b-beta.Q4_K_S.gguf",
+model_type='mistral',
+max_new_tokens = 1096,
+threads = 3,
+)
+#Pydantic object
+class validation(BaseModel):
+    prompt: str
+#Fast API
 app = FastAPI()
 @app.post("/llm_on_cpu")
+async def stream(item: validation):
     system_prompt = 'Below is an instruction that describes a task. Write a response that appropriately completes the request.'
     E_INST = "</s>"
     user, assistant = "<|user|>", "<|assistant|>"
     prompt = f"{system_prompt}{E_INST}\n{user}\n{item.prompt}{E_INST}\n{assistant}\n"
+    return llm(prompt)