Spaces:

ar08
/

Phi-3-api

Paused

ar08 commited on Aug 20, 2024

Commit

cbc595a

verified ·

1 Parent(s): 1491ed2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,6 +4,7 @@ from pydantic import BaseModel
 from llama_cpp import Llama
 import time
 import io
 # Initialize FastAPI app
 app = FastAPI()
@@ -29,15 +30,21 @@ class RequestModel(BaseModel):
     logprobs: int = None
     stop: list = None
-# Response model
 class ResponseModel(BaseModel):
     id: str
     object: str
     created: int
     model: str
-    choices: list
-@app.post("/v1/completions")
 async def create_completion(request: RequestModel):
     try:
         if request.stream:
@@ -79,12 +86,12 @@ async def create_completion(request: RequestModel):
                 created=int(time.time()),
                 model=request.model,
                 choices=[
-                    {
-                        "text": generated_text,
-                        "index": 0,
-                        "logprobs": None,
-                        "finish_reason": "stop"
-                    }
                 ]
             )
@@ -93,5 +100,4 @@ async def create_completion(request: RequestModel):
 if __name__ == "__main__":
     import uvicorn
-    import asyncio
     uvicorn.run(app, host="0.0.0.0", port=8000)

 from llama_cpp import Llama
 import time
 import io
+import asyncio
 # Initialize FastAPI app
 app = FastAPI()
     logprobs: int = None
     stop: list = None
+# Response model based on OpenAI API structure
+class Choice(BaseModel):
+    text: str
+    index: int
+    logprobs: int = None
+    finish_reason: str
 class ResponseModel(BaseModel):
     id: str
     object: str
     created: int
     model: str
+    choices: list[Choice]
+@app.post("/v1/completions", response_model=ResponseModel)
 async def create_completion(request: RequestModel):
     try:
         if request.stream:
                 created=int(time.time()),
                 model=request.model,
                 choices=[
+                    Choice(
+                        text=generated_text,
+                        index=0,
+                        logprobs=None,
+                        finish_reason="stop"
+                    )
                 ]
             )
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=8000)