Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -22,12 +22,14 @@ class MessageModel(BaseModel):
|
|
| 22 |
role: str
|
| 23 |
content: Any
|
| 24 |
|
| 25 |
-
class
|
| 26 |
messages: List[MessageModel]
|
| 27 |
max_tokens: Optional[int] = 16384
|
| 28 |
temperature: Optional[float] = 1.00
|
| 29 |
top_p: Optional[float] = 0.95
|
| 30 |
-
|
|
|
|
|
|
|
| 31 |
|
| 32 |
def verify_token(api_key: str = Security(api_key_header)):
|
| 33 |
if not api_key or api_key.replace("Bearer ", "") != CLIENT_AUTH_TOKEN:
|
|
@@ -38,8 +40,9 @@ def verify_token(api_key: str = Security(api_key_header)):
|
|
| 38 |
def home():
|
| 39 |
return {"status": "online", "model": "Vedika AI (stepfun-ai/step-3.7-flash)"}
|
| 40 |
|
|
|
|
| 41 |
@app.post("/v1/chat/completions")
|
| 42 |
-
def process_chat(payload:
|
| 43 |
if not NVIDIA_API_KEY:
|
| 44 |
raise HTTPException(status_code=500, detail="Server Error: NVIDIA_API_KEY is missing")
|
| 45 |
|
|
@@ -48,14 +51,14 @@ def process_chat(payload: ChatPayload, token: str = Security(verify_token)):
|
|
| 48 |
"Accept": "application/json"
|
| 49 |
}
|
| 50 |
|
| 51 |
-
formatted_messages = [VEDIKA_SYSTEM_PROMPT] + [msg.model_dump() for msg in payload.messages]
|
| 52 |
|
| 53 |
nvidia_payload = {
|
| 54 |
"model": MODEL_NAME,
|
| 55 |
"messages": formatted_messages,
|
| 56 |
-
"max_tokens": payload.max_tokens,
|
| 57 |
-
"temperature": payload.temperature,
|
| 58 |
-
"top_p": payload.top_p,
|
| 59 |
"stream": False
|
| 60 |
}
|
| 61 |
|
|
|
|
| 22 |
role: str
|
| 23 |
content: Any
|
| 24 |
|
| 25 |
+
class RunPodInput(BaseModel):
|
| 26 |
messages: List[MessageModel]
|
| 27 |
max_tokens: Optional[int] = 16384
|
| 28 |
temperature: Optional[float] = 1.00
|
| 29 |
top_p: Optional[float] = 0.95
|
| 30 |
+
|
| 31 |
+
class RunPodPayload(BaseModel):
|
| 32 |
+
input: RunPodInput
|
| 33 |
|
| 34 |
def verify_token(api_key: str = Security(api_key_header)):
|
| 35 |
if not api_key or api_key.replace("Bearer ", "") != CLIENT_AUTH_TOKEN:
|
|
|
|
| 40 |
def home():
|
| 41 |
return {"status": "online", "model": "Vedika AI (stepfun-ai/step-3.7-flash)"}
|
| 42 |
|
| 43 |
+
@app.post("/run")
|
| 44 |
@app.post("/v1/chat/completions")
|
| 45 |
+
def process_chat(payload: RunPodPayload, token: str = Security(verify_token)):
|
| 46 |
if not NVIDIA_API_KEY:
|
| 47 |
raise HTTPException(status_code=500, detail="Server Error: NVIDIA_API_KEY is missing")
|
| 48 |
|
|
|
|
| 51 |
"Accept": "application/json"
|
| 52 |
}
|
| 53 |
|
| 54 |
+
formatted_messages = [VEDIKA_SYSTEM_PROMPT] + [msg.model_dump() for msg in payload.input.messages]
|
| 55 |
|
| 56 |
nvidia_payload = {
|
| 57 |
"model": MODEL_NAME,
|
| 58 |
"messages": formatted_messages,
|
| 59 |
+
"max_tokens": payload.input.max_tokens,
|
| 60 |
+
"temperature": payload.input.temperature,
|
| 61 |
+
"top_p": payload.input.top_p,
|
| 62 |
"stream": False
|
| 63 |
}
|
| 64 |
|