Vedika-advanced-AI commited on
Commit
cbc80cd
·
verified ·
1 Parent(s): c5fafa4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -7
app.py CHANGED
@@ -22,12 +22,14 @@ class MessageModel(BaseModel):
22
  role: str
23
  content: Any
24
 
25
- class ChatPayload(BaseModel):
26
  messages: List[MessageModel]
27
  max_tokens: Optional[int] = 16384
28
  temperature: Optional[float] = 1.00
29
  top_p: Optional[float] = 0.95
30
- stream: Optional[bool] = False
 
 
31
 
32
  def verify_token(api_key: str = Security(api_key_header)):
33
  if not api_key or api_key.replace("Bearer ", "") != CLIENT_AUTH_TOKEN:
@@ -38,8 +40,9 @@ def verify_token(api_key: str = Security(api_key_header)):
38
  def home():
39
  return {"status": "online", "model": "Vedika AI (stepfun-ai/step-3.7-flash)"}
40
 
 
41
  @app.post("/v1/chat/completions")
42
- def process_chat(payload: ChatPayload, token: str = Security(verify_token)):
43
  if not NVIDIA_API_KEY:
44
  raise HTTPException(status_code=500, detail="Server Error: NVIDIA_API_KEY is missing")
45
 
@@ -48,14 +51,14 @@ def process_chat(payload: ChatPayload, token: str = Security(verify_token)):
48
  "Accept": "application/json"
49
  }
50
 
51
- formatted_messages = [VEDIKA_SYSTEM_PROMPT] + [msg.model_dump() for msg in payload.messages]
52
 
53
  nvidia_payload = {
54
  "model": MODEL_NAME,
55
  "messages": formatted_messages,
56
- "max_tokens": payload.max_tokens,
57
- "temperature": payload.temperature,
58
- "top_p": payload.top_p,
59
  "stream": False
60
  }
61
 
 
22
  role: str
23
  content: Any
24
 
25
+ class RunPodInput(BaseModel):
26
  messages: List[MessageModel]
27
  max_tokens: Optional[int] = 16384
28
  temperature: Optional[float] = 1.00
29
  top_p: Optional[float] = 0.95
30
+
31
+ class RunPodPayload(BaseModel):
32
+ input: RunPodInput
33
 
34
  def verify_token(api_key: str = Security(api_key_header)):
35
  if not api_key or api_key.replace("Bearer ", "") != CLIENT_AUTH_TOKEN:
 
40
  def home():
41
  return {"status": "online", "model": "Vedika AI (stepfun-ai/step-3.7-flash)"}
42
 
43
+ @app.post("/run")
44
  @app.post("/v1/chat/completions")
45
+ def process_chat(payload: RunPodPayload, token: str = Security(verify_token)):
46
  if not NVIDIA_API_KEY:
47
  raise HTTPException(status_code=500, detail="Server Error: NVIDIA_API_KEY is missing")
48
 
 
51
  "Accept": "application/json"
52
  }
53
 
54
+ formatted_messages = [VEDIKA_SYSTEM_PROMPT] + [msg.model_dump() for msg in payload.input.messages]
55
 
56
  nvidia_payload = {
57
  "model": MODEL_NAME,
58
  "messages": formatted_messages,
59
+ "max_tokens": payload.input.max_tokens,
60
+ "temperature": payload.input.temperature,
61
+ "top_p": payload.input.top_p,
62
  "stream": False
63
  }
64