Spaces:

Alvin3y1
/

ai

Paused

App Files Files Community

Alvin3y1 commited on Dec 28, 2025

Commit

e35e970

verified ·

1 Parent(s): 081423f

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -23

app.py CHANGED Viewed

@@ -4,24 +4,14 @@ import uvicorn
 from fastapi import FastAPI, WebSocket
 from fastapi.responses import PlainTextResponse
-API_URL = "https://api.deepinfra.com/v1/openai/chat/completions"
 HEADERS = {
-    "User-Agent": "Mozilla/5.0 (X11; Linux x86_64; rv:146.0) Gecko/20100101 Firefox/146.0",
-    "Accept": "text/event-stream",
-    "Accept-Language": "en-US,en;q=0.5",
-    "Accept-Encoding": "gzip, deflate, br, zstd",
-    "Referer": "https://deepinfra.com/",
-    "Content-Type": "application/json",
-    "X-Deepinfra-Source": "model-embed",
-    "Origin": "https://deepinfra.com",
-    "Sec-GPC": "1",
-    "Connection": "keep-alive",
-    "Sec-Fetch-Dest": "empty",
-    "Sec-Fetch-Mode": "cors",
-    "Sec-Fetch-Site": "same-site",
-    "Priority": "u=0",
 }
-MODEL = "Qwen/Qwen3-Coder-480B-A35B-Instruct"
 app = FastAPI()
@@ -50,11 +40,7 @@ async def websocket_endpoint(websocket: WebSocket):
             payload = {
                 "model": MODEL,
                 "messages": chat_history,
-                "stream": True,
-                "stream_options": {
-                    "include_usage": True,
-                    "continuous_usage_stats": True
-                }
             }
             full_response = ""
@@ -69,11 +55,25 @@ async def websocket_endpoint(websocket: WebSocket):
                                     break
                                 try:
                                     data = json.loads(line_content)
-                                    delta = data.get("choices", [{}])[0].get("delta", {})
-                                    text_chunk = delta.get("content", "")
                                     if text_chunk:
                                         await websocket.send_text(text_chunk)
                                         full_response += text_chunk
                                 except Exception:
                                     continue
             except Exception:

 from fastapi import FastAPI, WebSocket
 from fastapi.responses import PlainTextResponse
+# Updated API Configuration
+API_URL = "https://theoldllm.vercel.app/api/proxy?provider=p7"
 HEADERS = {
+    "accept": "*/*",
+    "content-type": "application/json",
+    "origin": "https://theoldllm.vercel.app",
 }
+MODEL = "gemini-3-pro-preview"
 app = FastAPI()
             payload = {
                 "model": MODEL,
                 "messages": chat_history,
+                "stream": True
             }
             full_response = ""
                                     break
                                 try:
                                     data = json.loads(line_content)
+                                    choices = data.get("choices", [{}])
+                                    if not choices:
+                                        continue
+                                    delta = choices[0].get("delta", {})
+                                    # Handle "Reasoning" (Thinking process) if present
+                                    reasoning_chunk = delta.get("reasoning_content")
+                                    if reasoning_chunk:
+                                        await websocket.send_text(reasoning_chunk)
+                                        full_response += reasoning_chunk
+                                    # Handle actual content
+                                    # We use (delta.get("content") or "") to handle cases where content is null
+                                    text_chunk = delta.get("content")
                                     if text_chunk:
                                         await websocket.send_text(text_chunk)
                                         full_response += text_chunk
                                 except Exception:
                                     continue
             except Exception: