hello_server

Running

App Files Files Community

Techbitforge commited on Jan 31

Commit

0af3440

verified ·

1 Parent(s): a9425db

Update app.py

Browse files

Files changed (1) hide show

app.py +125 -5

app.py CHANGED Viewed

@@ -12,11 +12,43 @@ app = Flask(__name__)
 # CONFIG
 # =========================
 Server  = [
-    "https://techbitforge-webui.hf.space/api/models",
-    "https://APINOW-service-server.hf.space",
-    "https://APINOW-service-newserver.hf.space",
 ]
 PING_INTERVAL = 120
 REQUEST_TIMEOUT = 300
@@ -30,6 +62,94 @@ logging.basicConfig(
 logger = logging.getLogger("proxy")
 # =========================
 # HEALTH CHECK
 # =========================
@@ -47,7 +167,7 @@ HEADERS = {"User-Agent": "HF-Proxy-KeepAliveBot"}
 def keep_alive_worker():
     while True:
         logger.info("Pinging HF servers...")
-        for url in Server:
             try:
                 r = requests.get(url, headers=HEADERS, timeout=8)
                 logger.info(f"{url} → {r.status_code}")

 # CONFIG
 # =========================
 Server  = [
+    "https://Techbitforge-server.hf.space"
 ]
+HF_SERVERS = [
+    "https://6lqmgwrrrn-api1.hf.space",
+    "https://6lqmgwrrrn-api2.hf.space",
+    "https://6lqmgwrrrn-api3.hf.space",
+    "https://6lqmgwrrrn-api4.hf.space",
+    "https://6lqmgwrrrn-api5.hf.space",
+    "https://6lqmgwrrrn-api6.hf.space",
+    "https://6lqmgwrrrn-api7.hf.space",
+    "https://6lqmgwrrrn-api8.hf.space",
+    "https://dokek64685-api1.hf.space",
+    "https://dokek64685-api2.hf.space",
+    "https://dokek64685-api3.hf.space",
+    "https://dokek64685-api4.hf.space",
+    "https://dokek64685-api5.hf.space",
+    "https://dokek64685-api6.hf.space",
+    "https://dokek64685-api7.hf.space",
+    "https://dokek64685-api8.hf.space",
+    "https://sayonob407-api1.hf.space",
+    "https://sayonob407-api2.hf.space",
+    "https://sayonob407-api3.hf.space",
+    "https://sayonob407-api4.hf.space",
+    "https://sayonob407-api5.hf.space",
+    "https://sayonob407-api6.hf.space",
+    "https://sayonob407-api7.hf.space",
+    "https://sayonob407-api8.hf.space",
+    "https://Shadowty491-none1.hf.space",
+    "https://Shadowty491-none2.hf.space",
+    "https://Shadowty491-none3.hf.space",
+    "https://Shadowty491-none4.hf.space",
+    "https://Shadowty491-none5.hf.space",
+    "https://Shadowty491-none6.hf.space",
+    "https://Shadowty491-none7.hf.space",
+    "https://Shadowty491-none8.hf.space",
+]
 PING_INTERVAL = 120
 REQUEST_TIMEOUT = 300
 logger = logging.getLogger("proxy")
+def pick_server() -> str:
+    return random.choice(HF_SERVERS)
+def error_response(message: str, code: int = 500):
+    logger.error(message)
+    return jsonify({
+        "error": {
+            "message": message,
+            "type": "proxy_error"
+        }
+    }), code
+# =========================
+# CHAT COMPLETIONS PROXY
+# =========================
+@app.route("/v1/chat/completions", methods=["POST"])
+def chat_completions():
+    try:
+        payload = request.get_json(force=True)
+    except Exception:
+        return error_response("Invalid JSON payload", 400)
+    headers = dict(request.headers)
+    headers.pop("Host", None)
+    target = pick_server() + "/v1/chat/completions"
+    stream = payload.get("stream", False)
+    logger.info(f"Forwarding request to {target} | Stream={stream}")
+    try:
+        if stream:
+            def generate():
+                with requests.post(
+                    target,
+                    json=payload,
+                    headers=headers,
+                    stream=True,
+                    timeout=REQUEST_TIMEOUT
+                ) as res:
+                    res.raise_for_status()
+                    for line in res.iter_lines():
+                        if line:
+                            yield line + b"\n\n"
+            return Response(
+                generate(),
+                mimetype="text/event-stream",
+                headers={"Cache-Control": "no-cache", "X-Accel-Buffering": "no"}
+            )
+        res = requests.post(
+            target,
+            json=payload,
+            headers=headers,
+            timeout=REQUEST_TIMEOUT
+        )
+        res.raise_for_status()
+        return jsonify(res.json())
+    except requests.exceptions.Timeout:
+        return error_response("Upstream server timeout", 504)
+    except requests.exceptions.ConnectionError:
+        return error_response("Failed to connect to upstream server", 502)
+    except Exception as e:
+        return error_response(str(e), 500)
+# =========================
+# MODELS ROUTE
+# =========================
+@app.route("/models", methods=["GET"])
+def models():
+    url = pick_server()
+    target = f"{url}/models"
+    logger.info(f"Fetching models from {target}")
+    try:
+        res = requests.get(target, timeout=20)
+        res.raise_for_status()
+        return jsonify(res.json())
+    except Exception as e:
+        return error_response(f"Failed to fetch models: {e}", 500)
 # =========================
 # HEALTH CHECK
 # =========================
 def keep_alive_worker():
     while True:
         logger.info("Pinging HF servers...")
+        for url in HF_SERVERS + Server:
             try:
                 r = requests.get(url, headers=HEADERS, timeout=8)
                 logger.info(f"{url} → {r.status_code}")