#!/usr/bin/env python3 # -*- coding: utf-8 -*- """Freebuff OpenAI API 反代代理 - Hugging Face Docker Space 版 说明: - 保留原有 OpenAI 兼容接口: - /v1/chat/completions - /v1/responses - /v1/models - /v1/reset-run - /health - 将原来的命令行/TTY 登录改为网页管理页: - / - /admin/login/start - /admin/login/status - 适配 Hugging Face Spaces: - 读取 PORT 环境变量 - 凭据优先保存到 /data(若已开通持久化存储) - 可通过 Secrets 传入 API_KEY / ADMIN_PASSWORD / ACCOUNTS_JSON """ import asyncio import json import os import platform import random import string import sys import time import uuid from pathlib import Path from typing import Any, Dict, List, Optional, Tuple from urllib.parse import quote try: import aiohttp from aiohttp import web except ImportError: print("请先安装 aiohttp: pip install aiohttp") sys.exit(1) API_BASE = os.environ.get("API_BASE", "www.codebuff.com") PORT = int(os.environ.get("PORT", "7860")) HOST = os.environ.get("HOST", "0.0.0.0") POLL_INTERVAL_S = int(os.environ.get("POLL_INTERVAL_S", "5")) TIMEOUT_S = int(os.environ.get("TIMEOUT_S", "300")) # /v1/* 访问鉴权(Bearer) PROXY_API_KEY = os.environ.get("API_KEY", "") # 管理后台鉴权(X-Admin-Password / ?password=) ADMIN_PASSWORD = os.environ.get("ADMIN_PASSWORD", "") FRONTEND_PASSWORD = os.environ.get("FRONTEND_PASSWORD", "") FRONTEND_COOKIE_NAME = "frontend_gate" MODEL_TO_AGENT = { "minimax/minimax-m2.7": "base2-free", "z-ai/glm-5.1": "base2-free", "google/gemini-2.5-flash-lite": "file-picker", "google/gemini-3.1-flash-lite-preview": "file-picker-max", "google/gemini-3.1-pro-preview": "thinker-with-files-gemini", } default_model = os.environ.get("DEFAULT_MODEL", "minimax/minimax-m2.7") # 多账号 Token 池 # token_pool 每项示例: # { # "id": "user-id", # "name": "Alice", # "email": "a@example.com", # "authToken": "...", # "credits": 0, # } token_pool: List[Dict[str, Any]] = [] next_token_index = 0 # Agent Run 缓存按 (token, agent_id) 维度维护 run_cache: Dict[Tuple[str, str], str] = {} # 等待登录态缓存:{ login_id: {fingerprintId, fingerprintHash, expiresAt, loginUrl, createdAt} } pending_logins: Dict[str, Dict[str, Any]] = {} C = { "R": "\033[0m", "B": "\033[1m", "G": "\033[32m", "Y": "\033[33m", "E": "\033[31m", "C": "\033[36m", "D": "\033[90m", } def log(msg: str, t: str = "info") -> None: c = {"success": C["G"], "error": C["E"], "warn": C["Y"]}.get(t, C["C"]) icon = {"success": "✓", "error": "✗", "warn": "⚠"}.get(t, "ℹ") print(f"{c}{icon}{C['R']} {msg}", flush=True) def token_fingerprint(auth_token: str) -> str: if not auth_token: return "none" if len(auth_token) < 12: return auth_token[:3] + "..." return f"{auth_token[:6]}...{auth_token[-4:]}" def generate_fingerprint_id() -> str: chars = string.ascii_lowercase + string.digits return f"codebuff-cli-{''.join(random.choices(chars, k=26))}" def get_config_paths() -> Tuple[Path, Path]: # Hugging Face Spaces 若启用了持久化存储,/data 会持久保存 if Path("/data").exists() and os.access("/data", os.W_OK): config_dir = Path("/data") / "manicode" return config_dir, config_dir / "credentials.json" home = Path.home() if platform.system() == "Windows": config_dir = Path(os.environ.get("APPDATA", str(home))) / "manicode" else: config_dir = home / ".config" / "manicode" return config_dir, config_dir / "credentials.json" def normalize_accounts(creds: Any) -> List[Dict[str, Any]]: """兼容旧格式(default)和新格式(accounts)。""" if not isinstance(creds, dict): return [] accounts: List[Dict[str, Any]] = [] raw_accounts = creds.get("accounts") if isinstance(raw_accounts, list): for entry in raw_accounts: if isinstance(entry, dict) and entry.get("authToken"): accounts.append({ "id": entry.get("id"), "name": entry.get("name") or "unknown", "email": entry.get("email") or "unknown", "authToken": entry.get("authToken"), "credits": entry.get("credits", 0), }) default_entry = creds.get("default") if isinstance(default_entry, dict) and default_entry.get("authToken"): default_token = default_entry.get("authToken") exists = any(acc.get("authToken") == default_token for acc in accounts) if not exists: accounts.insert(0, { "id": default_entry.get("id"), "name": default_entry.get("name") or "default", "email": default_entry.get("email") or "unknown", "authToken": default_token, "credits": default_entry.get("credits", 0), }) return accounts def load_accounts() -> List[Dict[str, Any]]: _, creds_path = get_config_paths() disk_accounts: List[Dict[str, Any]] = [] if creds_path.exists(): try: creds = json.loads(creds_path.read_text(encoding="utf-8")) disk_accounts = normalize_accounts(creds) except Exception as e: log(f"读取本地凭据失败: {e}", "warn") # 可选:通过 HF Secrets 直接注入账号池 env_accounts: List[Dict[str, Any]] = [] raw_env = os.environ.get("ACCOUNTS_JSON", "").strip() if raw_env: try: parsed = json.loads(raw_env) if isinstance(parsed, list): env_accounts = [ { "id": entry.get("id"), "name": entry.get("name") or "unknown", "email": entry.get("email") or "unknown", "authToken": entry.get("authToken"), "credits": entry.get("credits", 0), } for entry in parsed if isinstance(entry, dict) and entry.get("authToken") ] elif isinstance(parsed, dict): env_accounts = normalize_accounts(parsed) except Exception as e: log(f"解析 ACCOUNTS_JSON 失败: {e}", "warn") merged: List[Dict[str, Any]] = [] seen = set() for acc in disk_accounts + env_accounts: token = acc.get("authToken") if token and token not in seen: seen.add(token) merged.append(acc) return merged def save_accounts(accounts: List[Dict[str, Any]]) -> None: config_dir, creds_path = get_config_paths() config_dir.mkdir(parents=True, exist_ok=True) if not accounts: return # default 指向当前首个账号,兼容旧逻辑 data = { "default": { "id": accounts[0].get("id"), "name": accounts[0].get("name"), "email": accounts[0].get("email"), "authToken": accounts[0].get("authToken"), "credits": accounts[0].get("credits", 0), }, "accounts": accounts, } creds_path.write_text(json.dumps(data, indent=2, ensure_ascii=False), encoding="utf-8") async def warm_account_default_agent(session: aiohttp.ClientSession, account: Dict[str, Any]) -> Optional[str]: auth_token = account.get("authToken") if not auth_token: return None default_agent = MODEL_TO_AGENT.get(default_model, "base2-free") try: run_id = await create_agent_run(session, auth_token, default_agent) run_cache[get_run_cache_key(auth_token, default_agent)] = run_id return run_id except Exception as e: log( f"预热失败: user={account.get('name')}, token={token_fingerprint(auth_token)}, err={e}", "warn", ) return None def append_account(user_obj: Dict[str, Any]) -> Tuple[bool, Dict[str, Any]]: """把新登录账号追加到 token 池并持久化(按 authToken 去重)。""" global token_pool new_acc = { "id": user_obj.get("id"), "name": user_obj.get("name") or "unknown", "email": user_obj.get("email") or "unknown", "authToken": user_obj.get("authToken") or user_obj.get("auth_token"), "credits": user_obj.get("credits", 0), } if not new_acc["authToken"]: raise RuntimeError("登录返回中缺少 authToken") existing = {acc.get("authToken") for acc in token_pool} if new_acc["authToken"] not in existing: token_pool.append(new_acc) save_accounts(token_pool) return True, new_acc return False, new_acc def pick_next_account() -> Tuple[Dict[str, Any], int]: """轮询选择下一个账号。""" global next_token_index if not token_pool: raise RuntimeError("没有可用 token,请先在管理页添加至少一个账号") idx = next_token_index % len(token_pool) next_token_index = (next_token_index + 1) % len(token_pool) return token_pool[idx], idx def get_run_cache_key(auth_token: str, agent_id: str) -> Tuple[str, str]: return auth_token, agent_id # ============ HTTP 请求 ============ async def api_request( session: aiohttp.ClientSession, hostname: str, path: str, body: Optional[Dict[str, Any]] = None, auth_token: Optional[str] = None, method: str = "POST", ) -> Dict[str, Any]: url = f"https://{hostname}{path}" headers = { "Content-Type": "application/json", "Accept": "application/json", "User-Agent": "freebuff-proxy/1.0", } if auth_token: headers["Authorization"] = f"Bearer {auth_token}" kwargs: Dict[str, Any] = { "headers": headers, "timeout": aiohttp.ClientTimeout(total=30), } if body is not None and method.upper() != "GET": kwargs["json"] = body async with session.request(method.upper(), url, **kwargs) as resp: try: data = await resp.json() except Exception: data = await resp.text() return {"status": resp.status, "data": data} # ============ 登录流程(网页版) ============ async def start_login_flow(session: aiohttp.ClientSession) -> Dict[str, Any]: fp_id = generate_fingerprint_id() res = await api_request(session, "freebuff.com", "/api/auth/cli/code", {"fingerprintId": fp_id}) if res["status"] != 200 or "loginUrl" not in res["data"]: raise RuntimeError(f"获取登录 URL 失败: {res['data']}") d = res["data"] login_id = uuid.uuid4().hex pending_logins[login_id] = { "fingerprintId": fp_id, "fingerprintHash": d["fingerprintHash"], "expiresAt": d["expiresAt"], "loginUrl": d["loginUrl"], "createdAt": time.time(), } return { "loginId": login_id, "fingerprintId": fp_id, "fingerprintHash": d["fingerprintHash"], "expiresAt": d["expiresAt"], "loginUrl": d["loginUrl"], } async def poll_login_status(session: aiohttp.ClientSession, login_id: str) -> Dict[str, Any]: pending = pending_logins.get(login_id) if not pending: raise RuntimeError("loginId 不存在或已过期") # 清理超过 TIMEOUT_S 的登录任务 if time.time() - float(pending.get("createdAt", 0)) > TIMEOUT_S: pending_logins.pop(login_id, None) raise RuntimeError("登录已超时,请重新发起") path = ( f"/api/auth/cli/status?fingerprintId={quote(str(pending['fingerprintId']))}" f"&fingerprintHash={quote(str(pending['fingerprintHash']))}" f"&expiresAt={quote(str(pending['expiresAt']))}" ) sr = await api_request(session, "freebuff.com", path, method="GET") if sr["status"] == 200 and isinstance(sr["data"], dict) and "user" in sr["data"]: user = sr["data"]["user"] added, new_acc = append_account(user) pending_logins.pop(login_id, None) await warm_account_default_agent(session, new_acc) return { "status": "success", "added": added, "user": { "id": new_acc.get("id"), "name": new_acc.get("name"), "email": new_acc.get("email"), "credits": new_acc.get("credits", 0), "token": token_fingerprint(new_acc.get("authToken", "")), }, } return { "status": "pending", "message": "尚未完成登录,请在新标签页完成授权后继续轮询", "upstream": sr.get("data"), } # ============ Freebuff API ============ async def create_agent_run(session: aiohttp.ClientSession, auth_token: str, agent_id: str) -> str: t = time.time() res = await api_request( session, API_BASE, "/api/v1/agent-runs", {"action": "START", "agentId": agent_id}, auth_token, ) ms = int((time.time() - t) * 1000) if res["status"] != 200 or "runId" not in res["data"]: raise RuntimeError(f"创建 Agent Run 失败: {json.dumps(res['data'], ensure_ascii=False)}") log(f"创建新 Agent Run: {res['data']['runId']} (耗时 {ms}ms, token={token_fingerprint(auth_token)})") return res["data"]["runId"] async def get_or_create_agent_run(session: aiohttp.ClientSession, auth_token: str, agent_id: str) -> str: key = get_run_cache_key(auth_token, agent_id) run_id = run_cache.get(key) if run_id: return run_id run_id = await create_agent_run(session, auth_token, agent_id) run_cache[key] = run_id return run_id async def finish_agent_run(session: aiohttp.ClientSession, auth_token: str, run_id: str) -> None: await api_request(session, API_BASE, "/api/v1/agent-runs", { "action": "FINISH", "runId": run_id, "status": "completed", "totalSteps": 1, "directCredits": 0, "totalCredits": 0, }, auth_token) def make_freebuff_body(openai_body: Dict[str, Any], run_id: str) -> Dict[str, Any]: body = dict(openai_body) body["codebuff_metadata"] = { "run_id": run_id, "client_id": f"freebuff-proxy-{''.join(random.choices(string.ascii_lowercase + string.digits, k=8))}", "cost_mode": "free", } return body def build_openai_response(run_id: str, model: str, choice_data: Dict[str, Any], usage_data: Optional[Dict[str, Any]] = None) -> Dict[str, Any]: choice = choice_data or {} message = choice.get("message", {}) resp = { "id": f"freebuff-{run_id}", "object": "chat.completion", "created": int(time.time()), "model": model, "choices": [{ "index": 0, "message": { "role": "assistant", "content": message.get("content", ""), }, "finish_reason": choice.get("finish_reason", "stop"), }], "usage": { "prompt_tokens": (usage_data or {}).get("prompt_tokens", 0), "completion_tokens": (usage_data or {}).get("completion_tokens", 0), "total_tokens": (usage_data or {}).get("total_tokens", 0), }, } if message.get("tool_calls"): resp["choices"][0]["message"]["tool_calls"] = message["tool_calls"] return resp # ============ 流式转发 ============ async def stream_to_openai_format( session: aiohttp.ClientSession, freebuff_body: Dict[str, Any], auth_token: str, response: web.StreamResponse, model: str, ) -> None: url = f"https://{API_BASE}/api/v1/chat/completions" headers = { "Content-Type": "application/json", "Authorization": f"Bearer {auth_token}", "Accept": "text/event-stream", "User-Agent": "freebuff-proxy/1.0", } response_id = f"freebuff-{int(time.time() * 1000)}" finish_reason = "stop" timeout = aiohttp.ClientTimeout(total=120) async with session.post(url, json=freebuff_body, headers=headers, timeout=timeout) as resp: if resp.status != 200: err = await resp.text() raise RuntimeError(f"HTTP {resp.status}: {err}") buffer = "" async for chunk in resp.content.iter_any(): buffer += chunk.decode("utf-8", errors="replace") lines = buffer.split("\n") buffer = lines.pop() for line in lines: trimmed = line.strip() if not trimmed or not trimmed.startswith("data: "): continue json_str = trimmed[6:].strip() if json_str == "[DONE]": await response.write(b"data: [DONE]\n\n") continue try: parsed = json.loads(json_str) delta = (parsed.get("choices") or [{}])[0].get("delta", {}) cfr = (parsed.get("choices") or [{}])[0].get("finish_reason") if cfr: finish_reason = cfr delta_obj: Dict[str, Any] = {} if delta.get("content"): delta_obj["content"] = delta["content"] if delta.get("tool_calls"): delta_obj["tool_calls"] = delta["tool_calls"] if delta.get("role"): delta_obj["role"] = delta["role"] if delta_obj: openai_chunk = { "id": response_id, "object": "chat.completion.chunk", "created": int(time.time()), "model": model, "choices": [{"index": 0, "delta": delta_obj, "finish_reason": None}], } await response.write(f"data: {json.dumps(openai_chunk, ensure_ascii=False)}\n\n".encode()) except Exception: pass final_chunk = { "id": response_id, "object": "chat.completion.chunk", "created": int(time.time()), "model": model, "choices": [{"index": 0, "delta": {}, "finish_reason": finish_reason}], } await response.write(f"data: {json.dumps(final_chunk, ensure_ascii=False)}\n\n".encode()) await response.write(b"data: [DONE]\n\n") await response.write_eof() # ============ 鉴权中间件 ============ @web.middleware async def auth_middleware(request: web.Request, handler): """当 PROXY_API_KEY 非空时,对 /v1/* 路由强制验证 Bearer token。""" if PROXY_API_KEY and request.path.startswith("/v1/"): auth_header = request.headers.get("Authorization", "") token = auth_header[7:] if auth_header.startswith("Bearer ") else "" if token != PROXY_API_KEY: log(f"鉴权失败: path={request.path}, ip={request.remote}", "warn") return web.json_response( {"error": {"message": "Incorrect API key provided", "type": "invalid_request_error", "code": "invalid_api_key"}}, status=401, ) return await handler(request) def require_admin(request: web.Request) -> Optional[web.Response]: if not ADMIN_PASSWORD: return None supplied = request.headers.get("X-Admin-Password") or request.query.get("password") or "" if supplied != ADMIN_PASSWORD: return web.json_response({"error": {"message": "Admin password required"}}, status=401) return None def get_frontend_gate_password() -> str: return FRONTEND_PASSWORD or ADMIN_PASSWORD def is_frontend_allowed(request: web.Request) -> bool: gate_password = get_frontend_gate_password() if not gate_password: return True return request.cookies.get(FRONTEND_COOKIE_NAME) == gate_password def frontend_gate_page(error: str = "") -> str: escaped_error = quote(error) if error else "" return f""" 进入管理页

进入管理页

这个页面已加简单门禁。输入访问密码后才会展示前端管理面板。

{error}

默认优先读取 FRONTEND_PASSWORD;如果没设置,会回退使用 ADMIN_PASSWORD

""" # ============ Responses API 辅助函数 ============ def _responses_parse_input(data: Dict[str, Any]) -> List[Dict[str, Any]]: """将 Responses API 的 input 字段转换为 OpenAI messages 列表。""" raw_input = data.get("input", "") instructions = data.get("instructions", "") messages: List[Dict[str, Any]] = [] if instructions: messages.append({"role": "system", "content": instructions}) if isinstance(raw_input, str): if raw_input: messages.append({"role": "user", "content": raw_input}) elif isinstance(raw_input, list): for item in raw_input: if isinstance(item, str): messages.append({"role": "user", "content": item}) elif isinstance(item, dict): role = item.get("role", "user") content = item.get("content", "") item_type = item.get("type", "") if item_type == "function_call_output": messages.append({ "role": "tool", "tool_call_id": item.get("call_id", ""), "content": item.get("output", ""), }) elif role in ("user", "assistant", "system", "developer"): if role == "developer": role = "system" if isinstance(content, list): text_parts: List[str] = [] for part in content: if isinstance(part, dict): if part.get("type") in ("input_text", "text"): text_parts.append(part.get("text", "")) elif isinstance(part, str): text_parts.append(part) content = "".join(text_parts) messages.append({"role": role, "content": content}) return messages def _responses_make_base(resp_id: str, model: str, created: float, instructions: Optional[str] = None, status: str = "completed") -> Dict[str, Any]: return { "id": resp_id, "object": "response", "created_at": created, "status": status, "model": model, "output": [], "parallel_tool_calls": True, "tool_choice": "auto", "tools": [], "temperature": 1.0, "top_p": 1.0, "max_output_tokens": None, "truncation": "disabled", "instructions": instructions, "metadata": {}, "incomplete_details": None, "error": None, "usage": None, } # ============ 路由处理 ============ async def handle_chat_completion(request: web.Request) -> web.StreamResponse: start = time.time() session: aiohttp.ClientSession = request.app["client_session"] try: body = await request.json() except Exception: return web.json_response({"error": {"message": "Invalid JSON body"}}, status=400) model = body.get("model", default_model) agent_id = MODEL_TO_AGENT.get(model, "base2-free") try: account, account_idx = pick_next_account() auth_token = account["authToken"] except Exception as e: return web.json_response({"error": {"message": str(e)}}, status=503) log( "收到请求: " f"model={model}, messages={len(body.get('messages', []))}, stream={body.get('stream', False)}, " f"account_index={account_idx}, user={account.get('name')}, token={token_fingerprint(auth_token)}" ) try: run_id = await get_or_create_agent_run(session, auth_token, agent_id) except Exception as e: return web.json_response({"error": {"message": str(e)}}, status=500) fb_body = make_freebuff_body(body, run_id) try: if body.get("stream"): response = web.StreamResponse( status=200, headers={"Content-Type": "text/event-stream", "Cache-Control": "no-cache", "Connection": "keep-alive"}, ) await response.prepare(request) await stream_to_openai_format(session, fb_body, auth_token, response, model) log(f"请求完成,总耗时 {int((time.time() - start) * 1000)}ms", "success") return response res = await api_request(session, API_BASE, "/api/v1/chat/completions", fb_body, auth_token) if res["status"] == 200: choice = (res["data"].get("choices") or [{}])[0] resp = build_openai_response(run_id, model, choice, res["data"].get("usage")) log(f"请求完成,总耗时 {int((time.time() - start) * 1000)}ms", "success") return web.json_response(resp) if res["status"] in (400, 404): log("Agent Run 失效,重新创建...", "warn") run_cache.pop(get_run_cache_key(auth_token, agent_id), None) run_id = await get_or_create_agent_run(session, auth_token, agent_id) fb_body["codebuff_metadata"]["run_id"] = run_id retry = await api_request(session, API_BASE, "/api/v1/chat/completions", fb_body, auth_token) if retry["status"] == 200: choice = (retry["data"].get("choices") or [{}])[0] resp = build_openai_response(run_id, model, choice, retry["data"].get("usage")) log(f"重试成功,总耗时 {int((time.time() - start) * 1000)}ms", "success") return web.json_response(resp) return web.json_response({"error": {"message": retry["data"]}}, status=retry["status"]) return web.json_response({"error": {"message": res["data"]}}, status=res["status"]) except Exception as e: log(f"请求失败: {e}", "error") return web.json_response({"error": {"message": str(e)}}, status=500) async def handle_responses(request: web.Request) -> web.StreamResponse: """OpenAI Responses API 兼容端点 /v1/responses。""" start = time.time() session: aiohttp.ClientSession = request.app["client_session"] try: data = await request.json() except Exception: return web.json_response({"error": {"message": "Invalid JSON body"}}, status=400) model = data.get("model", default_model) stream = data.get("stream", False) instructions = data.get("instructions") agent_id = MODEL_TO_AGENT.get(model, "base2-free") messages = _responses_parse_input(data) if not messages: return web.json_response({"error": {"message": "input is required", "type": "invalid_request_error"}}, status=400) try: account, account_idx = pick_next_account() auth_token = account["authToken"] except Exception as e: return web.json_response({"error": {"message": str(e)}}, status=503) log( f"收到 Responses API 请求: model={model}, msgs={len(messages)}, stream={stream}, " f"account_index={account_idx}, user={account.get('name')}, token={token_fingerprint(auth_token)}" ) try: run_id = await get_or_create_agent_run(session, auth_token, agent_id) except Exception as e: return web.json_response({"error": {"message": str(e)}}, status=500) fb_body = make_freebuff_body({"model": model, "messages": messages, "stream": True}, run_id) resp_id = f"resp_{int(time.time() * 1000)}" msg_id = f"msg_{int(time.time() * 1000)}" created = time.time() msg_chars = sum(len(str(m.get("content", ""))) for m in messages) url = f"https://{API_BASE}/api/v1/chat/completions" headers = { "Content-Type": "application/json", "Authorization": f"Bearer {auth_token}", "Accept": "text/event-stream", "User-Agent": "freebuff-proxy/1.0", } try: if stream: response = web.StreamResponse( status=200, headers={"Content-Type": "text/event-stream", "Cache-Control": "no-cache", "Connection": "keep-alive"}, ) await response.prepare(request) timeout = aiohttp.ClientTimeout(total=120) async with session.post(url, json=fb_body, headers=headers, timeout=timeout) as upstream_resp: if upstream_resp.status != 200: err = await upstream_resp.text() raise RuntimeError(f"HTTP {upstream_resp.status}: {err}") seq = 0 full_text_parts: List[str] = [] base = _responses_make_base(resp_id, model, created, instructions, "in_progress") async def emit(event_type: str, payload: Dict[str, Any]) -> None: nonlocal seq data_str = json.dumps({"type": event_type, "sequence_number": seq, **payload}, ensure_ascii=False) await response.write(f"event: {event_type}\ndata: {data_str}\n\n".encode()) seq += 1 await emit("response.created", {"response": base}) await emit("response.in_progress", {"response": base}) item_skeleton = {"id": msg_id, "type": "message", "role": "assistant", "status": "in_progress", "content": []} await emit("response.output_item.added", {"output_index": 0, "item": item_skeleton}) part_skeleton = {"type": "output_text", "text": "", "annotations": []} await emit("response.content_part.added", {"item_id": msg_id, "output_index": 0, "content_index": 0, "part": part_skeleton}) buffer = "" async for chunk in upstream_resp.content.iter_any(): buffer += chunk.decode("utf-8", errors="replace") lines = buffer.split("\n") buffer = lines.pop() for line in lines: trimmed = line.strip() if not trimmed or not trimmed.startswith("data: "): continue json_str = trimmed[6:].strip() if json_str == "[DONE]": continue try: parsed = json.loads(json_str) delta_content = (parsed.get("choices") or [{}])[0].get("delta", {}).get("content", "") if delta_content: full_text_parts.append(delta_content) await emit("response.output_text.delta", { "item_id": msg_id, "output_index": 0, "content_index": 0, "delta": delta_content, }) except Exception: pass full_text = "".join(full_text_parts) await emit("response.output_text.done", { "item_id": msg_id, "output_index": 0, "content_index": 0, "text": full_text, }) done_part = {"type": "output_text", "text": full_text, "annotations": []} await emit("response.content_part.done", { "item_id": msg_id, "output_index": 0, "content_index": 0, "part": done_part, }) done_item = {"id": msg_id, "type": "message", "role": "assistant", "status": "completed", "content": [done_part]} await emit("response.output_item.done", {"output_index": 0, "item": done_item}) usage = { "input_tokens": msg_chars // 4, "input_tokens_details": {"cached_tokens": 0}, "output_tokens": len(full_text) // 4, "output_tokens_details": {"reasoning_tokens": 0}, "total_tokens": (msg_chars + len(full_text)) // 4, } final = _responses_make_base(resp_id, model, created, instructions, "completed") final["output"] = [done_item] final["usage"] = usage await emit("response.completed", {"response": final}) await response.write_eof() log(f"Responses API 请求完成,总耗时 {int((time.time() - start) * 1000)}ms", "success") return response timeout = aiohttp.ClientTimeout(total=120) content_parts: List[str] = [] async with session.post(url, json=fb_body, headers=headers, timeout=timeout) as upstream_resp: if upstream_resp.status != 200: err = await upstream_resp.text() if upstream_resp.status in (400, 404): log("Responses API: Agent Run 失效,重新创建...", "warn") run_cache.pop(get_run_cache_key(auth_token, agent_id), None) run_id = await get_or_create_agent_run(session, auth_token, agent_id) fb_body["codebuff_metadata"]["run_id"] = run_id async with session.post(url, json=fb_body, headers=headers, timeout=timeout) as retry_resp: if retry_resp.status != 200: raise RuntimeError(f"HTTP {retry_resp.status}: {await retry_resp.text()}") buffer = "" async for chunk in retry_resp.content.iter_any(): buffer += chunk.decode("utf-8", errors="replace") for line in buffer.split("\n"): trimmed = line.strip() if not trimmed or not trimmed.startswith("data: "): continue json_str = trimmed[6:].strip() if json_str == "[DONE]": continue try: parsed = json.loads(json_str) c = (parsed.get("choices") or [{}])[0].get("delta", {}).get("content", "") if c: content_parts.append(c) except Exception: pass else: raise RuntimeError(f"HTTP {upstream_resp.status}: {err}") else: buffer = "" async for chunk in upstream_resp.content.iter_any(): buffer += chunk.decode("utf-8", errors="replace") for line in buffer.split("\n"): trimmed = line.strip() if not trimmed or not trimmed.startswith("data: "): continue json_str = trimmed[6:].strip() if json_str == "[DONE]": continue try: parsed = json.loads(json_str) c = (parsed.get("choices") or [{}])[0].get("delta", {}).get("content", "") if c: content_parts.append(c) except Exception: pass full_text = "".join(content_parts) output_item = { "id": msg_id, "type": "message", "role": "assistant", "status": "completed", "content": [{"type": "output_text", "text": full_text, "annotations": []}], } usage = { "input_tokens": msg_chars // 4, "input_tokens_details": {"cached_tokens": 0}, "output_tokens": len(full_text) // 4, "output_tokens_details": {"reasoning_tokens": 0}, "total_tokens": (msg_chars + len(full_text)) // 4, } result = _responses_make_base(resp_id, model, created, instructions, "completed") result["output"] = [output_item] result["usage"] = usage log(f"Responses API 请求完成,总耗时 {int((time.time() - start) * 1000)}ms", "success") return web.json_response(result) except Exception as e: log(f"Responses API 请求失败: {e}", "error") return web.json_response({"error": {"message": str(e)}}, status=500) async def handle_models(request: web.Request) -> web.Response: models = [{"id": m, "object": "model", "created": 1700000000, "owned_by": "freebuff"} for m in MODEL_TO_AGENT] return web.json_response({"object": "list", "data": models}) async def handle_reset_run(request: web.Request) -> web.Response: run_cache.clear() log("Agent Run 缓存已清除") return web.json_response({"status": "cleared"}) async def handle_health(request: web.Request) -> web.Response: config_dir, creds_path = get_config_paths() account_brief = [ { "index": i, "name": acc.get("name"), "email": acc.get("email"), "token": token_fingerprint(acc.get("authToken", "")), } for i, acc in enumerate(token_pool) ] return web.json_response({ "status": "ok", "model": default_model, "accounts": account_brief, "accountCount": len(token_pool), "nextAccountIndex": next_token_index, "cachedRunCount": len(run_cache), "storage": { "configDir": str(config_dir), "credentialsFile": str(creds_path), "persistentDataMounted": Path("/data").exists(), }, "security": { "apiKeyEnabled": bool(PROXY_API_KEY), "adminPasswordEnabled": bool(ADMIN_PASSWORD), "frontendPasswordEnabled": bool(get_frontend_gate_password()), }, }) async def handle_root(request: web.Request) -> web.Response: if not is_frontend_allowed(request): return web.Response(text=frontend_gate_page(), content_type="text/html") html = f""" Freebuff OpenAI Proxy - HF Space

Freebuff OpenAI Proxy · Hugging Face Space

保留原脚本的 OpenAI 兼容接口、Responses API、账号池轮询、Run 缓存、健康检查与重置能力,并把登录迁移到网页管理页。

{('
' if get_frontend_gate_password() else '')}
聊天接口
POST /v1/chat/completions
Responses API
POST /v1/responses
模型列表 / 健康检查
GET /v1/models
GET /health

管理权限

如果你设置了 ADMIN_PASSWORD,请先输入。它只用于管理页,不影响 /v1 接口。/v1 接口仍由 API_KEY 控制。

账号管理

登录后账号会写入凭据文件。若 Space 挂载了持久化存储,会写入 /data/manicode/credentials.json

尚未发起登录。

当前状态

加载中...

调用示例

curl {(' -H "Authorization: Bearer ' + PROXY_API_KEY + '"') if PROXY_API_KEY else ''} \
  -H "Content-Type: application/json" \
  -X POST "./v1/chat/completions" \
  -d '{{
    "model": "{default_model}",
    "messages": [{{"role": "user", "content": "你好"}}],
    "stream": false
  }}'

在浏览器中用相对路径展示;实际接入请替换成你的 Space 域名。

""" return web.Response(text=html, content_type="text/html") async def handle_frontend_login(request: web.Request) -> web.Response: gate_password = get_frontend_gate_password() if not gate_password: raise web.HTTPFound("/") data = await request.post() supplied = (data.get("password") or "").strip() if supplied != gate_password: return web.Response(text=frontend_gate_page("密码错误,请重试"), content_type="text/html", status=401) response = web.HTTPFound("/") response.set_cookie( FRONTEND_COOKIE_NAME, gate_password, max_age=7 * 24 * 60 * 60, httponly=True, samesite="Lax", ) raise response async def handle_frontend_logout(request: web.Request) -> web.Response: response = web.HTTPFound("/") response.del_cookie(FRONTEND_COOKIE_NAME) raise response async def handle_admin_login_start(request: web.Request) -> web.Response: denied = require_admin(request) if denied: return denied session: aiohttp.ClientSession = request.app["client_session"] try: payload = await start_login_flow(session) return web.json_response(payload) except Exception as e: return web.json_response({"error": {"message": str(e)}}, status=500) async def handle_admin_login_status(request: web.Request) -> web.Response: denied = require_admin(request) if denied: return denied session: aiohttp.ClientSession = request.app["client_session"] login_id = request.query.get("loginId", "") if not login_id: return web.json_response({"error": {"message": "loginId is required"}}, status=400) try: payload = await poll_login_status(session, login_id) return web.json_response(payload) except Exception as e: return web.json_response({"error": {"message": str(e)}}, status=400) # ============ App 生命周期 ============ async def on_startup(app: web.Application) -> None: global token_pool session = aiohttp.ClientSession() app["client_session"] = session token_pool = load_accounts() if token_pool: log(f"已加载账号池: {len(token_pool)} 个") for i, acc in enumerate(token_pool): log( f" [{i}] {acc.get('name')} <{acc.get('email')}> token={token_fingerprint(acc.get('authToken', ''))}" ) log("预热:为账号池创建默认 Agent Run...") warmed = 0 for acc in token_pool: run_id = await warm_account_default_agent(session, acc) if run_id: warmed += 1 if warmed: log(f"预热完成,已缓存 {warmed} 个默认 Agent Run", "success") else: log("当前没有已预热账号;可在管理页登录新增账号", "warn") async def on_cleanup(app: web.Application) -> None: session: aiohttp.ClientSession = app["client_session"] if run_cache: log("关闭代理,结束全部缓存 Agent Run...") for (auth_token, _agent_id), run_id in list(run_cache.items()): try: await finish_agent_run(session, auth_token, run_id) except Exception: pass log("Agent Run 清理完成", "success") await session.close() def create_app() -> web.Application: app = web.Application(middlewares=[auth_middleware], client_max_size=20 * 1024 * 1024) app.on_startup.append(on_startup) app.on_cleanup.append(on_cleanup) app.router.add_get("/", handle_root) app.router.add_post("/gate/login", handle_frontend_login) app.router.add_post("/gate/logout", handle_frontend_logout) app.router.add_get("/health", handle_health) app.router.add_post("/v1/chat/completions", handle_chat_completion) app.router.add_post("/v1/responses", handle_responses) app.router.add_get("/v1/models", handle_models) app.router.add_post("/v1/reset-run", handle_reset_run) app.router.add_post("/admin/login/start", handle_admin_login_start) app.router.add_get("/admin/login/status", handle_admin_login_status) return app if __name__ == "__main__": app = create_app() log(f"代理地址: http://{HOST}:{PORT}/v1/chat/completions") log(f"Responses: http://{HOST}:{PORT}/v1/responses") log(f"模型列表: http://{HOST}:{PORT}/v1/models") log(f"重置缓存: http://{HOST}:{PORT}/v1/reset-run (POST)") log(f"健康检查: http://{HOST}:{PORT}/health") if PROXY_API_KEY: log(f"API 鉴权: 已启用 (Bearer {token_fingerprint(PROXY_API_KEY)})", "success") else: log("API 鉴权: 未启用(所有 /v1 请求均可访问)", "warn") if ADMIN_PASSWORD: log("管理页鉴权: 已启用", "success") else: log("管理页鉴权: 未启用", "warn") web.run_app(app, host=HOST, port=PORT)