Spaces:
Paused
Paused
File size: 10,992 Bytes
8fea9ab 3cdbb76 8fea9ab 3cdbb76 8fea9ab 3cdbb76 8fea9ab 3cdbb76 8fea9ab 876b43a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 |
from fastapi import FastAPI, HTTPException, Request, status
from fastapi.responses import JSONResponse, HTMLResponse
from fastapi.staticfiles import StaticFiles
from fastapi.templating import Jinja2Templates
from app.models import ErrorResponse
from app.services import GeminiClient
from app.utils import (
APIKeyManager,
test_api_key,
format_log_message,
log_manager,
ResponseCacheManager,
ActiveRequestsManager,
clean_expired_stats,
update_api_call_stats,
check_version,
schedule_cache_cleanup,
handle_exception,
log
)
from app.api import router, init_router, dashboard_router, init_dashboard_router
from app.config.settings import (
FAKE_STREAMING,
FAKE_STREAMING_INTERVAL,
RANDOM_STRING,
RANDOM_STRING_LENGTH,
PASSWORD,
MAX_REQUESTS_PER_MINUTE,
MAX_REQUESTS_PER_DAY_PER_IP,
RETRY_DELAY,
MAX_RETRY_DELAY,
CACHE_EXPIRY_TIME,
MAX_CACHE_ENTRIES,
REMOVE_CACHE_AFTER_USE,
REQUEST_HISTORY_EXPIRY_TIME,
ENABLE_RECONNECT_DETECTION,
api_call_stats,
client_request_history,
version,
API_KEY_DAILY_LIMIT
)
from app.config.safety import SAFETY_SETTINGS, SAFETY_SETTINGS_G2
import os
import json
import asyncio
import time
import logging
from datetime import datetime, timedelta
import sys
import pathlib
# 设置模板目录
BASE_DIR = pathlib.Path(__file__).parent
templates = Jinja2Templates(directory=str(BASE_DIR / "templates"))
app = FastAPI()
# --------------- 全局实例 ---------------
# 初始化API密钥管理器
key_manager = APIKeyManager()
current_api_key = key_manager.get_available_key()
# 创建全局缓存字典,将作为缓存管理器的内部存储
response_cache = {}
# 初始化缓存管理器,使用全局字典作为存储
response_cache_manager = ResponseCacheManager(
expiry_time=CACHE_EXPIRY_TIME,
max_entries=MAX_CACHE_ENTRIES,
remove_after_use=REMOVE_CACHE_AFTER_USE,
cache_dict=response_cache
)
# 活跃请求池 - 将作为活跃请求管理器的内部存储
active_requests_pool = {}
# 初始化活跃请求管理器
active_requests_manager = ActiveRequestsManager(requests_pool=active_requests_pool)
# --------------- 工具函数 ---------------
def switch_api_key():
global current_api_key
key = key_manager.get_available_key() # get_available_key 会处理栈的逻辑
if key:
current_api_key = key
log('info', f"API key 替换为 → {current_api_key[:8]}...", extra={'key': current_api_key[:8], 'request_type': 'switch_key'})
else:
log('error', "API key 替换失败,所有API key都已尝试,请重新配置或稍后重试", extra={'key': 'N/A', 'request_type': 'switch_key', 'status_code': 'N/A'})
async def check_keys():
available_keys = []
for key in key_manager.api_keys:
is_valid = await test_api_key(key)
status_msg = "有效" if is_valid else "无效"
log('info', f"API Key {key[:10]}... {status_msg}.")
if is_valid:
available_keys.append(key)
if not available_keys:
log('error', "没有可用的 API 密钥!", extra={'key': 'N/A', 'request_type': 'startup', 'status_code': 'N/A'})
return available_keys
# 设置全局异常处理
sys.excepthook = handle_exception
# --------------- 事件处理 ---------------
@app.on_event("startup")
async def startup_event():
log('info', "Starting Gemini API proxy...")
# 启动缓存清理定时任务
schedule_cache_cleanup(response_cache_manager, active_requests_manager)
# 检查版本
await check_version()
available_keys = await check_keys()
if available_keys:
key_manager.api_keys = available_keys
key_manager._reset_key_stack() # 启动时也确保创建随机栈
key_manager.show_all_keys()
log('info', f"可用 API 密钥数量:{len(key_manager.api_keys)}")
log('info', f"最大重试次数设置为:{len(key_manager.api_keys)}")
if key_manager.api_keys:
all_models = await GeminiClient.list_available_models(key_manager.api_keys[0])
GeminiClient.AVAILABLE_MODELS = [model.replace(
"models/", "") for model in all_models]
log('info', "Available models loaded.")
# 初始化路由器
init_router(
key_manager,
response_cache_manager,
active_requests_manager,
SAFETY_SETTINGS,
SAFETY_SETTINGS_G2,
current_api_key,
FAKE_STREAMING,
FAKE_STREAMING_INTERVAL,
PASSWORD,
MAX_REQUESTS_PER_MINUTE,
MAX_REQUESTS_PER_DAY_PER_IP
)
# 初始化仪表盘路由器
init_dashboard_router(
key_manager,
response_cache_manager,
active_requests_manager
)
# --------------- 异常处理 ---------------
@app.exception_handler(Exception)
async def global_exception_handler(request: Request, exc: Exception):
from app.utils import translate_error
error_message = translate_error(str(exc))
extra_log_unhandled_exception = {'status_code': 500, 'error_message': error_message}
log('error', f"Unhandled exception: {error_message}", extra=extra_log_unhandled_exception)
return JSONResponse(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, content=ErrorResponse(message=str(exc), type="internal_error").dict())
# --------------- 路由 ---------------
# 包含API路由
app.include_router(router)
app.include_router(dashboard_router)
@app.get("/", response_class=HTMLResponse)
async def root(request: Request):
# 先清理过期数据,确保统计数据是最新的
clean_expired_stats(api_call_stats)
response_cache_manager.clean_expired() # 使用管理器清理缓存
active_requests_manager.clean_completed() # 使用管理器清理活跃请求
# 获取当前统计数据
now = datetime.now()
# 计算过去24小时的调用总数
last_24h_calls = sum(api_call_stats['last_24h']['total'].values())
# 计算过去一小时内的调用总数
one_hour_ago = now - timedelta(hours=1)
hourly_calls = 0
for hour_key, count in api_call_stats['hourly']['total'].items():
try:
hour_time = datetime.strptime(hour_key, '%Y-%m-%d %H:00')
if hour_time >= one_hour_ago:
hourly_calls += count
except ValueError:
continue
# 计算过去一分钟内的调用总数
one_minute_ago = now - timedelta(minutes=1)
minute_calls = 0
for minute_key, count in api_call_stats['minute']['total'].items():
try:
minute_time = datetime.strptime(minute_key, '%Y-%m-%d %H:%M')
if minute_time >= one_minute_ago:
minute_calls += count
except ValueError:
continue
# 获取最近的日志
recent_logs = log_manager.get_recent_logs(500) # 获取最近50条日志
# 获取缓存统计
total_cache = len(response_cache_manager.cache)
valid_cache = sum(1 for _, data in response_cache_manager.cache.items()
if time.time() < data.get('expiry_time', 0))
cache_by_model = {}
# 分析缓存数据
for _, cache_data in response_cache_manager.cache.items():
if time.time() < cache_data.get('expiry_time', 0):
# 按模型统计缓存
model = cache_data.get('response', {}).model
if model:
if model in cache_by_model:
cache_by_model[model] += 1
else:
cache_by_model[model] = 1
# 获取请求历史统计
history_count = len(client_request_history)
# 获取活跃请求统计
active_count = len(active_requests_manager.active_requests)
active_done = sum(1 for task in active_requests_manager.active_requests.values() if task.done())
active_pending = active_count - active_done
# 获取API密钥使用统计
api_key_stats = []
for api_key in key_manager.api_keys:
# 获取API密钥前8位作为标识
api_key_id = api_key[:8]
# 计算24小时内的调用次数
calls_24h = 0
if 'by_endpoint' in api_call_stats['last_24h'] and api_key in api_call_stats['last_24h']['by_endpoint']:
calls_24h = sum(api_call_stats['last_24h']['by_endpoint'][api_key].values())
# 计算使用百分比
usage_percent = (calls_24h / API_KEY_DAILY_LIMIT) * 100 if API_KEY_DAILY_LIMIT > 0 else 0
# 添加到结果列表
api_key_stats.append({
'api_key': api_key_id,
'calls_24h': calls_24h,
'limit': API_KEY_DAILY_LIMIT,
'usage_percent': round(usage_percent, 2)
})
# 按使用百分比降序排序
api_key_stats.sort(key=lambda x: x['usage_percent'], reverse=True)
# 准备模板上下文
context = {
"key_count": len(key_manager.api_keys),
"model_count": len(GeminiClient.AVAILABLE_MODELS),
"retry_count": len(key_manager.api_keys),
"last_24h_calls": last_24h_calls,
"hourly_calls": hourly_calls,
"minute_calls": minute_calls,
"max_requests_per_minute": MAX_REQUESTS_PER_MINUTE,
"max_requests_per_day_per_ip": MAX_REQUESTS_PER_DAY_PER_IP,
"current_time": datetime.now().strftime('%H:%M:%S'),
"logs": recent_logs,
# 添加版本信息
"local_version": version["local_version"],
"remote_version": version["remote_version"],
"has_update": version["has_update"],
# 添加流式响应配置
"fake_streaming": FAKE_STREAMING,
"fake_streaming_interval": FAKE_STREAMING_INTERVAL,
# 添加随机字符串配置
"random_string": RANDOM_STRING,
"random_string_length": RANDOM_STRING_LENGTH,
# 添加缓存信息
"cache_entries": total_cache,
"valid_cache": valid_cache,
"expired_cache": total_cache - valid_cache,
"cache_expiry_time": CACHE_EXPIRY_TIME,
"max_cache_entries": MAX_CACHE_ENTRIES,
"cache_by_model": cache_by_model,
"request_history_count": history_count,
"enable_reconnect_detection": ENABLE_RECONNECT_DETECTION,
"remove_cache_after_use": REMOVE_CACHE_AFTER_USE,
# 添加活跃请求池信息
"active_count": active_count,
"active_done": active_done,
"active_pending": active_pending,
# 添加API密钥统计
"api_key_stats": api_key_stats,
}
# 使用Jinja2模板引擎正确渲染HTML
return templates.TemplateResponse("index.html", {"request": request, **context}) |