Spaces:

smyslenny
/

gemini

Paused

App Files Files Community

gemini / app /main.py

smyslenny

Upload 38 files

8e2bad6 verified about 1 year ago

raw

history blame contribute delete

10.4 kB

	from fastapi import FastAPI, HTTPException, Request, status
	from fastapi.responses import JSONResponse, HTMLResponse
	from fastapi.staticfiles import StaticFiles
	from fastapi.templating import Jinja2Templates
	from app.models import ErrorResponse
	from app.services import GeminiClient
	from app.utils import (
	APIKeyManager,
	test_api_key,
	format_log_message,
	log_manager,
	ResponseCacheManager,
	ActiveRequestsManager,
	clean_expired_stats,
	update_api_call_stats,
	check_version,
	schedule_cache_cleanup,
	handle_exception,
	log
	)
	from app.api import router, init_router, dashboard_router, init_dashboard_router
	from app.config.settings import (
	FAKE_STREAMING,
	FAKE_STREAMING_INTERVAL,
	PASSWORD,
	MAX_REQUESTS_PER_MINUTE,
	MAX_REQUESTS_PER_DAY_PER_IP,
	RETRY_DELAY,
	MAX_RETRY_DELAY,
	CACHE_EXPIRY_TIME,
	MAX_CACHE_ENTRIES,
	REMOVE_CACHE_AFTER_USE,
	REQUEST_HISTORY_EXPIRY_TIME,
	ENABLE_RECONNECT_DETECTION,
	api_call_stats,
	client_request_history,
	local_version,
	remote_version,
	has_update,
	API_KEY_DAILY_LIMIT
	)
	from app.config.safety import SAFETY_SETTINGS, SAFETY_SETTINGS_G2
	import os
	import json
	import asyncio
	import time
	import logging
	from datetime import datetime, timedelta
	import sys
	import pathlib

	# 设置模板目录
	BASE_DIR = pathlib.Path(__file__).parent
	templates = Jinja2Templates(directory=str(BASE_DIR / "templates"))

	app = FastAPI()

	# --------------- 全局实例 ---------------

	# 初始化API密钥管理器
	key_manager = APIKeyManager()
	current_api_key = key_manager.get_available_key()

	# 创建全局缓存字典，将作为缓存管理器的内部存储
	response_cache = {}

	# 初始化缓存管理器，使用全局字典作为存储
	response_cache_manager = ResponseCacheManager(
	expiry_time=CACHE_EXPIRY_TIME,
	max_entries=MAX_CACHE_ENTRIES,
	remove_after_use=REMOVE_CACHE_AFTER_USE,
	cache_dict=response_cache
	)

	# 活跃请求池 - 将作为活跃请求管理器的内部存储
	active_requests_pool = {}

	# 初始化活跃请求管理器
	active_requests_manager = ActiveRequestsManager(requests_pool=active_requests_pool)

	# --------------- 工具函数 ---------------

	def switch_api_key():
	global current_api_key
	key = key_manager.get_available_key() # get_available_key 会处理栈的逻辑
	if key:
	current_api_key = key
	log('info', f"API key 替换为 → {current_api_key[:8]}...", extra={'key': current_api_key[:8], 'request_type': 'switch_key'})
	else:
	log('error', "API key 替换失败，所有API key都已尝试，请重新配置或稍后重试", extra={'key': 'N/A', 'request_type': 'switch_key', 'status_code': 'N/A'})

	async def check_keys():
	available_keys = []
	for key in key_manager.api_keys:
	is_valid = await test_api_key(key)
	status_msg = "有效" if is_valid else "无效"
	log('info', f"API Key {key[:10]}... {status_msg}.")
	if is_valid:
	available_keys.append(key)
	if not available_keys:
	log('error', "没有可用的 API 密钥！", extra={'key': 'N/A', 'request_type': 'startup', 'status_code': 'N/A'})
	return available_keys

	# 设置全局异常处理
	sys.excepthook = handle_exception

	# --------------- 事件处理 ---------------

	@app.on_event("startup")
	async def startup_event():
	log('info', "Starting Gemini API proxy...")

	# 启动缓存清理定时任务
	schedule_cache_cleanup(response_cache_manager, active_requests_manager)

	# 检查版本
	await check_version()

	available_keys = await check_keys()
	if available_keys:
	key_manager.api_keys = available_keys
	key_manager._reset_key_stack() # 启动时也确保创建随机栈
	key_manager.show_all_keys()
	log('info', f"可用 API 密钥数量：{len(key_manager.api_keys)}")
	log('info', f"最大重试次数设置为：{len(key_manager.api_keys)}")
	if key_manager.api_keys:
	all_models = await GeminiClient.list_available_models(key_manager.api_keys[0])
	GeminiClient.AVAILABLE_MODELS = [model.replace(
	"models/", "") for model in all_models]
	log('info', "Available models loaded.")

	# 初始化路由器
	init_router(
	key_manager,
	response_cache_manager,
	active_requests_manager,
	SAFETY_SETTINGS,
	SAFETY_SETTINGS_G2,
	current_api_key,
	FAKE_STREAMING,
	FAKE_STREAMING_INTERVAL,
	PASSWORD,
	MAX_REQUESTS_PER_MINUTE,
	MAX_REQUESTS_PER_DAY_PER_IP
	)

	# 初始化仪表盘路由器
	init_dashboard_router(
	key_manager,
	response_cache_manager,
	active_requests_manager
	)

	# --------------- 异常处理 ---------------

	@app.exception_handler(Exception)
	async def global_exception_handler(request: Request, exc: Exception):
	from app.utils import translate_error
	error_message = translate_error(str(exc))
	extra_log_unhandled_exception = {'status_code': 500, 'error_message': error_message}
	log('error', f"Unhandled exception: {error_message}", extra=extra_log_unhandled_exception)
	return JSONResponse(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, content=ErrorResponse(message=str(exc), type="internal_error").dict())

	# --------------- 路由 ---------------

	# 包含API路由
	app.include_router(router)
	app.include_router(dashboard_router)

	@app.get("/", response_class=HTMLResponse)
	async def root(request: Request):
	# 先清理过期数据，确保统计数据是最新的
	clean_expired_stats(api_call_stats)
	response_cache_manager.clean_expired() # 使用管理器清理缓存
	active_requests_manager.clean_completed() # 使用管理器清理活跃请求
	# 获取当前统计数据
	now = datetime.now()

	# 计算过去24小时的调用总数
	last_24h_calls = sum(api_call_stats['last_24h']['total'].values())

	# 计算过去一小时内的调用总数
	one_hour_ago = now - timedelta(hours=1)
	hourly_calls = 0
	for hour_key, count in api_call_stats['hourly']['total'].items():
	try:
	hour_time = datetime.strptime(hour_key, '%Y-%m-%d %H:00')
	if hour_time >= one_hour_ago:
	hourly_calls += count
	except ValueError:
	continue

	# 计算过去一分钟内的调用总数
	one_minute_ago = now - timedelta(minutes=1)
	minute_calls = 0
	for minute_key, count in api_call_stats['minute']['total'].items():
	try:
	minute_time = datetime.strptime(minute_key, '%Y-%m-%d %H:%M')
	if minute_time >= one_minute_ago:
	minute_calls += count
	except ValueError:
	continue

	# 获取最近的日志
	recent_logs = log_manager.get_recent_logs(50) # 获取最近50条日志

	# 获取缓存统计
	total_cache = len(response_cache_manager.cache)
	valid_cache = sum(1 for _, data in response_cache_manager.cache.items()
	if time.time() < data.get('expiry_time', 0))
	cache_by_model = {}

	# 分析缓存数据
	for _, cache_data in response_cache_manager.cache.items():
	if time.time() < cache_data.get('expiry_time', 0):
	# 按模型统计缓存
	model = cache_data.get('response', {}).model
	if model:
	if model in cache_by_model:
	cache_by_model[model] += 1
	else:
	cache_by_model[model] = 1

	# 获取请求历史统计
	history_count = len(client_request_history)

	# 获取活跃请求统计
	active_count = len(active_requests_manager.active_requests)
	active_done = sum(1 for task in active_requests_manager.active_requests.values() if task.done())
	active_pending = active_count - active_done

	# 获取API密钥使用统计
	api_key_stats = []
	for api_key in key_manager.api_keys:
	# 获取API密钥前8位作为标识
	api_key_id = api_key[:8]

	# 计算24小时内的调用次数
	calls_24h = 0
	if 'by_endpoint' in api_call_stats['last_24h'] and api_key in api_call_stats['last_24h']['by_endpoint']:
	calls_24h = sum(api_call_stats['last_24h']['by_endpoint'][api_key].values())

	# 计算使用百分比
	usage_percent = (calls_24h / API_KEY_DAILY_LIMIT) * 100 if API_KEY_DAILY_LIMIT > 0 else 0

	# 添加到结果列表
	api_key_stats.append({
	'api_key': api_key_id,
	'calls_24h': calls_24h,
	'limit': API_KEY_DAILY_LIMIT,
	'usage_percent': round(usage_percent, 2)
	})

	# 按使用百分比降序排序
	api_key_stats.sort(key=lambda x: x['usage_percent'], reverse=True)

	# 准备模板上下文
	context = {
	"key_count": len(key_manager.api_keys),
	"model_count": len(GeminiClient.AVAILABLE_MODELS),
	"retry_count": len(key_manager.api_keys),
	"last_24h_calls": last_24h_calls,
	"hourly_calls": hourly_calls,
	"minute_calls": minute_calls,
	"max_requests_per_minute": MAX_REQUESTS_PER_MINUTE,
	"max_requests_per_day_per_ip": MAX_REQUESTS_PER_DAY_PER_IP,
	"current_time": datetime.now().strftime('%H:%M:%S'),
	"logs": recent_logs,
	# 添加版本信息
	"local_version": local_version,
	"remote_version": remote_version,
	"has_update": has_update,
	# 添加缓存信息
	"cache_entries": total_cache,
	"valid_cache": valid_cache,
	"expired_cache": total_cache - valid_cache,
	"cache_expiry_time": CACHE_EXPIRY_TIME,
	"max_cache_entries": MAX_CACHE_ENTRIES,
	"cache_by_model": cache_by_model,
	"request_history_count": history_count,
	"enable_reconnect_detection": ENABLE_RECONNECT_DETECTION,
	"remove_cache_after_use": REMOVE_CACHE_AFTER_USE,
	# 添加活跃请求池信息
	"active_count": active_count,
	"active_done": active_done,
	"active_pending": active_pending,
	# 添加API密钥统计
	"api_key_stats": api_key_stats,
	}

	# 使用Jinja2模板引擎正确渲染HTML
	return templates.TemplateResponse("index.html", {"request": request, **context})