Spaces:

BG5
/

gemi2

Paused

App Files Files Community

gemi2 / main.py

BG5

Create main.py

4b7cb16 verified 10 months ago

raw

history blame contribute delete

11.1 kB

	import asyncio
	import json
	from datetime import datetime, timezone
	import os

	from fastapi import FastAPI, HTTPException, Request
	from fastapi.middleware.cors import CORSMiddleware
	from fastapi.responses import JSONResponse
	from fastapi.responses import StreamingResponse
	from pydantic import BaseModel
	from typing import List, Optional
	import time
	import uuid
	import logging

	from gemini_webapi import GeminiClient, set_log_level
	from gemini_webapi.constants import Model

	# Configure logging
	logging.basicConfig(level=logging.INFO)
	logger = logging.getLogger(__name__)
	set_log_level("INFO")

	app = FastAPI(title="Gemini API FastAPI Server")

	# Add CORS middleware
	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"],
	allow_credentials=True,
	allow_methods=["*"],
	allow_headers=["*"],
	)

	# Global client
	gemini_client = None

	# Authentication credentials
	SECURE_1PSID = os.environ.get("SECURE_1PSID", "")
	SECURE_1PSIDTS = os.environ.get("SECURE_1PSIDTS", "")

	# Print debug info at startup
	if not SECURE_1PSID or not SECURE_1PSIDTS:
	logger.warning("⚠️ Gemini API credentials are not set or empty! Please check your environment variables.")
	else:
	# Only log the first few characters for security
	logger.info(f"Credentials found. SECURE_1PSID starts with: {SECURE_1PSID[:5]}...")
	logger.info(f"Credentials found. SECURE_1PSIDTS starts with: {SECURE_1PSIDTS[:5]}...")

	# Pydantic models for API requests and responses
	class Message(BaseModel):
	role: str
	content: str
	name: Optional[str] = None


	class ChatCompletionRequest(BaseModel):
	model: str
	messages: List[Message]
	temperature: Optional[float] = 0.7
	top_p: Optional[float] = 1.0
	n: Optional[int] = 1
	stream: Optional[bool] = False
	max_tokens: Optional[int] = None
	presence_penalty: Optional[float] = 0
	frequency_penalty: Optional[float] = 0
	user: Optional[str] = None


	class Choice(BaseModel):
	index: int
	message: Message
	finish_reason: str


	class Usage(BaseModel):
	prompt_tokens: int
	completion_tokens: int
	total_tokens: int


	class ChatCompletionResponse(BaseModel):
	id: str
	object: str = "chat.completion"
	created: int
	model: str
	choices: List[Choice]
	usage: Usage


	class ModelData(BaseModel):
	id: str
	object: str = "model"
	created: int
	owned_by: str = "google"


	class ModelList(BaseModel):
	object: str = "list"
	data: List[ModelData]


	# Simple error handler middleware
	@app.middleware("http")
	async def error_handling(request: Request, call_next):
	try:
	return await call_next(request)
	except Exception as e:
	logger.error(f"Request failed: {str(e)}")
	return JSONResponse(
	status_code=500,
	content={ "error": { "message": str(e), "type": "internal_server_error" } }
	)


	# Get list of available models
	@app.get("/v1/models")
	async def list_models():
	"""返回 gemini_webapi 中声明的模型列表"""
	now = int(datetime.now(tz=timezone.utc).timestamp())
	data = [
	{
	"id": m.model_name, # 如 "gemini-2.0-flash"
	"object": "model",
	"created": now,
	"owned_by": "google-gemini-web"
	}
	for m in Model
	]
	print(data)
	return {"object": "list", "data": data}


	# Helper to convert between Gemini and OpenAI model names
	def map_model_name(openai_model_name: str) -> Model:
	"""根据模型名称字符串查找匹配的 Model 枚举值"""
	# 打印所有可用模型以便调试
	all_models = [m.model_name if hasattr(m, "model_name") else str(m) for m in Model]
	logger.info(f"Available models: {all_models}")

	# 首先尝试直接查找匹配的模型名称
	for m in Model:
	model_name = m.model_name if hasattr(m, "model_name") else str(m)
	if openai_model_name.lower() in model_name.lower():
	return m

	# 如果找不到匹配项，使用默认映射
	model_keywords = {
	"gemini-pro": ["pro", "2.0"],
	"gemini-pro-vision": ["vision", "pro"],
	"gemini-flash": ["flash", "2.0"],
	"gemini-1.5-pro": ["1.5", "pro"],
	"gemini-1.5-flash": ["1.5", "flash"],
	}

	# 根据关键词匹配
	keywords = model_keywords.get(openai_model_name, ["pro"]) # 默认使用pro模型

	for m in Model:
	model_name = m.model_name if hasattr(m, "model_name") else str(m)
	if all(kw.lower() in model_name.lower() for kw in keywords):
	return m

	# 如果还是找不到，返回第一个模型
	return next(iter(Model))


	# Prepare conversation history from OpenAI messages format
	def prepare_conversation(messages: List[Message]) -> str:
	conversation = ""

	for msg in messages:
	if msg.role == "system":
	conversation += f"System: {msg.content}\n\n"
	elif msg.role == "user":
	conversation += f"Human: {msg.content}\n\n"
	elif msg.role == "assistant":
	conversation += f"Assistant: {msg.content}\n\n"

	# Add a final prompt for the assistant to respond to
	conversation += "Assistant: "

	return conversation


	# Dependency to get the initialized Gemini client
	async def get_gemini_client():
	global gemini_client
	if gemini_client is None:
	try:
	gemini_client = GeminiClient(SECURE_1PSID, SECURE_1PSIDTS)
	await gemini_client.init(timeout=30)
	except Exception as e:
	logger.error(f"Failed to initialize Gemini client: {str(e)}")
	raise HTTPException(
	status_code=500,
	detail=f"Failed to initialize Gemini client: {str(e)}"
	)
	return gemini_client


	@app.post("/v1/chat/completions")
	async def create_chat_completion(request: ChatCompletionRequest):
	try:
	# 确保客户端已初始化
	global gemini_client
	if gemini_client is None:
	gemini_client = GeminiClient(SECURE_1PSID, SECURE_1PSIDTS)
	await gemini_client.init(timeout=30)
	logger.info("Gemini client initialized successfully")

	# 转换消息为对话格式
	conversation = prepare_conversation(request.messages)
	logger.info(f"Prepared conversation: {conversation}")

	# 获取适当的模型
	model = map_model_name(request.model)
	logger.info(f"Using model: {model}")

	# 生成响应
	logger.info("Sending request to Gemini...")
	response = await gemini_client.generate_content(conversation, model=model)

	# 提取文本响应
	reply_text = ""
	if hasattr(response, "text"):
	reply_text = response.text
	else:
	reply_text = str(response)

	logger.info(f"Response: {reply_text}")

	if not reply_text or reply_text.strip() == "":
	logger.warning("Empty response received from Gemini")
	reply_text = "服务器返回了空响应。请检查 Gemini API 凭据是否有效。"

	# 创建响应对象
	completion_id = f"chatcmpl-{uuid.uuid4()}"
	created_time = int(time.time())

	# 检查客户端是否请求流式响应
	if request.stream:
	# 实现流式响应
	async def generate_stream():
	# 创建 SSE 格式的流式响应
	# 先发送开始事件
	data = {
	"id": completion_id,
	"object": "chat.completion.chunk",
	"created": created_time,
	"model": request.model,
	"choices": [
	{
	"index": 0,
	"delta": {
	"role": "assistant"
	},
	"finish_reason": None
	}
	]
	}
	yield f"data: {json.dumps(data)}\n\n"

	# 模拟流式输出 - 将文本按字符分割发送
	for char in reply_text:
	data = {
	"id": completion_id,
	"object": "chat.completion.chunk",
	"created": created_time,
	"model": request.model,
	"choices": [
	{
	"index": 0,
	"delta": {
	"content": char
	},
	"finish_reason": None
	}
	]
	}
	yield f"data: {json.dumps(data)}\n\n"
	# 可选：添加短暂延迟以模拟真实的流式输出
	await asyncio.sleep(0.01)

	# 发送结束事件
	data = {
	"id": completion_id,
	"object": "chat.completion.chunk",
	"created": created_time,
	"model": request.model,
	"choices": [
	{
	"index": 0,
	"delta": { },
	"finish_reason": "stop"
	}
	]
	}
	yield f"data: {json.dumps(data)}\n\n"
	yield "data: [DONE]\n\n"

	return StreamingResponse(
	generate_stream(),
	media_type="text/event-stream"
	)
	else:
	# 非流式响应（原来的逻辑）
	result = {
	"id": completion_id,
	"object": "chat.completion",
	"created": created_time,
	"model": request.model,
	"choices": [
	{
	"index": 0,
	"message": {
	"role": "assistant",
	"content": reply_text
	},
	"finish_reason": "stop"
	}
	],
	"usage": {
	"prompt_tokens": len(conversation.split()),
	"completion_tokens": len(reply_text.split()),
	"total_tokens": len(conversation.split()) + len(reply_text.split())
	}
	}

	logger.info(f"Returning response: {result}")
	return result

	except Exception as e:
	logger.error(f"Error generating completion: {str(e)}", exc_info=True)
	raise HTTPException(
	status_code=500,
	detail=f"Error generating completion: {str(e)}"
	)


	@app.get("/")
	async def root():
	return { "status": "online", "message": "Gemini API FastAPI Server is running" }


	if __name__ == "__main__":
	import uvicorn

	uvicorn.run("main:app", host="0.0.0.0", port=7890, log_level="info")