Spaces:

deeme
/

google

Paused

App Files Files Community

deeme commited on Apr 21, 2025

Commit

2789f98

verified ·

1 Parent(s): 3c00b29

Upload 4 files

Browse files

Files changed (4) hide show

Dockerfile +16 -0
README.md +10 -10
main.py +349 -0
requirements.txt +4 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,16 @@

+FROM python:3.11-slim
+WORKDIR /app
+# Install dependencies
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+# Copy application code
+COPY main.py .
+# Expose the port the app runs on
+EXPOSE 7860
+# Command to run the application
+CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]

README.md CHANGED Viewed

@@ -1,10 +1,10 @@
----
-title: Google
-emoji: 👁
-colorFrom: blue
-colorTo: green
-sdk: docker
-pinned: false
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+---
+title: google
+emoji: 🌍
+colorFrom: blue
+colorTo: pink
+sdk: docker
+pinned: false
+license: mit
+---

main.py ADDED Viewed

	@@ -0,0 +1,349 @@

+import asyncio
+import json
+from datetime import datetime, timezone
+import os
+from fastapi import FastAPI, HTTPException, Request
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import JSONResponse
+from fastapi.responses import StreamingResponse
+from pydantic import BaseModel
+from typing import List, Optional
+import time
+import uuid
+import logging
+from gemini_webapi import GeminiClient, set_log_level
+from gemini_webapi.constants import Model
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+set_log_level("INFO")
+app = FastAPI(title="Gemini API FastAPI Server")
+# Add CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# Global client
+gemini_client = None
+# Authentication credentials
+SECURE_1PSID = os.environ.get("SECURE_1PSID", "")
+SECURE_1PSIDTS = os.environ.get("SECURE_1PSIDTS", "")
+# Print debug info at startup
+if not SECURE_1PSID or not SECURE_1PSIDTS:
+    logger.warning("⚠️ Gemini API credentials are not set or empty! Please check your environment variables.")
+else:
+    # Only log the first few characters for security
+    logger.info(f"Credentials found. SECURE_1PSID starts with: {SECURE_1PSID[:5]}...")
+    logger.info(f"Credentials found. SECURE_1PSIDTS starts with: {SECURE_1PSIDTS[:5]}...")
+# Pydantic models for API requests and responses
+class Message(BaseModel):
+    role: str
+    content: str
+    name: Optional[str] = None
+class ChatCompletionRequest(BaseModel):
+    model: str
+    messages: List[Message]
+    temperature: Optional[float] = 0.7
+    top_p: Optional[float] = 1.0
+    n: Optional[int] = 1
+    stream: Optional[bool] = False
+    max_tokens: Optional[int] = None
+    presence_penalty: Optional[float] = 0
+    frequency_penalty: Optional[float] = 0
+    user: Optional[str] = None
+class Choice(BaseModel):
+    index: int
+    message: Message
+    finish_reason: str
+class Usage(BaseModel):
+    prompt_tokens: int
+    completion_tokens: int
+    total_tokens: int
+class ChatCompletionResponse(BaseModel):
+    id: str
+    object: str = "chat.completion"
+    created: int
+    model: str
+    choices: List[Choice]
+    usage: Usage
+class ModelData(BaseModel):
+    id: str
+    object: str = "model"
+    created: int
+    owned_by: str = "google"
+class ModelList(BaseModel):
+    object: str = "list"
+    data: List[ModelData]
+# Simple error handler middleware
+@app.middleware("http")
+async def error_handling(request: Request, call_next):
+    try:
+        return await call_next(request)
+    except Exception as e:
+        logger.error(f"Request failed: {str(e)}")
+        return JSONResponse(
+            status_code=500,
+            content={ "error": { "message": str(e), "type": "internal_server_error" } }
+        )
+# Get list of available models
+@app.get("/v1/models")
+async def list_models():
+    """返回 gemini_webapi 中声明的模型列表"""
+    now = int(datetime.now(tz=timezone.utc).timestamp())
+    data = [
+        {
+            "id": m.model_name,          # 如 "gemini-2.0-flash"
+            "object": "model",
+            "created": now,
+            "owned_by": "google-gemini-web"
+        }
+        for m in Model
+    ]
+    print(data)
+    return {"object": "list", "data": data}
+# Helper to convert between Gemini and OpenAI model names
+def map_model_name(openai_model_name: str) -> Model:
+    """根据模型名称字符串查找匹配的 Model 枚举值"""
+    # 打印所有可用模型以便调试
+    all_models = [m.model_name if hasattr(m, "model_name") else str(m) for m in Model]
+    logger.info(f"Available models: {all_models}")
+    # 首先尝试直接查找匹配的模型名称
+    for m in Model:
+        model_name = m.model_name if hasattr(m, "model_name") else str(m)
+        if openai_model_name.lower() in model_name.lower():
+            return m
+    # 如果找不到匹配项，使用默认映射
+    model_keywords = {
+        "gemini-pro": ["pro", "2.0"],
+        "gemini-pro-vision": ["vision", "pro"],
+        "gemini-flash": ["flash", "2.0"],
+        "gemini-1.5-pro": ["1.5", "pro"],
+        "gemini-1.5-flash": ["1.5", "flash"],
+    }
+    # 根据关键词匹配
+    keywords = model_keywords.get(openai_model_name, ["pro"])  # 默认使用pro模型
+    for m in Model:
+        model_name = m.model_name if hasattr(m, "model_name") else str(m)
+        if all(kw.lower() in model_name.lower() for kw in keywords):
+            return m
+    # 如果还是找不到，返回第一个模型
+    return next(iter(Model))
+# Prepare conversation history from OpenAI messages format
+def prepare_conversation(messages: List[Message]) -> str:
+    conversation = ""
+    for msg in messages:
+        if msg.role == "system":
+            conversation += f"System: {msg.content}\n\n"
+        elif msg.role == "user":
+            conversation += f"Human: {msg.content}\n\n"
+        elif msg.role == "assistant":
+            conversation += f"Assistant: {msg.content}\n\n"
+    # Add a final prompt for the assistant to respond to
+    conversation += "Assistant: "
+    return conversation
+# Dependency to get the initialized Gemini client
+async def get_gemini_client():
+    global gemini_client
+    if gemini_client is None:
+        try:
+            gemini_client = GeminiClient(SECURE_1PSID, SECURE_1PSIDTS)
+            await gemini_client.init(timeout=30)
+        except Exception as e:
+            logger.error(f"Failed to initialize Gemini client: {str(e)}")
+            raise HTTPException(
+                status_code=500,
+                detail=f"Failed to initialize Gemini client: {str(e)}"
+            )
+    return gemini_client
+@app.post("/v1/chat/completions")
+async def create_chat_completion(request: ChatCompletionRequest):
+    try:
+        # 确保客户端已初始化
+        global gemini_client
+        if gemini_client is None:
+            gemini_client = GeminiClient(SECURE_1PSID, SECURE_1PSIDTS)
+            await gemini_client.init(timeout=30)
+            logger.info("Gemini client initialized successfully")
+        # 转换消息为对话格式
+        conversation = prepare_conversation(request.messages)
+        logger.info(f"Prepared conversation: {conversation}")
+        # 获取适当的模型
+        model = map_model_name(request.model)
+        logger.info(f"Using model: {model}")
+        # 生成响应
+        logger.info("Sending request to Gemini...")
+        response = await gemini_client.generate_content(conversation, model=model)
+        # 提取文本响应
+        reply_text = ""
+        if hasattr(response, "text"):
+            reply_text = response.text
+        else:
+            reply_text = str(response)
+        logger.info(f"Response: {reply_text}")
+        if not reply_text or reply_text.strip() == "":
+            logger.warning("Empty response received from Gemini")
+            reply_text = "服务器返回了空响应。请检查 Gemini API 凭据是否有效。"
+        # 创建响应对象
+        completion_id = f"chatcmpl-{uuid.uuid4()}"
+        created_time = int(time.time())
+        # 检查客户端是否请求流式响应
+        if request.stream:
+            # 实现流式响应
+            async def generate_stream():
+                # 创建 SSE 格式的流式响应
+                # 先发送开始事件
+                data = {
+                    "id": completion_id,
+                    "object": "chat.completion.chunk",
+                    "created": created_time,
+                    "model": request.model,
+                    "choices": [
+                        {
+                            "index": 0,
+                            "delta": {
+                                "role": "assistant"
+                            },
+                            "finish_reason": None
+                        }
+                    ]
+                }
+                yield f"data: {json.dumps(data)}\n\n"
+                # 模拟流式输出 - 将文本按字符分割发送
+                for char in reply_text:
+                    data = {
+                        "id": completion_id,
+                        "object": "chat.completion.chunk",
+                        "created": created_time,
+                        "model": request.model,
+                        "choices": [
+                            {
+                                "index": 0,
+                                "delta": {
+                                    "content": char
+                                },
+                                "finish_reason": None
+                            }
+                        ]
+                    }
+                    yield f"data: {json.dumps(data)}\n\n"
+                    # 可选：添加短暂延迟以模拟真实的流式输出
+                    await asyncio.sleep(0.01)
+                # 发送结束事件
+                data = {
+                    "id": completion_id,
+                    "object": "chat.completion.chunk",
+                    "created": created_time,
+                    "model": request.model,
+                    "choices": [
+                        {
+                            "index": 0,
+                            "delta": { },
+                            "finish_reason": "stop"
+                        }
+                    ]
+                }
+                yield f"data: {json.dumps(data)}\n\n"
+                yield "data: [DONE]\n\n"
+            return StreamingResponse(
+                generate_stream(),
+                media_type="text/event-stream"
+            )
+        else:
+            # 非流式响应（原来的逻辑）
+            result = {
+                "id": completion_id,
+                "object": "chat.completion",
+                "created": created_time,
+                "model": request.model,
+                "choices": [
+                    {
+                        "index": 0,
+                        "message": {
+                            "role": "assistant",
+                            "content": reply_text
+                        },
+                        "finish_reason": "stop"
+                    }
+                ],
+                "usage": {
+                    "prompt_tokens": len(conversation.split()),
+                    "completion_tokens": len(reply_text.split()),
+                    "total_tokens": len(conversation.split()) + len(reply_text.split())
+                }
+            }
+            logger.info(f"Returning response: {result}")
+            return result
+    except Exception as e:
+        logger.error(f"Error generating completion: {str(e)}", exc_info=True)
+        raise HTTPException(
+            status_code=500,
+            detail=f"Error generating completion: {str(e)}"
+        )
+@app.get("/")
+async def root():
+    return { "status": "online", "message": "Gemini API FastAPI Server is running" }
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run("main:app", host="0.0.0.0", port=7860, log_level="info")

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+browser-cookie3>=0.20.1
+fastapi>=0.115.12
+gemini-webapi>=1.11.0
+uvicorn[standard]>=0.34.1