Spaces:

sanbo1200
/

zai

Runtime error

App Files Files Community

sanbo110 commited on Jan 15

Commit

f78578c

1 Parent(s): 9da15c9

update sth at 2026-01-15 15:33:59

Browse files

Files changed (38) hide show

.env +28 -11
.gitattributes +0 -2
.github/workflows/docker.yml +0 -64
.gitignore +0 -180
Dockerfile +6 -9
NGINX_SETUP.md +10 -10
README_DOCKER.md +10 -10
app/__pycache__/__init__.cpython-311.pyc +0 -0
app/admin/api.py +1 -1
app/core/__pycache__/__init__.cpython-311.pyc +0 -0
app/core/__pycache__/config.cpython-311.pyc +0 -0
app/core/__pycache__/openai.cpython-311.pyc +0 -0
app/core/config.py +11 -11
app/core/openai.py +5 -7
app/models/__pycache__/__init__.cpython-311.pyc +0 -0
app/models/__pycache__/schemas.cpython-311.pyc +0 -0
app/providers/__pycache__/__init__.cpython-311.pyc +0 -0
app/providers/__pycache__/base.cpython-311.pyc +0 -0
app/providers/__pycache__/k2think_provider.cpython-311.pyc +0 -0
app/providers/__pycache__/longcat_provider.cpython-311.pyc +0 -0
app/providers/__pycache__/provider_factory.cpython-311.pyc +0 -0
app/providers/__pycache__/zai_provider.cpython-311.pyc +0 -0
app/providers/zai_provider.py +17 -14
app/templates/config.html +1 -1
app/utils/__pycache__/__init__.cpython-311.pyc +0 -0
app/utils/__pycache__/fe_version.cpython-311.pyc +0 -0
app/utils/__pycache__/logger.cpython-311.pyc +0 -0
app/utils/__pycache__/reload_config.cpython-311.pyc +0 -0
app/utils/__pycache__/signature.cpython-311.pyc +0 -0
app/utils/__pycache__/token_pool.cpython-311.pyc +0 -0
app/utils/__pycache__/tool_call_handler.cpython-311.pyc +0 -0
app/utils/__pycache__/user_agent.cpython-311.pyc +0 -0
app/utils/fe_version.py +112 -0
app/utils/logger.py +0 -1
docker-compose.yml +3 -3
nginx.conf +0 -157
nginx.conf.example +7 -7
xREADME.md +0 -347

.env CHANGED Viewed

@@ -1,18 +1,35 @@
-# 代理服务配置文件
-# 匿名模式配置
-# 跳过客户端认证（启用匿名访问）
 SKIP_AUTH_TOKEN=true
-# Z.AI 匿名用户模式
-# false: 使用认证 Token 令牌，失败时自动降级为匿名请求
-# true: 自动从 Z.ai 获取临时访问令牌，避免对话历史共享
 ANONYMOUS_MODE=true
-# 服务监听端口
-LISTEN_PORT=7860
-# 调试日志
-DEBUG_LOGGING=true
-AUTH_TOKEN=sk-your-key

+# ==============================================
+# Z.AI API Server - Docker 环境变量配置示例
+# ==============================================
+# 管理后台密码
+ADMIN_PASSWORD=admin123
+# API 认证密钥 (用于验证客户端请求)
+AUTH_TOKEN=sk-your-key
+# 是否跳过 API Key 验证 (开发环境可设为 true)
 SKIP_AUTH_TOKEN=true
+# 调试日志 (生产环境建议设为 false)
+DEBUG_LOGGING=true
+# 匿名模式 (允许无 token 访问,需要配合 SKIP_AUTH_TOKEN=true)
 ANONYMOUS_MODE=true
+# Function Call 功能开关 (是否支持工具调用)
+TOOL_SUPPORT=true
+# 工具调用扫描限制 (字符数)
+SCAN_LIMIT=200000
+# 数据库路径 (Docker 环境使用持久化卷)
+DB_PATH=/app/data/tokens.db
+# Token 池配置
+TOKEN_FAILURE_THRESHOLD=3
+TOKEN_RECOVERY_TIMEOUT=300
+# 服务配置
+SERVICE_NAME=Z.AI_API_Server
+LISTEN_PORT=7860

.gitattributes DELETED Viewed

	@@ -1,2 +0,0 @@
1	- # Auto detect text files and perform LF normalization
2	- * text=auto

.github/workflows/docker.yml DELETED Viewed

@@ -1,64 +0,0 @@
-name: Build and Push Docker Image
-on:
-  push:
-    branches:
-      - main
-    tags:
-      - 'v*'
-env:
-  IMAGE_NAME: z-ai2api-python
-jobs:
-  docker:
-    runs-on: ubuntu-latest
-    permissions:
-      contents: read
-      packages: write
-    steps:
-      - name: Checkout
-        uses: actions/checkout@v4
-      - name: Set up Docker Buildx
-        uses: docker/setup-buildx-action@v3
-      - name: Login to GitHub Container Registry
-        uses: docker/login-action@v3
-        with:
-          registry: ghcr.io
-          username: ${{ github.actor }}
-          password: ${{ secrets.GITHUB_TOKEN }}
-      - name: Login to Docker Hub
-        if: github.event_name != 'pull_request'
-        uses: docker/login-action@v3
-        with:
-          username: ${{ secrets.DOCKERHUB_USERNAME }}
-          password: ${{ secrets.DOCKERHUB_TOKEN }}
-      - name: Extract metadata
-        id: meta
-        uses: docker/metadata-action@v5
-        with:
-          images: |
-            ghcr.io/${{ github.repository }}
-            ${{ secrets.DOCKERHUB_USERNAME }}/${{ env.IMAGE_NAME }}
-          tags: |
-            type=ref,event=branch
-            type=semver,pattern={{version}}
-            type=semver,pattern={{major}}.{{minor}}
-            type=raw,value=latest,enable={{is_default_branch}}
-      - name: Build and push
-        uses: docker/build-push-action@v5
-        with:
-          context: .
-          file: ./deploy/Dockerfile
-          platforms: linux/amd64,linux/arm64
-          push: true
-          tags: ${{ steps.meta.outputs.tags }}
-          labels: ${{ steps.meta.outputs.labels }}
-          cache-from: type=gha
-          cache-to: type=gha,mode=max

.gitignore DELETED Viewed

@@ -1,180 +0,0 @@
-# Custom
-.vs/
-.vscode/
-.idea/
-.conda/
-*.zip
-*.txt
-*.pid
-docs/
-output/
-main.build/
-main.dist/
-main.onefile-build/
-*report.xml
-*.yaml
-logs/
-backup/
-uv.lock
-AGENTS.md
-*.db
-# AI Toolset
-.augment/
-.cursor/
-.claude/
-CLAUDE.md
-# Byte-compiled / optimized / DLL files
-__pycache__/
-*.py[cod]
-*$py.class
-# C extensions
-*.so
-# Distribution / packaging
-.Python
-build/
-develop-eggs/
-dist/
-downloads/
-eggs/
-.eggs/
-lib/
-lib64/
-parts/
-sdist/
-var/
-wheels/
-share/python-wheels/
-*.egg-info/
-.installed.cfg
-*.egg
-MANIFEST
-# PyInstaller
-#  Usually these files are written by a python script from a template
-#  before PyInstaller builds the exe, so as to inject date/other infos into it.
-*.manifest
-*.spec
-# Installer logs
-pip-log.txt
-pip-delete-this-directory.txt
-# Unit test / coverage reports
-htmlcov/
-.tox/
-.nox/
-.coverage
-.coverage.*
-.cache
-nosetests.xml
-coverage.xml
-*.cover
-*.py,cover
-.hypothesis/
-.pytest_cache/
-cover/
-# Translations
-*.mo
-*.pot
-# Django stuff:
-*.log
-local_settings.py
-db.sqlite3
-db.sqlite3-journal
-# Flask stuff:
-instance/
-.webassets-cache
-# Scrapy stuff:
-.scrapy
-# Sphinx documentation
-docs/_build/
-# PyBuilder
-.pybuilder/
-target/
-# Jupyter Notebook
-.ipynb_checkpoints
-# IPython
-profile_default/
-ipython_config.py
-# pyenv
-#   For a library or package, you might want to ignore these files since the code is
-#   intended to run in multiple environments; otherwise, check them in:
-# .python-version
-# pipenv
-#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
-#   However, in case of collaboration, if having platform-specific dependencies or dependencies
-#   having no cross-platform support, pipenv may install dependencies that don't work, or not
-#   install all needed dependencies.
-#Pipfile.lock
-# poetry
-#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
-#   This is especially recommended for binary packages to ensure reproducibility, and is more
-#   commonly ignored for libraries.
-#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
-#poetry.lock
-# pdm
-#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
-#pdm.lock
-#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
-#   in version control.
-#   https://pdm.fming.dev/#use-with-ide
-.pdm.toml
-# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
-__pypackages__/
-# Celery stuff
-celerybeat-schedule
-celerybeat.pid
-# SageMath parsed files
-*.sage.py
-# Environments
-.env
-.venv
-env/
-venv/
-ENV/
-env.bak/
-venv.bak/
-# Spyder project settings
-.spyderproject
-.spyproject
-# Rope project settings
-.ropeproject
-# mkdocs documentation
-/site
-# mypy
-.mypy_cache/
-.dmypy.json
-dmypy.json
-# Pyre type checker
-.pyre/
-# pytype static type analyzer
-.pytype/
-# Cython debug symbols
-cython_debug/

Dockerfile CHANGED Viewed

@@ -4,8 +4,9 @@ FROM python:3.12-slim
 WORKDIR /app
 # Create data and logs directories with proper permissions
-RUN mkdir -p /app/data /app/logs && \
-    chmod 755 /app/data /app/logs
 # Install dependencies
 COPY requirements.txt .
@@ -14,18 +15,14 @@ RUN pip install --no-cache-dir -r requirements.txt
 # Copy application code
 COPY . .
-# Set environment variable for database path
 ENV DB_PATH=/app/data/tokens.db
 ENV SKIP_AUTH_TOKEN=true
 ENV ANONYMOUS_MODE=true
-# 服务监听端口
-ENV LISTEN_PORT=7860
-# 调试日志
-ENV DEBUG_LOGGING=true
-# Expose port
 EXPOSE 7860
 # Run the application
 CMD ["python", "main.py"]

 WORKDIR /app
 # Create data and logs directories with proper permissions
+# HuggingFace Spaces runs as non-root user, need proper permissions
+RUN mkdir -p /app/data /app/logs /app/app/static/css /app/app/static/js && \
+    chmod -R 777 /app/data /app/logs /app/app/static
 # Install dependencies
 COPY requirements.txt .
 # Copy application code
 COPY . .
+# Set environment variables
 ENV DB_PATH=/app/data/tokens.db
+ENV LISTEN_PORT=7860
 ENV SKIP_AUTH_TOKEN=true
 ENV ANONYMOUS_MODE=true
+# Expose HuggingFace Spaces default port
 EXPOSE 7860
 # Run the application
 CMD ["python", "main.py"]

NGINX_SETUP.md CHANGED Viewed

@@ -37,7 +37,7 @@ server {
     location /ai2api {
         # 代理到后端服务
-        proxy_pass http://127.0.0.1:7860;
         # 传递原始请求信息
         proxy_set_header Host $host;
@@ -72,7 +72,7 @@ services:
       - LISTEN_PORT=7860
       # ... 其他环境变量
     ports:
-      - "7860:7860"
 ```
 ### 4. 重启服务
@@ -93,8 +93,8 @@ docker-compose restart
 配置完成后,服务访问地址如下:
-- **API 端点**: `http://your-domain.com/ai2api/v1/chat/completions`
-- **模型列表**: `http://your-domain.com/ai2api/v1/models`
 - **管理后台**: `http://your-domain.com/ai2api/admin/login`
 - **根路径**: `http://your-domain.com/ai2api/`
@@ -110,7 +110,7 @@ ROOT_PATH=/api
 **Nginx 配置**:
 ```nginx
 location /api {
-    proxy_pass http://127.0.0.1:7860;
     # ... 其他配置
 }
 ```
@@ -127,7 +127,7 @@ ROOT_PATH=
 **Nginx 配置**:
 ```nginx
 location / {
-    proxy_pass http://127.0.0.1:7860;
     # ... 其他配置
 }
 ```
@@ -144,7 +144,7 @@ ROOT_PATH=/services/ai/chat
 **Nginx 配置**:
 ```nginx
 location /services/ai/chat {
-    proxy_pass http://127.0.0.1:7860;
     # ... 其他配置
 }
 ```
@@ -215,7 +215,7 @@ proxy_set_header X-Forwarded-Proto $scheme;
 1. **访问健康检查端点**:
    ```bash
-   curl http://your-domain.com/ai2api/v1/models
    ```
 2. **访问管理后台**:
@@ -246,7 +246,7 @@ server {
     ssl_certificate_key /path/to/key.pem;
     location /ai2api {
-        proxy_pass http://127.0.0.1:7860;
         proxy_set_header X-Forwarded-Proto https;
         # ... 其他配置
     }
@@ -257,7 +257,7 @@ server {
 ```nginx
 upstream ai2api_backend {
-    server 127.0.0.1:7860;
     server 127.0.0.1:8081;
     server 127.0.0.1:8082;
 }

     location /ai2api {
         # 代理到后端服务
+        proxy_pass http://127.0.0.1:8080;
         # 传递原始请求信息
         proxy_set_header Host $host;
       - LISTEN_PORT=7860
       # ... 其他环境变量
     ports:
+      - "8080:8080"
 ```
 ### 4. 重启服务
 配置完成后,服务访问地址如下:
+- **API 端点**: `http://your-domain.com/ai2api/hf/v1/chat/completions`
+- **模型列表**: `http://your-domain.com/ai2api/hf/v1/models`
 - **管理后台**: `http://your-domain.com/ai2api/admin/login`
 - **根路径**: `http://your-domain.com/ai2api/`
 **Nginx 配置**:
 ```nginx
 location /api {
+    proxy_pass http://127.0.0.1:8080;
     # ... 其他配置
 }
 ```
 **Nginx 配置**:
 ```nginx
 location / {
+    proxy_pass http://127.0.0.1:8080;
     # ... 其他配置
 }
 ```
 **Nginx 配置**:
 ```nginx
 location /services/ai/chat {
+    proxy_pass http://127.0.0.1:8080;
     # ... 其他配置
 }
 ```
 1. **访问健康检查端点**:
    ```bash
+   curl http://your-domain.com/ai2api/hf/v1/models
    ```
 2. **访问管理后台**:
     ssl_certificate_key /path/to/key.pem;
     location /ai2api {
+        proxy_pass http://127.0.0.1:8080;
         proxy_set_header X-Forwarded-Proto https;
         # ... 其他配置
     }
 ```nginx
 upstream ai2api_backend {
+    server 127.0.0.1:8080;
     server 127.0.0.1:8081;
     server 127.0.0.1:8082;
 }

README_DOCKER.md CHANGED Viewed

@@ -16,7 +16,7 @@ mkdir -p data logs
 # 快速启动
 docker run -d \
   --name z-ai-api-server \
-  -p 7860:7860 \
   -e ADMIN_PASSWORD=admin123 \
   -e AUTH_TOKEN=sk-your-api-key \
   -e ANONYMOUS_MODE=true \
@@ -48,7 +48,7 @@ docker compose up -d
 docker compose logs -f api-server
 ```
-服务将在 `http://localhost:7860` 启动。
 ## 架构说明
@@ -222,10 +222,10 @@ docker compose config
 ### 端口冲突
-如端口 7860 被占用,修改 `docker-compose.yml`:
 ```yaml
 ports:
-  - "8081:7860"  # 映射到宿主机 8081 端口
 ```
 ### 健康检查失败
@@ -235,7 +235,7 @@ ports:
 docker compose ps
 # 手动测试接口
-curl http://localhost:7860/v1/models
 # 进入容器排查
 docker exec -it z-ai-api-server bash
@@ -245,11 +245,11 @@ docker exec -it z-ai-api-server bash
 | 端点 | 地址 | 说明 |
 |------|------|------|
-| API 根路径 | `http://localhost:7860` | OpenAI 兼容 API |
-| 模型列表 | `http://localhost:7860/v1/models` | 获取可用模型 |
-| 管理后台 | `http://localhost:7860/admin` | Web 管理界面 |
-| API 文档 | `http://localhost:7860/docs` | OpenAPI/Swagger 文档 |
-| 健康检查 | `http://localhost:7860/v1/models` | 服务健康状态 |
 ## 高级配置

 # 快速启动
 docker run -d \
   --name z-ai-api-server \
+  -p 8080:8080 \
   -e ADMIN_PASSWORD=admin123 \
   -e AUTH_TOKEN=sk-your-api-key \
   -e ANONYMOUS_MODE=true \
 docker compose logs -f api-server
 ```
+服务将在 `http://localhost:8080` 启动。
 ## 架构说明
 ### 端口冲突
+如端口 8080 被占用,修改 `docker-compose.yml`:
 ```yaml
 ports:
+  - "8081:8080"  # 映射到宿主机 8081 端口
 ```
 ### 健康检查失败
 docker compose ps
 # 手动测试接口
+curl http://localhost:8080/hf/v1/models
 # 进入容器排查
 docker exec -it z-ai-api-server bash
 | 端点 | 地址 | 说明 |
 |------|------|------|
+| API 根路径 | `http://localhost:8080` | OpenAI 兼容 API |
+| 模型列表 | `http://localhost:8080/hf/v1/models` | 获取可用模型 |
+| 管理后台 | `http://localhost:8080/admin` | Web 管理界面 |
+| API 文档 | `http://localhost:8080/docs` | OpenAPI/Swagger 文档 |
+| 健康检查 | `http://localhost:8080/hf/v1/models` | 服务健康状态 |
 ## 高级配置

app/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (268 Bytes). View file

app/admin/api.py CHANGED Viewed

@@ -166,7 +166,7 @@ async def get_recent_logs(request: Request):
     logs = [
         {
             "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
-            "endpoint": "/v1/chat/completions",
             "model": "gpt-4o",
             "status": 200,
             "duration": "1.23s",

     logs = [
         {
             "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
+            "endpoint": "/hf/v1/chat/completions",
             "model": "gpt-4o",
             "status": 200,
             "duration": "1.23s",

app/core/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (267 Bytes). View file

app/core/__pycache__/config.cpython-311.pyc ADDED Viewed

Binary file (4.86 kB). View file

app/core/__pycache__/openai.cpython-311.pyc ADDED Viewed

Binary file (9.16 kB). View file

app/core/config.py CHANGED Viewed

@@ -24,11 +24,11 @@ class Settings(BaseSettings):
     GLM45_THINKING_MODEL: str = os.getenv("GLM45_THINKING_MODEL", "GLM-4.5-Thinking")
     GLM45_SEARCH_MODEL: str = os.getenv("GLM45_SEARCH_MODEL", "GLM-4.5-Search")
     GLM45_AIR_MODEL: str = os.getenv("GLM45_AIR_MODEL", "GLM-4.5-Air")
-    GLM45V_MODEL: str = os.getenv("GLM45V_MODEL", "GLM-4.5V")
-    GLM46_MODEL: str = os.getenv("GLM46_MODEL", "GLM-4.6")
-    GLM46_THINKING_MODEL: str = os.getenv("GLM46_THINKING_MODEL", "GLM-4.6-Thinking")
-    GLM46_SEARCH_MODEL: str = os.getenv("GLM46_SEARCH_MODEL", "GLM-4.6-Search")
-    GLM46_ADVANCED_SEARCH_MODEL: str = os.getenv("GLM46_ADVANCED_SEARCH_MODEL", "GLM-4.6-advanced-search")
     # Provider Model Mapping
     @property
@@ -40,11 +40,11 @@ class Settings(BaseSettings):
             "GLM-4.5-Thinking": "zai",
             "GLM-4.5-Search": "zai",
             "GLM-4.5-Air": "zai",
-            "GLM-4.5V": "zai",
-            "GLM-4.6": "zai",
-            "GLM-4.6-Thinking": "zai",
-            "GLM-4.6-Search": "zai",
-            "GLM-4.6-advanced-search": "zai",
             # K2Think models
             "MBZUAI-IFM/K2-Think": "k2think",
             # LongCat models
@@ -54,7 +54,7 @@ class Settings(BaseSettings):
         }
     # Server Configuration
-    LISTEN_PORT: int = int(os.getenv("LISTEN_PORT", "7860"))
     DEBUG_LOGGING: bool = os.getenv("DEBUG_LOGGING", "true").lower() == "true"
     SERVICE_NAME: str = os.getenv("SERVICE_NAME", "z-ai2api-server")
     ROOT_PATH: str = os.getenv("ROOT_PATH", "")  # For Nginx reverse proxy path prefix, e.g., "/api" or "/path-prefix"

     GLM45_THINKING_MODEL: str = os.getenv("GLM45_THINKING_MODEL", "GLM-4.5-Thinking")
     GLM45_SEARCH_MODEL: str = os.getenv("GLM45_SEARCH_MODEL", "GLM-4.5-Search")
     GLM45_AIR_MODEL: str = os.getenv("GLM45_AIR_MODEL", "GLM-4.5-Air")
+    GLM46V_MODEL: str = os.getenv("GLM46V_MODEL", "GLM-4.6V")
+    GLM47_MODEL: str = os.getenv("GLM47_MODEL", "GLM-4.7")
+    GLM47_THINKING_MODEL: str = os.getenv("GLM47_THINKING_MODEL", "GLM-4.7-Thinking")
+    GLM47_SEARCH_MODEL: str = os.getenv("GLM47_SEARCH_MODEL", "GLM-4.7-Search")
+    GLM47_ADVANCED_SEARCH_MODEL: str = os.getenv("GLM47_ADVANCED_SEARCH_MODEL", "GLM-4.7-advanced-search")
     # Provider Model Mapping
     @property
             "GLM-4.5-Thinking": "zai",
             "GLM-4.5-Search": "zai",
             "GLM-4.5-Air": "zai",
+            "GLM-4.6V": "zai",
+            "GLM-4.7": "zai",
+            "GLM-4.7-Thinking": "zai",
+            "GLM-4.7-Search": "zai",
+            "GLM-4.7-advanced-search": "zai",
             # K2Think models
             "MBZUAI-IFM/K2-Think": "k2think",
             # LongCat models
         }
     # Server Configuration
+    LISTEN_PORT: int = int(os.getenv("LISTEN_PORT", "7860"))  # HuggingFace Spaces 默认端口
     DEBUG_LOGGING: bool = os.getenv("DEBUG_LOGGING", "true").lower() == "true"
     SERVICE_NAME: str = os.getenv("SERVICE_NAME", "z-ai2api-server")
     ROOT_PATH: str = os.getenv("ROOT_PATH", "")  # For Nginx reverse proxy path prefix, e.g., "/api" or "/path-prefix"

app/core/openai.py CHANGED Viewed

@@ -92,9 +92,8 @@ async def handle_non_stream_response(stream_response, request: OpenAIRequest) ->
     return JSONResponse(content=response_data.model_dump(exclude_none=True))
-@router.get("/v1/models")
 @router.get("/hf/v1/models")
-@router.get("/api/v1/models")
 async def list_models():
     """List available models from all providers"""
     try:
@@ -107,18 +106,17 @@ async def list_models():
         current_time = int(time.time())
         fallback_response = ModelsResponse(
             data=[
-                Model(id=settings.GLM46_MODEL, created=current_time, owned_by="z.ai"),
-                Model(id=settings.GLM46_THINKING_MODEL, created=current_time, owned_by="z.ai"),
-                Model(id=settings.GLM46_SEARCH_MODEL, created=current_time, owned_by="z.ai"),
                 Model(id=settings.GLM45_AIR_MODEL, created=current_time, owned_by="z.ai"),
             ]
         )
         return fallback_response
-@router.post("/v1/chat/completions")
 @router.post("/hf/v1/chat/completions")
-@router.post("/api/v1/chat/completions")
 async def chat_completions(request: OpenAIRequest, authorization: str = Header(...)):
     """Handle chat completion requests with multi-provider architecture"""
     role = request.messages[0].role if request.messages else "unknown"

     return JSONResponse(content=response_data.model_dump(exclude_none=True))
 @router.get("/hf/v1/models")
+@router.get("/v1/models")
 async def list_models():
     """List available models from all providers"""
     try:
         current_time = int(time.time())
         fallback_response = ModelsResponse(
             data=[
+                Model(id=settings.GLM47_MODEL, created=current_time, owned_by="z.ai"),
+                Model(id=settings.GLM47_THINKING_MODEL, created=current_time, owned_by="z.ai"),
+                Model(id=settings.GLM47_SEARCH_MODEL, created=current_time, owned_by="z.ai"),
                 Model(id=settings.GLM45_AIR_MODEL, created=current_time, owned_by="z.ai"),
             ]
         )
         return fallback_response
 @router.post("/hf/v1/chat/completions")
+@router.post("/v1/chat/completions")
 async def chat_completions(request: OpenAIRequest, authorization: str = Header(...)):
     """Handle chat completion requests with multi-provider architecture"""
     role = request.messages[0].role if request.messages else "unknown"

app/models/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (239 Bytes). View file

app/models/__pycache__/schemas.cpython-311.pyc ADDED Viewed

Binary file (8.32 kB). View file

app/providers/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (917 Bytes). View file

app/providers/__pycache__/base.cpython-311.pyc ADDED Viewed

Binary file (12.3 kB). View file

app/providers/__pycache__/k2think_provider.cpython-311.pyc ADDED Viewed

Binary file (26.1 kB). View file

app/providers/__pycache__/longcat_provider.cpython-311.pyc ADDED Viewed

Binary file (22.2 kB). View file

app/providers/__pycache__/provider_factory.cpython-311.pyc ADDED Viewed

Binary file (9.81 kB). View file

app/providers/__pycache__/zai_provider.cpython-311.pyc ADDED Viewed

Binary file (51.6 kB). View file

app/providers/zai_provider.py CHANGED Viewed

@@ -20,6 +20,7 @@ import random
 from datetime import datetime
 from typing import Dict, List, Any, Optional, AsyncGenerator, Union
 from app.utils.user_agent import get_random_user_agent
 from app.utils.signature import generate_signature
 from app.providers.base import BaseProvider, ProviderConfig
 from app.models.schemas import OpenAIRequest, Message
@@ -42,6 +43,7 @@ def get_zai_dynamic_headers(chat_id: str = "") -> Dict[str, str]:
     browser_choices = ["chrome", "chrome", "chrome", "edge", "edge", "firefox", "safari"]
     browser_type = random.choice(browser_choices)
     user_agent = get_random_user_agent(browser_type)
     chrome_version = "139"
     edge_version = "139"
@@ -70,7 +72,7 @@ def get_zai_dynamic_headers(chat_id: str = "") -> Dict[str, str]:
         "Cache-Control": "no-cache",
         "User-Agent": user_agent,
         "Accept-Language": "zh-CN,zh;q=0.9,en;q=0.8",
-        "X-FE-Version": "prod-fe-1.0.106",
         "Origin": "https://chat.z.ai",
     }
@@ -141,11 +143,11 @@ class ZAIProvider(BaseProvider):
             settings.GLM45_THINKING_MODEL: "0727-360B-API",  # GLM-4.5-Thinking
             settings.GLM45_SEARCH_MODEL: "0727-360B-API",  # GLM-4.5-Search
             settings.GLM45_AIR_MODEL: "0727-106B-API",  # GLM-4.5-Air
-            settings.GLM45V_MODEL: "glm-4.5v",  # GLM-4.5V多模态
-            settings.GLM46_MODEL: "GLM-4-6-API-V1",  # GLM-4.6
-            settings.GLM46_THINKING_MODEL: "GLM-4-6-API-V1",  # GLM-4.6-Thinking
-            settings.GLM46_SEARCH_MODEL: "GLM-4-6-API-V1",  # GLM-4.6-Search
-            settings.GLM46_ADVANCED_SEARCH_MODEL: "GLM-4-6-API-V1",  # GLM-4.6-advanced-search
         }
     def get_supported_models(self) -> List[str]:
@@ -155,11 +157,11 @@ class ZAIProvider(BaseProvider):
             settings.GLM45_THINKING_MODEL,
             settings.GLM45_SEARCH_MODEL,
             settings.GLM45_AIR_MODEL,
-            settings.GLM45V_MODEL,
-            settings.GLM46_MODEL,
-            settings.GLM46_THINKING_MODEL,
-            settings.GLM46_SEARCH_MODEL,
-            settings.GLM46_ADVANCED_SEARCH_MODEL,
         ]
     def _get_proxy_config(self) -> Optional[str]:
@@ -528,7 +530,7 @@ class ZAIProvider(BaseProvider):
         requested_model = request.model
         is_thinking = "-thinking" in requested_model.casefold()
         is_search = "-search" in requested_model.casefold()
-        is_advanced_search = requested_model == settings.GLM46_ADVANCED_SEARCH_MODEL
         is_air = "-air" in requested_model.casefold()
         # 获取上游模型ID
@@ -636,6 +638,7 @@ class ZAIProvider(BaseProvider):
         user_id = _extract_user_id_from_token(token)
         timestamp_ms = int(time.time() * 1000)
         request_id = generate_uuid()
         try:
             signing_metadata = f"requestId,{request_id},timestamp,{timestamp_ms},user_id,{user_id}"
             prompt_for_signature = last_user_text or ""
@@ -650,11 +653,11 @@ class ZAIProvider(BaseProvider):
             logger.error(f"[Z.AI] 签名生成失败: {e}")
             signature = ""
-        # 构建请求头 (匹配 X-FE-Version 和 X-Signature)
         headers = {
             "Authorization": f"Bearer {token}",
             "Content-Type": "application/json",
-            "X-FE-Version": "prod-fe-1.0.106",
             "X-Signature": signature,
         }

 from datetime import datetime
 from typing import Dict, List, Any, Optional, AsyncGenerator, Union
 from app.utils.user_agent import get_random_user_agent
+from app.utils.fe_version import get_latest_fe_version
 from app.utils.signature import generate_signature
 from app.providers.base import BaseProvider, ProviderConfig
 from app.models.schemas import OpenAIRequest, Message
     browser_choices = ["chrome", "chrome", "chrome", "edge", "edge", "firefox", "safari"]
     browser_type = random.choice(browser_choices)
     user_agent = get_random_user_agent(browser_type)
+    fe_version = get_latest_fe_version()
     chrome_version = "139"
     edge_version = "139"
         "Cache-Control": "no-cache",
         "User-Agent": user_agent,
         "Accept-Language": "zh-CN,zh;q=0.9,en;q=0.8",
+        "X-FE-Version": fe_version,
         "Origin": "https://chat.z.ai",
     }
             settings.GLM45_THINKING_MODEL: "0727-360B-API",  # GLM-4.5-Thinking
             settings.GLM45_SEARCH_MODEL: "0727-360B-API",  # GLM-4.5-Search
             settings.GLM45_AIR_MODEL: "0727-106B-API",  # GLM-4.5-Air
+            settings.GLM46V_MODEL: "glm-4.6v",  # GLM-4.6V多模态
+            settings.GLM47_MODEL: "glm-4.7",  # GLM-4.7
+            settings.GLM47_THINKING_MODEL: "glm-4.7",  # GLM-4.7-Thinking
+            settings.GLM47_SEARCH_MODEL: "glm-4.7",  # GLM-4.7-Search
+            settings.GLM47_ADVANCED_SEARCH_MODEL: "glm-4.7",  # GLM-4.7-advanced-search
         }
     def get_supported_models(self) -> List[str]:
             settings.GLM45_THINKING_MODEL,
             settings.GLM45_SEARCH_MODEL,
             settings.GLM45_AIR_MODEL,
+            settings.GLM46V_MODEL,
+            settings.GLM47_MODEL,
+            settings.GLM47_THINKING_MODEL,
+            settings.GLM47_SEARCH_MODEL,
+            settings.GLM47_ADVANCED_SEARCH_MODEL,
         ]
     def _get_proxy_config(self) -> Optional[str]:
         requested_model = request.model
         is_thinking = "-thinking" in requested_model.casefold()
         is_search = "-search" in requested_model.casefold()
+        is_advanced_search = requested_model == settings.GLM47_ADVANCED_SEARCH_MODEL
         is_air = "-air" in requested_model.casefold()
         # 获取上游模型ID
         user_id = _extract_user_id_from_token(token)
         timestamp_ms = int(time.time() * 1000)
         request_id = generate_uuid()
+        fe_version = get_latest_fe_version()
         try:
             signing_metadata = f"requestId,{request_id},timestamp,{timestamp_ms},user_id,{user_id}"
             prompt_for_signature = last_user_text or ""
             logger.error(f"[Z.AI] 签名生成失败: {e}")
             signature = ""
+        # 构建请求头
         headers = {
             "Authorization": f"Bearer {token}",
             "Content-Type": "application/json",
+            "X-FE-Version": fe_version,
             "X-Signature": signature,
         }

app/templates/config.html CHANGED Viewed

@@ -43,7 +43,7 @@
                 <label class="block text-sm font-medium text-gray-700">监听端口</label>
                 <input type="number"
                        name="listen_port"
-                       value="{{ config.LISTEN_PORT or 8000 }}"
                        class="mt-1 block w-full rounded-md border-gray-300 shadow-sm focus:border-indigo-500 focus:ring-indigo-500 sm:text-sm">
                 <p class="mt-1 text-sm text-gray-500">服务监听的端口号</p>
             </div>

                 <label class="block text-sm font-medium text-gray-700">监听端口</label>
                 <input type="number"
                        name="listen_port"
+                       value="{{ config.LISTEN_PORT or 7860 }}"
                        class="mt-1 block w-full rounded-md border-gray-300 shadow-sm focus:border-indigo-500 focus:ring-indigo-500 sm:text-sm">
                 <p class="mt-1 text-sm text-gray-500">服务监听的端口号</p>
             </div>

app/utils/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (276 Bytes). View file

app/utils/__pycache__/fe_version.cpython-311.pyc ADDED Viewed

Binary file (4.65 kB). View file

app/utils/__pycache__/logger.cpython-311.pyc ADDED Viewed

Binary file (4.28 kB). View file

app/utils/__pycache__/reload_config.cpython-311.pyc ADDED Viewed

Binary file (1.13 kB). View file

app/utils/__pycache__/signature.cpython-311.pyc ADDED Viewed

Binary file (1.93 kB). View file

app/utils/__pycache__/token_pool.cpython-311.pyc ADDED Viewed

Binary file (30.3 kB). View file

app/utils/__pycache__/tool_call_handler.cpython-311.pyc ADDED Viewed

Binary file (13.7 kB). View file

app/utils/__pycache__/user_agent.cpython-311.pyc ADDED Viewed

Binary file (4.04 kB). View file

app/utils/fe_version.py ADDED Viewed

	@@ -0,0 +1,112 @@

+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+Utility helpers for resolving the latest X-FE-Version value from chat.z.ai.
+The upstream service embeds the current front-end release identifier inside
+its landing page static asset URLs (e.g. `prod-fe-1.0.107`). The helpers in
+this module fetch the landing page, extract the version string, and cache it
+with a configurable TTL so the expensive network fetch only happens when
+necessary.
+"""
+from __future__ import annotations
+import re
+import time
+from typing import Optional
+import httpx
+from app.utils.logger import get_logger
+from app.utils.user_agent import get_random_user_agent
+# Base URL to probe for the version string.
+FE_VERSION_SOURCE_URL = "https://chat.z.ai"
+# Cache TTL in seconds (default: 30 minutes).
+CACHE_TTL_SECONDS = 1800
+_logger = get_logger()
+_version_pattern = re.compile(r"prod-fe-\d+\.\d+\.\d+")
+_cached_version: str = ""
+_cached_at: float = 0.0
+def _extract_version(page_content: str) -> Optional[str]:
+    """Extract the version string from the page content."""
+    if not page_content:
+        return None
+    matches = _version_pattern.findall(page_content)
+    if not matches:
+        return None
+    # Choose the highest lexical value to guard against mixed versions.
+    return max(matches)
+def _should_use_cache(force_refresh: bool) -> bool:
+    """Determine whether the cached value can be reused."""
+    if force_refresh:
+        return False
+    if not _cached_version:
+        return False
+    if _cached_at <= 0:
+        return False
+    return (time.time() - _cached_at) < CACHE_TTL_SECONDS
+def get_latest_fe_version(force_refresh: bool = False) -> str:
+    """
+    Resolve the latest X-FE-Version value from chat.z.ai.
+    The lookup order is:
+        1. Cached value within TTL.
+        2. Remote fetch from chat.z.ai.
+    Raises:
+        Exception: If unable to fetch the version from the remote source.
+    """
+    global _cached_version, _cached_at
+    if _should_use_cache(force_refresh):
+        return _cached_version
+    try:
+        headers = {"User-Agent": get_random_user_agent("chrome")}
+    except Exception:
+        headers = {
+            "User-Agent": (
+                "Mozilla/5.0 (Windows NT 10.0; Win64; x64) "
+                "AppleWebKit/537.36 (KHTML, like Gecko) "
+                "Chrome/120.0.0.0 Safari/537.36"
+            )
+        }
+    try:
+        with httpx.Client(timeout=10.0, follow_redirects=True) as client:
+            response = client.get(FE_VERSION_SOURCE_URL, headers=headers)
+            response.raise_for_status()
+            version = _extract_version(response.text)
+            if version:
+                if version != _cached_version:
+                    _logger.info(f"[Z.AI] Detected X-FE-Version update: {version}")
+                _cached_version = version
+                _cached_at = time.time()
+                return version
+            _logger.error("[Z.AI] Unable to locate X-FE-Version in landing page")
+            raise Exception("Unable to locate X-FE-Version in landing page")
+    except Exception as exc:
+        _logger.error(f"[Z.AI] Failed to fetch X-FE-Version from {FE_VERSION_SOURCE_URL}: {exc}")
+        raise Exception(f"Failed to fetch X-FE-Version: {exc}")
+def refresh_fe_version() -> str:
+    """Force refresh the cached version by bypassing the TTL."""
+    return get_latest_fe_version(force_refresh=True)

app/utils/logger.py CHANGED Viewed

@@ -56,7 +56,6 @@ def setup_logger(log_dir, log_retention_days=7, log_rotation="1 day", debug_mode
                 enqueue=True,
                 catch=True,
             )
-            logger.info(f"✅ 日志文件输出已启用: {log_dir}")
         except (PermissionError, OSError) as e:
             # 如果无法创建日志目录或文件，降级为仅控制台输出
             logger.warning(f"⚠️ 无法创建日志文件 ({e})，将仅使用控制台输出")

                 enqueue=True,
                 catch=True,
             )
         except (PermissionError, OSError) as e:
             # 如果无法创建日志目录或文件，降级为仅控制台输出
             logger.warning(f"⚠️ 无法创建日志文件 ({e})，将仅使用控制台输出")

docker-compose.yml CHANGED Viewed

@@ -1,8 +1,8 @@
 services:
   api-server:
     build:
-      context: ..
-      dockerfile: deploy/Dockerfile
     container_name: z-ai-api-server
     ports:
       - "7860:7860"
@@ -29,7 +29,7 @@ services:
       - DB_PATH=/app/data/tokens.db
     restart: unless-stopped
     healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:7860/v1/models"]
       interval: 30s
       timeout: 10s
       retries: 3

 services:
   api-server:
     build:
+      context: .
+      dockerfile: Dockerfile
     container_name: z-ai-api-server
     ports:
       - "7860:7860"
       - DB_PATH=/app/data/tokens.db
     restart: unless-stopped
     healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:7860/hf/v1/models"]
       interval: 30s
       timeout: 10s
       retries: 3

nginx.conf DELETED Viewed

@@ -1,157 +0,0 @@
-# Nginx reverse proxy configuration example for Z.AI2API
-# This example shows how to deploy the service behind Nginx with a custom path prefix
-# Example 1: Deploy at http://your-domain.com/ai2api
-server {
-    listen 80;
-    server_name your-domain.com;
-    # Forward requests with /ai2api prefix to the backend service
-    location /ai2api {
-        # Remove trailing slash redirect (optional, but recommended)
-        rewrite ^(/ai2api)$ $1/ permanent;
-        # Proxy to the backend service
-        proxy_pass http://127.0.0.1:7860;
-        # Pass original host and IP information
-        proxy_set_header Host $host;
-        proxy_set_header X-Real-IP $remote_addr;
-        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
-        proxy_set_header X-Forwarded-Proto $scheme;
-        # IMPORTANT: Tell the backend about the path prefix
-        # This ensures all generated URLs include the prefix
-        proxy_set_header X-Forwarded-Prefix /ai2api;
-        # WebSocket and SSE support (for streaming responses)
-        proxy_http_version 1.1;
-        proxy_set_header Upgrade $http_upgrade;
-        proxy_set_header Connection "upgrade";
-        # Disable buffering for streaming responses
-        proxy_buffering off;
-        proxy_cache off;
-        # Timeout settings (adjust as needed)
-        proxy_connect_timeout 60s;
-        proxy_send_timeout 300s;
-        proxy_read_timeout 300s;
-    }
-}
-# Example 2: Deploy at http://your-domain.com/api/chat
-server {
-    listen 80;
-    server_name example.com;
-    location /api/chat {
-        # Proxy configuration
-        proxy_pass http://127.0.0.1:7860;
-        # Headers
-        proxy_set_header Host $host;
-        proxy_set_header X-Real-IP $remote_addr;
-        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
-        proxy_set_header X-Forwarded-Proto $scheme;
-        proxy_set_header X-Forwarded-Prefix /api/chat;
-        # SSE/WebSocket support
-        proxy_http_version 1.1;
-        proxy_set_header Upgrade $http_upgrade;
-        proxy_set_header Connection "upgrade";
-        proxy_buffering off;
-        proxy_cache off;
-    }
-}
-# Example 3: Deploy with SSL (HTTPS)
-server {
-    listen 443 ssl http2;
-    server_name secure.example.com;
-    # SSL configuration
-    ssl_certificate /path/to/cert.pem;
-    ssl_certificate_key /path/to/key.pem;
-    location /ai2api {
-        proxy_pass http://127.0.0.1:7860;
-        proxy_set_header Host $host;
-        proxy_set_header X-Real-IP $remote_addr;
-        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
-        proxy_set_header X-Forwarded-Proto https;
-        proxy_set_header X-Forwarded-Prefix /ai2api;
-        # SSE/WebSocket support
-        proxy_http_version 1.1;
-        proxy_set_header Upgrade $http_upgrade;
-        proxy_set_header Connection "upgrade";
-        proxy_buffering off;
-        proxy_cache off;
-        # Security headers (optional)
-        add_header X-Content-Type-Options nosniff;
-        add_header X-Frame-Options DENY;
-        add_header X-XSS-Protection "1; mode=block";
-    }
-}
-# Example 4: Load balancing with multiple backend instances
-upstream ai2api_backend {
-    # Round-robin by default
-    server 127.0.0.1:7860;
-    server 127.0.0.1:8081;
-    server 127.0.0.1:8082;
-    # Or use least connections
-    # least_conn;
-    # Or use IP hash for session persistence
-    # ip_hash;
-}
-server {
-    listen 80;
-    server_name loadbalanced.example.com;
-    location /ai2api {
-        proxy_pass http://ai2api_backend;
-        proxy_set_header Host $host;
-        proxy_set_header X-Real-IP $remote_addr;
-        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
-        proxy_set_header X-Forwarded-Proto $scheme;
-        proxy_set_header X-Forwarded-Prefix /ai2api;
-        proxy_http_version 1.1;
-        proxy_set_header Upgrade $http_upgrade;
-        proxy_set_header Connection "upgrade";
-        proxy_buffering off;
-        proxy_cache off;
-    }
-}
-# Important Notes:
-#
-# 1. Set ROOT_PATH in your .env file to match the Nginx location path:
-#    ROOT_PATH=/ai2api
-#
-# 2. Restart both Nginx and the application after configuration changes:
-#    sudo systemctl reload nginx
-#    docker-compose restart (or restart your application)
-#
-# 3. Access URLs will include the prefix:
-#    - Admin panel: http://your-domain.com/ai2api/admin/login
-#    - API endpoint: http://your-domain.com/ai2api/v1/chat/completions
-#    - Health check: http://your-domain.com/ai2api/v1/models
-#
-# 4. For Docker deployments, make sure to:
-#    - Add ROOT_PATH to docker-compose.yml environment variables
-#    - Expose the container port (7860 by default)
-#
-# 5. Common issues:
-#    - 404 errors: Check that ROOT_PATH matches the Nginx location path exactly
-#    - CORS errors: Verify proxy headers are set correctly
-#    - Streaming not working: Ensure proxy_buffering is off
-#    - Admin panel CSS/JS not loading: Confirm static files are served with the prefix

nginx.conf.example CHANGED Viewed

@@ -12,7 +12,7 @@ server {
         rewrite ^(/ai2api)$ $1/ permanent;
         # Proxy to the backend service
-        proxy_pass http://127.0.0.1:7860;
         # Pass original host and IP information
         proxy_set_header Host $host;
@@ -47,7 +47,7 @@ server {
     location /api/chat {
         # Proxy configuration
-        proxy_pass http://127.0.0.1:7860;
         # Headers
         proxy_set_header Host $host;
@@ -75,7 +75,7 @@ server {
     ssl_certificate_key /path/to/key.pem;
     location /ai2api {
-        proxy_pass http://127.0.0.1:7860;
         proxy_set_header Host $host;
         proxy_set_header X-Real-IP $remote_addr;
@@ -100,7 +100,7 @@ server {
 # Example 4: Load balancing with multiple backend instances
 upstream ai2api_backend {
     # Round-robin by default
-    server 127.0.0.1:7860;
     server 127.0.0.1:8081;
     server 127.0.0.1:8082;
@@ -143,12 +143,12 @@ server {
 #
 # 3. Access URLs will include the prefix:
 #    - Admin panel: http://your-domain.com/ai2api/admin/login
-#    - API endpoint: http://your-domain.com/ai2api/v1/chat/completions
-#    - Health check: http://your-domain.com/ai2api/v1/models
 #
 # 4. For Docker deployments, make sure to:
 #    - Add ROOT_PATH to docker-compose.yml environment variables
-#    - Expose the container port (7860 by default)
 #
 # 5. Common issues:
 #    - 404 errors: Check that ROOT_PATH matches the Nginx location path exactly

         rewrite ^(/ai2api)$ $1/ permanent;
         # Proxy to the backend service
+        proxy_pass http://127.0.0.1:8080;
         # Pass original host and IP information
         proxy_set_header Host $host;
     location /api/chat {
         # Proxy configuration
+        proxy_pass http://127.0.0.1:8080;
         # Headers
         proxy_set_header Host $host;
     ssl_certificate_key /path/to/key.pem;
     location /ai2api {
+        proxy_pass http://127.0.0.1:8080;
         proxy_set_header Host $host;
         proxy_set_header X-Real-IP $remote_addr;
 # Example 4: Load balancing with multiple backend instances
 upstream ai2api_backend {
     # Round-robin by default
+    server 127.0.0.1:8080;
     server 127.0.0.1:8081;
     server 127.0.0.1:8082;
 #
 # 3. Access URLs will include the prefix:
 #    - Admin panel: http://your-domain.com/ai2api/admin/login
+#    - API endpoint: http://your-domain.com/ai2api/hf/v1/chat/completions
+#    - Health check: http://your-domain.com/ai2api/hf/v1/models
 #
 # 4. For Docker deployments, make sure to:
 #    - Add ROOT_PATH to docker-compose.yml environment variables
+#    - Expose the container port (8080 by default)
 #
 # 5. Common issues:
 #    - 404 errors: Check that ROOT_PATH matches the Nginx location path exactly

xREADME.md DELETED Viewed

@@ -1,347 +0,0 @@
-# OpenAI 代理服务
-![License: MIT](https://img.shields.io/badge/license-MIT-blue.svg)
-![Python: 3.9-3.12](https://img.shields.io/badge/python-3.9--3.12-green.svg)
-![FastAPI](https://img.shields.io/badge/framework-FastAPI-009688.svg)
-基于 FastAPI 的高性能 OpenAI API 兼容代理服务，采用多提供商架构设计，支持 Z.AI（GLM-4.5/4.6 系列）、K2Think、LongCat 等多种 AI 模型。
-## ✨ 核心特性
-- 🔌 **OpenAI API 兼容** - 无缝对接现有 OpenAI 客户端
-- 🏗️ **多提供商架构** - 统一接口支持 Z.AI、K2Think、LongCat
-- 🧬 **数据库管理** - SQLite + Web 后台统一管理 Token
-- 🚀 **流式响应** - 高性能 SSE 实时流式输出
-- 🧠 **思考模式** - 支持 Thinking 模型的推理过程展示
-- 🐳 **容器化部署** - Docker/Docker Compose 一键部署
-- 🔄 **Token 池** - 智能轮询、容错恢复、健康检查
-- 📊 **管理后台** - 实时监控、配置管理
-- 🔐 **安全认证** - 密码保护的管理后台访问
-❤️ 感谢各位的反馈推动项目改进！
-## 🚀 快速开始
-### 环境要求
-- Python 3.9-3.12
-- pip 或 uv (推荐)
-### 本地运行
-```bash
-# 1. 克隆项目
-git clone https://github.com/ZyphrZero/z.ai2api_python.git
-cd z.ai2api_python
-# 2. 安装依赖（使用 uv 推荐）
-curl -LsSf https://astral.sh/uv/install.sh | sh
-uv sync
-# 或使用 pip
-pip install -r requirements.txt
-# 3. 配置环境变量
-cp .env.example .env
-# 编辑 .env 文件，设置 AUTH_TOKEN 等配置
-# 4. 启动服务
-uv run python main.py  # 或 python main.py
-```
-**首次运行会自动初始化数据库**，访问以下地址：
-- API 文档：http://localhost:7860/docs
-- 管理后台：http://localhost:7860/admin（**需要登录**）
-- Token 管理：http://localhost:7860/admin/tokens
-> ⚠️ **重要**：
-> - 请妥善保管 `AUTH_TOKEN`，不要泄露给他人
-> - 管理后台默认密码为 `admin123`，**首次使用后请立即修改**
-### Docker 部署
-从 Docker Hub 拉取镜像：
-```bash
-# 拉取最新镜像
-docker pull zyphrzero/z-ai2api-python:latest
-# 快速启动（创建数据目录）
-mkdir -p data logs
-# 运行容器
-docker run -d \
-  --name z-ai-api-server \
-  -p 7860:7860 \
-  -e ADMIN_PASSWORD=admin123 \
-  -e AUTH_TOKEN=sk-your-api-key \
-  -e ANONYMOUS_MODE=true \
-  -e DB_PATH=/app/data/tokens.db \
-  -v $(pwd)/data:/app/data \
-  -v $(pwd)/logs:/app/logs \
-  --restart unless-stopped \
-  zyphrzero/z-ai2api-python:latest
-```
-启动服务：
-```bash
-docker compose up -d
-```
-#### 方式二：本地构建
-```bash
-# 进入部署目录
-cd deploy
-# 启动服务（会自动构建镜像）
-docker compose up -d
-# 查看日志
-docker compose logs -f api-server
-```
-#### 数据持久化
-容器使用卷映射自动持久化数据：
-```
-data/                  # 数据库文件存储目录
-├── tokens.db          # SQLite 数据库（自动创建）
-logs/                  # 日志文件存储目录
-```
-数据在容器重启或重建后仍然保留，无需担心丢失。
-> 📖 **详细文档**：[Docker 部署指南](deploy/README_DOCKER.md)
-## 📖 支持的模型
-### Z.AI 提供商（GLM 系列）
-| 模型 | 上游 ID | 特性 |
-|------|---------|------|
-| `GLM-4.5` | 0727-360B-API | 标准模型，通用对话 |
-| `GLM-4.5-Thinking` | 0727-360B-API | 思考模型，显示推理过程 |
-| `GLM-4.5-Search` | 0727-360B-API | 搜索模型，实时联网 |
-| `GLM-4.5-Air` | 0727-106B-API | 轻量模型，快速响应 |
-| `GLM-4.5V` | glm-4.5v | 多模态模型，支持图像理解 |
-| `GLM-4.6` | GLM-4-6-API-V1 | 新版标准模型，200K 上下文 |
-| `GLM-4.6-Thinking` | GLM-4-6-API-V1 | 新版思考模型，增强推理 |
-| `GLM-4.6-Search` | GLM-4-6-API-V1 | 新版搜索模型，改进联网能力 |
-| `GLM-4.6-advanced-search` | GLM-4-6-API-V1 | 高级搜索模型，深度研究 |
-### K2Think 提供商
-| 模型 | 特性 |
-|------|------|
-| `MBZUAI-IFM/K2-Think` | 高质量推理模型 |
-### LongCat 提供商
-| 模型 | 特性 |
-|------|------|
-| `LongCat-Flash` | 快速响应 |
-| `LongCat` | 标准模型 |
-| `LongCat-Search` | 搜索增强 |
-## ⚙️ 配置说明
-### 核心环境变量
-| 变量名 | 默认值 | 说明 |
-|--------|--------|------|
-| `AUTH_TOKEN` | `sk-your-api-key` | 客户端访问密钥（必填） |
-| `ADMIN_PASSWORD` | `admin123` | 管理后台登录密码（**强烈建议修改**） |
-| `LISTEN_PORT` | `7860` | 服务监听端口 |
-| `DEBUG_LOGGING` | `false` | 调试日志（支持热重载） |
-| `ANONYMOUS_MODE` | `true` | Z.AI 匿名模式 |
-| `TOOL_SUPPORT` | `true` | Function Call 开关 |
-| `SKIP_AUTH_TOKEN` | `false` | 跳过认证（仅开发） |
-| `DB_PATH` | `tokens.db` | 数据库文件路径（Docker: `/app/data/tokens.db`） |
-### Token 配置
-| 变量名 | 说明 |
-|--------|------|
-| `LONGCAT_TOKEN` | LongCat 认证 Token（可选） |
-| `TOKEN_FAILURE_THRESHOLD` | Token 失败阈值（默认 3） |
-| `TOKEN_RECOVERY_TIMEOUT` | Token 恢复超时（默认 1800 秒） |
-> 💡 详细配置请参考 [.env.example](.env.example) 或 [deploy/.env.example](deploy/.env.example)
-## 🔐 管理后台登录
-### 首次登录
-1. 启动服务后访问：http://localhost:7860/admin
-2. 自动跳转到登录页面
-3. 输入管理密码（默认：`admin123`）
-4. 登录成功后进入仪表盘
-### 修改密码
-在 `.env` 文件中修改 `ADMIN_PASSWORD`：
-```bash
-# 使用强密码（推荐 12 位以上）
-ADMIN_PASSWORD=Your_Secure_Password_2025!
-```
-重启服务后生效。
-### 安全特性
-- ✅ **Session 管理**：基于 Cookie 的安全 Session
-- ✅ **自动过期**：登录后 24 小时自动失效
-- ✅ **HttpOnly Cookie**：防止 XSS 攻击
-- ✅ **SameSite 保护**：防止 CSRF 攻击
-- ✅ **随机 Token**：使用加密安全的随机数生成
-> 💡 详细文档：[管理后台登录功能使用说明](管理后台登录功能使用说明.md)
-## 🔄 Token 管理
-### 数据库方式（推荐）
-项目使用 SQLite 数据库统一管理 Token，首次运行会自动初始化：
-```bash
-# 首次运行自动创建 tokens.db
-python main.py
-# 访问 Web 管理后台
-http://localhost:7860/admin
-```
-### 管理后台功能
-- ✅ **密码保护** - 安全的登录认证
-- ✅ Token 增删改查
-- ✅ 批量导入/导出
-- ✅ 启用/禁用 Token
-- ✅ Token 有效性检测
-- ✅ 多提供商支持（Z.AI/K2Think/LongCat）
-### Token 池机制
-- **负载均衡**：轮询使用多个 Token 分散请求
-- **自动容错**：Token 失败时自动切换
-- **自动恢复**：失败 Token 超时后重试
-- **智能去重**：自动检测重复 Token
-- **回退机制**：认证失败自动降级匿名模式
-## ❓ 常见问题
-### Q: 如何获取 AUTH_TOKEN？
-A: `AUTH_TOKEN` 是自定义的 API 密钥，用于客户端访问本服务，需在 `.env` 文件或 `docker-compose.yml` 中配置，确保客户端与服务端一致。
-### Q: 匿名模式是什么？
-A: 匿名模式使用临时 Token 访问 Z.AI，避免对话历史共享，保护隐私。设置 `ANONYMOUS_MODE=true` 启用。
-### Q: 如何管理 Token？
-A: 访问 Web 管理后台 http://localhost:7860/admin/tokens（需要先登录）即可增删改查 Token，支持批量导入导出。
-### Q: 忘记管理后台密码怎么办？
-A: 在 `.env` 文件或 `docker-compose.yml` 中修改 `ADMIN_PASSWORD` 为新密码，然后重启服务即可。
-### Q: Docker 部署时数据库初始化失败？
-A: 错误提示 `unable to open database file` 通常是权限问题。解决方案：
-```bash
-cd deploy
-mkdir -p ./data ./logs
-chmod 755 ./data ./logs
-docker compose down && docker compose up -d --build
-```
-详见 [Docker 部署指南](deploy/README_DOCKER.md#故障排查)
-### Q: 如何禁用管理后台登录？
-A: 当前版本暂不支持禁用登录功能。如有需要，请手动移除路由中的 `dependencies=[Depends(require_auth)]`。
-## 🔑 获取 Token
-### Z.AI Token
-1. 访问 [Z.AI 官网](https://chat.z.ai) 并登录
-2. 按 F12 打开开发者工具
-3. 进入 Application → Local Storage → Cookies
-4. 复制 `token` 值
-> ⚠️ 多模态功能需要非匿名 Token
-### LongCat Token
-1. 访问 [LongCat 官网](https://longcat.chat/) 并登录美团账号
-2. 按 F12 打开开发者工具
-3. 进入 "Application" -> "Local Storage" -> "Cookie"列表中找到名为`passport_token_key`的值
-4. 复制 `passport_token_key` 值
-## 🛠️ 技术栈
-| 组件 | 技术 | 版本 | 说明 |
-|------|------|------|------|
-| Web 框架 | [FastAPI](https://fastapi.tiangolo.com/) | 0.116.1 | 高性能异步框架 |
-| ASGI 服务器 | [Granian](https://github.com/emmett-framework/granian) | 2.5.2 | Rust 高性能服务器 |
-| HTTP 客户端 | [HTTPX](https://www.python-httpx.org/) | 0.28.1 | 异步 HTTP 客户端 |
-| 数据验证 | [Pydantic](https://pydantic.dev/) | 2.11.7 | 类型安全验证 |
-| 数据库 | SQLite (aiosqlite) | 0.20.0 | Token 存储 |
-| 模板引擎 | Jinja2 | 3.1.4 | Web 后台模板 |
-| 日志系统 | [Loguru](https://loguru.readthedocs.io/) | 0.7.3 | 结构化日志 |
-## 🏗️ 系统架构
-```
-┌─────────────┐      ┌────────────────────────────────┐      ┌──────────────┐
-│   OpenAI    │      │      FastAPI Server            │      │   Z.AI API   │
-│   Client    │─────▶│                                │─────▶│   (GLM-4.x)  │
-└─────────────┘      │  ┌──────────────────────────┐  │      └──────────────┘
-                     │  │   Provider Router        │  │
-                     │  │  ┌────────┬────────────┐ │  ��      ┌──────────────┐
-                     │  │  │ Z.AI   │ K2Think    │ │  │      │  K2Think API │
-                     │  │  │Provider│ Provider   │ │  │─────▶│              │
-                     │  │  └────────┴────────────┘ │  │      └──────────────┘
-                     │  │  ┌────────────┐          │  │
-                     │  │  │ LongCat    │          │  │      ┌──────────────┐
-                     │  │  │ Provider   │          │  │      │ LongCat API  │
-                     │  │  └────────────┘          │  │─────▶│              │
-                     │  └──────────────────────────┘  │      └──────────────┘
-                     │                                │
-                     │  ┌──────────────────────────┐  │
-                     │  │   Web Admin Dashboard    │  │
-                     │  │   (Token/Stats/Monitor)  │  │
-                     │  └──────────────────────────┘  │
-                     └────────────────────────────────┘
-                               ↕
-                          ┌─────────┐
-                          │SQLite DB│
-                          │(tokens) │
-                          └─────────┘
-```
-## 🤝 贡献指南
-欢迎提交 Issue 和 Pull Request！请确保代码符合 PEP 8 规范。
-## ⭐ Star History
-[![Star History Chart](https://api.star-history.com/svg?repos=ZyphrZero/z.ai2api_python&type=Date)](https://star-history.com/#ZyphrZero/z.ai2api_python&Date)
-## 📄 许可证
-本项目采用 MIT 许可证 - 详见 [LICENSE](LICENSE) 文件。
-## ⚠️ 免责声明
-- 本项目与 Z.AI、K2Think、LongCat 等 AI 提供商官方无关
-- 使用前请确保遵守各提供商的服务条款
-- 请勿用于商业用途或违反使用条款的场景
-- 项目仅供学习和研究使用
-- 用户需自行承担使用风险
----
-<div align="center">
-Made with ❤️ by the community
-</div>