Spaces:

flysuper
/

tts

Sleeping

App Files Files Community

flysuper commited on Oct 21, 2025

Commit

0c322d0

verified ·

1 Parent(s): 00c8bc6

Upload 5 files

Browse files

Files changed (5) hide show

.dockerignore +57 -0
Dockerfile +32 -0
README.md +168 -10
app.py +279 -0
requirements.txt +6 -0

.dockerignore ADDED Viewed

	@@ -0,0 +1,57 @@

+# Git
+.git
+.gitignore
+# Python
+__pycache__
+*.pyc
+*.pyo
+*.pyd
+.Python
+env
+pip-log.txt
+pip-delete-this-directory.txt
+.tox
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.log
+.git
+.mypy_cache
+.pytest_cache
+.hypothesis
+# OS
+.DS_Store
+.DS_Store?
+._*
+.Spotlight-V100
+.Trashes
+ehthumbs.db
+Thumbs.db
+# IDE
+.vscode
+.idea
+*.swp
+*.swo
+*~
+# Project specific
+output/
+*.mp3
+*.wav
+*.ogg
+logs/
+*.log
+# Documentation
+README.md
+HUGGINGFACE_DEPLOYMENT.md
+deploy_to_hf.py
+deploy_hf.bat
+Dockerfile_HF
+README_HF.md

Dockerfile ADDED Viewed

	@@ -0,0 +1,32 @@

+FROM python:3.9-slim
+# 設置工作目錄
+WORKDIR /app
+# 安裝系統依賴
+RUN apt-get update && apt-get install -y \
+    gcc \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+# 複製依賴文件
+COPY requirements.txt .
+# 安裝 Python 依賴
+RUN pip install --no-cache-dir -r requirements.txt
+# 複製應用程式代碼
+COPY app.py .
+# 創建必要的目錄
+RUN mkdir -p static
+# 暴露端口（Hugging Face Spaces 使用 7860）
+EXPOSE 7860
+# 健康檢查
+HEALTHCHECK --interval=30s --timeout=30s --start-period=5s --retries=3 \
+    CMD curl -f http://localhost:7860/health || exit 1
+# 啟動命令
+CMD ["python", "app.py"]

README.md CHANGED Viewed

@@ -1,10 +1,168 @@
----
-title: Tts
-emoji: 😻
-colorFrom: indigo
-colorTo: gray
-sdk: docker
-pinned: false
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+---
+title: Edge TTS API
+emoji: 🎤
+colorFrom: blue
+colorTo: purple
+sdk: docker
+pinned: false
+license: mit
+short_description: 基於 Microsoft Edge TTS 的文字轉語音 API 服務
+---
+# Edge TTS API 服務
+這是一個基於 Microsoft Edge TTS 的文字轉語音網路服務，使用 FastAPI 框架構建，現在部署在 Hugging Face Spaces 上。
+## 功能特色
+- 🎤 支援多種語音和語言
+- ⚡ 快速響應的 API 服務
+- 🔧 可調整語速、音量和音調
+- 📱 支援 CORS，可用於前端應用
+- 📊 自動生成的 API 文檔
+- 🗂️ 文件管理功能
+## 快速開始
+### 1. 訪問服務
+- **API 服務**: 點擊右上角的 "View API" 按鈕
+- **API 文檔**: `https://your-space-name.hf.space/docs`
+- **健康檢查**: `https://your-space-name.hf.space/health`
+### 2. 使用 API
+#### 獲取語音列表
+```http
+GET /voices
+```
+#### 文字轉語音 (POST)
+```http
+POST /tts
+Content-Type: application/json
+{
+    "text": "你好，世界！",
+    "voice": "zh-TW-HsiaoChenNeural",
+    "rate": "+0%",
+    "volume": "+0%",
+    "pitch": "+0Hz"
+}
+```
+#### 文字轉語音 (GET)
+```http
+GET /tts?text=你好世界&voice=zh-TW-HsiaoChenNeural&rate=+0%&volume=+0%&pitch=+0Hz
+```
+## 使用範例
+### Python 客戶端
+```python
+import requests
+# 替換為您的 Hugging Face Space URL
+base_url = "https://your-space-name.hf.space"
+# 使用 POST 方法
+response = requests.post(f"{base_url}/tts", json={
+    "text": "你好，這是測試文字",
+    "voice": "zh-TW-HsiaoChenNeural"
+})
+if response.json()["success"]:
+    audio_url = response.json()["audio_url"]
+    print(f"音頻文件：{base_url}{audio_url}")
+# 使用 GET 方法
+response = requests.get(f"{base_url}/tts", params={
+    "text": "你好，這是測試文字",
+    "voice": "zh-TW-HsiaoChenNeural"
+})
+# 直接下載音頻文件
+with open("output.mp3", "wb") as f:
+    f.write(response.content)
+```
+### JavaScript 客戶端
+```javascript
+// 替換為您的 Hugging Face Space URL
+const baseUrl = "https://your-space-name.hf.space";
+// 使用 POST 方法
+fetch(`${baseUrl}/tts`, {
+    method: 'POST',
+    headers: {
+        'Content-Type': 'application/json',
+    },
+    body: JSON.stringify({
+        text: '你好，這是測試文字',
+        voice: 'zh-TW-HsiaoChenNeural'
+    })
+})
+.then(response => response.json())
+.then(data => {
+    if (data.success) {
+        console.log('音頻文件：', `${baseUrl}${data.audio_url}`);
+    }
+});
+// 使用 GET 方法
+const audioUrl = `${baseUrl}/tts?text=你好世界&voice=zh-TW-HsiaoChenNeural`;
+window.open(audioUrl, '_blank');
+```
+## 常用語音
+### 🇹🇼 台灣語音
+- `zh-TW-HsiaoChenNeural` - 台灣女聲 (HsiaoChen)
+- `zh-TW-HsiaoYuNeural` - 台灣女聲 (HsiaoYu)
+- `zh-TW-YunJheNeural` - 台灣男聲 (YunJhe)
+### 🇨🇳 中國語音
+- `zh-CN-XiaoxiaoNeural` - 中國女聲 (Xiaoxiao)
+- `zh-CN-XiaoyiNeural` - 中國女聲 (Xiaoyi)
+- `zh-CN-YunjianNeural` - 中國男聲 (Yunjian)
+- `zh-CN-YunxiNeural` - 中國男聲 (Yunxi)
+- `zh-CN-YunxiaNeural` - 中國男聲 (Yunxia)
+- `zh-CN-YunyangNeural` - 中國男聲 (Yunyang)
+### 🇺🇸 美國語音
+- `en-US-JennyNeural` - 美國女聲 (Jenny)
+- `en-US-GuyNeural` - 美國男聲 (Guy)
+### 🇬🇧 英國語音
+- `en-GB-SoniaNeural` - 英國女聲 (Sonia)
+- `en-GB-RyanNeural` - 英國男聲 (Ryan)
+## 參數說明
+### 語速調整 (rate)
+- `+50%` - 加快 50%
+- `-50%` - 減慢 50%
+- `+0%` - 正常速度
+### 音量調整 (volume)
+- `+50%` - 增加音量 50%
+- `-50%` - 減少音量 50%
+- `+0%` - 正常音量
+### 音調調整 (pitch)
+- `+50Hz` - 提高音調
+- `-50Hz` - 降低音調
+- `+0Hz` - 正常音調
+## 注意事項
+1. 生成的音頻文件會保存在臨時目錄中
+2. 文件會自動生成唯一 ID，避免衝突
+3. 服務需要網路連接才能使用 Microsoft Edge TTS
+4. 在 Hugging Face Spaces 上，音頻文件會在短時間後自動清理
+## 授權
+本項目基於 MIT 授權條款開源。

app.py ADDED Viewed

	@@ -0,0 +1,279 @@

+"""
+Hugging Face Spaces 入口點
+基於 main.py 但針對 Hugging Face Spaces 進行優化
+"""
+from fastapi import FastAPI, HTTPException, Query, Request
+from fastapi.responses import FileResponse, JSONResponse
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.staticfiles import StaticFiles
+from pydantic import BaseModel
+import edge_tts
+import asyncio
+import os
+import uuid
+from typing import Optional, List
+import aiofiles
+import json
+from urllib.parse import urlparse
+import tempfile
+import shutil
+app = FastAPI(
+    title="Edge TTS API",
+    description="A web service for text-to-speech using Microsoft Edge TTS",
+    version="1.0.0"
+)
+# 添加 CORS 中間件（允許所有來源以方便測試）
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# 創建臨時輸出目錄
+OUTPUT_DIR = tempfile.mkdtemp(prefix="edge_tts_")
+os.makedirs(OUTPUT_DIR, exist_ok=True)
+# 允許的來源網址清單
+ALLOWED_ORIGINS = [
+    "https://www.dfes.ntpc.edu.tw",
+    "https://script.google.com/a/macros/apps.dfes.ntpc.edu.tw",
+    "https://www.dfes.ntpc.edu.tw/"
+]
+# 掛載靜態文件（如果存在）
+if os.path.exists("static"):
+    app.mount("/static", StaticFiles(directory="static"), name="static")
+class TTSRequest(BaseModel):
+    text: str
+    voice: Optional[str] = "zh-TW-HsiaoChenNeural"
+    rate: Optional[str] = "+0%"
+    volume: Optional[str] = "+0%"
+    pitch: Optional[str] = "+0Hz"
+class TTSResponse(BaseModel):
+    success: bool
+    message: str
+    audio_url: Optional[str] = None
+    error: Optional[str] = None
+# 來源檢查函數
+def _is_origin_allowed(request: Request) -> bool:
+    """檢查請求來源是否被允許"""
+    origin = request.headers.get("origin")
+    referer = request.headers.get("referer")
+    # 檢查 Origin 標頭
+    if origin:
+        for allowed_origin in ALLOWED_ORIGINS:
+            if origin.startswith(allowed_origin):
+                return True
+    # 檢查 Referer 標頭（備用檢查）
+    if referer:
+        for allowed_origin in ALLOWED_ORIGINS:
+            if referer.startswith(allowed_origin):
+                return True
+    # 如果沒有 Origin 或 Referer 標頭，檢查是否為直接 API 調用
+    # 允許來自 Hugging Face Spaces 的直接調用
+    user_agent = request.headers.get("user-agent", "")
+    if "huggingface" in user_agent.lower():
+        return True
+    return False
+@app.get("/")
+async def root():
+    """根路徑，返回 API 信息"""
+    return {
+        "message": "Edge TTS API Service - Hugging Face Spaces",
+        "version": "1.0.0",
+        "endpoints": {
+            "GET /voices": "獲取所有可用語音",
+            "POST /tts": "文字轉語音",
+            "GET /tts": "文字轉語音 (GET 方法)",
+            "GET /health": "健康檢查",
+            "GET /allowed-origins": "查看允許的來源網址"
+        },
+        "note": "此服務部署在 Hugging Face Spaces 上，僅允許特定來源網址訪問"
+    }
+@app.get("/health")
+async def health_check():
+    """健康檢查端點"""
+    return {"status": "healthy", "service": "edge-tts-api", "platform": "huggingface-spaces"}
+@app.get("/allowed-origins")
+async def get_allowed_origins():
+    """獲取允許的來源列表（僅供管理員查看）"""
+    return {
+        "allowed_origins": ALLOWED_ORIGINS,
+        "count": len(ALLOWED_ORIGINS),
+        "description": "允許的來源網址清單，支援擴充匹配"
+    }
+@app.get("/voices")
+async def get_voices():
+    """獲取所有可用的語音列表"""
+    try:
+        voices = await edge_tts.list_voices()
+        return {
+            "success": True,
+            "voices": voices,
+            "count": len(voices)
+        }
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=f"獲取語音列表失敗: {str(e)}")
+@app.post("/tts", response_model=TTSResponse)
+async def text_to_speech(request: TTSRequest, http_request: Request):
+    """文字轉語音 API (POST 方法)"""
+    try:
+        # 檢查來源是否被允許
+        if not _is_origin_allowed(http_request):
+            return TTSResponse(
+                success=False,
+                message="來源網站未被允許使用此 API",
+                error="forbidden"
+            )
+        # 生成唯一文件名
+        file_id = str(uuid.uuid4())
+        output_file = os.path.join(OUTPUT_DIR, f"{file_id}.mp3")
+        # 創建 TTS 通信對象
+        communicate = edge_tts.Communicate(
+            text=request.text,
+            voice=request.voice,
+            rate=request.rate,
+            volume=request.volume,
+            pitch=request.pitch
+        )
+        # 生成語音文件
+        await communicate.save(output_file)
+        # 檢查文件是否成功創建
+        if not os.path.exists(output_file):
+            raise Exception("語音文件生成失敗")
+        return TTSResponse(
+            success=True,
+            message="語音生成成功",
+            audio_url=f"/audio/{file_id}.mp3"
+        )
+    except Exception as e:
+        return TTSResponse(
+            success=False,
+            message="語音生成失敗",
+            error=str(e)
+        )
+@app.get("/tts")
+async def text_to_speech_get(
+    text: str = Query(..., description="要轉換的文字"),
+    voice: str = Query("zh-TW-HsiaoChenNeural", description="語音名稱"),
+    rate: str = Query("+0%", description="語速調整"),
+    volume: str = Query("+0%", description="音量調整"),
+    pitch: str = Query("+0Hz", description="音調調整"),
+    http_request: Request = None
+):
+    """文字轉語音 API (GET 方法)"""
+    try:
+        print(f"TTS 請求: text={text}, voice={voice}, rate={rate}, volume={volume}, pitch={pitch}")
+        # 檢查來源是否被允許
+        if http_request and not _is_origin_allowed(http_request):
+            raise HTTPException(
+                status_code=403,
+                detail="來源網站未被允許使用此 API"
+            )
+        # 生成唯一文件名
+        file_id = str(uuid.uuid4())
+        output_file = os.path.join(OUTPUT_DIR, f"{file_id}.mp3")
+        print(f"輸出文件路徑: {output_file}")
+        # 創建 TTS 通信對象
+        communicate = edge_tts.Communicate(
+            text=text,
+            voice=voice,
+            rate=rate,
+            volume=volume,
+            pitch=pitch
+        )
+        # 生成語音文件
+        print("開始生成語音文件...")
+        await communicate.save(output_file)
+        print("語音文件生成完成")
+        # 檢查文件是否成功創建
+        if not os.path.exists(output_file):
+            print(f"文件不存在: {output_file}")
+            raise HTTPException(status_code=500, detail="語音文件生成失敗")
+        file_size = os.path.getsize(output_file)
+        print(f"文件大小: {file_size} bytes")
+        # 返回音頻文件
+        return FileResponse(
+            output_file,
+            media_type="audio/mpeg",
+            filename=f"tts_{file_id}.mp3"
+        )
+    except Exception as e:
+        print(f"TTS 錯誤: {str(e)}")
+        import traceback
+        traceback.print_exc()
+        raise HTTPException(status_code=500, detail=f"語音生成失敗: {str(e)}")
+@app.get("/audio/{file_id}.mp3")
+async def get_audio_file(file_id: str):
+    """獲取生成的音頻文件"""
+    file_path = os.path.join(OUTPUT_DIR, f"{file_id}.mp3")
+    if not os.path.exists(file_path):
+        raise HTTPException(status_code=404, detail="音頻文件不存在")
+    return FileResponse(
+        file_path,
+        media_type="audio/mpeg",
+        filename=f"tts_{file_id}.mp3"
+    )
+@app.delete("/audio/{file_id}.mp3")
+async def delete_audio_file(file_id: str):
+    """刪除音頻文件"""
+    file_path = os.path.join(OUTPUT_DIR, f"{file_id}.mp3")
+    if not os.path.exists(file_path):
+        raise HTTPException(status_code=404, detail="音頻文件不存在")
+    try:
+        os.remove(file_path)
+        return {"success": True, "message": "文件刪除成功"}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=f"文件刪除失敗: {str(e)}")
+# 清理函數（可選）
+@app.on_event("shutdown")
+async def cleanup():
+    """應用關閉時清理臨時文件"""
+    try:
+        if os.path.exists(OUTPUT_DIR):
+            shutil.rmtree(OUTPUT_DIR)
+    except Exception:
+        pass
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=7860)

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+fastapi==0.104.1
+uvicorn[standard]==0.24.0
+edge-tts==7.2.0
+python-multipart==0.0.6
+aiofiles==23.2.1
+requests==2.31.0