Spaces:

tudeplom
/

tts

Sleeping

App Files Files Community

tudeplom commited on Feb 24, 2025

Commit

cb5cebf

verified ·

1 Parent(s): 933e5d5

Update app.py

Browse files

Files changed (1) hide show

app.py +11 -64

app.py CHANGED Viewed

@@ -2,24 +2,17 @@ from fastapi import FastAPI, UploadFile, File
 from fastapi.responses import FileResponse
 from huggingface_hub import InferenceClient
 import os
-import google.generativeai as genai  # Dùng Gemini AI
 # Khởi tạo FastAPI
 app = FastAPI()
 # Lấy API key từ biến môi trường
 HF_API_KEY = os.getenv("HF_API_KEY")
-GOOGLE_API_KEY = os.getenv("GOOGLE_API_KEY")
-if not HF_API_KEY or not GOOGLE_API_KEY:
-    raise ValueError("❌ Missing API keys! Add HF_API_KEY and GOOGLE_API_KEY to Hugging Face Spaces Secrets.")
 # Khởi tạo Hugging Face Client
-hf_client = InferenceClient(token=HF_API_KEY)
-# Khởi tạo Google Gemini AI
-genai.configure(api_key=GOOGLE_API_KEY)
-gemini = genai.GenerativeModel("gemini-pro")
 # Tạo thư mục lưu file tạm
 TEMP_DIR = "temp"
@@ -34,8 +27,8 @@ TTS_MODEL = "facebook/mms-tts-eng"
 async def text_to_speech(text: str):
     output_path = os.path.join(TEMP_DIR, "output.wav")
     try:
-        print(f"🔄 Đang xử lý TTS với model {TTS_MODEL}...")
-        audio = hf_client.text_to_speech(model=TTS_MODEL, text=text)
         with open(output_path, "wb") as f:
             f.write(audio)
         return FileResponse(output_path, media_type="audio/wav", filename="output.wav")
@@ -47,68 +40,22 @@ async def text_to_speech(text: str):
 @app.post("/stt")
 async def speech_to_text(file: UploadFile = File(...)):
     try:
-        print(f"🔄 Đang xử lý STT với model {STT_MODEL}...")
         audio_data = await file.read()
-        response = hf_client.automatic_speech_recognition(model=STT_MODEL, data=audio_data)
-        text = response.get("text", "")
         return {"text": text}
     except Exception as e:
         print(f"❌ Lỗi STT: {e}")
         return {"error": str(e)}
-# 🤖 API Chatbot: Xử lý hội thoại với AI
-@app.post("/chat")
-async def chat_with_ai(message: str):
-    try:
-        print(f"💬 Chatbot nhận tin nhắn: {message}")
-        response = gemini.generate_content(message)
-        reply = response.text
-        return {"reply": reply}
-    except Exception as e:
-        print(f"❌ Lỗi chatbot: {e}")
-        return {"error": str(e)}
-# 🎙 API Voice Chat: Nhận giọng nói -> STT -> AI -> TTS
-@app.post("/voice_chat")
-async def voice_chat(file: UploadFile = File(...)):
-    try:
-        print("🎙 Nhận giọng nói và xử lý...")
-        # 1️⃣ STT: Chuyển giọng nói thành văn bản
-        audio_data = await file.read()
-        stt_response = hf_client.automatic_speech_recognition(model=STT_MODEL, data=audio_data)
-        user_message = stt_response.get("text", "")
-        if not user_message:
-            return {"error": "Không nhận diện được giọng nói."}
-        print(f"📜 Văn bản nhận được: {user_message}")
-        # 2️⃣ Chatbot AI: Phản hồi lại
-        response = gemini.generate_content(user_message)
-        ai_reply = response.text
-        print(f"🤖 Trả lời: {ai_reply}")
-        # 3️⃣ TTS: Chuyển phản hồi thành giọng nói
-        output_path = os.path.join(TEMP_DIR, "response.wav")
-        tts_audio = hf_client.text_to_speech(model=TTS_MODEL, text=ai_reply)
-        with open(output_path, "wb") as f:
-            f.write(tts_audio)
-        return FileResponse(output_path, media_type="audio/wav", filename="response.wav")
-    except Exception as e:
-        print(f"❌ Lỗi voice chat: {e}")
-        return {"error": str(e)}
 # Kiểm tra API
 @app.get("/")
 async def root():
-    return {"message": "✅ Chatbot AI với STT & TTS đang chạy!"}
-# Chạy Uvicorn
 if __name__ == "__main__":
     import uvicorn
     print("🚀 Khởi động FastAPI Server...")
-    uvicorn.run(app, host="0.0.0.0", port=7860)

 from fastapi.responses import FileResponse
 from huggingface_hub import InferenceClient
 import os
 # Khởi tạo FastAPI
 app = FastAPI()
 # Lấy API key từ biến môi trường
 HF_API_KEY = os.getenv("HF_API_KEY")
+if not HF_API_KEY:
+    raise ValueError("❌ Missing HF_API_KEY! Add it to Hugging Face Spaces Secrets.")
 # Khởi tạo Hugging Face Client
+client = InferenceClient(token=HF_API_KEY)
 # Tạo thư mục lưu file tạm
 TEMP_DIR = "temp"
 async def text_to_speech(text: str):
     output_path = os.path.join(TEMP_DIR, "output.wav")
     try:
+        print(f"🔄 Đang xử lý TTS với model {TTS_MODEL}...")  # Debug log
+        audio = client.text_to_speech(model=TTS_MODEL, text=text)  # Sửa lỗi ở đây
         with open(output_path, "wb") as f:
             f.write(audio)
         return FileResponse(output_path, media_type="audio/wav", filename="output.wav")
 @app.post("/stt")
 async def speech_to_text(file: UploadFile = File(...)):
     try:
+        print(f"🔄 Đang xử lý STT với model {STT_MODEL}...")  # Debug log
         audio_data = await file.read()
+        response = client.automatic_speech_recognition(model=STT_MODEL, data=audio_data)
+        text = response.get("text", "")  # Lấy nội dung từ JSON trả về
         return {"text": text}
     except Exception as e:
         print(f"❌ Lỗi STT: {e}")
         return {"error": str(e)}
 # Kiểm tra API
 @app.get("/")
 async def root():
+    return {"message": "✅ TTS & STT API is running!"}
+# Chạy Uvicorn (tránh lỗi "application does not seem to be initialized")
 if __name__ == "__main__":
     import uvicorn
     print("🚀 Khởi động FastAPI Server...")
+    uvicorn.run(app, host="0.0.0.0", port=7860)