Spaces:

kawaiipeace
/

VAJA9_TTS_THAI

Sleeping

App Files Files Community

kawaiipeace commited on Jun 26, 2025

Commit

2aaf0f3

1 Parent(s): 15bc933

Initialization

Browse files

Files changed (5) hide show

.env.example +1 -0
.gitignore +1 -0
app.py +61 -0
dockerfile +24 -0
requirements.txt +3 -0

.env.example ADDED Viewed

	@@ -0,0 +1 @@


1	+ API_KEY=

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ .env

app.py ADDED Viewed

	@@ -0,0 +1,61 @@

+import gradio as gr
+import requests
+import uuid
+import os
+from dotenv import load_dotenv
+# Load environment variables from .env
+load_dotenv()
+API_KEY = os.getenv("API_KEY")
+API_URL = 'https://api.aiforthai.in.th/vaja9/synth_audiovisual'
+def synthesize(text, speaker):
+    headers = {'Apikey': API_KEY, 'Content-Type': 'application/json'}
+    payload = {
+        'input_text': text,
+        'speaker': speaker,
+        'phrase_break': 0,
+        'audiovisual': 0
+    }
+    response = requests.post(API_URL, json=payload, headers=headers)
+    if response.status_code != 200:
+        return None, "Error in synthesis."
+    audio_url = response.json().get('wav_url')
+    if not audio_url:
+        return None, "No audio URL returned."
+    audio_data = requests.get(audio_url, headers={'Apikey': API_KEY})
+    if audio_data.status_code != 200:
+        return None, "Failed to download audio."
+    file_path = f"output_{uuid.uuid4().hex[:8]}.wav"
+    with open(file_path, 'wb') as f:
+        f.write(audio_data.content)
+    return file_path, file_path
+with gr.Blocks() as demo:
+    gr.Markdown("## 🇹🇭 Thai Text-to-Speech with VAJA9")
+    with gr.Row():
+        text_input = gr.Textbox(label="ใส่ข้อความที่ต้องการสังเคราะห์เสียง (Thai text)", lines=3)
+        speaker_selector = gr.Dropdown(
+        choices=[
+            ("เสียงผู้ชาย", 0),
+            ("เสียงผู้หญิง", 1),
+            ("เสียงเด็กผู้ชาย", 2),
+            ("เสียงเด็กผู้หญิง", 3)
+        ],
+        value=1,
+        label="เลือกเสียงพูด"
+        )
+    convert_button = gr.Button("🎤 สังเคราะห์เสียง")
+    audio_output = gr.Audio(label="🔊 เสียงที่สังเคราะห์", type="filepath")
+    download_output = gr.File(label="📥 ดาวน์โหลดไฟล์เสียง")
+    convert_button.click(fn=synthesize, inputs=[text_input, speaker_selector], outputs=[audio_output, download_output])
+demo.launch()

dockerfile ADDED Viewed

	@@ -0,0 +1,24 @@

+# Use an official Python runtime as a parent image
+FROM python:3.10-slim
+# Set environment variables
+ENV PYTHONDONTWRITEBYTECODE=1
+ENV PYTHONUNBUFFERED=1
+# Set work directory
+WORKDIR /app
+# Install dependencies
+COPY requirements.txt /app/
+RUN pip install --upgrade pip && pip install -r requirements.txt
+# Copy the rest of the application
+COPY . /app/
+# Copy .env file
+# COPY .env /app/.env
+# Expose port for Gradio
+EXPOSE 7860
+# Run the application
+CMD ["python", "app.py"]

requirements.txt ADDED Viewed

	@@ -0,0 +1,3 @@

+gradio==4.33.2
+requests
+python-dotenv