File size: 1,236 Bytes
34227c3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
import gradio as gr
import edge_tts
import asyncio
import tempfile

async def text_to_speech(text, voice, rate, pitch):
    if not text.strip():
        return None
    voice_short_name = voice.split(" - ")[0]
    communicate = edge_tts.Communicate(text, voice_short_name, rate=f"{rate:+d}%", pitch=f"{pitch:+d}Hz")
    with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp:
        await communicate.save(tmp.name)
        return tmp.name

async def build_ui():
    voices = await edge_tts.list_voices()
    voice_map = {f"{v['ShortName']} - {v['Locale']}": v['ShortName'] for v in voices}
    with gr.Blocks() as demo:
        gr.Markdown("# 🗣️ Text to Speech")
        text_in = gr.Textbox(label="Text", lines=4)
        voice = gr.Dropdown(choices=list(voice_map.keys()), label="Voice")
        rate = gr.Slider(-50, 50, 0, step=1, label="Rate (%)")
        pitch = gr.Slider(-20, 20, 0, step=1, label="Pitch (Hz)")
        out = gr.Audio(label="Generated Speech", type="filepath")
        btn = gr.Button("Generate")
        btn.click(lambda t, v, r, p: asyncio.run(text_to_speech(t, v, r, p)),
                  inputs=[text_in, voice, rate, pitch], outputs=out)
    return demo

demo = asyncio.run(build_ui())