Spaces:

NaseemTahir
/

TTS

Sleeping

TTS

File size: 1,621 Bytes

ff72d7d
 
 
9c989b7
ff72d7d
9c989b7
ff72d7d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9c989b7
 
 
 
 
 
 
 
 
ff72d7d
 
9c989b7
ff72d7d
 
608af9e

import streamlit as st
from TTS.api import TTS
import torch
from scipy.io.wavfile import write
from io import BytesIO
import numpy as np

# Initialize the TTS model
device = "cuda" if torch.cuda.is_available() else "cpu"
tts = TTS(model_name="tts_models/en/ljspeech/tacotron2-DDC", progress_bar=True, gpu=device == "cuda")

# App title
st.title("🐸 Coqui TTS - Text to Speech App")

# Text input
text = st.text_area("Enter the text to convert to speech", "Imagine being able to offer your clients curated travel insights at their fingertips.")

# Submit button
if st.button("Generate Speech"):
    if text.strip() == "":
        st.warning("Please enter some text.")
    else:
        # Run TTS
        st.text("Generating speech...")
        try:
            # Generate audio with the default voice
            wav = tts.tts(text=text)
            
            # Convert the list of amplitude values to a binary WAV file
            sample_rate = 22050  # Default sample rate used by Coqui TTS
            wav = np.array(wav)  # Ensure it's a NumPy array
            buffer = BytesIO()
            write(buffer, sample_rate, wav.astype(np.float32))  # Write WAV data to buffer
            buffer.seek(0)
            
            # Display audio player
            st.audio(buffer, format="audio/wav")
            
            # Option to download the audio file
            st.download_button(
                "Download Audio",
                buffer,
                file_name="output.wav",
                mime="audio/wav"
            )
        except Exception as e:
            st.error(f"An error occurred: {e}")