ktts

Running

App Files Files Community

leonelhs commited on Sep 9, 2025

Commit

ce18f8b

verified ·

1 Parent(s): 7eaf5e3

Init app

Browse files

Initial commit for Kokoro TTS API for spanish languaje

Files changed (2) hide show

app.py +82 -0
requirements.txt +5 -0

app.py ADDED Viewed

	@@ -0,0 +1,82 @@

+#######################################################################################
+#
+# MIT License
+#
+# Copyright (c) [2025] [leonelhs@gmail.com]
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+#
+#######################################################################################
+# This file implements an API endpoint for the Spanish Kokoro Text-to-Speech (TTS) system.
+# It provides functionality to generate TTS audio from input Spanish text using the Kokoro voice model.
+# Source code is based on or inspired by several projects.
+# For more details and proper attribution, please refer to the following resources:
+#
+# - [Kokoro-82M] - [https://huggingface.co/hexgrad/Kokoro-82M]
+# - [Kokoro-onnx] - [https://github.com/thewh1teagle/kokoro-onnx]
+# - [Misaki] - [https://github.com/hexgrad/misaki]
+import os
+import gradio as gr
+from misaki import espeak
+from misaki.espeak import EspeakG2P
+from kokoro_onnx import Kokoro
+from huggingface_hub import snapshot_download
+KOKORO_REPO_ID = "leonelhs/kokoro-thewh1teagle"
+VOICES = {
+    '🚺 Dora':'ef_dora',
+    '🚹 Alex':'em_alex',
+    '🚹 Santa':'em_santa'
+}
+snapshot = snapshot_download(repo_id=KOKORO_REPO_ID)
+# Misaki G2P with espeak-ng fallback
+fallback = espeak.EspeakFallback(british=False)
+g2p = EspeakG2P(language="es")
+# Kokoro
+model_path = os.path.join(snapshot, "kokoro-v1.0.onnx")
+voices_path = os.path.join(snapshot, "voices-v1.0.bin")
+kokoro = Kokoro(model_path, voices_path)
+def predict(text, voice='ef_dora', speed=1):
+    phonemes, _ = g2p(text)
+    samples, sample_rate = kokoro.create(phonemes, voice, speed, is_phonemes=True)
+    return sample_rate, samples
+app = gr.Interface(
+    predict,
+    [
+        gr.Textbox(label='Input Text'),
+        gr.Dropdown(list(VOICES.items()), value='ef_dora', label='Voice'),
+        gr.Slider(minimum=0.5, maximum=2, value=1, step=0.1, label='Speed')
+    ],
+    gr.Audio(label='Output Audio', interactive=False, streaming=False, autoplay=True),
+    description="Kokoro TTS 🇪🇸 API Endpoint",
+)
+app.launch(share=False, debug=True, show_error=True)
+app.queue()

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+kokoro-onnx
+gradio~=5.44.1
+misaki~=0.9.4
+onnxruntime~=1.22.1
+huggingface-hub~=0.34.4