Spaces:

amedcj
/

gemini_tts

Running

App Files Files Community

amedcj commited on Oct 12, 2025

Commit

b72c5a4

verified ·

1 Parent(s): 2310741

Update app.py

Browse files

Updated the code

Files changed (1) hide show

app.py +16 -8

app.py CHANGED Viewed

@@ -6,13 +6,10 @@ import wave
 import io
 # --- Configuration ---
-# You can change the voice here. Find other names like 'Puck', 'Charon', etc. in the documentation.
 VOICE_NAME = 'Fenrir'
-# We remove the "cheerfully" style instruction to keep the accent attempt cleaner.
 # --- API Client Initialization ---
 try:
-    # Client loads the key from the environment variable GEMINI_API_KEY set in Hugging Face Secrets.
     client = genai.Client(api_key=os.environ.get("GEMINI_API_KEY"))
 except Exception as e:
     print(f"Error initializing Gemini client: {e}. Ensure GEMINI_API_KEY secret is set.")
@@ -30,16 +27,14 @@ def wave_file(filename, pcm, channels=1, rate=24000, sample_width=2):
 # --- The Gradio Interface Function ---
 def gemini_tts_kurmanji(kurmanji_text: str) -> str:
     """
-    Takes a Kurmanji text prompt and uses a natural language instruction to guide the TTS.
     """
     if not client:
-        # Raise a Gradio error if the client failed to initialize (usually the API key issue)
         raise gr.Error("Gemini API Client failed to initialize. Check the GEMINI_API_KEY secret.")
     print(f"Attempting to generate Kurmanji speech: '{kurmanji_text}' with voice {VOICE_NAME}")
     try:
-        # The key change: Instruct the model to speak the text in Kurdish Kurmanji.
         prompt = f"Speak the following text in Kurdish Kurmanji: {kurmanji_text}"
         response = client.models.generate_content(
@@ -57,6 +52,19 @@ def gemini_tts_kurmanji(kurmanji_text: str) -> str:
             )
         )
         data = response.candidates[0].content.parts[0].inline_data.data
         file_name = 'kurmanji_output.wav'
         wave_file(file_name, data)
@@ -75,7 +83,7 @@ demo = gr.Interface(
     fn=gemini_tts_kurmanji,
     inputs=gr.Textbox(
         lines=3,
-        placeholder="Mînak: Silav, roj baş. Ez dixwazim Kurdî biaxivim.", # Example Kurmanji Text
         label="Kurmanji Text to Convert"
     ),
     outputs=gr.Audio(
@@ -83,7 +91,7 @@ demo = gr.Interface(
         label="Generated Kurmanji Speech"
     ),
     title=f"🗣️ Gemini TTS for Kurdish Kurmanji (Voice: {VOICE_NAME})",
-    description="Uses Gemini 2.5 Flash and natural language prompting to generate Kurdish Kurmanji speech."
 )
 if __name__ == "__main__":

 import io
 # --- Configuration ---
 VOICE_NAME = 'Fenrir'
 # --- API Client Initialization ---
 try:
     client = genai.Client(api_key=os.environ.get("GEMINI_API_KEY"))
 except Exception as e:
     print(f"Error initializing Gemini client: {e}. Ensure GEMINI_API_KEY secret is set.")
 # --- The Gradio Interface Function ---
 def gemini_tts_kurmanji(kurmanji_text: str) -> str:
     """
+    Takes a Kurmanji text prompt, handles API errors, and checks the response content.
     """
     if not client:
         raise gr.Error("Gemini API Client failed to initialize. Check the GEMINI_API_KEY secret.")
     print(f"Attempting to generate Kurmanji speech: '{kurmanji_text}' with voice {VOICE_NAME}")
     try:
         prompt = f"Speak the following text in Kurdish Kurmanji: {kurmanji_text}"
         response = client.models.generate_content(
             )
         )
+        # --- NEW: Robust Error Checking ---
+        if not response.candidates or not response.candidates[0].content:
+            # Check for block reasons (e.g., safety, policy)
+            block_reason = response.candidates[0].finish_reason.name if response.candidates else "NO_CANDIDATE"
+            # This is the most important part for debugging your 'NoneType' error:
+            raise gr.Error(
+                f"TTS Generation Failed. Reason: The model returned an empty response. "
+                f"The finish reason was: {block_reason}. "
+                f"This may indicate a quota limit, or the model could not generate the requested Kurmanji speech."
+            )
+        # Proceed if the content part is valid
         data = response.candidates[0].content.parts[0].inline_data.data
         file_name = 'kurmanji_output.wav'
         wave_file(file_name, data)
     fn=gemini_tts_kurmanji,
     inputs=gr.Textbox(
         lines=3,
+        placeholder="Mînak: Silav, roj baş. Ez dixwazim Kurdî biaxivim.",
         label="Kurmanji Text to Convert"
     ),
     outputs=gr.Audio(
         label="Generated Kurmanji Speech"
     ),
     title=f"🗣️ Gemini TTS for Kurdish Kurmanji (Voice: {VOICE_NAME})",
+    description="Uses Gemini 2.5 Flash and natural language prompting. Check the logs for specific failure reasons."
 )
 if __name__ == "__main__":