Spaces:

PlotweaverModel
/

AudioBook

Running

App Files Files Community

PlotweaverModel commited on 11 days ago

Commit

86adbfb

verified ·

1 Parent(s): 3d91d95

Upload app.py

Browse files

Files changed (1) hide show

app.py +24 -29

app.py CHANGED Viewed

@@ -117,6 +117,10 @@ PRESET_VOICES = [
 # YourVoic voices mapped by language
 # Only include CONFIRMED working voice names
 YOURVOIC_VOICE_MAP = {
     # Indian - confirmed working
     "Hindi": ["Rahul", "Deepika", "Aditya"],
     "Bengali": ["Sneha", "Aryan"],
@@ -127,10 +131,6 @@ YOURVOIC_VOICE_MAP = {
     "Kannada": ["Divya", "Karthik"],
     "Malayalam": ["Nikhil", "Ammu"],
     "Punjabi": ["Vikram", "Simran"],
-    # African - NOT confirmed, will use API lookup
-    # "Afrikaans": [],  # unknown - use API
-    # "Amharic": [],    # unknown - use API
-    # "Swahili": [],    # unknown - use API
     # English fallback
     "English": ["Peter", "Sarah", "Caleb"],
 }
@@ -224,25 +224,33 @@ def generate_speech_yourvoic_with_retry(client, text, voice, yv_model, emotion,
     # Get list of candidate voices
     candidates = []
-    # 1. Try user-selected voice
-    user_voice = get_voice_name(voice)
-    candidates.append(user_voice)
-    # 2. Try hardcoded voices
     hardcoded = YOURVOIC_VOICE_MAP.get(language, [])
     candidates.extend(hardcoded)
-    # 3. Try API-fetched voices
     api_voices = _fetch_yourvoic_voice(yourvoic_lang, yv_model)
     if api_voices:
-        candidates.extend(api_voices)
     # Deduplicate preserving order
     seen = set()
     candidates = [x for x in candidates if not (x in seen or seen.add(x))]
     # Try each candidate until one works
-    for i, candidate_voice in enumerate(candidates[:5]):  # try up to 5
         print(f"[YourVoic] Trying voice '{candidate_voice}' for {language} (attempt {i+1})")
         wav_path, transcript, error = generate_speech_yourvoic(
             client, text, candidate_voice, yv_model, emotion, language, lang_config,
@@ -252,12 +260,14 @@ def generate_speech_yourvoic_with_retry(client, text, voice, yv_model, emotion,
             # Cache this working voice for future chunks
             if language not in YOURVOIC_VOICE_MAP or not YOURVOIC_VOICE_MAP.get(language):
                 YOURVOIC_VOICE_MAP[language] = [candidate_voice]
             return wav_path, transcript, None
         if error and "Invalid voice name" not in str(error):
             # Non-voice error (credits, etc) - don't try more voices
             return None, transcript, error
-    return None, text, f"No valid voice found for {language}. Tried: {candidates[:5]}"
 YOURVOIC_MODELS = [
     "aura-prime -- Balanced quality and speed (recommended)",
@@ -774,15 +784,6 @@ And he would smile - that slow, careful smile that seemed to cost him something
 DESCRIPTION = """
 # Audiobook Generator
 ### English Text to Multi-Language Audiobook
-**Three Voice Engines**
-| Engine | Languages | Best for |
-|--------|-----------|----------|
-| **Qwen Preset** (20 voices) | English, Chinese, Japanese, Korean, German, French, Russian, Portuguese, Spanish, Italian, Arabic | General audiobooks |
-| **Qwen Clone** (your voice) | Same 10 core (excl. Arabic) | Personalized narration |
-| **YourVoic** (1000+ emotional voices) | Hindi, Bengali, Marathi, Telugu, Tamil, Gujarati, Kannada, Malayalam, Punjabi, Swahili, Amharic, Afrikaans | Indian/African languages |
-The app automatically selects the right engine based on your chosen language.
 """
 # Build language dropdown
@@ -936,13 +937,7 @@ with gr.Blocks(title="Audiobook Generator") as demo:
     gr.Markdown(
         "---\n"
-        "**Engines:**\n\n"
-        "**Qwen Preset:** 11 languages (EN, ZH, JA, KO, DE, FR, RU, PT, ES, IT, AR) via Qwen3.5-Omni-Plus\n\n"
-        "**Qwen Clone:** 10 languages (same minus Arabic) via Qwen3-TTS-VC\n\n"
-        "**YourVoic:** Hindi, Bengali, Marathi, Telugu, Tamil, Gujarati, Kannada, Malayalam, Punjabi, "
-        "Swahili, Amharic, Afrikaans via YourVoic API with emotional voices\n\n"
-        "Built with Gradio | Qwen by Alibaba | YourVoic by YourVoic Private Limited"
-    )
 if __name__ == "__main__":
     demo.launch()

 # YourVoic voices mapped by language
 # Only include CONFIRMED working voice names
 YOURVOIC_VOICE_MAP = {
+    # African - Peter works as universal voice
+    "Afrikaans": ["Peter", "Sarah"],
+    "Amharic": ["Peter", "Sarah"],
+    "Swahili": ["Peter", "Sarah"],
     # Indian - confirmed working
     "Hindi": ["Rahul", "Deepika", "Aditya"],
     "Bengali": ["Sneha", "Aryan"],
     "Kannada": ["Divya", "Karthik"],
     "Malayalam": ["Nikhil", "Ammu"],
     "Punjabi": ["Vikram", "Simran"],
     # English fallback
     "English": ["Peter", "Sarah", "Caleb"],
 }
     # Get list of candidate voices
     candidates = []
+    # 1. Try hardcoded voices for this language
     hardcoded = YOURVOIC_VOICE_MAP.get(language, [])
     candidates.extend(hardcoded)
+    # 2. Try user-selected voice
+    user_voice = get_voice_name(voice)
+    if user_voice not in candidates:
+        candidates.insert(0, user_voice)
+    # 3. Try universal English voices (work for many languages like Swahili)
+    for universal in ["Peter", "Sarah", "Caleb"]:
+        if universal not in candidates:
+            candidates.append(universal)
+    # 4. Try API-fetched voices last
     api_voices = _fetch_yourvoic_voice(yourvoic_lang, yv_model)
     if api_voices:
+        for av in api_voices:
+            if av not in candidates:
+                candidates.append(av)
     # Deduplicate preserving order
     seen = set()
     candidates = [x for x in candidates if not (x in seen or seen.add(x))]
     # Try each candidate until one works
+    for i, candidate_voice in enumerate(candidates[:8]):  # try up to 8
         print(f"[YourVoic] Trying voice '{candidate_voice}' for {language} (attempt {i+1})")
         wav_path, transcript, error = generate_speech_yourvoic(
             client, text, candidate_voice, yv_model, emotion, language, lang_config,
             # Cache this working voice for future chunks
             if language not in YOURVOIC_VOICE_MAP or not YOURVOIC_VOICE_MAP.get(language):
                 YOURVOIC_VOICE_MAP[language] = [candidate_voice]
+            elif candidate_voice not in YOURVOIC_VOICE_MAP[language]:
+                YOURVOIC_VOICE_MAP[language].insert(0, candidate_voice)
             return wav_path, transcript, None
         if error and "Invalid voice name" not in str(error):
             # Non-voice error (credits, etc) - don't try more voices
             return None, transcript, error
+    return None, text, f"No valid voice found for {language}. This language may not be supported on your plan. Tried: {candidates[:8]}"
 YOURVOIC_MODELS = [
     "aura-prime -- Balanced quality and speed (recommended)",
 DESCRIPTION = """
 # Audiobook Generator
 ### English Text to Multi-Language Audiobook
 """
 # Build language dropdown
     gr.Markdown(
         "---\n"
+        )
 if __name__ == "__main__":
     demo.launch()