Spaces:

kambris
/

Varabic

Sleeping

App Files Files Community

kambris commited on Jun 16, 2025

Commit

9cdcbb7

verified ·

1 Parent(s): 858d077

Update app.py

Browse files

Files changed (1) hide show

app.py +24 -26

app.py CHANGED Viewed

@@ -17,9 +17,15 @@ translit_map = {
     "l": "ل", "m": "م", "n": "ن", "h": "ه",
     "w": "و", "y": "ي", "x": "ء", "o": "أُ",
-    # Vowels
     "i": "إِ", "u": "أُ", "e": "أ",
     # Space and punctuation
     " ": " ", ".": ".", ",": "،", "?": "؟", "!": "!"
 }
@@ -31,7 +37,7 @@ def transliterate(text):
     output = ""
     i = 0
-    text = text.lower()  # Convert to lowercase for consistent mapping
     while i < len(text):
         # Check for two-character combinations first
@@ -49,21 +55,13 @@ def transliterate(text):
     return output
-def arabic_tts(arabic_text, tts_option="standard"):
-    """Generate TTS audio for Arabic text with different pronunciation options."""
     if not arabic_text or not arabic_text.strip():
         return None
     try:
-        # Remove diacritics for more neutral pronunciation
-        if tts_option == "neutral":
-            # Remove common Arabic diacritics that add inflection
-            diacritics = "ًٌٍَُِّْ"
-            cleaned_text = ''.join(char for char in arabic_text if char not in diacritics)
-            tts = gTTS(text=cleaned_text, lang='ar', slow=True)
-        else:
-            tts = gTTS(text=arabic_text, lang='ar', slow=False)
         # Create temporary file
         tmp_file = tempfile.NamedTemporaryFile(delete=False, suffix=".mp3")
         tts.save(tmp_file.name)
@@ -104,14 +102,23 @@ with gr.Blocks(title="Arabic Transliterator") as demo:
                 `S` → ص, `D` → ض, `T` → ط, `Z` → ظ, `'` → ع, `f` → ف, `q` → ق, `k` → ك
                 `l` → ل, `m` → م, `n` → ن, `h` → ه, `w` → و, `y` → ي, `x` → ء
-                **Vowels:**
                 `o` → أُ, `i` → إِ, `u` → أُ, `e` → أ
                 **Tips:**
                 - Use capital letters for emphatic consonants (S, D, T, Z, H)
                 - Combinations like 'th', 'kh' are processed before single letters
                 - Use apostrophe (') for the letter ع (ayn)
                 - Use 'x' for hamza ء when standalone
                 """)
         with gr.Column():
@@ -124,15 +131,10 @@ with gr.Blocks(title="Arabic Transliterator") as demo:
     with gr.Row():
         convert_btn = gr.Button("🔄 Transliterate", variant="primary")
         tts_btn = gr.Button("🔊 Speak Arabic", variant="secondary")
-        neutral_tts_btn = gr.Button("🔊 Neutral Pronunciation", variant="secondary")
         combined_btn = gr.Button("🔄🔊 Transliterate & Speak", variant="secondary")
     tts_audio = gr.Audio(label="Audio Output", type="filepath")
-    # Options
-    with gr.Row():
-        gr.Markdown("**TTS Options:** Standard includes natural inflections, Neutral removes diacritics for clearer pronunciation")
     # Event handlers
     convert_btn.click(
         fn=transliterate,
@@ -141,13 +143,7 @@ with gr.Blocks(title="Arabic Transliterator") as demo:
     )
     tts_btn.click(
-        fn=lambda text: arabic_tts(text, "standard"),
-        inputs=arabic_output,
-        outputs=tts_audio
-    )
-    neutral_tts_btn.click(
-        fn=lambda text: arabic_tts(text, "neutral"),
         inputs=arabic_output,
         outputs=tts_audio
     )
@@ -157,6 +153,8 @@ with gr.Blocks(title="Arabic Transliterator") as demo:
         inputs=latin_input,
         outputs=[arabic_output, tts_audio]
     )
 if __name__ == "__main__":
     demo.launch()

     "l": "ل", "m": "م", "n": "ن", "h": "ه",
     "w": "و", "y": "ي", "x": "ء", "o": "أُ",
+    # Initial vowels (hamza with vowel for word beginnings)
     "i": "إِ", "u": "أُ", "e": "أ",
+    # Short vowels (diacritics)
+    "I": "ِ", "U": "ُ", "A": "َ", "~": "ّ", "^": "ْ",
+    # Tanween (double diacritics)
+    "an": "ً", "un": "ٌ", "in": "ٍ",
     # Space and punctuation
     " ": " ", ".": ".", ",": "،", "?": "؟", "!": "!"
 }
     output = ""
     i = 0
+    # Don't convert to lowercase to preserve capital letter mappings
     while i < len(text):
         # Check for two-character combinations first
     return output
+def arabic_tts(arabic_text):
+    """Generate TTS audio for Arabic text."""
     if not arabic_text or not arabic_text.strip():
         return None
     try:
+        tts = gTTS(text=arabic_text, lang='ar', slow=False)
         # Create temporary file
         tmp_file = tempfile.NamedTemporaryFile(delete=False, suffix=".mp3")
         tts.save(tmp_file.name)
                 `S` → ص, `D` → ض, `T` → ط, `Z` → ظ, `'` → ع, `f` → ف, `q` → ق, `k` → ك
                 `l` → ل, `m` → م, `n` → ن, `h` → ه, `w` → و, `y` → ي, `x` → ء
+                **Initial Vowels (Word Beginnings):**
                 `o` → أُ, `i` → إِ, `u` → أُ, `e` → أ
+                **Short Vowels (Diacritics):**
+                `I` → ِ (Kasra), `U` → ُ (Damma), `A` → َ (Fatha), `~` → ّ (Shadda), `^` → ْ (Sukun)
+                **Tanween (Double Diacritics):**
+                `an` → ً (Fathatan), `un` → ٌ (Dammatan), `in` → ٍ (Kasratan)
                 **Tips:**
                 - Use capital letters for emphatic consonants (S, D, T, Z, H)
+                - Use capital vowels (I, U, A) for diacritics/short vowels
+                - Use 'an', 'un', 'in' for tanween (double diacritics)
                 - Combinations like 'th', 'kh' are processed before single letters
                 - Use apostrophe (') for the letter ع (ayn)
                 - Use 'x' for hamza ء when standalone
+                - Use ~ for shadda (gemination) and ^ for sukun (no vowel)
                 """)
         with gr.Column():
     with gr.Row():
         convert_btn = gr.Button("🔄 Transliterate", variant="primary")
         tts_btn = gr.Button("🔊 Speak Arabic", variant="secondary")
         combined_btn = gr.Button("🔄🔊 Transliterate & Speak", variant="secondary")
     tts_audio = gr.Audio(label="Audio Output", type="filepath")
     # Event handlers
     convert_btn.click(
         fn=transliterate,
     )
     tts_btn.click(
+        fn=arabic_tts,
         inputs=arabic_output,
         outputs=tts_audio
     )
         inputs=latin_input,
         outputs=[arabic_output, tts_audio]
     )
 if __name__ == "__main__":
     demo.launch()