Spaces:

Layer7
/

audio2phoneme

Sleeping

IvanLayer7 commited on Dec 31, 2025

Commit

a7fcc90

verified ·

1 Parent(s): d889cea

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -16,9 +16,9 @@ model = None
 # Load access code from HuggingFace Secrets or environment variable
 # In HuggingFace Spaces, add a secret named "ACCESS_CODE" with value "sensei"
-ACCESS_CODE = os.environ.get("ACCESS_CODE", "sensei")
-def load_model():
     """Load the Wav2Vec2 phoneme model and processor."""
     global processor, model
@@ -159,11 +159,11 @@ with gr.Blocks(title="Phoneme Transcription App", theme=gr.themes.Soft()) as dem
     with gr.Column(visible=False) as main_app:
         gr.Markdown(
             """
-            # 🎙️ Phoneme Transcription with Wav2Vec2
             Upload or record audio to get phoneme transcription in IPA (International Phonetic Alphabet) format.
-            **Model:** `facebook/wav2vec2-lv-60-espeak-cv-ft` (Multilingual - supports Spanish, English, and more)
             """
         )
@@ -182,7 +182,7 @@ with gr.Blocks(title="Phoneme Transcription App", theme=gr.themes.Soft()) as dem
                     ### 💡 Tips:
                     - Supports WAV, MP3, OGG, and other audio formats
                     - Audio will be automatically resampled to 16kHz
-                    - Works best with clear speech
                     - Supports multiple languages including Spanish
                     """
                 )

 # Load access code from HuggingFace Secrets or environment variable
 # In HuggingFace Spaces, add a secret named "ACCESS_CODE" with value "sensei"
+ACCESS_CODE = os.environ.get("ACCESS_CODE")
+def load_model():
     """Load the Wav2Vec2 phoneme model and processor."""
     global processor, model
     with gr.Column(visible=False) as main_app:
         gr.Markdown(
             """
+            # Keywords Spotting (KWS)
+            ## 🎙️ Phoneme Transcription with Wav2Vec2
             Upload or record audio to get phoneme transcription in IPA (International Phonetic Alphabet) format.
+            The first use could be slower than subsequent uses.
             """
         )
                     ### 💡 Tips:
                     - Supports WAV, MP3, OGG, and other audio formats
                     - Audio will be automatically resampled to 16kHz
+                    - Works best with clear speech (ideally)
                     - Supports multiple languages including Spanish
                     """
                 )