Spaces:

Layer7
/

Simple-KWS

Sleeping

App Files Files Community

IvanLayer7 commited on Oct 18, 2025

Commit

e25c059

verified ·

1 Parent(s): 664bdbb

Upload app.py

Browse files

Files changed (1) hide show

app.py +9 -26

app.py CHANGED Viewed

@@ -181,7 +181,7 @@ def create_gradio_interface():
     """Create and configure the Gradio interface for Hugging Face."""
     # Initialize the app with default model
-    app = KeywordSpottingApp(model_size="base")
     def classify_audio(audio_input, audio_file, keywords, model_size, access_token):
         """Wrapper function for Gradio interface."""
@@ -231,7 +231,7 @@ def create_gradio_interface():
         5. **Click "Analyze Audio"** to get results
         ### 💡 Example Keywords:
-        `hola, gracias, adiós, sí, no, por favor`
         """)
         with gr.Row():
@@ -247,17 +247,18 @@ def create_gradio_interface():
                 gr.Markdown("### 🤖 Model Selection")
                 model_selector = gr.Dropdown(
                     choices=["tiny", "base", "small", "medium"],
-                    value="base",
                     label="Whisper Model",
                     info="tiny=fastest, base=balanced, small=better accuracy, medium=best accuracy"
                 )
                 gr.Markdown("### 🔤 Keywords")
-                gr.Markdown("*Example: hola, gracias, adiós*")
                 keywords_input = gr.Textbox(
                     label="Keywords (comma-separated)",
-                    placeholder="hola, gracias, adiós, sí, no",
-                    lines=2
                 )
                 gr.Markdown("### 🎵 Audio Input")
@@ -301,7 +302,7 @@ def create_gradio_interface():
                 model_status_output = gr.Textbox(
                     label="Model Status",
-                    value="Current model: base",
                     interactive=False,
                     elem_classes=["status-box"]
                 )
@@ -317,30 +318,12 @@ def create_gradio_interface():
         gr.Markdown("""
         ## 💡 Usage Examples:
-        **Suggested Spanish keywords:**
-        - Greetings: `hola, buenos días, buenas tardes, adiós`
-        - Courtesy: `gracias, por favor, disculpe, perdón`
-        - Responses: `sí, no, tal vez, claro`
-        - Numbers: `uno, dos, tres, cuatro, cinco`
-        - Colors: `rojo, azul, verde, amarillo`
         **Tips:**
         - Use clear audio without background noise
         - Speak at normal speed
         - Keywords can appear anywhere in the audio
         - Works best with common Spanish words
-        ## 🔧 Technical Details:
-        - **Model**: OpenAI Whisper (speech transcription)
-        - **Languages**: Optimized for Spanish, works with others
-        - **Processing**: Up to 30 seconds, 48kHz sampling rate
-        - **Approach**: Transcription + text matching
-        ## 🤖 Model Comparison:
-        - **tiny**: Fastest, basic accuracy (72MB)
-        - **base**: Balanced speed/accuracy (139MB)
-        - **small**: Better accuracy, slower (461MB)
-        - **medium**: Best accuracy, slowest (1.46GB)
         """)
     return interface

     """Create and configure the Gradio interface for Hugging Face."""
     # Initialize the app with default model
+    app = KeywordSpottingApp(model_size="tiny")
     def classify_audio(audio_input, audio_file, keywords, model_size, access_token):
         """Wrapper function for Gradio interface."""
         5. **Click "Analyze Audio"** to get results
         ### 💡 Example Keywords:
+        `Sí, Claro, No, Nunca, Quizás, Tal vez, Por supuesto, En absoluto`
         """)
         with gr.Row():
                 gr.Markdown("### 🤖 Model Selection")
                 model_selector = gr.Dropdown(
                     choices=["tiny", "base", "small", "medium"],
+                    value="tiny",
                     label="Whisper Model",
                     info="tiny=fastest, base=balanced, small=better accuracy, medium=best accuracy"
                 )
                 gr.Markdown("### 🔤 Keywords")
+                gr.Markdown("*Example: Sí, No, Quizás, Claro, Nunca*")
                 keywords_input = gr.Textbox(
                     label="Keywords (comma-separated)",
+                    placeholder="Si,Claro,Por supuesto,Exacto,De acuerdo,Seguro,Cierto,Sin duda,Así es,Correcto,No,Nunca,Jamás,De ninguna,En absoluto,Para nada,Negativo,Falso,Ni hablar,Imposible,Quizás,Tal vez,Puede ser,No sé,A lo mejor,Es posible,Dudo mucho,Quién sabe,Probablemente,No estoy seguro",
+                    value="Si,Claro,Por supuesto,Exacto,De acuerdo,Seguro,Cierto,Sin duda,Así es,Correcto,No,Nunca,Jamás,De ninguna,En absoluto,Para nada,Negativo,Falso,Ni hablar,Imposible,Quizás,Tal vez,Puede ser,No sé,A lo mejor,Es posible,Dudo mucho,Quién sabe,Probablemente,No estoy seguro",
+                    lines=3
                 )
                 gr.Markdown("### 🎵 Audio Input")
                 model_status_output = gr.Textbox(
                     label="Model Status",
+                    value="Current model: tiny",
                     interactive=False,
                     elem_classes=["status-box"]
                 )
         gr.Markdown("""
         ## 💡 Usage Examples:
         **Tips:**
         - Use clear audio without background noise
         - Speak at normal speed
         - Keywords can appear anywhere in the audio
         - Works best with common Spanish words
         """)
     return interface