ASR-for-MG-dialects

Sleeping

App Files Files Community

sbompolas commited on Dec 19, 2025

Commit

2b8223d

verified ·

1 Parent(s): 2bfc660

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -44

app.py CHANGED Viewed

@@ -139,48 +139,23 @@ class MultiASRApp:
     # ------------------------
     # Transcription
     # ------------------------
-    def transcribe(self, audio, model_name, return_timestamps):
         if audio is None:
-            return "Ανέβασε ένα ηχητικό αρχείο.", "", ""
         start = time.time()
         if not self.load_model(model_name):
-            return "Σφάλμα φόρτωσης μοντέλου.", "", ""
-        if self.current_kind == "ctc":
-            result = self.pipe(audio)
-            text = result.get("text", "")
-            timestamps = (
-                "Οι χρονικές σημάνσεις δεν υποστηρίζονται για αυτό το μοντέλο."
-                if return_timestamps
-                else ""
-            )
-        else:
-            result = self.pipe(
-                audio,
-                return_timestamps=return_timestamps,
-            )
-            text = result.get("text", "")
-            timestamps = self.format_timestamps(result.get("chunks", []))
-        details = (
             f"Μοντέλο: {model_name}\n"
             f"Χρόνος επεξεργασίας: {time.time() - start:.2f} δευτ."
         )
-        return text.strip(), timestamps, details
-    def format_timestamps(self, chunks):
-        if not chunks:
-            return ""
-        out = ""
-        for c in chunks:
-            ts = c.get("timestamp")
-            if ts and ts[0] is not None and ts[1] is not None:
-                out += f"[{ts[0]:.1f}–{ts[1]:.1f}] {c.get('text','')}\n"
-        return out
     def status(self):
         if not self.current_model:
@@ -193,8 +168,8 @@ class MultiASRApp:
 # ------------------------
 app = MultiASRApp()
-def run(audio, model, timestamps):
-    return app.transcribe(audio, model, timestamps)
 def status():
     return app.status()
@@ -214,11 +189,18 @@ with gr.Blocks(title="Ίντα λαλείς;", theme=gr.themes.Soft()) as demo:
 """
     )
-    model_status = gr.Textbox(label="Κατάσταση μοντέλου", value=status(), interactive=False)
     with gr.Row():
         with gr.Column():
-            audio = gr.Audio(label="🎵 Ανέβασε ηχητικό αρχείο", type="filepath")
             model = gr.Dropdown(
                 choices=app.available_models,
@@ -226,19 +208,27 @@ with gr.Blocks(title="Ίντα λαλείς;", theme=gr.themes.Soft()) as demo:
                 label="Μοντέλο αναγνώρισης ομιλίας",
             )
-            timestamps = gr.Checkbox(label="Χρονικές σημάνσεις", value=True)
-            btn = gr.Button("🗣️ Μετατροπή ομιλίας σε κείμενο", variant="primary")
         with gr.Column():
-            text_out = gr.Textbox(label="📄 Κείμενο", lines=8, show_copy_button=True)
-            ts_out = gr.Textbox(label="Χρονικές σημάνσεις", lines=8)
-            info_out = gr.Textbox(label="Πληροφορίες", lines=4)
     btn.click(
         run,
-        inputs=[audio, model, timestamps],
-        outputs=[text_out, ts_out, info_out],
     )
     model.change(lambda _: status(), outputs=model_status)

     # ------------------------
     # Transcription
     # ------------------------
+    def transcribe(self, audio, model_name):
         if audio is None:
+            return "Ανέβασε ένα ηχητικό αρχείο.", ""
         start = time.time()
         if not self.load_model(model_name):
+            return "Σφάλμα φόρτωσης μοντέλου.", ""
+        result = self.pipe(audio)
+        text = result.get("text", "")
+        info = (
             f"Μοντέλο: {model_name}\n"
             f"Χρόνος επεξεργασίας: {time.time() - start:.2f} δευτ."
         )
+        return text.strip(), info
     def status(self):
         if not self.current_model:
 # ------------------------
 app = MultiASRApp()
+def run(audio, model):
+    return app.transcribe(audio, model)
 def status():
     return app.status()
 """
     )
+    model_status = gr.Textbox(
+        label="Κατάσταση μοντέλου",
+        value=status(),
+        interactive=False,
+    )
     with gr.Row():
         with gr.Column():
+            audio = gr.Audio(
+                label="🎵 Ανέβασε ηχητικό αρχείο",
+                type="filepath",
+            )
             model = gr.Dropdown(
                 choices=app.available_models,
                 label="Μοντέλο αναγνώρισης ομιλίας",
             )
+            btn = gr.Button(
+                "🗣️ Μετατροπή ομιλίας σε κείμενο",
+                variant="primary",
+            )
         with gr.Column():
+            text_out = gr.Textbox(
+                label="📄 Κείμενο",
+                lines=8,
+                show_copy_button=True,
+            )
+            info_out = gr.Textbox(
+                label="Πληροφορίες",
+                lines=4,
+            )
     btn.click(
         run,
+        inputs=[audio, model],
+        outputs=[text_out, info_out],
     )
     model.change(lambda _: status(), outputs=model_status)