conette

Sleeping

Labbeti commited on Nov 16, 2023

Commit

f96230b

1 Parent(s): 1348542

Add: Options beam size, min pred size and max pred size to UI.

Files changed (1) hide show

app.py CHANGED Viewed

@@ -15,6 +15,25 @@ def load_conette(*args, **kwargs) -> CoNeTTEModel:
 def main() -> None:
     st.header("CoNeTTE model test")
     audios = st.file_uploader(
         "Upload an audio file",
         type=["wav", "flac", "mp3", "ogg", "avi"],
@@ -22,13 +41,17 @@ def main() -> None:
     )
     if audios is not None and len(audios) > 0:
-        model = load_conette(model_kwds=dict(device="cpu"))
         for audio in audios:
             with NamedTemporaryFile() as temp:
                 temp.write(audio.getvalue())
                 fpath = temp.name
-                outputs = model(fpath)
                 cand = outputs["cands"][0]
                 st.write(f"Output for {audio.name}:")

 def main() -> None:
     st.header("CoNeTTE model test")
+    model = load_conette(model_kwds=dict(device="cpu"))
+    task = st.selectbox("Task embedding input", model.tasks, 0)
+    beam_size: int = st.select_slider(  # type: ignore
+        "Beam size",
+        list(range(1, 50)),
+        model.config.beam_size,
+    )
+    min_pred_size: int = st.select_slider(  # type: ignore
+        "Minimal number of words",
+        list(range(1, 50)),
+        model.config.min_pred_size,
+    )
+    max_pred_size: int = st.select_slider(  # type: ignore
+        "Maximal number of words",
+        list(range(1, 50)),
+        model.config.max_pred_size,
+    )
     audios = st.file_uploader(
         "Upload an audio file",
         type=["wav", "flac", "mp3", "ogg", "avi"],
     )
     if audios is not None and len(audios) > 0:
         for audio in audios:
             with NamedTemporaryFile() as temp:
                 temp.write(audio.getvalue())
                 fpath = temp.name
+                outputs = model(
+                    fpath,
+                    task=task,
+                    beam_size=beam_size,
+                    min_pred_size=min_pred_size,
+                    max_pred_size=max_pred_size,
+                )
                 cand = outputs["cands"][0]
                 st.write(f"Output for {audio.name}:")