Voice_Assistant_Demo

Runtime error

App Files Files Community

wanchichen commited on Jan 20

Commit

30a6fae

verified ·

1 Parent(s): f056593

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -264

app.py CHANGED Viewed

@@ -1,10 +1,3 @@
-try:
-    import versa
-except ImportError:
-    from subprocess import call
-    with open('versa.sh', 'rb') as file:
-        script = file.read()
-    rc = call(script, shell=True)
 import os
 import shutil
@@ -16,27 +9,7 @@ import nltk
 import numpy as np
 import torch
 from huggingface_hub import HfApi
-from pyscripts.utils.dialog_eval.ASR_WER import handle_espnet_ASR_WER
-from pyscripts.utils.dialog_eval.human_feedback import (
-    natural_vote1_last_response,
-    natural_vote2_last_response,
-    natural_vote3_last_response,
-    natural_vote4_last_response,
-    relevant_vote1_last_response,
-    relevant_vote2_last_response,
-    relevant_vote3_last_response,
-    relevant_vote4_last_response,
-)
-from pyscripts.utils.dialog_eval.LLM_Metrics import (
-    DialoGPT_perplexity,
-    bert_score,
-    perplexity,
-    vert,
-)
-from pyscripts.utils.dialog_eval.TTS_intelligibility import (
-    handle_espnet_TTS_intelligibility,
-)
-from pyscripts.utils.dialog_eval.TTS_speech_quality import TTS_psuedomos
 from espnet2.sds.espnet_model import ESPnetSDSModelInterface
@@ -153,34 +126,7 @@ def handle_eval_selection(
     """
     global LLM_response_arr
     global total_response_arr
-    yield (option, gr.Textbox(visible=True))
-    if option == "Latency":
-        text = (
-            f"ASR Latency: {latency_ASR:.2f}\n"
-            f"LLM Latency: {latency_LM:.2f}\n"
-            f"TTS Latency: {latency_TTS:.2f}"
-        )
-        yield (None, text)
-    elif option == "TTS Intelligibility":
-        yield (None, handle_espnet_TTS_intelligibility(TTS_audio_output, LLM_Output))
-    elif option == "TTS Speech Quality":
-        yield (None, TTS_psuedomos(TTS_audio_output))
-    elif option == "ASR WER":
-        yield (None, handle_espnet_ASR_WER(ASR_audio_output, ASR_transcript))
-    elif option == "Text Dialog Metrics":
-        yield (
-            None,
-            perplexity(LLM_Output.replace("\n", " "))
-            + vert(LLM_response_arr)
-            + bert_score(total_response_arr)
-            + DialoGPT_perplexity(
-                ASR_transcript.replace("\n", " "), LLM_Output.replace("\n", " ")
-            ),
-        )
-    elif option is None:
-        return
-    else:
-        raise ValueError(f"Unknown option: {option}")
 def handle_eval_selection_E2E(
@@ -244,20 +190,7 @@ def handle_eval_selection_E2E(
     """
     global LLM_response_arr
     global total_response_arr
-    yield (option, gr.Textbox(visible=True))
-    if option == "Latency":
-        text = f"Total Latency: {latency_TTS:.2f}"
-        yield (None, text)
-    elif option == "TTS Intelligibility":
-        yield (None, handle_espnet_TTS_intelligibility(TTS_audio_output, LLM_Output))
-    elif option == "TTS Speech Quality":
-        yield (None, TTS_psuedomos(TTS_audio_output))
-    elif option == "Text Dialog Metrics":
-        yield (None, perplexity(LLM_Output.replace("\n", " ")) + vert(LLM_response_arr))
-    elif option is None:
-        return
-    else:
-        raise ValueError(f"Unknown option: {option}")
 def start_warmup():
@@ -789,198 +722,6 @@ with gr.Blocks(
         None,
         preprocess=False,
     )
-    natural_btn1.click(
-        natural_vote1_last_response,
-        [],
-        [natural_response, ip_address] + natural_btn_list,
-    ).then(
-        lambda *args: callback.flag(list(args)),
-        [
-            user_audio,
-            output_asr_text,
-            output_text,
-            output_audio,
-            output_audio1,
-            type_radio,
-            ASR_radio,
-            LLM_radio,
-            radio,
-            E2Eradio,
-            natural_response,
-            diversity_response,
-            ip_address,
-        ],
-        None,
-        preprocess=False,
-    )
-    natural_btn2.click(
-        natural_vote2_last_response,
-        [],
-        [natural_response, ip_address] + natural_btn_list,
-    ).then(
-        lambda *args: callback.flag(list(args)),
-        [
-            user_audio,
-            output_asr_text,
-            output_text,
-            output_audio,
-            output_audio1,
-            type_radio,
-            ASR_radio,
-            LLM_radio,
-            radio,
-            E2Eradio,
-            natural_response,
-            diversity_response,
-            ip_address,
-        ],
-        None,
-        preprocess=False,
-    )
-    natural_btn3.click(
-        natural_vote3_last_response,
-        [],
-        [natural_response, ip_address] + natural_btn_list,
-    ).then(
-        lambda *args: callback.flag(list(args)),
-        [
-            user_audio,
-            output_asr_text,
-            output_text,
-            output_audio,
-            output_audio1,
-            type_radio,
-            ASR_radio,
-            LLM_radio,
-            radio,
-            E2Eradio,
-            natural_response,
-            diversity_response,
-            ip_address,
-        ],
-        None,
-        preprocess=False,
-    )
-    natural_btn4.click(
-        natural_vote4_last_response,
-        [],
-        [natural_response, ip_address] + natural_btn_list,
-    ).then(
-        lambda *args: callback.flag(list(args)),
-        [
-            user_audio,
-            output_asr_text,
-            output_text,
-            output_audio,
-            output_audio1,
-            type_radio,
-            ASR_radio,
-            LLM_radio,
-            radio,
-            E2Eradio,
-            natural_response,
-            diversity_response,
-            ip_address,
-        ],
-        None,
-        preprocess=False,
-    )
-    relevant_btn1.click(
-        relevant_vote1_last_response,
-        [],
-        [diversity_response, ip_address] + relevant_btn_list,
-    ).then(
-        lambda *args: callback.flag(list(args)),
-        [
-            user_audio,
-            output_asr_text,
-            output_text,
-            output_audio,
-            output_audio1,
-            type_radio,
-            ASR_radio,
-            LLM_radio,
-            radio,
-            E2Eradio,
-            natural_response,
-            diversity_response,
-            ip_address,
-        ],
-        None,
-        preprocess=False,
-    )
-    relevant_btn2.click(
-        relevant_vote2_last_response,
-        [],
-        [diversity_response, ip_address] + relevant_btn_list,
-    ).then(
-        lambda *args: callback.flag(list(args)),
-        [
-            user_audio,
-            output_asr_text,
-            output_text,
-            output_audio,
-            output_audio1,
-            type_radio,
-            ASR_radio,
-            LLM_radio,
-            radio,
-            E2Eradio,
-            natural_response,
-            diversity_response,
-            ip_address,
-        ],
-        None,
-        preprocess=False,
-    )
-    relevant_btn3.click(
-        relevant_vote3_last_response,
-        [],
-        [diversity_response, ip_address] + relevant_btn_list,
-    ).then(
-        lambda *args: callback.flag(list(args)),
-        [
-            user_audio,
-            output_asr_text,
-            output_text,
-            output_audio,
-            output_audio1,
-            type_radio,
-            ASR_radio,
-            LLM_radio,
-            radio,
-            E2Eradio,
-            natural_response,
-            diversity_response,
-            ip_address,
-        ],
-        None,
-        preprocess=False,
-    )
-    relevant_btn4.click(
-        relevant_vote4_last_response,
-        [],
-        [diversity_response, ip_address] + relevant_btn_list,
-    ).then(
-        lambda *args: callback.flag(list(args)),
-        [
-            user_audio,
-            output_asr_text,
-            output_text,
-            output_audio,
-            output_audio1,
-            type_radio,
-            ASR_radio,
-            LLM_radio,
-            radio,
-            E2Eradio,
-            natural_response,
-            diversity_response,
-            ip_address,
-        ],
-        None,
-        preprocess=False,
-    )
 demo.queue(max_size=10, default_concurrency_limit=1)
-demo.launch(share=True)

 import os
 import shutil
 import numpy as np
 import torch
 from huggingface_hub import HfApi
 from espnet2.sds.espnet_model import ESPnetSDSModelInterface
     """
     global LLM_response_arr
     global total_response_arr
+    return None
 def handle_eval_selection_E2E(
     """
     global LLM_response_arr
     global total_response_arr
+    return
 def start_warmup():
         None,
         preprocess=False,
     )
 demo.queue(max_size=10, default_concurrency_limit=1)
+demo.launch(share=True)