Spaces:

nimool
/

gbn_test

Sleeping

App Files Files Community

nimool commited on Oct 4, 2023

Commit

f9d356e

1 Parent(s): ac48dca

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -10

app.py CHANGED Viewed

@@ -6,6 +6,7 @@ import sox
 import subprocess
 from fuzzywuzzy import fuzz
 def read_file_and_process(wav_file):
     filename = wav_file.split('.')[0]
     filename_16k = filename + "16k.wav"
@@ -36,29 +37,28 @@ def parse(wav_file):
         logits = model(**input_values).logits
     return parse_transcription(logits)
 model_id = "jonatasgrosman/wav2vec2-large-xlsr-53-persian"
 processor = Wav2Vec2Processor.from_pretrained(model_id)
 model = Wav2Vec2ForCTC.from_pretrained(model_id)
-input_ = gr.Audio(source="microphone", type="filepath")
 txtbox = gr.Textbox(
-            label="persian text output:",
             lines=5,
-            placeholder="متن نوشتاری گفتار شما",
-            show_label=True,
-            container=True,
             text_align="right",
             show_copy_button=True,
         )
 title = "Speech-to-Text (persian)"
-description = "Upload a prsian audio, and let AI do the hard work of transcribing."
 article = "<p style='text-align: center'><a href='https://github.com/nimaprgrmr'>Large-Scale Self- and Semi-Supervised Learning for Speech Translation</a></p>"
 demo = gr.Interface(fn=parse, inputs = input_,  outputs=txtbox, title=title, description=description, article = article,
              streaming=True, interactive=True,
              analytics_enabled=False, show_tips=False, enable_queue=True)

 import subprocess
 from fuzzywuzzy import fuzz
 def read_file_and_process(wav_file):
     filename = wav_file.split('.')[0]
     filename_16k = filename + "16k.wav"
         logits = model(**input_values).logits
     return parse_transcription(logits)
 model_id = "jonatasgrosman/wav2vec2-large-xlsr-53-persian"
 processor = Wav2Vec2Processor.from_pretrained(model_id)
 model = Wav2Vec2ForCTC.from_pretrained(model_id)
+input_ = gr.Audio(source="microphone",
+                  type="filepath",
+                  label="لطفا دکمه ضبط صدا را بزنید و شروع به صحبت کنید و بعذ از اتمام صحبت دوباره دکمه ضبط را فشار دهید.",
+                  show_download_button=True,
+                  show_edit_button=True,
+                 )
 txtbox = gr.Textbox(
+            label="متن گفتار شما: ",
             lines=5,
             text_align="right",
+            show_label=True,
             show_copy_button=True,
         )
 title = "Speech-to-Text (persian)"
+description = "، توجه داشته باشید که هرچه گفتار شما شمرده تر باشد خروجی با کیفیت تری دارید.روی دکمه ضبط صدا کلیک کنید و سپس دسترسی مرورگر خود را به میکروفون دستگاه بدهید، سپس شروع به صحبت کنید و برای اتمام ضبط دوباره روی دکمه کلیک کنید"
 article = "<p style='text-align: center'><a href='https://github.com/nimaprgrmr'>Large-Scale Self- and Semi-Supervised Learning for Speech Translation</a></p>"
 demo = gr.Interface(fn=parse, inputs = input_,  outputs=txtbox, title=title, description=description, article = article,
              streaming=True, interactive=True,
              analytics_enabled=False, show_tips=False, enable_queue=True)