Spaces:

cdactvm
/

demoASR

Sleeping

App Files Files Community

cdactvm commited on Jul 2, 2024

Commit

ee6e935

verified ·

1 Parent(s): d4e2ce0

Update app.py

Browse files

Files changed (1) hide show

app.py +46 -2

app.py CHANGED Viewed

@@ -16,6 +16,8 @@ pipe = pipeline(task="automatic-speech-recognition", model="cdactvm/w2v-bert-2.0
 p1 = pipeline(task="automatic-speech-recognition", model="cdactvm/w2v-bert-2.0-odia_v1")
 p2 = pipeline(task="automatic-speech-recognition", model="cdactvm/w2v-bert-2.0-hindi_v1")
 os.system('git clone https://github.com/irshadbhat/indic-trans.git')
 os.system('pip install ./indic-trans/.')
@@ -35,7 +37,16 @@ def transcribe_hindi(speech):
     if text is None:
         return "Error: ASR returned None"
     return text
 def transcribe_odiya_eng(speech):
     trn = Transliterator(source='ori', target='eng', build_lookup=True)
     text = p1(speech)["text"]
@@ -60,6 +71,31 @@ def transcribe_hin_eng(speech):
     processed_sentence = process_doubles(replaced_words)
     return process_transcription(processed_sentence)
 def process_transcription(input_sentence):
     word_to_code_map = {}
     code_to_word_map = {}
@@ -92,6 +128,14 @@ def sel_lng(lng, mic=None, file=None):
         return transcribe_hin_eng(audio)
     elif lng == "Hindi":
         return transcribe_hindi(audio)
 # Function to replace incorrectly spelled words
 def replace_words(sentence):
@@ -316,7 +360,7 @@ demo=gr.Interface(
     inputs=[
-        gr.Dropdown(["Hindi","Hindi-trans","Odiya","Odiya-trans"],value="Hindi",label="Select Language"),
         gr.Audio(sources=["microphone","upload"], type="filepath"),
         #gr.Audio(sources="upload", type="filepath"),
         #"state"

 p1 = pipeline(task="automatic-speech-recognition", model="cdactvm/w2v-bert-2.0-odia_v1")
 p2 = pipeline(task="automatic-speech-recognition", model="cdactvm/w2v-bert-2.0-hindi_v1")
+p3 = pipeline(task="automatic-speech-recognition", model="cdactvm/kannada_w2v-bert_model")
+p4 = pipeline(task="automatic-speech-recognition", model="cdactvm/telugu_w2v-bert_model")
 os.system('git clone https://github.com/irshadbhat/indic-trans.git')
 os.system('pip install ./indic-trans/.')
     if text is None:
         return "Error: ASR returned None"
     return text
+def transcribe_kannada(speech):
+    text = p3(speech)["text"]
+    if text is None:
+        return "Error: ASR returned None"
+    return text
+def transcribe_telugu(speech):
+    text = p4(speech)["text"]
+    if text is None:
+        return "Error: ASR returned None"
+    return text
 def transcribe_odiya_eng(speech):
     trn = Transliterator(source='ori', target='eng', build_lookup=True)
     text = p1(speech)["text"]
     processed_sentence = process_doubles(replaced_words)
     return process_transcription(processed_sentence)
+def transcribe_kan_eng(speech):
+    trn = Transliterator(source='kan', target='eng', build_lookup=True)
+    text = p3(speech)["text"]
+    if text is None:
+        return "Error: ASR returned None"
+    sentence = trn.transform(text)
+    if sentence is None:
+        return "Error: Transliteration returned None"
+    replaced_words = replace_words(sentence)
+    processed_sentence = process_doubles(replaced_words)
+    return process_transcription(processed_sentence)
+def transcribe_tel_eng(speech):
+    trn = Transliterator(source='tel', target='eng', build_lookup=True)
+    text = p4(speech)["text"]
+    if text is None:
+        return "Error: ASR returned None"
+    sentence = trn.transform(text)
+    if sentence is None:
+        return "Error: Transliteration returned None"
+    replaced_words = replace_words(sentence)
+    processed_sentence = process_doubles(replaced_words)
+    return process_transcription(processed_sentence)
 def process_transcription(input_sentence):
     word_to_code_map = {}
     code_to_word_map = {}
         return transcribe_hin_eng(audio)
     elif lng == "Hindi":
         return transcribe_hindi(audio)
+    elif lng == "Kannada-trans":
+       return transcribe_kan_eng(audio)
+    elif lng == "Kannada":
+       return transcribe_kannada(audio)
+    elif lng == "Telugu-trans":
+       return transcribe_tel_eng(audio)
+    elif lng == "Telugu":
+       return transcribe_telugu(audio)
 # Function to replace incorrectly spelled words
 def replace_words(sentence):
     inputs=[
+        gr.Dropdown(["Hindi","Hindi-trans","Odiya","Odiya-trans","Kannada","Kannada-trans","Telugu","Telugu-trans"],value="Hindi",label="Select Language"),
         gr.Audio(sources=["microphone","upload"], type="filepath"),
         #gr.Audio(sources="upload", type="filepath"),
         #"state"