| import streamlit as st | |
| from audio_recorder_streamlit import audio_recorder | |
| from transformers import pipeline | |
| pipe = pipeline("automatic-speech-recognition", model="Bidwill/whisper-medium-sanskrit-try-2") | |
| recorded_audio = audio_recorder() | |
| if recorded_audio: | |
| audio_file = "audio.mp3" | |
| with open(audio_file,"wb") as f: | |
| f.write(recorded_audio) | |
| if recorded_audio: | |
| out = pipe(audio_file) | |
| st.json(out) | |
| transcribed_text = out['text'] | |
| messages = [ | |
| {"role": "user", "content": transcribed_text}, | |
| ] | |
| pipe2 = pipeline("text-generation", model="thtskaran/sanskritayam-gpt") | |
| out2 = pipe2(messages) | |
| st.write(out2) | |