demo-app / app.py
iSaahil's picture
Update app.py
1cb3650 verified
raw
history blame
685 Bytes
import streamlit as st
from audio_recorder_streamlit import audio_recorder
from transformers import pipeline
pipe = pipeline("automatic-speech-recognition", model="Bidwill/whisper-medium-sanskrit-try-2")
recorded_audio = audio_recorder()
if recorded_audio:
audio_file = "audio.mp3"
with open(audio_file,"wb") as f:
f.write(recorded_audio)
if recorded_audio:
out = pipe(audio_file)
st.json(out)
transcribed_text = out['text']
messages = [
{"role": "user", "content": transcribed_text},
]
pipe2 = pipeline("text-generation", model="thtskaran/sanskritayam-gpt")
out2 = pipe2(messages)
st.write(out2)