Transcript2Word / app.py
Rajor78's picture
Update app.py
88bf030 verified
raw
history blame
940 Bytes
import gradio as gr
import subprocess
import os
import librosa
from transformers import WhisperProcessor, WhisperForConditionalGeneration
from gingerit.gingerit import GingerIt
from pydub import AudioSegment
from docx import Document
# Funci贸n para extraer audio de video
def extract_audio(video_path, audio_path):
command = f"ffmpeg -i '{video_path}' -ar 16000 -ac 1 -c:a pcm_s16le '{audio_path}' -y"
subprocess.run(command, shell=True, check=True)
return audio_path
# Funci贸n para transcribir el audio usando Whisper
def transcribe_audio(audio_path):
# Cargar el procesador y modelo de Whisper
processor = WhisperProcessor.from_pretrained("openai/whisper-base")
model = WhisperForConditionalGeneration.from_pretrained("openai/whisper-base")
# Cargar el archivo de audio usando librosa
audio_input, _ = librosa.load(audio_path, sr=16000)
# Preprocesar el audio para el modelo
inputs =