Abu Naim commited on
Commit
a16931b
·
1 Parent(s): 972de5d

Add application code

Browse files
Files changed (3) hide show
  1. ModelName +1 -0
  2. app.py +34 -0
  3. requirments.txt +5 -0
ModelName ADDED
@@ -0,0 +1 @@
 
 
1
+ model: facebook/wav2vec2-base-960h
app.py ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import warnings
2
+ import torch
3
+ import gradio as gr
4
+ import librosa
5
+ from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
6
+
7
+ warnings.filterwarnings("ignore")
8
+ processor = Wav2Vec2Processor.from_pretrained("facebook/wav2vec2-base-960h")
9
+ model = Wav2Vec2ForCTC.from_pretrained("facebook/wav2vec2-base-960h")
10
+
11
+ def transcribe_audio(audio_path):
12
+ try:
13
+ audio,sampling_rate = librosa.load(audio_path, sampling_rate=16000)
14
+ input_values = processor(audio, return_tensors='pt', sampling_rate=16000).input_values
15
+
16
+ with torch.no_grad():
17
+ logits = model(input_values).logits
18
+
19
+ predicted_ids = torch.argmax(logits, dim=-1)
20
+ transcriptions = processor.batch_decode(predicted_ids)[0]
21
+ return transcriptions
22
+ except Exception as e:
23
+ return str(e)
24
+
25
+ demo = gr.Interface(
26
+ fn = transcribe_audio,
27
+ inputs= gr.Audio(type='filepath'),
28
+ outputs='text',
29
+ title="Subtitle Genarator",
30
+ description="This tool transcribes audio file into text"
31
+ )
32
+ demo.launch()
33
+
34
+
requirments.txt ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ torch
2
+ librosa //for audio
3
+ numpy
4
+ transformers
5
+ gradio //making interface for a AI app with this package