Spaces:
Runtime error
Runtime error
debug
Browse files
app.py
CHANGED
|
@@ -6,6 +6,7 @@ from datasets import Dataset, Audio
|
|
| 6 |
from moviepy.editor import AudioFileClip
|
| 7 |
|
| 8 |
pipe = pipeline(model="Neprox/model")
|
|
|
|
| 9 |
|
| 10 |
def download_from_youtube(url):
|
| 11 |
streams = YouTube(url).streams.filter(only_audio=True, file_extension='mp4')
|
|
@@ -20,6 +21,10 @@ def divide_into_30s_segments(audio_fpath):
|
|
| 20 |
n_full_segments = int(sound.duration / 30)
|
| 21 |
len_last_segment = sound.duration % 30
|
| 22 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 23 |
segment_paths = []
|
| 24 |
segment_start_times = []
|
| 25 |
|
|
@@ -51,6 +56,7 @@ def transcribe(audio, url):
|
|
| 51 |
|
| 52 |
audio_dataset = Dataset.from_dict({"audio": segment_paths}).cast_column("audio", Audio())
|
| 53 |
print(audio_dataset)
|
|
|
|
| 54 |
text = pipe(audio_dataset)
|
| 55 |
print(type(text))
|
| 56 |
print(text)
|
|
|
|
| 6 |
from moviepy.editor import AudioFileClip
|
| 7 |
|
| 8 |
pipe = pipeline(model="Neprox/model")
|
| 9 |
+
MAX_SEGMENTS = 10 # 5 minutes
|
| 10 |
|
| 11 |
def download_from_youtube(url):
|
| 12 |
streams = YouTube(url).streams.filter(only_audio=True, file_extension='mp4')
|
|
|
|
| 21 |
n_full_segments = int(sound.duration / 30)
|
| 22 |
len_last_segment = sound.duration % 30
|
| 23 |
|
| 24 |
+
if n_full_segments > MAX_SEGMENTS:
|
| 25 |
+
n_full_segments = MAX_SEGMENTS
|
| 26 |
+
len_last_segment = 0
|
| 27 |
+
|
| 28 |
segment_paths = []
|
| 29 |
segment_start_times = []
|
| 30 |
|
|
|
|
| 56 |
|
| 57 |
audio_dataset = Dataset.from_dict({"audio": segment_paths}).cast_column("audio", Audio())
|
| 58 |
print(audio_dataset)
|
| 59 |
+
print(audio_dataset[0])
|
| 60 |
text = pipe(audio_dataset)
|
| 61 |
print(type(text))
|
| 62 |
print(text)
|