Spaces:

Sanchayt
/

AutoDub

Runtime error

App Files Files Community

Sanchayt commited on Jul 27, 2023

Commit

7abe680

1 Parent(s): f86362b

working

Browse files

Files changed (2) hide show

.gitignore +1 -0
app.py +35 -22

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ env

app.py CHANGED Viewed

@@ -12,20 +12,19 @@ from moviepy.video.io.ffmpeg_tools import ffmpeg_extract_subclip
 import os
 from elevenlabs import set_api_key
-set_api_key("6d5e981fbb2643b06459981da55c4ae7")
 def shorten_audio(filename):
-    cut_filename = "AutoDub/dub/cut_audio.mp4"
     audio = AudioSegment.from_file(filename)
-    cut_audio = audio[:60 * 1000]
     cut_audio.export(cut_filename, format="mp4")
     return cut_filename
 def generate_translation(original_text, destination_language):
-    anthropic = Anthropic(
-        api_key="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")
     prompt = (
         f"{HUMAN_PROMPT} Please translate this video transcript into {destination_language}. You will get "
@@ -47,18 +46,14 @@ def generate_translation(original_text, destination_language):
 def generate_dubs(text):
-    filename = "AutoDub/dub/output.mp3"
-    set_api_key(st.secrets['xi_api_key'])
-    audio = generate(
-        text=text,
-        voice="Sanchay",
-        model='eleven_multilingual_v1'
-    )
     audio_io = io.BytesIO(audio)
-    insert_audio = AudioSegment.from_file(audio_io, format='mp3')
     insert_audio.export(filename, format="mp3")
     return filename
@@ -67,10 +62,21 @@ def generate_dubs(text):
 def combine_video(video_filename, audio_filename):
     ffmpeg_extract_subclip(video_filename, 0, 60, targetname="cut_video.mp4")
-    output_filename = "AutoDub/dub/output.mp4"
-    command = ["ffmpeg", "-y", "-i", "cut_video.mp4", "-i", audio_filename, "-c:v", "copy", "-c:a", "aac",
-               output_filename]
     subprocess.run(command)
@@ -81,7 +87,10 @@ st.title("AutoDubs 📺🎵")
 link = st.text_input("Link to Youtube Video", key="link")
-language = st.selectbox("Translate to", ("French", "German", "Hindi", "Italian", "Polish", "Portuguese", "Spanish"))
 if st.button("Transcribe!"):
     print(f"downloading from link: {link}")
@@ -105,11 +114,13 @@ if st.button("Transcribe!"):
             print(transcription)
             if transcription:
-                df = pd.DataFrame(transcription['segments'], columns=['start', 'end', 'text'])
                 st.dataframe(df)
-                print(transcription['text'])
                 dubbing_caption = st.caption("Dubbing...")
-                translation = generate_translation(transcription['text'], language)
                 dubbing_caption = st.caption("Begin dubbing...")
                 dubs_audio = generate_dubs(translation)
                 dubbing_caption.caption("Dubs generated! combining with the video...")
@@ -118,7 +129,9 @@ if st.button("Transcribe!"):
                 video_filename = video_streams.first().download()
                 if video_filename:
-                    dubbing_caption.caption("Video downloaded! combining the video and the dubs...")
                     output_filename = combine_video(video_filename, dubs_audio)
                     if os.path.exists(output_filename):

 import os
 from elevenlabs import set_api_key
+set_api_key(st.secrets["xi_api_key"])
 def shorten_audio(filename):
+    cut_filename = "cut_audio.mp4"
     audio = AudioSegment.from_file(filename)
+    cut_audio = audio[: 60 * 1000]
     cut_audio.export(cut_filename, format="mp4")
     return cut_filename
 def generate_translation(original_text, destination_language):
+    anthropic = Anthropic(api_key=st.secrets["anthropic"])
     prompt = (
         f"{HUMAN_PROMPT} Please translate this video transcript into {destination_language}. You will get "
 def generate_dubs(text):
+    filename = "output.mp3"
+    set_api_key(st.secrets["xi_api_key"])
+    audio = generate(text=text, voice="Sanchay", model="eleven_multilingual_v1")
     audio_io = io.BytesIO(audio)
+    insert_audio = AudioSegment.from_file(audio_io, format="mp3")
     insert_audio.export(filename, format="mp3")
     return filename
 def combine_video(video_filename, audio_filename):
     ffmpeg_extract_subclip(video_filename, 0, 60, targetname="cut_video.mp4")
+    output_filename = "output.mp4"
+    command = [
+        "ffmpeg",
+        "-y",
+        "-i",
+        "cut_video.mp4",
+        "-i",
+        audio_filename,
+        "-c:v",
+        "copy",
+        "-c:a",
+        "aac",
+        output_filename,
+    ]
     subprocess.run(command)
 link = st.text_input("Link to Youtube Video", key="link")
+language = st.selectbox(
+    "Translate to",
+    ("French", "German", "Hindi", "Italian", "Polish", "Portuguese", "Spanish"),
+)
 if st.button("Transcribe!"):
     print(f"downloading from link: {link}")
             print(transcription)
             if transcription:
+                df = pd.DataFrame(
+                    transcription["segments"], columns=["start", "end", "text"]
+                )
                 st.dataframe(df)
+                print(transcription["text"])
                 dubbing_caption = st.caption("Dubbing...")
+                translation = generate_translation(transcription["text"], language)
                 dubbing_caption = st.caption("Begin dubbing...")
                 dubs_audio = generate_dubs(translation)
                 dubbing_caption.caption("Dubs generated! combining with the video...")
                 video_filename = video_streams.first().download()
                 if video_filename:
+                    dubbing_caption.caption(
+                        "Video downloaded! combining the video and the dubs..."
+                    )
                     output_filename = combine_video(video_filename, dubs_audio)
                     if os.path.exists(output_filename):