Spaces:

lifesee
/

VoiceoverStudio

Sleeping

App Files Files Community

lifesee commited on Aug 24, 2025

Commit

8593d59

verified ·

1 Parent(s): ab32289

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -46

app.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import gradio as gr
-import io, os, re, uuid, zipfile, tempfile, subprocess
 from pydub import AudioSegment
 from pydub.silence import split_on_silence
@@ -43,7 +43,6 @@ def _atempo_chain(factor: float) -> str:
     return ",".join([f"atempo={s:.5f}" for s in steps])
 def fit_to_seconds(seg: AudioSegment, target_s: float, fmt_out="mp3") -> io.BytesIO:
-    """Pitch-preserving time stretch via FFmpeg atempo."""
     with tempfile.TemporaryDirectory() as d:
         inp = os.path.join(d, "in.wav")
         outp = os.path.join(d, f"out.{fmt_out}")
@@ -64,27 +63,6 @@ def normalize_lufs(seg: AudioSegment, target_lufs=-14.0):
     gain_db = float(target_lufs) - current_db
     return seg.apply_gain(gain_db)
-def sanitize_filename(name: str, default_stem="output"):
-    name = (name or "").strip()
-    # allow letters, digits, spaces, dashes, underscores; collapse spaces to underscores
-    safe = re.sub(r"[^A-Za-z0-9 _.-]", "", name)
-    safe = re.sub(r"\s+", "_", safe)
-    return safe or default_stem
-def write_temp_file_with_name(blob: io.BytesIO, stem: str, ext: str) -> str:
-    stem = sanitize_filename(stem)
-    ext = ext.lower().strip(".")
-    tf = tempfile.NamedTemporaryFile(delete=False, prefix=f"{stem}_", suffix=f".{ext}")
-    tf.write(blob.getvalue())
-    tf.flush(); tf.close()
-    # Rename to exact requested stem if possible (NamedTemporaryFile adds random chars in prefix)
-    exact_path = os.path.join(os.path.dirname(tf.name), f"{stem}.{ext}")
-    try:
-        os.replace(tf.name, exact_path)
-        return exact_path
-    except Exception:
-        return tf.name  # fallback
 # ---------- processors ----------
 def process_single(file, mode, target_seconds, keep_silence_s,
                    min_silence_ms, silence_thresh_db, do_normalize, fmt):
@@ -131,45 +109,42 @@ def write_temp_for_preview(blob: io.BytesIO, fmt: str) -> str:
     tf.flush(); tf.close()
     return tf.name
-# ---------- UI (minimal + custom filename) ----------
 css = """
-.gradio-container { max-width: 880px !important; margin: auto !important; }
 """
 with gr.Blocks(title="AI Voice Studio – Simple", css=css) as demo:
-    gr.Markdown("## AI Voice Studio\nSet pause length. Optionally **Trim** or **Fit** to exact time. Export MP3/WAV/M4A/OGG.\n\n**Tip:** Set a custom file name below for your download.")
     with gr.Row():
-        with gr.Column():
             files = gr.Files(label="Upload audio", file_types=["audio"], type="filepath")
-            mode = gr.Radio(["none", "trim", "fit"], value="none", label="Timing mode")
             target = gr.Number(value=30, label="Target seconds (used for trim/fit)")
             keep = gr.Number(value=0.25, label="Set pause length (seconds)")
-            # NEW: custom filename stem (no extension)
-            out_name = gr.Textbox(value="voiceover", label="Output filename (no extension)")
-            with gr.Accordion("Advanced (optional)", open=False):
-                min_sil = gr.Slider(50, 1000, 120, step=10, label="Count a pause if silence ≥ (ms)")
                 thresh = gr.Slider(-80, -10, -45, step=1, label="Silence threshold (dBFS)")
                 do_norm = gr.Checkbox(True, label="Normalize loudness (~-14 LUFS)")
             fmt = gr.Dropdown(["mp3","wav","m4a","ogg"], value="mp3", label="Output format")
             go = gr.Button("Process", variant="primary")
-        with gr.Column():
             preview = gr.Audio(label="Preview (first file)", type="filepath", interactive=False)
             direct = gr.File(label="Download processed file (single)")
             zip_out = gr.File(label="Download ZIP (if multiple)")
             rep = gr.Textbox(label="Report", lines=1)
-    def run(files, mode, target, keep, min_sil, thresh, do_norm, out_name, fmt):
         files = files or []
         if not files:
             return None, None, None, "Please upload at least one audio file."
-        # process first file
         single_blob, report = process_single(
             open(files[0], "rb"),
             mode=mode, target_seconds=target, keep_silence_s=keep,
@@ -179,25 +154,19 @@ with gr.Blocks(title="AI Voice Studio – Simple", css=css) as demo:
         preview_path = write_temp_for_preview(single_blob, fmt)
         if len(files) == 1:
-            # return a file path with the requested name + extension
-            stem = sanitize_filename(out_name, default_stem="output")
-            out_path = write_temp_file_with_name(single_blob, stem, fmt)
-            return preview_path, out_path, None, report
         else:
-            # multi → zip (named after chosen stem)
             opened = [open(p, "rb") for p in files]
             zipped = process_batch(
                 opened, mode=mode, target_seconds=target, keep_silence_s=keep,
                 min_silence_ms=min_sil, silence_thresh_db=thresh,
                 do_normalize=do_norm, fmt=fmt
             )
-            zip_stem = sanitize_filename(out_name, default_stem="batch_output")
-            zip_path = write_temp_file_with_name(zipped, f"{zip_stem}_batch", "zip")
-            return preview_path, None, zip_path, report
     go.click(
         run,
-        [files, mode, target, keep, min_sil, thresh, do_norm, out_name, fmt],
         [preview, direct, zip_out, rep]
     )

 import gradio as gr
+import io, os, uuid, zipfile, tempfile, subprocess
 from pydub import AudioSegment
 from pydub.silence import split_on_silence
     return ",".join([f"atempo={s:.5f}" for s in steps])
 def fit_to_seconds(seg: AudioSegment, target_s: float, fmt_out="mp3") -> io.BytesIO:
     with tempfile.TemporaryDirectory() as d:
         inp = os.path.join(d, "in.wav")
         outp = os.path.join(d, f"out.{fmt_out}")
     gain_db = float(target_lufs) - current_db
     return seg.apply_gain(gain_db)
 # ---------- processors ----------
 def process_single(file, mode, target_seconds, keep_silence_s,
                    min_silence_ms, silence_thresh_db, do_normalize, fmt):
     tf.flush(); tf.close()
     return tf.name
+# ---------- UI (two-column, compact) ----------
 css = """
+.gradio-container { max-width: 1100px !important; margin: auto !important; }
 """
 with gr.Blocks(title="AI Voice Studio – Simple", css=css) as demo:
+    gr.Markdown("## AI Voice Studio\nSet pause length. Optionally **Trim** or **Fit** to exact time. Export MP3/WAV/M4A/OGG.")
     with gr.Row():
+        # Left column: controls
+        with gr.Column(scale=1):
             files = gr.Files(label="Upload audio", file_types=["audio"], type="filepath")
+            mode = gr.Radio(["none", "trim", "fit"], value="none", label="Timing mode", elem_id="mode")
             target = gr.Number(value=30, label="Target seconds (used for trim/fit)")
             keep = gr.Number(value=0.25, label="Set pause length (seconds)")
+            with gr.Accordion("Advanced options", open=False):
+                min_sil = gr.Slider(50, 1000, 120, step=10, label="Pause if silence ≥ (ms)")
                 thresh = gr.Slider(-80, -10, -45, step=1, label="Silence threshold (dBFS)")
                 do_norm = gr.Checkbox(True, label="Normalize loudness (~-14 LUFS)")
             fmt = gr.Dropdown(["mp3","wav","m4a","ogg"], value="mp3", label="Output format")
             go = gr.Button("Process", variant="primary")
+        # Right column: outputs
+        with gr.Column(scale=1):
             preview = gr.Audio(label="Preview (first file)", type="filepath", interactive=False)
             direct = gr.File(label="Download processed file (single)")
             zip_out = gr.File(label="Download ZIP (if multiple)")
             rep = gr.Textbox(label="Report", lines=1)
+    def run(files, mode, target, keep, min_sil, thresh, do_norm, fmt):
         files = files or []
         if not files:
             return None, None, None, "Please upload at least one audio file."
         single_blob, report = process_single(
             open(files[0], "rb"),
             mode=mode, target_seconds=target, keep_silence_s=keep,
         preview_path = write_temp_for_preview(single_blob, fmt)
         if len(files) == 1:
+            return preview_path, single_blob, None, report
         else:
             opened = [open(p, "rb") for p in files]
             zipped = process_batch(
                 opened, mode=mode, target_seconds=target, keep_silence_s=keep,
                 min_silence_ms=min_sil, silence_thresh_db=thresh,
                 do_normalize=do_norm, fmt=fmt
             )
+            return preview_path, None, zipped, report
     go.click(
         run,
+        [files, mode, target, keep, min_sil, thresh, do_norm, fmt],
         [preview, direct, zip_out, rep]
     )