Spaces:

PlayerBPlaytime
/

dolbyshi

Running

App Files Files Community

PlayerBPlaytime commited on Apr 24

Commit

cbcfe40

verified ·

1 Parent(s): c1408ce

Create app.py

Browse files

Files changed (1) hide show

app.py +218 -0

app.py ADDED Viewed

	@@ -0,0 +1,218 @@

+import gradio as gr
+import numpy as np
+import soundfile as sf
+import os
+import tempfile
+import zipfile
+from pathlib import Path
+def get_channel_name(index, total_channels):
+    """Asigna nombres a los canales según la configuración Atmos/Surround"""
+    # Configuraciones comunes de Dolby Atmos
+    channel_maps = {
+        2: ["Left", "Right"],
+        6: ["Left", "Right", "Center", "LFE", "Left Surround", "Right Surround"],
+        8: ["Left", "Right", "Center", "LFE", "Left Surround", "Right Surround",
+            "Left Back", "Right Back"],
+        10: ["Left", "Right", "Center", "LFE", "Left Surround", "Right Surround",
+             "Left Back", "Right Back", "Left Height", "Right Height"],
+        12: ["Left", "Right", "Center", "LFE", "Left Surround", "Right Surround",
+             "Left Back", "Right Back", "Left Height Front", "Right Height Front",
+             "Left Height Rear", "Right Height Rear"],
+        14: ["Left", "Right", "Center", "LFE", "Left Surround", "Right Surround",
+             "Left Back", "Right Back", "Left Height Front", "Right Height Front",
+             "Left Height Rear", "Right Height Rear", "Top Front", "Top Rear"],
+        16: ["Left", "Right", "Center", "LFE", "Left Surround", "Right Surround",
+             "Left Back", "Right Back", "Left Wide", "Right Wide",
+             "Left Height Front", "Right Height Front", "Left Height Rear",
+             "Right Height Rear", "Top Front", "Top Rear"],
+    }
+    if total_channels in channel_maps:
+        return channel_maps[total_channels][index]
+    else:
+        return f"Channel_{index + 1}"
+def extract_stems(audio_file, output_format):
+    """Extrae todos los stems/canales de un archivo de audio multicanal"""
+    if audio_file is None:
+        return None, "❌ Por favor, sube un archivo de audio"
+    try:
+        # Leer el archivo de audio
+        audio_data, sample_rate = sf.read(audio_file)
+        # Obtener información del archivo
+        if len(audio_data.shape) == 1:
+            # Audio mono
+            num_channels = 1
+            audio_data = audio_data.reshape(-1, 1)
+        else:
+            num_channels = audio_data.shape[1]
+        # Información del archivo
+        duration = len(audio_data) / sample_rate
+        file_name = Path(audio_file).stem
+        info_text = f"""
+## 📊 Información del archivo
+- **Nombre:** {Path(audio_file).name}
+- **Canales detectados:** {num_channels}
+- **Sample Rate:** {sample_rate} Hz
+- **Duración:** {duration:.2f} segundos
+- **Formato de salida:** {output_format.upper()}
+## 🎚️ Canales extraídos:
+"""
+        # Crear directorio temporal para los stems
+        temp_dir = tempfile.mkdtemp()
+        stem_files = []
+        # Extraer cada canal
+        for i in range(num_channels):
+            channel_name = get_channel_name(i, num_channels)
+            channel_data = audio_data[:, i]
+            # Normalizar el canal
+            max_val = np.max(np.abs(channel_data))
+            if max_val > 0:
+                channel_data = channel_data / max_val * 0.95
+            # Guardar el stem
+            stem_filename = f"{file_name}_{channel_name.replace(' ', '_')}.{output_format}"
+            stem_path = os.path.join(temp_dir, stem_filename)
+            sf.write(stem_path, channel_data, sample_rate)
+            stem_files.append(stem_path)
+            info_text += f"- ✅ **{channel_name}** → `{stem_filename}`\n"
+        # Crear archivo ZIP con todos los stems
+        zip_filename = f"{file_name}_stems.zip"
+        zip_path = os.path.join(temp_dir, zip_filename)
+        with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zipf:
+            for stem_file in stem_files:
+                zipf.write(stem_file, os.path.basename(stem_file))
+        info_text += f"\n## 📦 Descarga\n\nTodos los stems empaquetados en: `{zip_filename}`"
+        return zip_path, info_text
+    except Exception as e:
+        return None, f"❌ Error procesando el archivo: {str(e)}"
+def create_demo_file():
+    """Crea un archivo de demostración multicanal"""
+    temp_dir = tempfile.mkdtemp()
+    demo_path = os.path.join(temp_dir, "demo_5.1_surround.wav")
+    sample_rate = 48000
+    duration = 3  # segundos
+    t = np.linspace(0, duration, int(sample_rate * duration))
+    # Crear 6 canales con diferentes frecuencias (simulando 5.1)
+    channels = [
+        np.sin(2 * np.pi * 440 * t) * 0.5,   # Left - La
+        np.sin(2 * np.pi * 554 * t) * 0.5,   # Right - Do#
+        np.sin(2 * np.pi * 330 * t) * 0.5,   # Center - Mi
+        np.sin(2 * np.pi * 60 * t) * 0.8,    # LFE - Bajo
+        np.sin(2 * np.pi * 392 * t) * 0.4,   # Left Surround - Sol
+        np.sin(2 * np.pi * 494 * t) * 0.4,   # Right Surround - Si
+    ]
+    # Combinar canales
+    audio_data = np.column_stack(channels)
+    sf.write(demo_path, audio_data, sample_rate)
+    return demo_path
+# Interfaz Gradio
+with gr.Blocks(
+    title="🎵 Dolby Atmos Stem Extractor",
+    theme=gr.themes.Soft(primary_hue="purple", secondary_hue="blue")
+) as demo:
+    gr.Markdown("""
+    # 🎵 Dolby Atmos Stem Extractor
+    Extrae todos los canales/stems de archivos de audio **Dolby Atmos** o **Surround**.
+    ### 🎯 Formatos soportados:
+    - **Entrada:** WAV, FLAC, AIFF, OGG (multicanal)
+    - **Configuraciones:** Stereo, 5.1, 7.1, 7.1.4, 9.1.6, y más
+    ### 📝 Instrucciones:
+    1. Sube tu archivo de audio multicanal
+    2. Selecciona el formato de salida
+    3. ¡Descarga tus stems!
+    """)
+    with gr.Row():
+        with gr.Column(scale=1):
+            audio_input = gr.File(
+                label="📁 Sube tu archivo de audio",
+                file_types=[".wav", ".flac", ".aiff", ".ogg", ".mp3", ".m4a"],
+                type="filepath"
+            )
+            output_format = gr.Radio(
+                choices=["wav", "flac", "ogg"],
+                value="wav",
+                label="🎚️ Formato de salida"
+            )
+            extract_btn = gr.Button(
+                "🚀 Extraer Stems",
+                variant="primary",
+                size="lg"
+            )
+            demo_btn = gr.Button(
+                "🎹 Generar archivo demo 5.1",
+                variant="secondary"
+            )
+        with gr.Column(scale=1):
+            output_file = gr.File(
+                label="📦 Descargar Stems (ZIP)"
+            )
+            info_output = gr.Markdown(
+                label="📊 Información",
+                value="*Sube un archivo para comenzar...*"
+            )
+    # Ejemplos
+    gr.Markdown("""
+    ---
+    ### 💡 Tips:
+    - Los archivos **Dolby Atmos** típicamente tienen 12-16 canales
+    - El formato **5.1 Surround** tiene 6 canales
+    - El formato **7.1 Surround** tiene 8 canales
+    - Los canales de **altura** (Height) son característicos de Atmos
+    """)
+    # Eventos
+    extract_btn.click(
+        fn=extract_stems,
+        inputs=[audio_input, output_format],
+        outputs=[output_file, info_output]
+    )
+    demo_btn.click(
+        fn=create_demo_file,
+        inputs=[],
+        outputs=[audio_input]
+    )
+# Lanzar
+if __name__ == "__main__":
+    demo.launch()