Spaces:

rlackey
/

vynl

Running on Zero

File size: 12,926 Bytes

a3fa32f
 
 
 
 
 
 
 
 
 
 
 
 
892f418
a3fa32f
 
 
892f418
a3fa32f

#!/usr/bin/env python3
"""
VYNL AI Mastering Module
Reference matching + genre presets + loudness normalization
"""

import numpy as np
from pathlib import Path
import tempfile

try:
    import librosa
    import soundfile as sf
    from scipy.ndimage import uniform_filter1d
    HAS_LIBROSA = True
except ImportError:
    HAS_LIBROSA = False
    uniform_filter1d = None

try:
    import pyloudnorm as pyln
    HAS_PYLOUDNORM = True
except ImportError:
    HAS_PYLOUDNORM = False

# ============================================================================
# MASTERING PRESETS
# ============================================================================

PRESETS = {
    'Balanced': {
        'eq_low': 0,
        'eq_mid': 0,
        'eq_high': 0,
        'compression_ratio': 3,
        'compression_threshold': -18,
        'target_lufs': -14,
    },
    'Warm': {
        'eq_low': 2,
        'eq_mid': -1,
        'eq_high': -2,
        'compression_ratio': 2.5,
        'compression_threshold': -16,
        'target_lufs': -14,
    },
    'Bright': {
        'eq_low': -1,
        'eq_mid': 1,
        'eq_high': 3,
        'compression_ratio': 3,
        'compression_threshold': -18,
        'target_lufs': -13,
    },
    'Punchy': {
        'eq_low': 3,
        'eq_mid': 0,
        'eq_high': 1,
        'compression_ratio': 4,
        'compression_threshold': -20,
        'target_lufs': -12,
    },
    'Reference Match': {
        'eq_low': 0,
        'eq_mid': 0,
        'eq_high': 0,
        'compression_ratio': 3,
        'compression_threshold': -18,
        'target_lufs': -14,
    },
}

# ============================================================================
# AUDIO ANALYSIS
# ============================================================================

def analyze_audio(audio_path):
    """Analyze audio file for mastering metrics"""
    if not HAS_LIBROSA:
        return None

    try:
        y, sr = librosa.load(audio_path, sr=44100, mono=False)

        # Handle mono/stereo
        if y.ndim == 1:
            y_mono = y
        else:
            y_mono = librosa.to_mono(y)

        # Peak level
        peak_db = 20 * np.log10(np.max(np.abs(y_mono)) + 1e-10)

        # RMS level
        rms = np.sqrt(np.mean(y_mono**2))
        rms_db = 20 * np.log10(rms + 1e-10)

        # Dynamic range (simplified)
        frame_length = int(sr * 0.1)  # 100ms frames
        hop_length = frame_length // 2

        frames_rms = []
        for i in range(0, len(y_mono) - frame_length, hop_length):
            frame = y_mono[i:i+frame_length]
            frame_rms = np.sqrt(np.mean(frame**2))
            if frame_rms > 0:
                frames_rms.append(20 * np.log10(frame_rms + 1e-10))

        if frames_rms:
            dynamic_range = np.percentile(frames_rms, 95) - np.percentile(frames_rms, 5)
        else:
            dynamic_range = 0

        # LUFS (integrated loudness)
        lufs = -14  # Default
        if HAS_PYLOUDNORM:
            try:
                meter = pyln.Meter(sr)
                lufs = meter.integrated_loudness(y_mono)
            except:
                pass

        # Spectral centroid (brightness)
        spectral_centroid = np.mean(librosa.feature.spectral_centroid(y=y_mono, sr=sr))

        return {
            'peak_db': float(peak_db),
            'rms_db': float(rms_db),
            'lufs': float(lufs) if not np.isinf(lufs) else -24,
            'dynamic_range': float(dynamic_range),
            'spectral_centroid': float(spectral_centroid),
            'duration': float(len(y_mono) / sr),
            'sample_rate': sr,
        }

    except Exception as e:
        return {'error': str(e)}


def analyze_reference(reference_path, target_path):
    """Analyze reference track and compute matching parameters"""
    ref_analysis = analyze_audio(reference_path)
    target_analysis = analyze_audio(target_path)

    if not ref_analysis or not target_analysis:
        return PRESETS['Balanced']

    if 'error' in ref_analysis or 'error' in target_analysis:
        return PRESETS['Balanced']

    # Compute EQ adjustments based on spectral difference
    centroid_diff = ref_analysis['spectral_centroid'] - target_analysis['spectral_centroid']

    # Brightness adjustment
    if centroid_diff > 500:
        eq_high = 2
    elif centroid_diff < -500:
        eq_high = -2
    else:
        eq_high = 0

    # Target LUFS from reference
    target_lufs = ref_analysis['lufs']
    if target_lufs < -20 or target_lufs > -6:
        target_lufs = -14

    return {
        'eq_low': 0,
        'eq_mid': 0,
        'eq_high': eq_high,
        'compression_ratio': 3,
        'compression_threshold': -18,
        'target_lufs': target_lufs,
        'reference_lufs': ref_analysis['lufs'],
        'reference_peak': ref_analysis['peak_db'],
    }


# ============================================================================
# PROCESSING
# ============================================================================

def apply_eq(y, sr, low_db=0, mid_db=0, high_db=0):
    """Apply 3-band EQ"""
    if not HAS_LIBROSA:
        return y

    # Define frequency bands
    low_freq = 200
    high_freq = 4000

    # Get STFT
    D = librosa.stft(y)
    freqs = librosa.fft_frequencies(sr=sr)

    # Create gain masks
    low_mask = freqs < low_freq
    mid_mask = (freqs >= low_freq) & (freqs < high_freq)
    high_mask = freqs >= high_freq

    # Apply gains
    gains = np.ones(len(freqs))
    gains[low_mask] *= 10 ** (low_db / 20)
    gains[mid_mask] *= 10 ** (mid_db / 20)
    gains[high_mask] *= 10 ** (high_db / 20)

    # Apply to STFT
    D_eq = D * gains[:, np.newaxis]

    # Inverse STFT
    y_eq = librosa.istft(D_eq, length=len(y))

    return y_eq


def apply_compression(y, sr, ratio=3, threshold_db=-18, attack_ms=10, release_ms=100):
    """Apply dynamic range compression"""
    if ratio <= 1:
        return y

    # Convert to linear
    threshold = 10 ** (threshold_db / 20)

    # Envelope follower
    attack_samples = int(sr * attack_ms / 1000)
    release_samples = int(sr * release_ms / 1000)

    envelope = np.abs(y)

    # Smooth envelope
    envelope = uniform_filter1d(envelope, size=attack_samples)

    # Compute gain reduction
    gain = np.ones_like(envelope)
    above_thresh = envelope > threshold

    if np.any(above_thresh):
        # Gain reduction for samples above threshold
        gain[above_thresh] = (threshold / envelope[above_thresh]) ** (1 - 1/ratio)

    # Apply gain
    y_compressed = y * gain

    # Makeup gain
    makeup = 1 / np.mean(gain[gain < 1]) if np.any(gain < 1) else 1
    y_compressed *= min(makeup, 2)  # Limit makeup gain

    return y_compressed


def apply_limiter(y, ceiling_db=-0.3):
    """Apply brick-wall limiter"""
    ceiling = 10 ** (ceiling_db / 20)

    # Soft clipping
    y_limited = np.tanh(y / ceiling) * ceiling

    return y_limited


def normalize_loudness(y, sr, target_lufs=-14):
    """Normalize to target LUFS"""
    if not HAS_PYLOUDNORM:
        # Fallback: simple peak normalization
        peak = np.max(np.abs(y))
        if peak > 0:
            target_peak = 10 ** (-1 / 20)  # -1 dB
            y = y * (target_peak / peak)
        return y

    try:
        meter = pyln.Meter(sr)
        current_lufs = meter.integrated_loudness(y)

        if np.isinf(current_lufs) or np.isnan(current_lufs):
            return y

        # Calculate gain needed
        gain_db = target_lufs - current_lufs
        gain = 10 ** (gain_db / 20)

        # Apply gain with limiter
        y_normalized = y * gain
        y_normalized = apply_limiter(y_normalized)

        return y_normalized

    except:
        return y


# ============================================================================
# MAIN MASTERING FUNCTION
# ============================================================================

def master_audio(input_path, output_path=None, preset='Balanced',
                 reference_path=None, target_lufs=None,
                 eq_low=None, eq_mid=None, eq_high=None):
    """
    Master audio file

    Args:
        input_path: Path to input audio
        output_path: Path for output (optional, creates temp file if None)
        preset: Preset name or 'Reference Match'
        reference_path: Path to reference track (for Reference Match)
        target_lufs: Override target LUFS
        eq_low/mid/high: Override EQ settings

    Returns:
        (output_path, analysis_dict)
    """

    if not HAS_LIBROSA:
        return None, {'error': 'librosa not installed'}

    try:
        # Load audio
        y, sr = librosa.load(input_path, sr=44100, mono=True)

        # Get preset settings
        if preset == 'Reference Match' and reference_path:
            settings = analyze_reference(reference_path, input_path)
        else:
            settings = PRESETS.get(preset, PRESETS['Balanced']).copy()

        # Override with manual settings
        if eq_low is not None:
            settings['eq_low'] = eq_low
        if eq_mid is not None:
            settings['eq_mid'] = eq_mid
        if eq_high is not None:
            settings['eq_high'] = eq_high
        if target_lufs is not None:
            settings['target_lufs'] = target_lufs

        # Analyze input
        input_analysis = analyze_audio(input_path)

        # Apply processing chain
        y_processed = y.copy()

        # 1. EQ
        y_processed = apply_eq(
            y_processed, sr,
            low_db=settings['eq_low'],
            mid_db=settings['eq_mid'],
            high_db=settings['eq_high']
        )

        # 2. Compression
        y_processed = apply_compression(
            y_processed, sr,
            ratio=settings['compression_ratio'],
            threshold_db=settings['compression_threshold']
        )

        # 3. Loudness normalization
        y_processed = normalize_loudness(
            y_processed, sr,
            target_lufs=settings['target_lufs']
        )

        # 4. Final limiter
        y_processed = apply_limiter(y_processed, ceiling_db=-0.3)

        # Create output path if needed
        if output_path is None:
            temp_dir = tempfile.mkdtemp()
            output_path = Path(temp_dir) / f"{Path(input_path).stem}_mastered.wav"

        # Save
        sf.write(str(output_path), y_processed, sr)

        # Analyze output
        output_analysis = analyze_audio(str(output_path))

        # Build result
        result = {
            'input': input_analysis,
            'output': output_analysis,
            'settings': settings,
            'preset': preset,
        }

        return str(output_path), result

    except Exception as e:
        return None, {'error': str(e)}


def format_analysis(analysis):
    """Format analysis dict for display"""
    if not analysis:
        return "Analysis unavailable"

    if 'error' in analysis:
        return f"Error: {analysis['error']}"

    lines = []

    if 'input' in analysis:
        inp = analysis['input']
        lines.append("INPUT:")
        lines.append(f"  LUFS: {inp.get('lufs', 'N/A'):.1f}")
        lines.append(f"  Peak: {inp.get('peak_db', 'N/A'):.1f} dB")
        lines.append(f"  Dynamic Range: {inp.get('dynamic_range', 'N/A'):.1f} dB")

    if 'output' in analysis:
        out = analysis['output']
        lines.append("\nOUTPUT:")
        lines.append(f"  LUFS: {out.get('lufs', 'N/A'):.1f}")
        lines.append(f"  Peak: {out.get('peak_db', 'N/A'):.1f} dB")
        lines.append(f"  Dynamic Range: {out.get('dynamic_range', 'N/A'):.1f} dB")

    if 'settings' in analysis:
        settings = analysis['settings']
        lines.append("\nSETTINGS:")
        lines.append(f"  Target LUFS: {settings.get('target_lufs', -14)}")
        lines.append(f"  EQ: Low {settings.get('eq_low', 0):+.0f} / Mid {settings.get('eq_mid', 0):+.0f} / High {settings.get('eq_high', 0):+.0f}")
        lines.append(f"  Compression: {settings.get('compression_ratio', 3)}:1 @ {settings.get('compression_threshold', -18)} dB")

    return "\n".join(lines)


# ============================================================================
# CLI
# ============================================================================

if __name__ == "__main__":
    import sys

    if len(sys.argv) < 2:
        print("Usage: python mastering.py <input.wav> [output.wav] [preset]")
        print("Presets: Balanced, Warm, Bright, Punchy, Reference Match")
        sys.exit(1)

    input_path = sys.argv[1]
    output_path = sys.argv[2] if len(sys.argv) > 2 else None
    preset = sys.argv[3] if len(sys.argv) > 3 else 'Balanced'

    print(f"Mastering: {input_path}")
    print(f"Preset: {preset}")

    out_path, analysis = master_audio(input_path, output_path, preset)

    if out_path:
        print(f"\nOutput: {out_path}")
        print(format_analysis(analysis))
    else:
        print(f"Error: {analysis.get('error', 'Unknown error')}")