Spaces:

Clearwave48
/

clearwave-api

Running

App Files Files Community

Clearwave48 commited on 7 days ago

Commit

d0c4c17

verified ·

1 Parent(s): a960e11

Update denoiser.py

Browse files

Files changed (1) hide show

denoiser.py +16 -15

denoiser.py CHANGED Viewed

@@ -174,7 +174,7 @@ class Denoiser:
         # then convert to MP3 via ffmpeg (already in the Dockerfile).
         tmp_wav  = os.path.join(out_dir, "denoised_tmp.wav")
         out_path = os.path.join(out_dir, out_name)
-        sf.write(tmp_wav, out_audio, sr, subtype="PCM_24")
         result = subprocess.run([
             "ffmpeg", "-y", "-i", tmp_wav,
@@ -324,24 +324,25 @@ class Denoiser:
         except Exception as e:
             logger.warning(f"[Denoiser] DeepFilterNet unavailable ({e})")
-        # ── Fallback: Two-pass noisereduce (voice-preserving) ─────────────
-        # prop_decrease kept LOW on both passes to avoid speech artifacts.
         try:
             import noisereduce as nr
-            pass1 = nr.reduce_noise(
                 y=audio, sr=sr,
                 stationary=True,
-                prop_decrease=0.65,
-            ).astype(np.float32)
-            pass2 = nr.reduce_noise(
-                y=pass1, sr=sr,
-                stationary=False,
-                prop_decrease=0.30,       # very gentle — voice stays natural
-                freq_mask_smooth_hz=400,
-                time_mask_smooth_ms=80,
             ).astype(np.float32)
-            print("[Denoiser] ✅ Two-pass noisereduce done (voice-preserving)")
-            return pass2, "noisereduce_2pass"
         except Exception as e:
             logger.warning(f"noisereduce failed: {e}")
@@ -710,7 +711,7 @@ class Denoiser:
             logger.warning(f"ffmpeg non-zero exit: {stderr[-400:]}")
             # Fallback: soundfile passthrough
             data, sr = sf.read(src, always_2d=True)
-            sf.write(dst, data, sr, subtype="PCM_24")
     def _resample(self, audio: np.ndarray, orig_sr: int, target_sr: int) -> np.ndarray:
         if orig_sr == target_sr:

         # then convert to MP3 via ffmpeg (already in the Dockerfile).
         tmp_wav  = os.path.join(out_dir, "denoised_tmp.wav")
         out_path = os.path.join(out_dir, out_name)
+        sf.write(tmp_wav, out_audio, sr, format="WAV", subtype="PCM_24")
         result = subprocess.run([
             "ffmpeg", "-y", "-i", tmp_wav,
         except Exception as e:
             logger.warning(f"[Denoiser] DeepFilterNet unavailable ({e})")
+        # ── Fallback: Single-pass noisereduce, stationary only ────────────
+        # PHILOSOPHY: do as little as possible to the signal.
+        # - stationary=True  → only targets steady/consistent noise (fan,
+        #                       hum, AC, room hiss). Leaves transient
+        #                       speech harmonics completely untouched.
+        # - prop_decrease=0.5 → reduces noise by ~50%, not 100%.
+        #                       Keeps a thin noise floor so the voice
+        #                       never sounds "hollow" or over-processed.
+        # - No second pass, no non-stationary processing — those modes
+        #   touch voice frequencies and cause the robotic effect.
         try:
             import noisereduce as nr
+            cleaned = nr.reduce_noise(
                 y=audio, sr=sr,
                 stationary=True,
+                prop_decrease=0.50,
             ).astype(np.float32)
+            print("[Denoiser] ✅ noisereduce done (voice-preserving, stationary only)")
+            return cleaned, "noisereduce_stationary"
         except Exception as e:
             logger.warning(f"noisereduce failed: {e}")
             logger.warning(f"ffmpeg non-zero exit: {stderr[-400:]}")
             # Fallback: soundfile passthrough
             data, sr = sf.read(src, always_2d=True)
+            sf.write(dst, data, sr, format="WAV", subtype="PCM_24")
     def _resample(self, audio: np.ndarray, orig_sr: int, target_sr: int) -> np.ndarray:
         if orig_sr == target_sr: