Spaces:

vyluong
/

PoC_ASR_v6_dev

Sleeping

App Files Files Community

vyluong commited on May 19

Commit

d975a12

verified ·

1 Parent(s): 03282ea

Update app/services/denoiser.py

Browse files

Files changed (1) hide show

app/services/denoiser.py +50 -19

app/services/denoiser.py CHANGED Viewed

@@ -5,7 +5,11 @@ import logging
 import torch
 import torchaudio
-from df.enhance import enhance, init_df
 from app.core.config import get_settings
@@ -17,6 +21,8 @@ class DenoiserService:
     _model = None
     _df_state = None
     @classmethod
     def _load_model(cls):
@@ -24,64 +30,89 @@ class DenoiserService:
         if cls._model is not None:
             return
         logger.info("Loading DeepFilterNet...")
         model, df_state, _ = init_df()
         cls._model = model
         cls._df_state = df_state
-        logger.info("DeepFilterNet READY")
     @classmethod
-    async def enhance_audio(
-        cls,
-        input_path: Path
-    ) -> Path:
         if not settings.enable_denoiser:
             return input_path
-        loop = asyncio.get_event_loop()
         return await loop.run_in_executor(
             None,
             lambda: cls._run_enhancement(input_path)
         )
     @classmethod
-    def _run_enhancement(
-        cls,
-        input_path: Path
-    ) -> Path:
         try:
             cls._load_model()
             audio, sr = torchaudio.load(str(input_path))
-            enhanced = enhance(
-                cls._model,
-                cls._df_state,
-                audio
-            )
             output_path = (
                 settings.processed_dir /
                 f"{input_path.stem}_enhanced.wav"
             )
             torchaudio.save(
                 str(output_path),
-                enhanced.cpu(),
                 sr
             )
             return output_path
         except Exception as e:
-            logger.exception(e)
             return input_path

 import torch
 import torchaudio
+try:
+    from df.enhance import enhance, init_df
+    DF_AVAILABLE = True
+except Exception:
+    DF_AVAILABLE = False
 from app.core.config import get_settings
     _model = None
     _df_state = None
+    _device = None
     @classmethod
     def _load_model(cls):
         if cls._model is not None:
             return
+        if not DF_AVAILABLE:
+            raise ImportError("DeepFilterNet is not available")
         logger.info("Loading DeepFilterNet...")
         model, df_state, _ = init_df()
+        cls._device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        model = model.to(cls._device)
+        model.eval()
         cls._model = model
         cls._df_state = df_state
+        logger.info(f"DeepFilterNet READY on {cls._device}")
     @classmethod
+    async def enhance_audio(cls, input_path: Path) -> Path:
         if not settings.enable_denoiser:
             return input_path
+        loop = asyncio.get_running_loop()
         return await loop.run_in_executor(
             None,
             lambda: cls._run_enhancement(input_path)
         )
     @classmethod
+    def _run_enhancement(cls, input_path: Path) -> Path:
         try:
             cls._load_model()
+            # ----------------------------
+            # LOAD AUDIO
+            # ----------------------------
             audio, sr = torchaudio.load(str(input_path))
+            # mono conversion
+            if audio.shape[0] > 1:
+                audio = torch.mean(audio, dim=0, keepdim=True)
+            audio = audio.float()
+            # move to device
+            audio = audio.to(cls._device)
+            with torch.no_grad():
+                enhanced = enhance(
+                    cls._model,
+                    cls._df_state,
+                    audio
+                )
             output_path = (
                 settings.processed_dir /
                 f"{input_path.stem}_enhanced.wav"
             )
+            output_path.parent.mkdir(parents=True, exist_ok=True)
+            # move back CPU before save
+            enhanced = enhanced.cpu()
             torchaudio.save(
                 str(output_path),
+                enhanced,
                 sr
             )
+            logger.info(f"Denoised audio saved: {output_path}")
             return output_path
         except Exception as e:
+            logger.exception("DeepFilterNet enhancement failed")
+            # fallback = original file
             return input_path