Spaces:

prathameshv07
/

Multilingual-Audio-Intelligence-System

Build error

App Files Files Community

Prathamesh Sarjerao Vaidya commited on Sep 5, 2025

Commit

65f46e8

1 Parent(s): 938d58f

made changes

Browse files

Files changed (4) hide show

Dockerfile +9 -6
model_preloader.py +61 -8
requirements.txt +1 -1
startup.py +12 -0

Dockerfile CHANGED Viewed

@@ -64,18 +64,21 @@ ENV PYTHONPATH=/app \
     HUGGINGFACE_HUB_CACHE=/app/model_cache \
     HF_HUB_CACHE=/app/model_cache \
     FONTCONFIG_PATH=/tmp/fontconfig \
-    # Fix for ONNX Runtime in containers (KEY FIX)
     ORT_DYLIB_DEFAULT_OPTIONS=DisableExecutablePageAllocator=1 \
     ONNXRUNTIME_EXECUTION_PROVIDERS=CPUExecutionProvider \
-    # Fix for audio processing libraries
     CTRANSLATE2_FORCE_CPU_ISA=generic \
-    # Disable problematic features
     TF_CPP_MIN_LOG_LEVEL=2 \
     TOKENIZERS_PARALLELISM=false \
-    # Disable problematic optimizations
     OMP_NUM_THREADS=1 \
-    # Suppress tensorboard warnings
-    TF_ENABLE_ONEDNN_OPTS=0
 # Expose port for Hugging Face Spaces
 EXPOSE 7860

     HUGGINGFACE_HUB_CACHE=/app/model_cache \
     HF_HUB_CACHE=/app/model_cache \
     FONTCONFIG_PATH=/tmp/fontconfig \
+    # Critical ONNX Runtime fixes for containers
     ORT_DYLIB_DEFAULT_OPTIONS=DisableExecutablePageAllocator=1 \
     ONNXRUNTIME_EXECUTION_PROVIDERS=CPUExecutionProvider \
+    ORT_DISABLE_TLS_ARENA=1 \
     CTRANSLATE2_FORCE_CPU_ISA=generic \
+    # Threading and memory optimizations
     TF_CPP_MIN_LOG_LEVEL=2 \
     TOKENIZERS_PARALLELISM=false \
     OMP_NUM_THREADS=1 \
+    MKL_NUM_THREADS=1 \
+    NUMBA_NUM_THREADS=1 \
+    TF_ENABLE_ONEDNN_OPTS=0 \
+    # Additional security for containers
+    MALLOC_ARENA_MAX=2 \
+    PYTHONUNBUFFERED=1
 # Expose port for Hugging Face Spaces
 EXPOSE 7860

model_preloader.py CHANGED Viewed

@@ -29,6 +29,32 @@ from rich.panel import Panel
 from rich.text import Text
 import psutil
 # Add src directory to path
 sys.path.insert(0, os.path.join(os.path.dirname(__file__), 'src'))
@@ -372,7 +398,7 @@ class ModelPreloader:
             logger.warning(f"Error saving cache for {model_key}: {e}")
     def load_pyannote_pipeline(self, task_id: str) -> Optional[Pipeline]:
-        """Load pyannote speaker diarization pipeline."""
         try:
             console.print(f"[yellow]Loading pyannote.audio pipeline...[/yellow]")
@@ -381,21 +407,48 @@ class ModelPreloader:
             if not hf_token:
                 console.print("[red]Warning: HUGGINGFACE_TOKEN not found. Some models may not be accessible.[/red]")
-            pipeline = Pipeline.from_pretrained(
-                "pyannote/speaker-diarization-3.1",
-                use_auth_token=hf_token
-            )
-            # Test the pipeline
             console.print(f"[green]SUCCESS: pyannote.audio pipeline loaded successfully on {self.device}[/green]")
             return pipeline
         except Exception as e:
             console.print(f"[red]ERROR: Failed to load pyannote.audio pipeline: {e}[/red]")
             logger.error(f"Pyannote loading failed: {e}")
             return None
     def load_whisper_model(self, task_id: str) -> Optional[whisper.Whisper]:
         """Load Whisper speech recognition model with enhanced cache checking."""
         try:

 from rich.text import Text
 import psutil
+# CRITICAL: Configure ONNX Runtime BEFORE any ML library imports
+import os
+os.environ.update({
+    'ORT_DYLIB_DEFAULT_OPTIONS': 'DisableExecutablePageAllocator=1',
+    'ONNXRUNTIME_EXECUTION_PROVIDERS': 'CPUExecutionProvider',
+    'ORT_DISABLE_TLS_ARENA': '1',
+    'OMP_NUM_THREADS': '1',
+    'MKL_NUM_THREADS': '1',
+    'NUMBA_NUM_THREADS': '1',
+    'TF_ENABLE_ONEDNN_OPTS': '0',
+    'TOKENIZERS_PARALLELISM': 'false',
+    'MALLOC_ARENA_MAX': '2'
+})
+# Import ONNX Runtime with error suppression
+try:
+    import warnings
+    warnings.filterwarnings("ignore", category=UserWarning, module="onnxruntime")
+    import onnxruntime as ort
+    # Force CPU provider only
+    ort.set_default_logger_severity(3)  # ERROR level only
+except ImportError:
+    pass
+except Exception as e:
+    print(f"ONNX Runtime warning (expected in containers): {e}")
 # Add src directory to path
 sys.path.insert(0, os.path.join(os.path.dirname(__file__), 'src'))
             logger.warning(f"Error saving cache for {model_key}: {e}")
     def load_pyannote_pipeline(self, task_id: str) -> Optional[Pipeline]:
+        """Load pyannote speaker diarization pipeline with container-safe settings."""
         try:
             console.print(f"[yellow]Loading pyannote.audio pipeline...[/yellow]")
             if not hf_token:
                 console.print("[red]Warning: HUGGINGFACE_TOKEN not found. Some models may not be accessible.[/red]")
+            # Container-safe pipeline loading with error suppression
+            with warnings.catch_warnings():
+                warnings.filterwarnings("ignore", category=UserWarning)
+                warnings.filterwarnings("ignore", message=".*executable stack.*")
+                pipeline = Pipeline.from_pretrained(
+                    "pyannote/speaker-diarization-3.1",
+                    use_auth_token=hf_token,
+                    cache_dir=str(self.cache_dir / "pyannote")
+                )
+                # Force CPU execution
+                if hasattr(pipeline, '_models'):
+                    for model_name, model in pipeline._models.items():
+                        if hasattr(model, 'to'):
+                            model.to('cpu')
             console.print(f"[green]SUCCESS: pyannote.audio pipeline loaded successfully on {self.device}[/green]")
             return pipeline
         except Exception as e:
+            # Check if it's the expected ONNX Runtime warning
+            if "executable stack" in str(e).lower():
+                console.print("[yellow]ONNX Runtime executable stack warning (expected in containers) - continuing...[/yellow]")
+                # Try alternative loading method
+                try:
+                    import warnings
+                    with warnings.catch_warnings():
+                        warnings.simplefilter("ignore")
+                        pipeline = Pipeline.from_pretrained(
+                            "pyannote/speaker-diarization-3.1",
+                            use_auth_token=hf_token,
+                            cache_dir=str(self.cache_dir / "pyannote")
+                        )
+                        return pipeline
+                except:
+                    pass
             console.print(f"[red]ERROR: Failed to load pyannote.audio pipeline: {e}[/red]")
             logger.error(f"Pyannote loading failed: {e}")
             return None
     def load_whisper_model(self, task_id: str) -> Optional[whisper.Whisper]:
         """Load Whisper speech recognition model with enhanced cache checking."""
         try:

requirements.txt CHANGED Viewed

@@ -4,7 +4,7 @@ torchaudio==2.0.2
 torchvision==0.15.2
 # Keep regular ONNX Runtime with container-safe environment variables
-onnxruntime==1.16.3
 # Audio processing
 pyannote.audio==3.1.1

 torchvision==0.15.2
 # Keep regular ONNX Runtime with container-safe environment variables
+onnxruntime==1.15.1
 # Audio processing
 pyannote.audio==3.1.1

startup.py CHANGED Viewed

@@ -4,11 +4,23 @@ Startup script for Hugging Face Spaces deployment.
 Handles model preloading and graceful fallbacks for containerized environments.
 """
 import os
 import subprocess
 import sys
 import logging
 # Configure logging
 logging.basicConfig(
     level=logging.INFO,

 Handles model preloading and graceful fallbacks for containerized environments.
 """
+# Suppress ONNX Runtime warnings BEFORE any imports
+import warnings
+warnings.filterwarnings("ignore", message=".*executable stack.*")
+warnings.filterwarnings("ignore", category=UserWarning, module="onnxruntime")
 import os
 import subprocess
 import sys
 import logging
+# Set critical environment variables immediately
+os.environ.update({
+    'ORT_DYLIB_DEFAULT_OPTIONS': 'DisableExecutablePageAllocator=1',
+    'ONNXRUNTIME_EXECUTION_PROVIDERS': 'CPUExecutionProvider',
+    'ORT_DISABLE_TLS_ARENA': '1'
+})
 # Configure logging
 logging.basicConfig(
     level=logging.INFO,