Spaces:

Csuarezg
/

Final_Assignment_Template_hf-course

Sleeping

App Files Files Community

Csuarezg commited on May 28, 2025

Commit

38d5f80

verified ·

1 Parent(s): 2f56333

Update app.py

Browse files

Files changed (1) hide show

app.py +66 -7

app.py CHANGED Viewed

@@ -9,6 +9,34 @@ import logging
 from typing import List, Dict, Optional, TypedDict, Annotated
 import numpy as np
 import base64
 # Core ML/AI imports
 from langchain_core.messages import HumanMessage, SystemMessage, AnyMessage, ToolMessage
@@ -26,7 +54,15 @@ import wikipedia
 from youtube_transcript_api import YouTubeTranscriptApi, TranscriptsDisabled, NoTranscriptFound
 import speech_recognition as sr
 from PIL import Image
-from transformers import pipeline
 # Audio processing - NEW IMPORTS
 try:
@@ -185,12 +221,19 @@ class GAIAAgent:
         def __init__(self, parent_agent):
             self.parent_agent = parent_agent
             print("🔧 Initializing Enhanced FileAnalyzerTool...")
-            try:
-                self.image_analyzer = pipeline("image-classification", model="google/vit-base-patch16-224")
-                self.text_generator = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base")
-                print("✅ Image analysis models loaded successfully")
-            except Exception as e:
-                print(f"⚠️ Could not load image analysis models: {e}")
                 self.image_analyzer = None
                 self.text_generator = None
@@ -199,6 +242,12 @@ class GAIAAgent:
                 print("✅ Audio processing (pydub) available")
             else:
                 print("⚠️ pydub not available - MP3 conversion will be limited")
         def analyze(self, file_path: str, file_type: str) -> str:
             try:
@@ -1318,6 +1367,16 @@ if __name__ == "__main__":
     else:
         print("⚠️ pydub not available - consider adding to requirements.txt")
     print("="*50 + "\n")
     print("🌟 Launching Enhanced GAIA Agent Interface...")
     demo.launch(debug=True, share=False)

 from typing import List, Dict, Optional, TypedDict, Annotated
 import numpy as np
 import base64
+import subprocess
+import sys
+# Configure ffmpeg for pydub in HuggingFace Spaces
+def setup_ffmpeg():
+    """Setup ffmpeg for audio processing in HuggingFace Spaces"""
+    try:
+        # Check if ffmpeg is already available
+        subprocess.run(['ffmpeg', '-version'], capture_output=True, check=True)
+        print("✅ ffmpeg already available")
+        return True
+    except (subprocess.CalledProcessError, FileNotFoundError):
+        try:
+            # Try to install ffmpeg using apt-get (works in HF Spaces)
+            print("📦 Installing ffmpeg...")
+            subprocess.run(['apt-get', 'update'], capture_output=True, check=True)
+            subprocess.run(['apt-get', 'install', '-y', 'ffmpeg'], capture_output=True, check=True)
+            print("✅ ffmpeg installed successfully")
+            return True
+        except subprocess.CalledProcessError as e:
+            print(f"⚠️ Could not install ffmpeg: {e}")
+            return False
+        except Exception as e:
+            print(f"⚠️ ffmpeg setup failed: {e}")
+            return False
+# Setup ffmpeg early
+FFMPEG_AVAILABLE = setup_ffmpeg()
 # Core ML/AI imports
 from langchain_core.messages import HumanMessage, SystemMessage, AnyMessage, ToolMessage
 from youtube_transcript_api import YouTubeTranscriptApi, TranscriptsDisabled, NoTranscriptFound
 import speech_recognition as sr
 from PIL import Image
+# Transformers with error handling
+try:
+    from transformers import pipeline
+    TRANSFORMERS_AVAILABLE = True
+    print("✅ Transformers library loaded successfully")
+except ImportError:
+    TRANSFORMERS_AVAILABLE = False
+    print("⚠️ Transformers not available - image analysis will be limited")
 # Audio processing - NEW IMPORTS
 try:
         def __init__(self, parent_agent):
             self.parent_agent = parent_agent
             print("🔧 Initializing Enhanced FileAnalyzerTool...")
+            # Initialize image analysis models if transformers is available
+            if TRANSFORMERS_AVAILABLE:
+                try:
+                    self.image_analyzer = pipeline("image-classification", model="google/vit-base-patch16-224")
+                    self.text_generator = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base")
+                    print("✅ Image analysis models loaded successfully")
+                except Exception as e:
+                    print(f"⚠️ Could not load image analysis models: {e}")
+                    self.image_analyzer = None
+                    self.text_generator = None
+            else:
+                print("⚠️ Transformers not available - image analysis models disabled")
                 self.image_analyzer = None
                 self.text_generator = None
                 print("✅ Audio processing (pydub) available")
             else:
                 print("⚠️ pydub not available - MP3 conversion will be limited")
+            # Check ffmpeg availability
+            if FFMPEG_AVAILABLE:
+                print("✅ ffmpeg available for audio conversion")
+            else:
+                print("⚠️ ffmpeg not available - some audio formats may not work")
         def analyze(self, file_path: str, file_type: str) -> str:
             try:
     else:
         print("⚠️ pydub not available - consider adding to requirements.txt")
+    if FFMPEG_AVAILABLE:
+        print("✅ ffmpeg available for audio conversion!")
+    else:
+        print("⚠️ ffmpeg not available - some audio formats may not work")
+    if TRANSFORMERS_AVAILABLE:
+        print("✅ Transformers available for image analysis!")
+    else:
+        print("⚠️ transformers not available - consider adding to requirements.txt")
     print("="*50 + "\n")
     print("🌟 Launching Enhanced GAIA Agent Interface...")
     demo.launch(debug=True, share=False)