Spaces:

shaheerawan3
/

VisionCraft-AI

Sleeping

App Files Files Community

shaheerawan3 commited on Jan 6

Commit

69162b3

verified ·

1 Parent(s): 1ec0cbb

Update app.py

Browse files

Files changed (1) hide show

app.py +104 -11

app.py CHANGED Viewed

@@ -24,12 +24,39 @@ from io import BytesIO
 class ImageScraper:
     def __init__(self):
-        self.headers = {
             'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36',
             'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
             'Accept-Language': 'en-US,en;q=0.5',
             'Connection': 'keep-alive',
-        }
     def get_stock_images(self) -> List[str]:
         """Return preset stock images relevant to digital security and technology"""
@@ -103,6 +130,9 @@ class EnhancedVideoGenerator:
             logging.error(f"Initialization failed: {str(e)}")
             raise RuntimeError("Failed to initialize video generator")
     def setup_logging(self):
         """Configure logging for the application"""
         logging.basicConfig(
@@ -339,20 +369,83 @@ class EnhancedVideoGenerator:
             self.logger.error(f"Progress bar drawing failed: {str(e)}")
     def generate_voice_over(self, script: str) -> AudioFileClip:
-        """Generate voice-over audio using gTTS"""
         try:
             audio_path = self.temp_dir / "voice.mp3"
-            tts = gTTS(
-                text=script,
-                lang='en',
-                slow=False
             )
-            tts.save(str(audio_path))
             return AudioFileClip(str(audio_path))
         except Exception as e:
-            self.logger.error(f"Voice-over generation failed: {str(e)}")
-            return AudioFileClip(duration=len(script.split()) * 0.3)
     def create_video(self, script: str, style: str, duration: int, output_path: str, selected_images: List[str]) -> str:
         """Create video with selected images"""

 class ImageScraper:
     def __init__(self):
+        self.PIXABAY_API_KEY = "48069976-37e20099248207cee12385560"  # Replace with your key
+        self.stock_images = [
+            "https://images.pexels.com/photos/60504/security-protection-anti-virus-software-60504.jpeg",
             'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36',
             'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
             'Accept-Language': 'en-US,en;q=0.5',
             'Connection': 'keep-alive',
+        ]
+     def get_images(self, query: str, num_images: int = 15) -> List[str]:
+        try:
+            search_terms = [
+                query,
+                "digital security technology",
+                "cyber security",
+                "data protection",
+                "digital technology"
+            ]
+            all_urls = []
+            for term in search_terms:
+                url = f"https://pixabay.com/api/?key={self.PIXABAY_API_KEY}&q={term.replace(' ', '+')}&image_type=photo&per_page=5"
+                response = requests.get(url)
+                data = response.json()
+                if 'hits' in data:
+                    all_urls.extend([img['largeImageURL'] for img in data['hits']])
+            return list(set(all_urls))[:num_images] if all_urls else self.stock_images
+        except Exception as e:
+            print(f"Pixabay API error: {e}")
+            return self.stock_images
     def get_stock_images(self) -> List[str]:
         """Return preset stock images relevant to digital security and technology"""
             logging.error(f"Initialization failed: {str(e)}")
             raise RuntimeError("Failed to initialize video generator")
+            self.ELEVEN_LABS_API_KEY = "sk_acdad9d2d82d504bddbe5ed4aa290ca772c106aed5b128ba"  # Replace with your key
     def setup_logging(self):
         """Configure logging for the application"""
         logging.basicConfig(
             self.logger.error(f"Progress bar drawing failed: {str(e)}")
     def generate_voice_over(self, script: str) -> AudioFileClip:
         try:
+            # Try ElevenLabs first
             audio_path = self.temp_dir / "voice.mp3"
+            headers = {
+                "xi-api-key": self.ELEVEN_LABS_API_KEY,
+                "Content-Type": "application/json"
+            }
+            data = {
+                "text": script,
+                "model_id": "eleven_monolingual_v1",
+                "voice_settings": {
+                    "stability": 0.75,
+                    "similarity_boost": 0.75
+                }
+            }
+            response = requests.post(
+                "https://api.elevenlabs.io/v1/text-to-speech/21m00Tcm4TlvDq8ikWAM",
+                headers=headers,
+                json=data
             )
+            if response.status_code == 200:
+                with open(audio_path, "wb") as f:
+                    f.write(response.content)
+            else:
+                # Fallback to Azure TTS
+                speech_config = speechsdk.SpeechConfig(
+                    subscription=self.AZURE_SPEECH_KEY,
+                    region=self.AZURE_REGION
+                )
+                speech_config.speech_synthesis_voice_name = "en-US-JennyNeural"
+                synthesizer = speechsdk.SpeechSynthesizer(speech_config=speech_config)
+                result = synthesizer.speak_text_async(script).get()
+                if result.reason == speechsdk.ResultReason.SynthesizingAudioCompleted:
+                    with open(audio_path, "wb") as f:
+                        f.write(result.audio_data)
             return AudioFileClip(str(audio_path))
         except Exception as e:
+            print(f"Voice generation error: {e}")
+            return self.generate_fallback_audio(script)
+    def generate_subtitles(self, script: str, duration: int) -> str:
+        words = script.split()
+        words_per_second = len(words) / duration
+        subtitle_path = self.temp_dir / "subtitles.srt"
+        with open(subtitle_path, 'w') as f:
+            current_time = 0
+            words_per_subtitle = int(words_per_second * 3)  # 3 seconds per subtitle
+            for i in range(0, len(words), words_per_subtitle):
+                subtitle_words = words[i:i + words_per_subtitle]
+                if subtitle_words:
+                    start_time = self.format_time(current_time)
+                    current_time += len(subtitle_words) / words_per_second
+                    end_time = self.format_time(current_time)
+                    f.write(f"{i//words_per_subtitle + 1}\n")
+                    f.write(f"{start_time} --> {end_time}\n")
+                    f.write(f"{' '.join(subtitle_words)}\n\n")
+        return str(subtitle_path)
+    @staticmethod
+    def format_time(seconds: float) -> str:
+        hours = int(seconds // 3600)
+        minutes = int((seconds % 3600) // 60)
+        secs = int(seconds % 60)
+        msecs = int((seconds - int(seconds)) * 1000)
+        return f"{hours:02d}:{minutes:02d}:{secs:02d},{msecs:03d}"
     def create_video(self, script: str, style: str, duration: int, output_path: str, selected_images: List[str]) -> str:
         """Create video with selected images"""