Spaces:

rairo
/

sozo-api

Sleeping

App Files Files

rairo commited on Mar 20, 2025

Commit

cfd4972

verified ·

1 Parent(s): 64f769f

Update video_gen.py

Browse files

Files changed (1) hide show

video_gen.py +24 -19

video_gen.py CHANGED Viewed

@@ -22,23 +22,26 @@ import seaborn as sns
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 def create_silent_video(images, durations, output_path, logo_path="sozo_logo2.png", font_path="lazy_dog.ttf"):
     try:
         height, width = 720, 1280
         fps = 24
         fourcc = cv2.VideoWriter_fourcc(*'mp4v')
         video = cv2.VideoWriter(output_path, fourcc, fps, (width, height))
         if not video.isOpened():
-            print("Failed to create video file.")
             return None
         # Load font
         try:
             font_size = 45
             font = ImageFont.truetype(font_path, font_size)
         except Exception as e:
-            print(f"Error loading font: {e}")
             font = None
         # Load logo
@@ -47,32 +50,33 @@ def create_silent_video(images, durations, output_path, logo_path="sozo_logo2.pn
             try:
                 logo = cv2.imread(logo_path)
                 if logo is not None:
-                    logo = cv2.resize(logo, (width, height))  # Resize logo to full screen
                 else:
-                    print(f"Warning: Failed to load logo from {logo_path}.")
             except Exception as e:
-                print(f"Error loading logo: {e}")
-        for img, duration in zip(images, durations):
             try:
-                # Convert image to RGB if it's in a different mode
                 if img.mode != "RGB":
                     img = img.convert("RGB")
-                # Resize image
                 img_resized = img.resize((width, height))
-                # Convert to NumPy array
                 frame = np.array(img_resized)
-                # Convert to OpenCV format (BGR)
                 frame_cv = cv2.cvtColor(frame, cv2.COLOR_RGB2BGR)
             except Exception as e:
-                print(f"Invalid image detected, replacing with logo: {e}")
                 if logo is not None:
                     frame_cv = logo
                 else:
-                    frame_cv = np.zeros((height, width, 3), dtype=np.uint8)  # Blank frame fallback
             # Convert frame to PIL for text overlay
             pil_img = Image.fromarray(cv2.cvtColor(frame_cv, cv2.COLOR_BGR2RGB))
@@ -86,8 +90,8 @@ def create_silent_video(images, durations, output_path, logo_path="sozo_logo2.pn
                 bbox = draw.textbbox((0, 0), text1, font=font)
                 text1_height = bbox[3] - bbox[1]
-                text_position1 = (width - 270, height - 120)  # "Made With"
-                text_position2 = (width - 330, height - 120 + text1_height + 5)  # "Sozo Dream Lab"
                 draw.text(text_position1, text1, font=font, fill=(81, 34, 97, 255))
                 draw.text(text_position2, text2, font=font, fill=(81, 34, 97, 255))
@@ -95,20 +99,21 @@ def create_silent_video(images, durations, output_path, logo_path="sozo_logo2.pn
             # Convert back to OpenCV format
             frame_cv = cv2.cvtColor(np.array(pil_img), cv2.COLOR_RGB2BGR)
-            # Write frame multiple times to match duration
             for _ in range(int(duration * fps)):
                 video.write(frame_cv)
-        # Add full-screen logo frame at the end
         if logo is not None:
-            for _ in range(int(3 * fps)):  # Display for 3 seconds
                 video.write(logo)
         video.release()
         return output_path
     except Exception as e:
-        print(f"Error creating silent video: {e}")
         return None

 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 def create_silent_video(images, durations, output_path, logo_path="sozo_logo2.png", font_path="lazy_dog.ttf"):
     try:
+        print("Initializing video creation...")
         height, width = 720, 1280
         fps = 24
         fourcc = cv2.VideoWriter_fourcc(*'mp4v')
         video = cv2.VideoWriter(output_path, fourcc, fps, (width, height))
         if not video.isOpened():
+            print("❌ ERROR: Failed to create video file.")
             return None
         # Load font
         try:
             font_size = 45
             font = ImageFont.truetype(font_path, font_size)
+            print("✅ Font loaded successfully.")
         except Exception as e:
+            print(f"⚠️ Font load error: {e}")
             font = None
         # Load logo
             try:
                 logo = cv2.imread(logo_path)
                 if logo is not None:
+                    logo = cv2.resize(logo, (width, height))
+                    print("✅ Logo loaded successfully.")
                 else:
+                    print(f"⚠️ Warning: Failed to load logo from {logo_path}.")
             except Exception as e:
+                print(f"⚠️ Error loading logo: {e}")
+        print(f"Processing {len(images)} images...")
+        for idx, (img, duration) in enumerate(zip(images, durations)):
             try:
+                print(f"➡️ Processing image {idx + 1}/{len(images)}...")
                 if img.mode != "RGB":
                     img = img.convert("RGB")
                 img_resized = img.resize((width, height))
                 frame = np.array(img_resized)
+                # Convert to OpenCV format
                 frame_cv = cv2.cvtColor(frame, cv2.COLOR_RGB2BGR)
             except Exception as e:
+                print(f"❌ ERROR: Invalid image detected: {e}")
                 if logo is not None:
                     frame_cv = logo
                 else:
+                    frame_cv = np.zeros((height, width, 3), dtype=np.uint8)
             # Convert frame to PIL for text overlay
             pil_img = Image.fromarray(cv2.cvtColor(frame_cv, cv2.COLOR_BGR2RGB))
                 bbox = draw.textbbox((0, 0), text1, font=font)
                 text1_height = bbox[3] - bbox[1]
+                text_position1 = (width - 270, height - 120)
+                text_position2 = (width - 330, height - 120 + text1_height + 5)
                 draw.text(text_position1, text1, font=font, fill=(81, 34, 97, 255))
                 draw.text(text_position2, text2, font=font, fill=(81, 34, 97, 255))
             # Convert back to OpenCV format
             frame_cv = cv2.cvtColor(np.array(pil_img), cv2.COLOR_RGB2BGR)
+            # Write frame multiple times
             for _ in range(int(duration * fps)):
                 video.write(frame_cv)
+        # Add full-screen logo at the end
         if logo is not None:
+            for _ in range(int(3 * fps)):
                 video.write(logo)
         video.release()
+        print("✅ Video creation completed successfully!")
         return output_path
     except Exception as e:
+        print(f"❌ ERROR in video generation: {e}")
         return None