Spaces:

Elvoro
/

Tools

Running

App Files Files Community

jebin2 commited on Jan 12

Commit

9cee612

1 Parent(s): 3a02405

Refactor: Modularized RunwayML logic and extracted to src/runwayml/

Browse files

Files changed (5) hide show

src/api_clients.py +0 -165
src/automation.py +3 -2
src/runwayml/__init__.py +0 -0
src/runwayml/generate_video.py +168 -0
src/video_generation_process.py +84 -0

src/api_clients.py CHANGED Viewed

@@ -100,171 +100,6 @@ class APIClients:
         except: pass
-    async def generate_video(self, prompt: str, duration: int, image_input: str = None) -> Dict:
-        """
-        Generate video using RunwayML gen4_turbo ($0.25 per video / 25 credits)
-        Args:
-            prompt: Text prompt for video generation
-            duration: Video duration in seconds
-            image_input: A HTTPS URL or a LOCAL FILE PATH to an image.
-        """
-        try:
-            if os.getenv("TEST_AUTOMATION", "").lower() == "true":
-                if image_input:
-                    return {
-                        "task_id": "644319db-5226-42cf-b45f-5388e40d38a6",
-                        "video_url": f"{os.getenv('TEST_DATA_DIRECTORY')}/image-to-video.mp4",
-                        "local_path": f"{os.getenv('TEST_DATA_DIRECTORY')}/image-to-video.mp4",
-                        "duration": 3,
-                        "prompt": prompt,
-                        "status": "SUCCEEDED",
-                        "created_at": "2025-10-15T12:39:24.279Z",
-                        "model": "veo3.1_fast",
-                    }
-                else:
-                    return {
-                        "task_id": "644319db-5226-42cf-b45f-5388e40d38a6",
-                        "video_url": f"{os.getenv('TEST_DATA_DIRECTORY')}/veo_text_to_video.mp4",
-                        "local_path": f"{os.getenv('TEST_DATA_DIRECTORY')}/veo_text_to_video.mp4",
-                        "duration": 3,
-                        "prompt": prompt,
-                        "status": "SUCCEEDED",
-                        "created_at": "2025-10-15T12:39:24.279Z",
-                        "model": "gen4_turbo",
-                    }
-            logger.info(f"🎬 Generating video with: {prompt[:1000]}...")
-            prompt_image_value = ""
-            if image_input:
-                if image_input.startswith("http"):
-                    # It's a URL, use it directly
-                    logger.info("Using provided image URL for RunwayML.")
-                    prompt_image_value = image_input
-                else:
-                    # It's a local file path, convert it to a Base64 Data URI
-                    logger.info(f"Encoding local image {image_input} to Base64 Data URI.")
-                    try:
-                        # Determine the image type from the file extension
-                        image_type = os.path.splitext(image_input)[1].replace('.', '') # e.g., 'png'
-                        with open(image_input, "rb") as image_file:
-                            encoded_string = base64.b64encode(image_file.read()).decode('utf-8')
-                        # Construct the full Data URI
-                        prompt_image_value = f"data:image/{image_type};base64,{encoded_string}"
-                        logger.info("✓ Successfully encoded image to Data URI.")
-                    except Exception as e:
-                        logger.error(f"❌ Failed to encode local image to Base64: {e}")
-                        raise
-            headers = {
-                "Authorization": f"Bearer {self.runway_api_key}",
-                "Content-Type": "application/json",
-                "X-Runway-Version": "2024-11-06",
-            }
-            model_name = "gen4_turbo"
-            ratio = "720:1280"
-            url = "https://api.dev.runwayml.com/v1/image_to_video"
-            duration = 3
-            if not image_input:
-                # ratio = "1080:1920" # not working wih veo3.1_fast
-                model_name = "veo3.1_fast"
-                duration = 4
-                # ratio = "1080:1920" # not working with veo in this ratio
-                url = "https://api.dev.runwayml.com/v1/text_to_video"
-            if os.getenv("USE_GEMIMI_VIDEO", "false").lower() == "true":
-                logger.info("Using Gemini SDK for video generation...")
-                output_path = await self.get_cache_url(f"ai_studio_sdk.generate_video_{model_name}", ".mp4")
-                if not output_path:
-                    output_path = f'/tmp/video_{duration}_{model_name}_{uuid.uuid4().hex[:8]}.mp4'
-                    ai_studio_sdk.generate_video(prompt, output_path, image_input)
-                    await self.store_in_cache(output_path, f"ai_studio_sdk.generate_video_{model_name}", ".mp4")
-                video_result = {
-                    "local_path": output_path,
-                    "task_id": None,
-                    "duration": duration,
-                    "prompt": prompt,
-                    "status": "success",
-                    "created_at": None,
-                    "model": model_name,
-                }
-                return video_result
-            payload = {
-                "promptImage": prompt_image_value,
-                "promptText": prompt[:1000],
-                "model": model_name,
-                "duration": duration,
-                "ratio": ratio,
-            }
-            method_type = "gen4_video_google_video" if image_input else "veo_google_video"
-            content = await self.get_from_cache(method_type, duration)
-            if content:
-                return json.loads(content)
-            if not image_input:
-                payload.pop("promptImage", None)
-            async with aiohttp.ClientSession() as session:
-                # Create task
-                async with session.post(
-                    url, headers=headers, json=payload
-                ) as response:
-                    if response.status != 200:
-                        error_text = await response.text()
-                        # Log the full error for easier debugging
-                        logger.error(f"RunwayML API Error Response: {error_text}")
-                        raise Exception(f"RunwayML error: {error_text}")
-                    task_data = await response.json()
-                    task_id = task_data["id"]
-                    logger.info(f"✓ Task created with {model_name}: {task_id}")
-                # Poll for completion
-                # task_id = "3b6d5a82-923f-4fa6-a7bc-4844de6e31e1"
-                max_attempts = 120
-                for _ in range(max_attempts):
-                    await asyncio.sleep(10)
-                    async with session.get(
-                        f"https://api.dev.runwayml.com/v1/tasks/{task_id}", headers=headers
-                    ) as status_response:
-                        status_data = await status_response.json()
-                        status = status_data["status"]
-                        if status == "SUCCEEDED":
-                            video_url = status_data["output"][0]
-                            logger.info(f"✅ Video generated with {model_name}: {video_url}")
-                            video_result = {
-                                "video_url": video_url,
-                                "task_id": task_id,
-                                "duration": duration,
-                                "prompt": prompt,
-                                "status": status,
-                                "created_at": status_data.get("createdAt"),
-                                "model": model_name,
-                            }
-                            await self.store_in_cache_file(method_type, json.dumps(video_result), duration)
-                            return video_result
-                        elif status == "FAILED":
-                            raise Exception(f"Generation failed: {status_data.get('failure')}")
-                        elif status == "RUNNING":
-                            progress = status_data.get("progress", 0)
-                            logger.info(f"⏳ Progress: {progress*100:.0f}%")
-                raise Exception("Timeout waiting for video generation")
-        except Exception as e:
-            logger.error(f"❌ Video generation error: {e}")
-            raise


100	except: pass
101
102





































































































































































103
104
105

src/automation.py CHANGED Viewed

@@ -7,6 +7,7 @@ import os
 import time
 import json
 from google_src import ai_studio_sdk
 from typing import Dict, List, Optional, Any
 from pathlib import Path
 from api_clients import APIClients
@@ -477,7 +478,7 @@ class ContentAutomation:
             upload_file_to_gcs(image_path)
             # Step 3: Generate video using gen4_turbo
-            video_data = await self.api_clients.generate_video(
                 prompt=strategy["runway_prompt"], image_input=image_path, duration=strategy.get("duration", 3)
             )
@@ -485,7 +486,7 @@ class ContentAutomation:
             video_data["script"] = self.data_holder.tts_script
             if os.getenv("USE_VEO", "false").lower() == "true":
-                veo_video_data = await self.api_clients.generate_video(
                     prompt=strategy["runway_veo_prompt"], duration=strategy.get("duration", 4)
                 )
                 video_data["veo_video_data"] = veo_video_data

 import time
 import json
 from google_src import ai_studio_sdk
+from video_generation_process import generate_video_process
 from typing import Dict, List, Optional, Any
 from pathlib import Path
 from api_clients import APIClients
             upload_file_to_gcs(image_path)
             # Step 3: Generate video using gen4_turbo
+            video_data = await generate_video_process(
                 prompt=strategy["runway_prompt"], image_input=image_path, duration=strategy.get("duration", 3)
             )
             video_data["script"] = self.data_holder.tts_script
             if os.getenv("USE_VEO", "false").lower() == "true":
+                veo_video_data = await generate_video_process(
                     prompt=strategy["runway_veo_prompt"], duration=strategy.get("duration", 4)
                 )
                 video_data["veo_video_data"] = veo_video_data

src/runwayml/__init__.py ADDED Viewed

File without changes

src/runwayml/generate_video.py ADDED Viewed

	@@ -0,0 +1,168 @@

+import os
+import aiohttp
+import asyncio
+import base64
+import logging
+from typing import Dict, Tuple, Optional
+logger = logging.getLogger(__name__)
+def _get_api_key() -> str:
+    """Retrieve RunwayML API key from environment variables."""
+    runway_api_key = os.getenv("RUNWAYML_API_KEY") or os.getenv("RUNWAY_2ND_API_KEY") or os.getenv("SPARK_KEY")
+    if not runway_api_key:
+         logger.error("RunwayML API key not found in environment variables.")
+         raise ValueError("RunwayML API key not found.")
+    return runway_api_key
+def _get_headers(api_key: str) -> Dict[str, str]:
+    """Construct headers for RunwayML API."""
+    return {
+        "Authorization": f"Bearer {api_key}",
+        "Content-Type": "application/json",
+        "X-Runway-Version": "2024-11-06",
+    }
+def _encode_image(image_input: str) -> str:
+    """Encode local image to Base64 Data URI or return URL as is."""
+    if image_input.startswith("http"):
+        logger.info("Using provided image URL for RunwayML.")
+        return image_input
+    logger.info(f"Encoding local image {image_input} to Base64 Data URI.")
+    try:
+        image_type = os.path.splitext(image_input)[1].replace('.', '') # e.g., 'png'
+        with open(image_input, "rb") as image_file:
+            encoded_string = base64.b64encode(image_file.read()).decode('utf-8')
+        data_uri = f"data:image/{image_type};base64,{encoded_string}"
+        logger.info("✓ Successfully encoded image to Data URI.")
+        return data_uri
+    except Exception as e:
+        logger.error(f"❌ Failed to encode local image to Base64: {e}")
+        raise
+async def _submit_task(session: aiohttp.ClientSession, url: str, headers: Dict, payload: Dict, model_name: str) -> str:
+    """Submit generation task to RunwayML API and return task ID."""
+    async with session.post(url, headers=headers, json=payload) as response:
+        if response.status != 200:
+            error_text = await response.text()
+            logger.error(f"RunwayML API Error Response: {error_text}")
+            raise Exception(f"RunwayML error: {error_text}")
+        task_data = await response.json()
+        task_id = task_data["id"]
+        logger.info(f"✓ Task created with {model_name}: {task_id}")
+        return task_id
+async def _poll_task(session: aiohttp.ClientSession, task_id: str, headers: Dict, model_name: str) -> Dict:
+    """Poll RunwayML task until completion."""
+    max_attempts = 120
+    for _ in range(max_attempts):
+        await asyncio.sleep(10)
+        async with session.get(
+            f"https://api.dev.runwayml.com/v1/tasks/{task_id}", headers=headers
+        ) as status_response:
+            status_data = await status_response.json()
+            status = status_data["status"]
+            if status == "SUCCEEDED":
+                video_url = status_data["output"][0]
+                logger.info(f"✅ Video generated with {model_name}: {video_url}")
+                return {
+                    "video_url": video_url,
+                    "status": status,
+                    "created_at": status_data.get("createdAt"),
+                }
+            elif status == "FAILED":
+                raise Exception(f"Generation failed: {status_data.get('failure')}")
+            elif status == "RUNNING":
+                progress = status_data.get("progress", 0)
+                logger.info(f"⏳ Progress: {progress*100:.0f}%")
+    raise Exception("Timeout waiting for video generation")
+async def _handle_image_to_video(
+    session: aiohttp.ClientSession,
+    headers: Dict,
+    prompt: str,
+    duration: int,
+    image_input: str
+) -> Tuple[str, str, int]:
+    """Handle Image-to-Video generation workflow."""
+    model_name = "gen4_turbo"
+    ratio = "720:1280"
+    url = "https://api.dev.runwayml.com/v1/image_to_video"
+    prompt_image_value = _encode_image(image_input)
+    payload = {
+        "promptImage": prompt_image_value,
+        "promptText": prompt[:1000],
+        "model": model_name,
+        "duration": duration,
+        "ratio": ratio,
+    }
+    task_id = await _submit_task(session, url, headers, payload, model_name)
+    return task_id, model_name, duration
+async def _handle_text_to_video(
+    session: aiohttp.ClientSession,
+    headers: Dict,
+    prompt: str
+) -> Tuple[str, str, int]:
+    """Handle Text-to-Video generation workflow."""
+    model_name = "veo3.1_fast"
+    duration = 4 # Fixed duration for Veo text-to-video for now
+    url = "https://api.dev.runwayml.com/v1/text_to_video"
+    payload = {
+        "promptText": prompt[:1000],
+        "model": model_name,
+        "duration": duration,
+        # "ratio": "1080:1920" # Note: Ratio not supported for Veo currently
+    }
+    task_id = await _submit_task(session, url, headers, payload, model_name)
+    return task_id, model_name, duration
+async def generate_video_runway(prompt: str, duration: int, image_input: str = None) -> Dict:
+    """
+    Generate video using RunwayML (Text-to-Video or Image-to-Video).
+    Args:
+        prompt: Text prompt for video generation
+        duration: Video duration in seconds (may be overridden by specific models)
+        image_input: Optional HTTPS URL or local file path to an image.
+    """
+    try:
+        api_key = _get_api_key()
+        headers = _get_headers(api_key)
+        async with aiohttp.ClientSession() as session:
+            if image_input:
+                task_id, model_name, final_duration = await _handle_image_to_video(
+                    session, headers, prompt, duration, image_input
+                )
+            else:
+                task_id, model_name, final_duration = await _handle_text_to_video(
+                    session, headers, prompt
+                )
+            result_data = await _poll_task(session, task_id, headers, model_name)
+            return {
+                "video_url": result_data["video_url"],
+                "task_id": task_id,
+                "duration": final_duration,
+                "prompt": prompt,
+                "status": result_data["status"],
+                "created_at": result_data["created_at"],
+                "model": model_name,
+            }
+    except Exception as e:
+        logger.error(f"❌ Video generation error: {e}")
+        raise

src/video_generation_process.py ADDED Viewed

	@@ -0,0 +1,84 @@

+import os
+import uuid
+import json
+import logging
+from typing import Dict, Optional
+from google_src import ai_studio_sdk
+from runwayml.generate_video import generate_video_runway
+from utils import logger
+from google_src.gcs_utils import upload_file_to_gcs
+async def generate_video_process(prompt: str, duration: int, image_input: str = None) -> Dict:
+    """
+    Orchestrate video generation:
+    1. Check if TEST_AUTOMATION is on -> return mock data.
+    2. Check USE_GEMIMI_VIDEO -> use ai_studio_sdk.
+    3. Else -> use RunwayML.
+    Handles caching implicitly via caller or here if needed (previously cached in api_clients was complex,
+    but automation usually re-checks cache. We can reimplement simple caching here or rely on the fact
+    that the logic is now streamlined).
+    The original api_clients code had extensive caching using APIClients.store_in_cache which uploaded to GCS.
+    We should probably return the result and let the caller handle it or replicate the upload if needed for
+    consistency with 'video_url' in result.
+    RunwayML returns a public URL. Gemini SDK returns a local path, so we upload it to GCS to get a URL,
+    making the result format consistent.
+    """
+    # 1. Test Mode
+    if os.getenv("TEST_AUTOMATION", "").lower() == "true":
+        if image_input:
+            return {
+                "task_id": "644319db-5226-42cf-b45f-5388e40d38a6",
+                "video_url": f"{os.getenv('TEST_DATA_DIRECTORY')}/image-to-video.mp4",
+                "local_path": f"{os.getenv('TEST_DATA_DIRECTORY')}/image-to-video.mp4",
+                "duration": 3,
+                "prompt": prompt,
+                "status": "SUCCEEDED",
+                "created_at": "2025-10-15T12:39:24.279Z",
+                "model": "veo3.1_fast",
+            }
+        else:
+            return {
+                "task_id": "644319db-5226-42cf-b45f-5388e40d38a6",
+                "video_url": f"{os.getenv('TEST_DATA_DIRECTORY')}/veo_text_to_video.mp4",
+                "local_path": f"{os.getenv('TEST_DATA_DIRECTORY')}/veo_text_to_video.mp4",
+                "duration": 3,
+                "prompt": prompt,
+                "status": "SUCCEEDED",
+                "created_at": "2025-10-15T12:39:24.279Z",
+                "model": "gen4_turbo",
+            }
+    # 2. Gemini / Veo
+    if os.getenv("USE_GEMIMI_VIDEO", "false").lower() == "true":
+        logger.info("Using Gemini SDK for video generation...")
+        model_name = "veo3.1_fast" # implied default from context
+        # Original code checked cache here. We'll simplify: generate -> upload -> return.
+        output_path = f'/tmp/video_{duration}_{model_name}_{uuid.uuid4().hex[:8]}.mp4'
+        ai_studio_sdk.generate_video(prompt, output_path, image_input)
+        # Upload to GCS to get a URL to match expectations
+        upload_result = upload_file_to_gcs(output_path)
+        video_url = upload_result.get('url')
+        video_result = {
+            "local_path": output_path,
+            "video_url": video_url,
+            "task_id": None,
+            "duration": duration,
+            "prompt": prompt,
+            "status": "success",
+            "created_at": None,
+            "model": model_name,
+        }
+        return video_result
+    # 3. RunwayML
+    logger.info("Using RunwayML for video generation...")
+    return await generate_video_runway(prompt, duration, image_input)