Spaces:

roll-ai
/

CogVideoXInterp

Paused

App Files Files Community

AhmadMustafa commited on Sep 30

Commit

2fa4732

1 Parent(s): 068b511

add: demo

Browse files

Files changed (2) hide show

app.py +41 -55
requirements.txt +0 -1

app.py CHANGED Viewed

@@ -1,15 +1,18 @@
 import gradio as gr
 import torch
 from diffusers.utils import export_to_video
-from cogvideox_interpolation.pipeline import CogVideoXInterpolationPipeline
 from PIL import Image
-import tempfile
-import os
 # Global variable to store the pipeline
 pipe = None
 device = "cuda" if torch.cuda.is_available() else "cpu"
 def load_model(model_path):
     """Load the CogVideoX-Interpolation model"""
     global pipe
@@ -20,10 +23,7 @@ def load_model(model_path):
     # Determine dtype based on model variant
     dtype = torch.bfloat16 if "5b" in model_path.lower() else torch.float16
-    pipe = CogVideoXInterpolationPipeline.from_pretrained(
-        model_path,
-        torch_dtype=dtype
-    )
     # Memory optimization
     if device == "cuda":
@@ -37,6 +37,7 @@ def load_model(model_path):
     print("Model loaded successfully!")
     return "✓ Model loaded successfully!"
 def generate_interpolation(
     first_image,
     last_image,
@@ -45,7 +46,7 @@ def generate_interpolation(
     num_inference_steps=50,
     guidance_scale=6.0,
     fps=8,
-    seed=42
 ):
     """Generate interpolated video between two keyframes"""
@@ -66,7 +67,9 @@ def generate_interpolation(
             last_image = Image.fromarray(last_image)
         print(f"Generating video with prompt: {prompt}")
-        print(f"Parameters: frames={num_frames}, steps={num_inference_steps}, guidance={guidance_scale}")
         # Generate video
         generator = torch.Generator(device=device).manual_seed(seed)
@@ -99,9 +102,11 @@ def generate_interpolation(
         print(error_msg)
         return None, error_msg
 # Create Gradio interface
 with gr.Blocks(title="CogVideoX Keyframe Interpolation") as demo:
-    gr.Markdown("""
     # 🎬 CogVideoX Keyframe Interpolation
     Generate smooth video transitions between two keyframe images using AI.
@@ -111,7 +116,8 @@ with gr.Blocks(title="CogVideoX Keyframe Interpolation") as demo:
     2. Upload start and end frame images
     3. Describe the motion/transition in the text prompt
     4. Adjust parameters and generate!
-    """)
     with gr.Row():
         with gr.Column():
@@ -119,7 +125,7 @@ with gr.Blocks(title="CogVideoX Keyframe Interpolation") as demo:
             model_path_input = gr.Textbox(
                 label="Model Path",
                 placeholder="e.g., /path/to/CogVideoX-5b-I2V-inter or feizhengcong/CogvideoX-Interpolation",
-                value="feizhengcong/CogvideoX-Interpolation"
             )
             load_btn = gr.Button("Load Model", variant="primary")
             model_status = gr.Textbox(label="Status", interactive=False)
@@ -129,23 +135,15 @@ with gr.Blocks(title="CogVideoX Keyframe Interpolation") as demo:
     with gr.Row():
         with gr.Column():
             gr.Markdown("### 🖼️ Input Keyframes")
-            first_image_input = gr.Image(
-                label="Start Frame",
-                type="pil",
-                height=300
-            )
-            last_image_input = gr.Image(
-                label="End Frame",
-                type="pil",
-                height=300
-            )
         with gr.Column():
             gr.Markdown("### ⚙️ Generation Settings")
             prompt_input = gr.Textbox(
                 label="Motion Description",
                 placeholder="Describe the motion/transition between the frames...",
-                lines=4
             )
             with gr.Row():
@@ -155,14 +153,10 @@ with gr.Blocks(title="CogVideoX Keyframe Interpolation") as demo:
                     maximum=49,
                     step=4,
                     value=49,
-                    info="Must be 4k+1 format (13, 17, 21, ..., 49)"
                 )
                 fps_slider = gr.Slider(
-                    label="FPS",
-                    minimum=4,
-                    maximum=16,
-                    step=2,
-                    value=8
                 )
             with gr.Row():
@@ -172,7 +166,7 @@ with gr.Blocks(title="CogVideoX Keyframe Interpolation") as demo:
                     maximum=100,
                     step=5,
                     value=50,
-                    info="More steps = better quality but slower"
                 )
                 guidance_slider = gr.Slider(
                     label="Guidance Scale",
@@ -180,14 +174,10 @@ with gr.Blocks(title="CogVideoX Keyframe Interpolation") as demo:
                     maximum=15.0,
                     step=0.5,
                     value=6.0,
-                    info="Higher = stronger prompt following"
                 )
-            seed_input = gr.Number(
-                label="Random Seed",
-                value=42,
-                precision=0
-            )
             generate_btn = gr.Button("🎬 Generate Video", variant="primary", size="lg")
@@ -204,22 +194,20 @@ with gr.Blocks(title="CogVideoX Keyframe Interpolation") as demo:
     gr.Markdown("### 💡 Example Prompts")
     gr.Examples(
         examples=[
-            ["A person walks forward slowly, their body moving naturally with each step."],
             ["The camera smoothly pans from left to right, revealing the scene."],
             ["A dancer gracefully transitions from one pose to another."],
             ["The sun sets gradually, changing the lighting and colors of the scene."],
             ["A car accelerates down the street, moving from standstill to motion."],
         ],
         inputs=prompt_input,
-        label="Click to use example prompts"
     )
     # Event handlers
-    load_btn.click(
-        fn=load_model,
-        inputs=[model_path_input],
-        outputs=[model_status]
-    )
     generate_btn.click(
         fn=generate_interpolation,
@@ -231,24 +219,22 @@ with gr.Blocks(title="CogVideoX Keyframe Interpolation") as demo:
             num_steps_slider,
             guidance_slider,
             fps_slider,
-            seed_input
         ],
-        outputs=[output_video, generation_status]
     )
 if __name__ == "__main__":
-    print("="*50)
     print("CogVideoX Keyframe Interpolation Gradio App")
-    print("="*50)
     print(f"Device: {device}")
     print(f"CUDA available: {torch.cuda.is_available()}")
     if torch.cuda.is_available():
         print(f"GPU: {torch.cuda.get_device_name(0)}")
-        print(f"GPU Memory: {torch.cuda.get_device_properties(0).total_memory / 1024**3:.2f} GB")
-    print("="*50)
-    demo.launch(
-        server_name="0.0.0.0",
-        server_port=7860,
-        share=False
-    )

+import os
+import tempfile
 import gradio as gr
 import torch
 from diffusers.utils import export_to_video
 from PIL import Image
+from cogvideox_interpolation.pipeline import CogVideoXInterpolationPipeline
 # Global variable to store the pipeline
 pipe = None
 device = "cuda" if torch.cuda.is_available() else "cpu"
 def load_model(model_path):
     """Load the CogVideoX-Interpolation model"""
     global pipe
     # Determine dtype based on model variant
     dtype = torch.bfloat16 if "5b" in model_path.lower() else torch.float16
+    pipe = CogVideoXInterpolationPipeline.from_pretrained(model_path, torch_dtype=dtype)
     # Memory optimization
     if device == "cuda":
     print("Model loaded successfully!")
     return "✓ Model loaded successfully!"
 def generate_interpolation(
     first_image,
     last_image,
     num_inference_steps=50,
     guidance_scale=6.0,
     fps=8,
+    seed=42,
 ):
     """Generate interpolated video between two keyframes"""
             last_image = Image.fromarray(last_image)
         print(f"Generating video with prompt: {prompt}")
+        print(
+            f"Parameters: frames={num_frames}, steps={num_inference_steps}, guidance={guidance_scale}"
+        )
         # Generate video
         generator = torch.Generator(device=device).manual_seed(seed)
         print(error_msg)
         return None, error_msg
 # Create Gradio interface
 with gr.Blocks(title="CogVideoX Keyframe Interpolation") as demo:
+    gr.Markdown(
+        """
     # 🎬 CogVideoX Keyframe Interpolation
     Generate smooth video transitions between two keyframe images using AI.
     2. Upload start and end frame images
     3. Describe the motion/transition in the text prompt
     4. Adjust parameters and generate!
+    """
+    )
     with gr.Row():
         with gr.Column():
             model_path_input = gr.Textbox(
                 label="Model Path",
                 placeholder="e.g., /path/to/CogVideoX-5b-I2V-inter or feizhengcong/CogvideoX-Interpolation",
+                value="feizhengcong/CogvideoX-Interpolation",
             )
             load_btn = gr.Button("Load Model", variant="primary")
             model_status = gr.Textbox(label="Status", interactive=False)
     with gr.Row():
         with gr.Column():
             gr.Markdown("### 🖼️ Input Keyframes")
+            first_image_input = gr.Image(label="Start Frame", type="pil", height=300)
+            last_image_input = gr.Image(label="End Frame", type="pil", height=300)
         with gr.Column():
             gr.Markdown("### ⚙️ Generation Settings")
             prompt_input = gr.Textbox(
                 label="Motion Description",
                 placeholder="Describe the motion/transition between the frames...",
+                lines=4,
             )
             with gr.Row():
                     maximum=49,
                     step=4,
                     value=49,
+                    info="Must be 4k+1 format (13, 17, 21, ..., 49)",
                 )
                 fps_slider = gr.Slider(
+                    label="FPS", minimum=4, maximum=16, step=2, value=8
                 )
             with gr.Row():
                     maximum=100,
                     step=5,
                     value=50,
+                    info="More steps = better quality but slower",
                 )
                 guidance_slider = gr.Slider(
                     label="Guidance Scale",
                     maximum=15.0,
                     step=0.5,
                     value=6.0,
+                    info="Higher = stronger prompt following",
                 )
+            seed_input = gr.Number(label="Random Seed", value=42, precision=0)
             generate_btn = gr.Button("🎬 Generate Video", variant="primary", size="lg")
     gr.Markdown("### 💡 Example Prompts")
     gr.Examples(
         examples=[
+            [
+                "A person walks forward slowly, their body moving naturally with each step."
+            ],
             ["The camera smoothly pans from left to right, revealing the scene."],
             ["A dancer gracefully transitions from one pose to another."],
             ["The sun sets gradually, changing the lighting and colors of the scene."],
             ["A car accelerates down the street, moving from standstill to motion."],
         ],
         inputs=prompt_input,
+        label="Click to use example prompts",
     )
     # Event handlers
+    load_btn.click(fn=load_model, inputs=[model_path_input], outputs=[model_status])
     generate_btn.click(
         fn=generate_interpolation,
             num_steps_slider,
             guidance_slider,
             fps_slider,
+            seed_input,
         ],
+        outputs=[output_video, generation_status],
     )
 if __name__ == "__main__":
+    print("=" * 50)
     print("CogVideoX Keyframe Interpolation Gradio App")
+    print("=" * 50)
     print(f"Device: {device}")
     print(f"CUDA available: {torch.cuda.is_available()}")
     if torch.cuda.is_available():
         print(f"GPU: {torch.cuda.get_device_name(0)}")
+        print(
+            f"GPU Memory: {torch.cuda.get_device_properties(0).total_memory / 1024**3:.2f} GB"
+        )
+    print("=" * 50)
+    demo.launch()

requirements.txt CHANGED Viewed

@@ -1,7 +1,6 @@
 diffusers==0.30.3
 transformers==4.44.2
 accelerate==0.34.0
-gradio>=4.0.0
 torch>=2.0.0
 torchvision
 Pillow

 diffusers==0.30.3
 transformers==4.44.2
 accelerate==0.34.0
 torch>=2.0.0
 torchvision
 Pillow