Spaces:

MoonMath-ai
/

Continue

Sleeping

App Files Files Community

Shalmoni commited on Sep 29

Commit

c6dce8c

verified ·

1 Parent(s): adbfb86

Update app.py

Browse files

Files changed (1) hide show

app.py +229 -160

app.py CHANGED Viewed

@@ -1,218 +1,286 @@
 import os
-import shutil
 import uuid
 from datetime import datetime
-import numpy as np
-from PIL import Image, ImageDraw, ImageFont
 import gradio as gr
-from moviepy.editor import (
-    ImageClip,
-    ColorClip,
-    TextClip,
-    CompositeVideoClip,
-    concatenate_videoclips,
-    VideoFileClip,
-)
-# ---------- Simple "video generator" stub ----------
-# Replace `generate_video_from_prompt` with your real model call.
-# It creates a short MP4 with a first frame (optionally from a previous video),
-# then overlays prompt text for a few seconds.
 OUT_DIR = "outputs"
-USED_DIR = os.path.join(OUT_DIR, "used")
 TMP_DIR = "tmp"
 os.makedirs(OUT_DIR, exist_ok=True)
-os.makedirs(USED_DIR, exist_ok=True)
 os.makedirs(TMP_DIR, exist_ok=True)
-FPS = 24
-W, H = 768, 432  # 16:9 HD-ish to keep files light
-DURATION = 3.0   # seconds per generated clip for demo
-def _solid_bg(color=(18, 18, 18)):
-    return ColorClip(size=(W, H), color=color, duration=DURATION)
-def _text_overlay(txt: str):
-    # Use TextClip if ImageMagick is available; otherwise fallback to PIL.
-    try:
-        return TextClip(
-            txt,
-            fontsize=48,
-            color="white",
-            font="Arial-Bold",
-            size=(W - 80, None),
-            method="caption",
-        ).set_position(("center", "center")).set_duration(DURATION)
-    except Exception:
-        # PIL fallback
-        img = Image.new("RGBA", (W, H), (0, 0, 0, 0))
-        draw = ImageDraw.Draw(img)
-        # Try to load a font; fallback to default if not available on HF
-        try:
-            font = ImageFont.truetype("DejaVuSans-Bold.ttf", 48)
-        except Exception:
-            font = ImageFont.load_default()
-        # simple multiline center
-        lines = []
-        words = txt.split()
-        line = ""
-        for w in words:
-            test = (line + " " + w).strip()
-            if draw.textlength(test, font=font) > (W - 80):
-                lines.append(line)
-                line = w
-            else:
-                line = test
-        lines.append(line)
-        total_h = sum(font.getbbox(l)[3] for l in lines) + (len(lines)-1)*8
-        y = (H - total_h)//2
-        for l in lines:
-            w_px = draw.textlength(l, font=font)
-            x = (W - w_px)//2
-            draw.text((x, y), l, fill=(255,255,255,255), font=font)
-            y += font.getbbox(l)[3] + 8
-        pil_path = os.path.join(TMP_DIR, f"txt_{uuid.uuid4().hex}.png")
-        img.save(pil_path)
-        return ImageClip(pil_path, duration=DURATION).set_position(("center","center"))
-def extract_last_frame_as_image(video_path: str) -> str:
-    """Save last frame of video to an image file and return its path."""
-    with VideoFileClip(video_path) as v:
-        frame = v.get_frame(v.duration - 1.0 / max(1, v.fps))
-    img = Image.fromarray(frame)
-    frame_path = os.path.join(TMP_DIR, f"seed_{uuid.uuid4().hex}.png")
-    img.save(frame_path)
-    return frame_path
-def generate_video_from_prompt(prompt: str, seed_frame_path: str | None) -> str:
     """
-    Make a short demo MP4 using:
-      - If seed_frame_path: start 0.5s with that still frame
-      - Then a solid background + prompt text
     """
-    # Clips to concatenate
-    clips = []
-    if seed_frame_path and os.path.exists(seed_frame_path):
-        seed = ImageClip(seed_frame_path, duration=0.5).set_fps(FPS)
-        clips.append(seed)
-    bg = _solid_bg().set_fps(FPS)
-    txt = _text_overlay(prompt)
-    comp = CompositeVideoClip([bg, txt]).set_duration(DURATION).set_fps(FPS)
-    clips.append(comp)
-    final = concatenate_videoclips(clips, method="compose")
-    out_name = f"gen_{datetime.utcnow().strftime('%Y%m%d_%H%M%S')}_{uuid.uuid4().hex[:8]}.mp4"
-    out_path = os.path.join(OUT_DIR, out_name)
-    final.write_videofile(out_path, fps=FPS, codec="libx264", audio=False, verbose=False, logger=None)
-    final.close()
     return out_path
-def concat_used_videos(video_paths: list[str]) -> str:
-    clips = [VideoFileClip(p) for p in video_paths]
-    final = concatenate_videoclips(clips, method="compose")
-    out_path = os.path.join(OUT_DIR, f"continuous_{datetime.utcnow().strftime('%Y%m%d_%H%M%S')}.mp4")
-    final.write_videofile(out_path, fps=FPS, codec="libx264", audio=False, verbose=False, logger=None)
-    for c in clips:
-        c.close()
     return out_path
-def zip_used_videos(video_paths: list[str]) -> str:
-    # Copy into a temp folder to zip cleanly
-    stamp = datetime.utcnow().strftime('%Y%m%d_%H%M%S')
-    pack_dir = os.path.join(TMP_DIR, f"used_{stamp}_{uuid.uuid4().hex[:6]}")
     os.makedirs(pack_dir, exist_ok=True)
-    for p in video_paths:
         shutil.copy(p, pack_dir)
     zip_base = os.path.join(OUT_DIR, f"used_{stamp}")
     shutil.make_archive(zip_base, "zip", pack_dir)
     shutil.rmtree(pack_dir, ignore_errors=True)
     return f"{zip_base}.zip"
-# ---------- Gradio App ----------
-with gr.Blocks(css=".grow {flex: 1}") as demo:
-    gr.Markdown("# Continuous Video Prompt → Use → Chain → Download")
-    # Session state
-    state_used_paths = gr.State([])         # list[str]
-    state_seed_frame = gr.State(None)       # str | None
-    state_current_path = gr.State(None)     # str | None
     with gr.Row():
         prompt = gr.Textbox(
             label="Prompt",
             placeholder="Describe your next shot…",
             lines=2,
-            autofocus=True,
         )
-    with gr.Row(equal_height=True):
-        video_out = gr.Video(label="Video Output", interactive=False).style(height=360)
     with gr.Row():
         btn_generate = gr.Button("Generate", variant="primary")
-        btn_use = gr.Button("Use (chain this)", variant="secondary")
-        btn_download = gr.Button("Download (A+B+C & ZIP)", variant="secondary")
         btn_reset = gr.Button("Reset Session", variant="stop")
-    files_out = gr.Files(label="Downloads (concatenated MP4 + ZIP of used clips)", height=100)
-    # ---- Handlers ----
-    def do_generate(prompt_text, seed_frame_path):
         if not prompt_text or not prompt_text.strip():
-            return None, None
-        out_path = generate_video_from_prompt(prompt_text.strip(), seed_frame_path)
-        return out_path, out_path  # gr.Video path AND state_current_path
     btn_generate.click(
-        do_generate,
-        inputs=[prompt, state_seed_frame],
-        outputs=[video_out, state_current_path],
     )
-    def do_use(current_path, used_paths):
-        """
-        Save current_path to used list, extract its last frame as the next seed.
-        """
         if not current_path or not os.path.exists(current_path):
-            # no-op if nothing to use
-            return used_paths, gr.update(interactive=True), None
-        # Append to used list
         new_used = list(used_paths)
         if current_path not in new_used:
             new_used.append(current_path)
-        # Extract last frame for next generation seed
-        next_seed = extract_last_frame_as_image(current_path)
-        return new_used, gr.update(interactive=True), next_seed
     btn_use.click(
-        do_use,
-        inputs=[state_current_path, state_used_paths],
-        outputs=[state_used_paths, prompt, state_seed_frame],
     )
-    def do_download(used_paths):
-        """
-        Build concatenated video (A+B+C) and a ZIP of used clips.
-        Returns list of two files for the Files component.
-        """
         if not used_paths:
             return []
-        concat_path = concat_used_videos(used_paths)
-        zip_path = zip_used_videos(used_paths)
-        return [concat_path, zip_path]
     btn_download.click(
-        do_download,
-        inputs=[state_used_paths],
         outputs=[files_out],
     )
-    def do_reset():
-        # Clear session state and temp
         try:
             for f in os.listdir(TMP_DIR):
                 fp = os.path.join(TMP_DIR, f)
@@ -220,13 +288,14 @@ with gr.Blocks(css=".grow {flex: 1}") as demo:
                     os.remove(fp)
         except Exception:
             pass
-        return None, [], None, None, gr.update(value=None), gr.update(value=[])
     btn_reset.click(
-        do_reset,
         inputs=None,
-        outputs=[state_seed_frame, state_used_paths, state_current_path, prompt, video_out, files_out],
     )
 if __name__ == "__main__":
     demo.launch()

 import os
+import io
+import json
 import uuid
+import time
+import shutil
+import mimetypes
+import requests
+import subprocess
 from datetime import datetime
+from typing import List, Optional
 import gradio as gr
+from PIL import Image
+# ================================
+# Config
+# ================================
+ENDPOINT_URL = "https://moonmath-ai-dev--moonmath-i2v-backend-moonmathinference-run.modal.run"  # your backend
 OUT_DIR = "outputs"
 TMP_DIR = "tmp"
 os.makedirs(OUT_DIR, exist_ok=True)
 os.makedirs(TMP_DIR, exist_ok=True)
+# If ffmpeg is not on PATH for any reason, set absolute path here
+FFMPEG_BIN = "ffmpeg"
+# ================================
+# Helpers
+# ================================
+def _ts() -> str:
+    return datetime.utcnow().strftime("%Y%m%d_%H%M%S")
+def _safe_filename(prefix: str, ext: str) -> str:
+    return f"{prefix}_{_ts()}_{uuid.uuid4().hex[:8]}.{ext}"
+def _run_ffmpeg(args: List[str]) -> None:
+    """Run ffmpeg with given args; raise on failure with readable message."""
+    cmd = [FFMPEG_BIN] + args
+    proc = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
+    if proc.returncode != 0:
+        raise RuntimeError(
+            f"ffmpeg failed ({proc.returncode}).\nSTDOUT:\n{proc.stdout.decode(errors='ignore')}\n\nSTDERR:\n{proc.stderr.decode(errors='ignore')}"
+        )
+def extract_last_frame(video_path: str) -> str:
     """
+    Extract the very last frame as PNG using ffmpeg.
+    Uses -sseof -1 to seek to the last second.
     """
+    out_path = os.path.join(TMP_DIR, _safe_filename("lastframe", "png"))
+    # Seek to last second and output a single frame
+    _run_ffmpeg([
+        "-sseof", "-1",
+        "-i", video_path,
+        "-update", "1",
+        "-frames:v", "1",
+        "-q:v", "2",
+        out_path
+    ])
     return out_path
+def concat_videos_ffmpeg(video_paths: List[str]) -> str:
+    """
+    Concatenate MP4s using ffmpeg concat demuxer.
+    """
+    if len(video_paths) == 1:
+        # copy the single file to a new name to keep UX consistent
+        dst = os.path.join(OUT_DIR, _safe_filename("continuous", "mp4"))
+        shutil.copy(video_paths[0], dst)
+        return dst
+    list_file = os.path.join(TMP_DIR, f"concat_{uuid.uuid4().hex}.txt")
+    with open(list_file, "w") as f:
+        for p in video_paths:
+            # paths must be quoted if they may contain spaces
+            f.write(f"file '{os.path.abspath(p)}'\n")
+    out_path = os.path.join(OUT_DIR, _safe_filename("continuous", "mp4"))
+    _run_ffmpeg([
+        "-f", "concat",
+        "-safe", "0",
+        "-i", list_file,
+        "-c", "copy",
+        out_path
+    ])
+    try:
+        os.remove(list_file)
+    except Exception:
+        pass
     return out_path
+def zip_files(file_paths: List[str]) -> str:
+    base = os.path.join(OUT_DIR, f"used_{_ts()}")
+    shutil.make_archive(base, "zip", root_dir=os.path.dirname(file_paths[0]) if file_paths else ".", base_dir=".")
+    # The above zips the entire directory — better: copy into temp pack dir first
+    # For precision, we’ll do that instead:
+    stamp = _ts()
+    pack_dir = os.path.join(TMP_DIR, f"pack_{stamp}_{uuid.uuid4().hex[:6]}")
     os.makedirs(pack_dir, exist_ok=True)
+    for p in file_paths:
         shutil.copy(p, pack_dir)
     zip_base = os.path.join(OUT_DIR, f"used_{stamp}")
     shutil.make_archive(zip_base, "zip", pack_dir)
     shutil.rmtree(pack_dir, ignore_errors=True)
     return f"{zip_base}.zip"
+def _guess_filename_from_response(resp: requests.Response, default_ext: str = "mp4") -> str:
+    # Try Content-Disposition
+    cd = resp.headers.get("Content-Disposition", "")
+    if "filename=" in cd:
+        name = cd.split("filename=")[-1].strip('"; ')
+        if name:
+            return name
+    # Otherwise, attempt from content-type
+    ctype = resp.headers.get("Content-Type", "")
+    ext = mimetypes.guess_extension(ctype) or f".{default_ext}"
+    return _safe_filename("gen", ext.lstrip("."))
+def save_bytes_to_file(content: bytes, ext: str = "mp4") -> str:
+    path = os.path.join(OUT_DIR, _safe_filename("gen", ext))
+    with open(path, "wb") as f:
+        f.write(content)
+    return path
+# ================================
+# Backend call
+# ================================
+def call_generator(prompt: str, seed_frame_path: Optional[str]) -> str:
+    """
+    Calls your Modal endpoint. Supports two response modes:
+      1) Direct video bytes (Content-Type like video/mp4)
+      2) JSON with {"video_url": "..."} which we then download.
+    We send:
+      - form field: prompt
+      - optional file: seed_frame (PNG/JPG)
+    """
+    files = {}
+    data = {"prompt": prompt}
+    if seed_frame_path and os.path.exists(seed_frame_path):
+        files["seed_frame"] = (os.path.basename(seed_frame_path), open(seed_frame_path, "rb"), "image/png")
+    # Make the request
+    resp = requests.post(ENDPOINT_URL, data=data, files=files, timeout=600)
+    if files:
+        # close file handles
+        for _, f in files.items():
+            # f is a tuple (name, fileobj, mimetype)
+            try:
+                f[1].close()
+            except Exception:
+                pass
+    if resp.status_code != 200:
+        raise RuntimeError(f"Generator returned {resp.status_code}: {resp.text[:500]}")
+    ctype = resp.headers.get("Content-Type", "")
+    if ctype.startswith("video/"):
+        # Direct bytes
+        ext = mimetypes.guess_extension(ctype) or ".mp4"
+        out_path = os.path.join(OUT_DIR, _safe_filename("gen", ext.lstrip(".")))
+        with open(out_path, "wb") as f:
+            f.write(resp.content)
+        return out_path
+    # Assume JSON with URL
+    try:
+        payload = resp.json()
+    except Exception:
+        # fallback: treat body as raw mp4
+        return save_bytes_to_file(resp.content, "mp4")
+    video_url = payload.get("video_url")
+    if not video_url:
+        # Maybe it returned base64? If so, add handling here if needed.
+        raise RuntimeError(f"Unexpected response: {json.dumps(payload)[:500]}")
+    # Download the video
+    r2 = requests.get(video_url, stream=True, timeout=600)
+    if r2.status_code != 200:
+        raise RuntimeError(f"Failed to fetch video from URL: {r2.status_code}")
+    ext = mimetypes.guess_extension(r2.headers.get("Content-Type", "")) or ".mp4"
+    out_path = os.path.join(OUT_DIR, _safe_filename("gen", ext.lstrip(".")))
+    with open(out_path, "wb") as f:
+        for chunk in r2.iter_content(chunk_size=1024 * 1024):
+            if chunk:
+                f.write(chunk)
+    return out_path
+# ================================
+# Gradio UI
+# ================================
+with gr.Blocks() as demo:
+    gr.Markdown("## Continuous Video (Prompt → Use → Chain → Download)")
+    state_used = gr.State([])         # list[str] of used clip paths
+    state_seed = gr.State(None)       # path to last-frame image
+    state_current = gr.State(None)    # most recent generated video path
     with gr.Row():
         prompt = gr.Textbox(
             label="Prompt",
             placeholder="Describe your next shot…",
             lines=2,
+            autofocus=True
         )
+    with gr.Row():
+        video_out = gr.Video(label="Video Output", interactive=False)
     with gr.Row():
         btn_generate = gr.Button("Generate", variant="primary")
+        btn_use = gr.Button("Use (chain this)")
+        btn_download = gr.Button("Download (A+B+C & ZIP)")
         btn_reset = gr.Button("Reset Session", variant="stop")
+    files_out = gr.Files(label="Downloads", height=100)
+    # ---------- Handlers ----------
+    def on_generate(prompt_text, seed_frame):
         if not prompt_text or not prompt_text.strip():
+            return gr.update(value=None), None
+        try:
+            vid_path = call_generator(prompt_text.strip(), seed_frame)
+        except Exception as e:
+            # Surface the error in the UI
+            err_mp4 = os.path.join(OUT_DIR, _safe_filename("error", "txt"))
+            with open(err_mp4, "w") as f:
+                f.write(str(e))
+            return gr.update(value=None), None
+        return vid_path, vid_path
     btn_generate.click(
+        on_generate,
+        inputs=[prompt, state_seed],
+        outputs=[video_out, state_current],
     )
+    def on_use(current_path, used_paths):
         if not current_path or not os.path.exists(current_path):
+            return used_paths, None
         new_used = list(used_paths)
         if current_path not in new_used:
             new_used.append(current_path)
+        # Extract last frame -> seed for next gen
+        try:
+            seed_img = extract_last_frame(current_path)
+        except Exception as e:
+            # If extraction fails, keep chaining logic but without seed
+            seed_img = None
+        return new_used, seed_img
     btn_use.click(
+        on_use,
+        inputs=[state_current, state_used],
+        outputs=[state_used, state_seed],
     )
+    def on_download(used_paths):
         if not used_paths:
             return []
+        try:
+            concat_path = concat_videos_ffmpeg(used_paths)
+        except Exception as e:
+            # If concat fails, skip it but still offer the ZIP
+            concat_path = None
+        zip_path = zip_files(used_paths)
+        files = [zip_path]
+        if concat_path:
+            files.insert(0, concat_path)
+        return files
     btn_download.click(
+        on_download,
+        inputs=[state_used],
         outputs=[files_out],
     )
+    def on_reset():
+        # Clear temp files and state
         try:
             for f in os.listdir(TMP_DIR):
                 fp = os.path.join(TMP_DIR, f)
                     os.remove(fp)
         except Exception:
             pass
+        return None, [], None, gr.update(value=None), gr.update(value=None), gr.update(value=[])
     btn_reset.click(
+        on_reset,
         inputs=None,
+        outputs=[state_seed, state_used, state_current, prompt, video_out, files_out],
     )
 if __name__ == "__main__":
     demo.launch()