Bifrost / app.py
JS6969's picture
Update app.py
f589249 verified
# Bifröst · Video → Frames Extractor
# ────────────────────────────────────────────────────────
# Standard imports
# ────────────────────────────────────────────────────────
import os, re, json, math, time, zipfile, tempfile, subprocess, base64
from pathlib import Path
from typing import List, Optional
import gradio as gr
_num = re.compile(r'(\d+)')
def _natural_key(p: Path | str):
s = str(p)
return [int(t) if t.isdigit() else t.lower() for t in _num.split(s)]
def sample_paths(paths: List[Path] | List[str], n: int = 30) -> List[str]:
if not paths:
return []
paths = sorted(paths, key=_natural_key)
total = len(paths)
n = max(1, min(n, total))
if n == total:
return [str(p) for p in paths]
step = (total - 1) / (n - 1)
idxs = [round(i * step) for i in range(n)]
out, seen = [], set()
for i in idxs:
if i not in seen:
out.append(str(paths[int(i)]))
seen.add(int(i))
return out
# ────────────────────────────────────────────────────────
# Logo
# ────────────────────────────────────────────────────────
APP_DIR = os.getcwd()
def load_logo_base64(path: str) -> str:
with open(path, "rb") as f:
return base64.b64encode(f.read()).decode("utf-8")
LOGO_B64 = load_logo_base64(os.path.join(APP_DIR, "bifrost_logo.png"))
def render_logo_html(px: int = 96) -> str:
return f"""
<div style="display:flex;align-items:center;gap:16px;">
<img src="data:image/png;base64,{LOGO_B64}" style="height:{px}px;width:auto;" />
<div>
<div style="font-size:1.6rem;font-weight:800;">Bifröst · Video-to-Image Extractor</div>
<div style="opacity:0.8;">The Rainbow Bridge to Frames — split video into images with precision</div>
</div>
</div>
<hr>
"""
# ────────────────────────────────────────────────────────
# System checks
# ────────────────────────────────────────────────────────
def _which(name: str) -> Optional[str]:
from shutil import which
return which(name)
FFMPEG = _which("ffmpeg")
FFPROBE = _which("ffprobe")
if not FFMPEG or not FFPROBE:
MISSING_MSG = (
"⚠️ FFmpeg not found. Add a 'packages.txt' with exactly:\n"
"ffmpeg\n"
"libsm6\n"
"libxext6\n"
"Then restart the Space."
)
else:
MISSING_MSG = ""
# ────────────────────────────────────────────────────────
# Helpers
# ────────────────────────────────────────────────────────
def sanitize_prefix(txt: str) -> str:
txt = (txt or "").strip()
if not txt:
return ""
return re.sub(r"[^A-Za-z0-9._-]+", "_", txt)[:80]
def ffprobe_json(input_path: str) -> dict:
if not FFPROBE:
return {}
cmd = [FFPROBE, "-v", "error", "-print_format", "json", "-show_streams", "-show_format", input_path]
res = subprocess.run(cmd, capture_output=True, text=True)
if res.returncode != 0:
return {}
try:
return json.loads(res.stdout)
except Exception:
return {}
def parse_video_info(meta: dict) -> dict:
info = {"duration": None, "fps": None, "width": None, "height": None}
if not meta:
return info
try:
info["duration"] = float(meta.get("format", {}).get("duration", None))
except Exception:
pass
vstreams = [s for s in meta.get("streams", []) if s.get("codec_type") == "video"]
if vstreams:
v = vstreams[0]
rfr = v.get("r_frame_rate") or v.get("avg_frame_rate")
if rfr and "/" in rfr:
try:
num, den = rfr.split("/")
num = float(num); den = float(den)
if den != 0:
info["fps"] = num / den
except Exception:
pass
info["width"] = v.get("width")
info["height"] = v.get("height")
return info
def estimate_output_count(mode: str, duration: float | None, in_fps: float | None,
every_seconds: float, nth_frame: int, exact_fps: float) -> Optional[int]:
if not duration:
return None
in_fps = in_fps or 30.0
try:
if mode == "All frames":
return int(math.ceil(duration * in_fps))
if mode == "Every N seconds" and every_seconds > 0:
return int(math.ceil(duration / every_seconds))
if mode == "Every Nth frame" and nth_frame > 0:
return int(math.ceil((duration * in_fps) / nth_frame))
if mode == "Exact FPS" and exact_fps > 0:
return int(math.ceil(duration * exact_fps))
except Exception:
return None
return None
def build_ffmpeg_extract(
input_path: str,
mode: str,
every_seconds: float,
nth_frame: int,
exact_fps: float,
start_time: str,
end_time: str,
long_side: int,
out_format: str,
jpg_quality: int,
png_level: int,
scene_detect: bool,
scene_thresh: float,
out_pattern: str,
) -> List[str]:
if not FFMPEG:
raise RuntimeError("FFmpeg not available")
cmd = [FFMPEG, "-y"]
if start_time:
cmd += ["-ss", start_time]
cmd += ["-i", input_path]
if end_time:
cmd += ["-to", end_time]
vf = []
if mode == "Every N seconds":
vf.append(f"fps={max(1e-6, 1.0/float(every_seconds or 1))}")
elif mode == "Every Nth frame":
vf.append(f"select='not(mod(n,{max(1, int(nth_frame or 1))}))'")
vf.append("setpts=N/FRAME_RATE/TB")
elif mode == "Exact FPS":
vf.append(f"fps={max(1e-6, float(exact_fps or 1))}")
elif mode == "All frames":
pass
else:
vf.append("fps=1")
if scene_detect:
vf.append(f"select='gt(scene,{float(scene_thresh)})',showinfo")
vf.append("setpts=N/FRAME_RATE/TB")
if long_side and long_side > 0:
vf.append("scale='if(gt(iw,ih),%d,-1)':'if(gt(iw,ih),-1,%d)':force_original_aspect_ratio=decrease" % (long_side, long_side))
if vf:
cmd += ["-vf", ",".join(vf)]
if out_format == "jpg":
cmd += ["-q:v", str(jpg_quality)]
elif out_format == "png":
cmd += ["-compression_level", str(png_level)]
cmd += ["-frame_pts", "1", out_pattern]
return cmd
def render_progress(pct: float, label: str = "") -> str:
pct = max(0.0, min(100.0, pct))
return f'''<div style="width:100%;border:1px solid #ddd;border-radius:8px;overflow:hidden;height:18px;">
<div style="height:100%;width:{pct:.1f}%;background:#3b82f6;"></div></div>
<div style="font-size:12px;opacity:.8;margin-top:4px;">{label} {pct:.1f}%</div>'''
# ────────────────────────────────────────────────────────
# Extraction (Step 1)
# ────────────────────────────────────────────────────────
def step1_extract(
video: gr.File | None,
mode: str,
every_seconds: float,
nth_frame: int,
exact_fps: float,
start_time: str,
end_time: str,
long_side: int,
out_format: str,
jpg_quality: int,
png_level: int,
scene_detect: bool,
scene_thresh: float,
prefix_in: str,
prog_html: str,
preview_all: bool, # ✅ toggle
):
if not video or not video.name:
yield None, None, "Upload a video.", "", prog_html, None, None, None
return
if not FFMPEG or not FFPROBE:
yield None, None, "FFmpeg missing. See note below.", MISSING_MSG, prog_html, None, None, None
return
work = Path(tempfile.mkdtemp(prefix="vid2img_"))
raw_dir = work / "frames_raw"
raw_dir.mkdir(parents=True, exist_ok=True)
prefix = sanitize_prefix(prefix_in) or Path(video.name).stem
vinfo = parse_video_info(ffprobe_json(video.name))
full_duration = float(vinfo.get("duration") or 0.0)
def _parse_ts(ts: str) -> float:
if not ts:
return 0.0
h, m, s = ts.split(":") if ":" in ts else ("0", "0", ts)
return float(h) * 3600 + float(m) * 60 + float(s)
st_s = _parse_ts((start_time or "").strip())
et_s = _parse_ts((end_time or "").strip())
if full_duration and st_s > 0:
full_duration = max(0.0, full_duration - st_s)
if full_duration and et_s > 0 and et_s < (vinfo.get("duration") or 0):
full_duration = max(0.0, min(full_duration, et_s))
pattern = str(raw_dir / f"{prefix}_%05d.{out_format}")
cmd = build_ffmpeg_extract(
input_path=video.name,
mode=mode,
every_seconds=every_seconds,
nth_frame=nth_frame,
exact_fps=exact_fps,
start_time=(start_time or "").strip(),
end_time=(end_time or "").strip(),
long_side=long_side,
out_format=out_format,
jpg_quality=jpg_quality,
png_level=png_level,
scene_detect=scene_detect,
scene_thresh=scene_thresh,
out_pattern=pattern,
)
cmd = [cmd[0], "-progress", "pipe:2"] + cmd[1:]
cmd_preview = " ".join([s if " " not in s else f'"{s}"' for s in cmd])
proc = subprocess.Popen(
cmd, stderr=subprocess.PIPE, stdout=subprocess.DEVNULL, text=True, bufsize=1
)
last_pct = 0.0
gallery_preview = []
while True:
line = proc.stderr.readline()
if not line and proc.poll() is not None:
break
line = (line or "").strip()
if line.startswith("out_time=") and full_duration > 0:
t = line.split("=", 1)[1]
try:
h, m, s = t.split(":")
secs = float(h) * 3600 + float(m) * 60 + float(s)
except Exception:
secs = 0.0
pct = max(0.0, min(100.0, (secs / full_duration) * 100.0))
if pct - last_pct >= 1.0 or pct in (0.0, 100.0):
last_pct = pct
gallery_preview = sample_paths(sorted(raw_dir.glob(f"{prefix}_*.{out_format}"), key=_natural_key), 36)
yield gallery_preview, None, "Extracting…", cmd_preview, render_progress(pct, f"Extracting {pct:.0f}%"), None, str(raw_dir), prefix
ret = proc.wait()
frames = sorted(raw_dir.glob(f"{prefix}_*.{out_format}"), key=_natural_key)
if preview_all:
gallery = [str(p) for p in frames]
else:
gallery = [str(p) for p in frames] if len(frames) <= 100 else sample_paths(frames, 100)
# ZIP name based on original video / custom prefix
zip_path = work / f"{prefix}_frames.zip"
with zipfile.ZipFile(zip_path, "w", zipfile.ZIP_DEFLATED) as zf:
for p in frames:
zf.write(p, p.name)
if ret != 0 or not frames:
err = ""
try:
err = proc.stderr.read() if proc.stderr else ""
except Exception:
pass
yield gallery, None, f"Extraction failed.\n\n{err}", cmd_preview, render_progress(0.0, "Failed"), None, str(raw_dir), prefix
return
details = f"Frames extracted: {len(frames)} | Saved to: {raw_dir}"
yield gallery, str(zip_path), details, cmd_preview, render_progress(100.0, f"Extracted {len(frames)} frames"), [str(p) for p in frames], str(raw_dir), prefix
# ────────────────────────────────────────────────────────
# UI
# ────────────────────────────────────────────────────────
def build_ui():
with gr.Blocks(theme=gr.themes.Soft()) as demo:
gr.HTML(render_logo_html(88))
gr.Markdown("Extract frames from a video with live progress.")
with gr.Row():
video = gr.File(label="Upload video", file_types=[".mp4", ".mov", ".mkv", ".avi", ".webm", ".m4v"], type="filepath")
preview_all = gr.Checkbox(value=False, label="Preview all frames (may be slow)")
with gr.Accordion("Extraction Settings", open=True):
with gr.Row():
mode = gr.Dropdown(["Every N seconds", "Every Nth frame", "Exact FPS", "All frames"], value="Every N seconds", label="Mode")
every_seconds = gr.Number(value=1.0, label="Every N seconds")
nth_frame = gr.Number(value=30, label="Every Nth frame")
exact_fps = gr.Number(value=1.0, label="Exact FPS")
with gr.Row():
start_time = gr.Textbox(value="", label="Start (HH:MM:SS.mmm)")
end_time = gr.Textbox(value="", label="End (HH:MM:SS.mmm)")
long_side = gr.Number(value=0, label="Resize long side px (0 = none)")
with gr.Row():
out_format = gr.Dropdown(["jpg", "png"], value="jpg", label="Output format")
jpg_quality = gr.Slider(2, 31, value=3, step=1, label="JPG quality (2=best)")
png_level = gr.Slider(0, 9, value=2, step=1, label="PNG compression level")
with gr.Row():
scene_detect = gr.Checkbox(False, label="Scene-change detect")
scene_thresh = gr.Slider(0.0, 1.0, value=0.3, step=0.01, label="Scene threshold")
prefix_vid = gr.Textbox(value="", label="Filename prefix (defaults to input video name)")
btn_extract = gr.Button("Extract Frames", variant="primary")
prog = gr.HTML(render_progress(0.0, "Idle"))
gallery = gr.Gallery(label="Preview (≤100 or all if toggled)", columns=6, height=480)
zip_out = gr.File(label="Download frames ZIP")
details = gr.Markdown("Ready.")
with gr.Accordion("Show FFmpeg command", open=False):
cmd_preview = gr.Textbox(label="ffmpeg command", lines=4)
estimate_md = gr.Markdown("Estimated output: —")
def _toggle_params(mode_val, fmt):
return (
gr.update(visible=(mode_val == "Every N seconds")),
gr.update(visible=(mode_val == "Every Nth frame")),
gr.update(visible=(mode_val == "Exact FPS")),
gr.update(visible=(fmt == "jpg")),
gr.update(visible=(fmt == "png")),
)
def update_estimate(vfile, mode_val, evs, nth, exfps, st, et):
if not vfile or not getattr(vfile, 'name', None):
return "Estimated output: —"
info = parse_video_info(ffprobe_json(vfile.name))
dur = info.get("duration")
def parse_ts(ts: str):
if not ts: return 0.0
parts = ts.split(":")
if len(parts) == 3:
try: return float(parts[0])*3600 + float(parts[1])*60 + float(parts[2])
except Exception: return 0.0
return 0.0
st_s = parse_ts(st or ""); et_s = parse_ts(et or "")
if dur:
if st_s: dur = max(0.0, dur - st_s)
if et_s and et_s < info.get("duration", 0) and et_s > 0:
dur = min(dur, et_s)
est = estimate_output_count(mode_val, dur, info.get("fps"), evs or 1.0, int(nth or 1), exfps or 1.0)
return f"Estimated output: **~{est} frames**" if est else "Estimated output: —"
mode.change(_toggle_params, [mode, out_format], [every_seconds, nth_frame, exact_fps, jpg_quality, png_level])
out_format.change(_toggle_params, [mode, out_format], [every_seconds, nth_frame, exact_fps, jpg_quality, png_level])
demo.load(_toggle_params, [mode, out_format], [every_seconds, nth_frame, exact_fps, jpg_quality, png_level])
for ctrl in [video, mode, every_seconds, nth_frame, exact_fps, start_time, end_time]:
ctrl.change(update_estimate, inputs=[video, mode, every_seconds, nth_frame, exact_fps, start_time, end_time], outputs=[estimate_md])
btn_extract.click(
step1_extract,
inputs=[video, mode, every_seconds, nth_frame, exact_fps, start_time, end_time, long_side, out_format, jpg_quality, png_level, scene_detect, scene_thresh, prefix_vid, prog, preview_all],
outputs=[gallery, zip_out, details, cmd_preview, prog],
)
if MISSING_MSG:
gr.Markdown(f"<span style='color:#b45309'>{MISSING_MSG}</span>")
return demo
if __name__ == "__main__":
build_ui().queue().launch()