| |
|
|
| |
| |
| |
| import os, re, json, math, time, zipfile, tempfile, subprocess, base64 |
| from pathlib import Path |
| from typing import List, Optional |
| import gradio as gr |
|
|
| _num = re.compile(r'(\d+)') |
|
|
| def _natural_key(p: Path | str): |
| s = str(p) |
| return [int(t) if t.isdigit() else t.lower() for t in _num.split(s)] |
|
|
| def sample_paths(paths: List[Path] | List[str], n: int = 30) -> List[str]: |
| if not paths: |
| return [] |
| paths = sorted(paths, key=_natural_key) |
| total = len(paths) |
| n = max(1, min(n, total)) |
| if n == total: |
| return [str(p) for p in paths] |
| step = (total - 1) / (n - 1) |
| idxs = [round(i * step) for i in range(n)] |
| out, seen = [], set() |
| for i in idxs: |
| if i not in seen: |
| out.append(str(paths[int(i)])) |
| seen.add(int(i)) |
| return out |
|
|
| |
| |
| |
| APP_DIR = os.getcwd() |
| def load_logo_base64(path: str) -> str: |
| with open(path, "rb") as f: |
| return base64.b64encode(f.read()).decode("utf-8") |
|
|
| LOGO_B64 = load_logo_base64(os.path.join(APP_DIR, "bifrost_logo.png")) |
|
|
| def render_logo_html(px: int = 96) -> str: |
| return f""" |
| <div style="display:flex;align-items:center;gap:16px;"> |
| <img src="data:image/png;base64,{LOGO_B64}" style="height:{px}px;width:auto;" /> |
| <div> |
| <div style="font-size:1.6rem;font-weight:800;">Bifröst · Video-to-Image Extractor</div> |
| <div style="opacity:0.8;">The Rainbow Bridge to Frames — split video into images with precision</div> |
| </div> |
| </div> |
| <hr> |
| """ |
|
|
| |
| |
| |
| def _which(name: str) -> Optional[str]: |
| from shutil import which |
| return which(name) |
|
|
| FFMPEG = _which("ffmpeg") |
| FFPROBE = _which("ffprobe") |
|
|
| if not FFMPEG or not FFPROBE: |
| MISSING_MSG = ( |
| "⚠️ FFmpeg not found. Add a 'packages.txt' with exactly:\n" |
| "ffmpeg\n" |
| "libsm6\n" |
| "libxext6\n" |
| "Then restart the Space." |
| ) |
| else: |
| MISSING_MSG = "" |
|
|
| |
| |
| |
| def sanitize_prefix(txt: str) -> str: |
| txt = (txt or "").strip() |
| if not txt: |
| return "" |
| return re.sub(r"[^A-Za-z0-9._-]+", "_", txt)[:80] |
|
|
| def ffprobe_json(input_path: str) -> dict: |
| if not FFPROBE: |
| return {} |
| cmd = [FFPROBE, "-v", "error", "-print_format", "json", "-show_streams", "-show_format", input_path] |
| res = subprocess.run(cmd, capture_output=True, text=True) |
| if res.returncode != 0: |
| return {} |
| try: |
| return json.loads(res.stdout) |
| except Exception: |
| return {} |
|
|
| def parse_video_info(meta: dict) -> dict: |
| info = {"duration": None, "fps": None, "width": None, "height": None} |
| if not meta: |
| return info |
| try: |
| info["duration"] = float(meta.get("format", {}).get("duration", None)) |
| except Exception: |
| pass |
| vstreams = [s for s in meta.get("streams", []) if s.get("codec_type") == "video"] |
| if vstreams: |
| v = vstreams[0] |
| rfr = v.get("r_frame_rate") or v.get("avg_frame_rate") |
| if rfr and "/" in rfr: |
| try: |
| num, den = rfr.split("/") |
| num = float(num); den = float(den) |
| if den != 0: |
| info["fps"] = num / den |
| except Exception: |
| pass |
| info["width"] = v.get("width") |
| info["height"] = v.get("height") |
| return info |
|
|
| def estimate_output_count(mode: str, duration: float | None, in_fps: float | None, |
| every_seconds: float, nth_frame: int, exact_fps: float) -> Optional[int]: |
| if not duration: |
| return None |
| in_fps = in_fps or 30.0 |
| try: |
| if mode == "All frames": |
| return int(math.ceil(duration * in_fps)) |
| if mode == "Every N seconds" and every_seconds > 0: |
| return int(math.ceil(duration / every_seconds)) |
| if mode == "Every Nth frame" and nth_frame > 0: |
| return int(math.ceil((duration * in_fps) / nth_frame)) |
| if mode == "Exact FPS" and exact_fps > 0: |
| return int(math.ceil(duration * exact_fps)) |
| except Exception: |
| return None |
| return None |
|
|
| def build_ffmpeg_extract( |
| input_path: str, |
| mode: str, |
| every_seconds: float, |
| nth_frame: int, |
| exact_fps: float, |
| start_time: str, |
| end_time: str, |
| long_side: int, |
| out_format: str, |
| jpg_quality: int, |
| png_level: int, |
| scene_detect: bool, |
| scene_thresh: float, |
| out_pattern: str, |
| ) -> List[str]: |
| if not FFMPEG: |
| raise RuntimeError("FFmpeg not available") |
| cmd = [FFMPEG, "-y"] |
| if start_time: |
| cmd += ["-ss", start_time] |
| cmd += ["-i", input_path] |
| if end_time: |
| cmd += ["-to", end_time] |
| vf = [] |
| if mode == "Every N seconds": |
| vf.append(f"fps={max(1e-6, 1.0/float(every_seconds or 1))}") |
| elif mode == "Every Nth frame": |
| vf.append(f"select='not(mod(n,{max(1, int(nth_frame or 1))}))'") |
| vf.append("setpts=N/FRAME_RATE/TB") |
| elif mode == "Exact FPS": |
| vf.append(f"fps={max(1e-6, float(exact_fps or 1))}") |
| elif mode == "All frames": |
| pass |
| else: |
| vf.append("fps=1") |
| if scene_detect: |
| vf.append(f"select='gt(scene,{float(scene_thresh)})',showinfo") |
| vf.append("setpts=N/FRAME_RATE/TB") |
| if long_side and long_side > 0: |
| vf.append("scale='if(gt(iw,ih),%d,-1)':'if(gt(iw,ih),-1,%d)':force_original_aspect_ratio=decrease" % (long_side, long_side)) |
| if vf: |
| cmd += ["-vf", ",".join(vf)] |
| if out_format == "jpg": |
| cmd += ["-q:v", str(jpg_quality)] |
| elif out_format == "png": |
| cmd += ["-compression_level", str(png_level)] |
| cmd += ["-frame_pts", "1", out_pattern] |
| return cmd |
|
|
| def render_progress(pct: float, label: str = "") -> str: |
| pct = max(0.0, min(100.0, pct)) |
| return f'''<div style="width:100%;border:1px solid #ddd;border-radius:8px;overflow:hidden;height:18px;"> |
| <div style="height:100%;width:{pct:.1f}%;background:#3b82f6;"></div></div> |
| <div style="font-size:12px;opacity:.8;margin-top:4px;">{label} {pct:.1f}%</div>''' |
|
|
| |
| |
| |
| def step1_extract( |
| video: gr.File | None, |
| mode: str, |
| every_seconds: float, |
| nth_frame: int, |
| exact_fps: float, |
| start_time: str, |
| end_time: str, |
| long_side: int, |
| out_format: str, |
| jpg_quality: int, |
| png_level: int, |
| scene_detect: bool, |
| scene_thresh: float, |
| prefix_in: str, |
| prog_html: str, |
| preview_all: bool, |
| ): |
| if not video or not video.name: |
| yield None, None, "Upload a video.", "", prog_html, None, None, None |
| return |
| if not FFMPEG or not FFPROBE: |
| yield None, None, "FFmpeg missing. See note below.", MISSING_MSG, prog_html, None, None, None |
| return |
|
|
| work = Path(tempfile.mkdtemp(prefix="vid2img_")) |
| raw_dir = work / "frames_raw" |
| raw_dir.mkdir(parents=True, exist_ok=True) |
|
|
| prefix = sanitize_prefix(prefix_in) or Path(video.name).stem |
|
|
| vinfo = parse_video_info(ffprobe_json(video.name)) |
| full_duration = float(vinfo.get("duration") or 0.0) |
|
|
| def _parse_ts(ts: str) -> float: |
| if not ts: |
| return 0.0 |
| h, m, s = ts.split(":") if ":" in ts else ("0", "0", ts) |
| return float(h) * 3600 + float(m) * 60 + float(s) |
|
|
| st_s = _parse_ts((start_time or "").strip()) |
| et_s = _parse_ts((end_time or "").strip()) |
| if full_duration and st_s > 0: |
| full_duration = max(0.0, full_duration - st_s) |
| if full_duration and et_s > 0 and et_s < (vinfo.get("duration") or 0): |
| full_duration = max(0.0, min(full_duration, et_s)) |
|
|
| pattern = str(raw_dir / f"{prefix}_%05d.{out_format}") |
| cmd = build_ffmpeg_extract( |
| input_path=video.name, |
| mode=mode, |
| every_seconds=every_seconds, |
| nth_frame=nth_frame, |
| exact_fps=exact_fps, |
| start_time=(start_time or "").strip(), |
| end_time=(end_time or "").strip(), |
| long_side=long_side, |
| out_format=out_format, |
| jpg_quality=jpg_quality, |
| png_level=png_level, |
| scene_detect=scene_detect, |
| scene_thresh=scene_thresh, |
| out_pattern=pattern, |
| ) |
|
|
| cmd = [cmd[0], "-progress", "pipe:2"] + cmd[1:] |
| cmd_preview = " ".join([s if " " not in s else f'"{s}"' for s in cmd]) |
|
|
| proc = subprocess.Popen( |
| cmd, stderr=subprocess.PIPE, stdout=subprocess.DEVNULL, text=True, bufsize=1 |
| ) |
|
|
| last_pct = 0.0 |
| gallery_preview = [] |
| while True: |
| line = proc.stderr.readline() |
| if not line and proc.poll() is not None: |
| break |
| line = (line or "").strip() |
| if line.startswith("out_time=") and full_duration > 0: |
| t = line.split("=", 1)[1] |
| try: |
| h, m, s = t.split(":") |
| secs = float(h) * 3600 + float(m) * 60 + float(s) |
| except Exception: |
| secs = 0.0 |
| pct = max(0.0, min(100.0, (secs / full_duration) * 100.0)) |
| if pct - last_pct >= 1.0 or pct in (0.0, 100.0): |
| last_pct = pct |
| gallery_preview = sample_paths(sorted(raw_dir.glob(f"{prefix}_*.{out_format}"), key=_natural_key), 36) |
| yield gallery_preview, None, "Extracting…", cmd_preview, render_progress(pct, f"Extracting {pct:.0f}%"), None, str(raw_dir), prefix |
|
|
| ret = proc.wait() |
| frames = sorted(raw_dir.glob(f"{prefix}_*.{out_format}"), key=_natural_key) |
|
|
| if preview_all: |
| gallery = [str(p) for p in frames] |
| else: |
| gallery = [str(p) for p in frames] if len(frames) <= 100 else sample_paths(frames, 100) |
|
|
| |
| zip_path = work / f"{prefix}_frames.zip" |
| with zipfile.ZipFile(zip_path, "w", zipfile.ZIP_DEFLATED) as zf: |
| for p in frames: |
| zf.write(p, p.name) |
|
|
| if ret != 0 or not frames: |
| err = "" |
| try: |
| err = proc.stderr.read() if proc.stderr else "" |
| except Exception: |
| pass |
| yield gallery, None, f"Extraction failed.\n\n{err}", cmd_preview, render_progress(0.0, "Failed"), None, str(raw_dir), prefix |
| return |
|
|
| details = f"Frames extracted: {len(frames)} | Saved to: {raw_dir}" |
| yield gallery, str(zip_path), details, cmd_preview, render_progress(100.0, f"Extracted {len(frames)} frames"), [str(p) for p in frames], str(raw_dir), prefix |
|
|
| |
| |
| |
| def build_ui(): |
| with gr.Blocks(theme=gr.themes.Soft()) as demo: |
| gr.HTML(render_logo_html(88)) |
| gr.Markdown("Extract frames from a video with live progress.") |
|
|
| with gr.Row(): |
| video = gr.File(label="Upload video", file_types=[".mp4", ".mov", ".mkv", ".avi", ".webm", ".m4v"], type="filepath") |
|
|
| preview_all = gr.Checkbox(value=False, label="Preview all frames (may be slow)") |
|
|
| with gr.Accordion("Extraction Settings", open=True): |
| with gr.Row(): |
| mode = gr.Dropdown(["Every N seconds", "Every Nth frame", "Exact FPS", "All frames"], value="Every N seconds", label="Mode") |
| every_seconds = gr.Number(value=1.0, label="Every N seconds") |
| nth_frame = gr.Number(value=30, label="Every Nth frame") |
| exact_fps = gr.Number(value=1.0, label="Exact FPS") |
| with gr.Row(): |
| start_time = gr.Textbox(value="", label="Start (HH:MM:SS.mmm)") |
| end_time = gr.Textbox(value="", label="End (HH:MM:SS.mmm)") |
| long_side = gr.Number(value=0, label="Resize long side px (0 = none)") |
| with gr.Row(): |
| out_format = gr.Dropdown(["jpg", "png"], value="jpg", label="Output format") |
| jpg_quality = gr.Slider(2, 31, value=3, step=1, label="JPG quality (2=best)") |
| png_level = gr.Slider(0, 9, value=2, step=1, label="PNG compression level") |
| with gr.Row(): |
| scene_detect = gr.Checkbox(False, label="Scene-change detect") |
| scene_thresh = gr.Slider(0.0, 1.0, value=0.3, step=0.01, label="Scene threshold") |
| prefix_vid = gr.Textbox(value="", label="Filename prefix (defaults to input video name)") |
|
|
| btn_extract = gr.Button("Extract Frames", variant="primary") |
| prog = gr.HTML(render_progress(0.0, "Idle")) |
| gallery = gr.Gallery(label="Preview (≤100 or all if toggled)", columns=6, height=480) |
| zip_out = gr.File(label="Download frames ZIP") |
| details = gr.Markdown("Ready.") |
| with gr.Accordion("Show FFmpeg command", open=False): |
| cmd_preview = gr.Textbox(label="ffmpeg command", lines=4) |
| estimate_md = gr.Markdown("Estimated output: —") |
|
|
| def _toggle_params(mode_val, fmt): |
| return ( |
| gr.update(visible=(mode_val == "Every N seconds")), |
| gr.update(visible=(mode_val == "Every Nth frame")), |
| gr.update(visible=(mode_val == "Exact FPS")), |
| gr.update(visible=(fmt == "jpg")), |
| gr.update(visible=(fmt == "png")), |
| ) |
|
|
| def update_estimate(vfile, mode_val, evs, nth, exfps, st, et): |
| if not vfile or not getattr(vfile, 'name', None): |
| return "Estimated output: —" |
| info = parse_video_info(ffprobe_json(vfile.name)) |
| dur = info.get("duration") |
| def parse_ts(ts: str): |
| if not ts: return 0.0 |
| parts = ts.split(":") |
| if len(parts) == 3: |
| try: return float(parts[0])*3600 + float(parts[1])*60 + float(parts[2]) |
| except Exception: return 0.0 |
| return 0.0 |
| st_s = parse_ts(st or ""); et_s = parse_ts(et or "") |
| if dur: |
| if st_s: dur = max(0.0, dur - st_s) |
| if et_s and et_s < info.get("duration", 0) and et_s > 0: |
| dur = min(dur, et_s) |
| est = estimate_output_count(mode_val, dur, info.get("fps"), evs or 1.0, int(nth or 1), exfps or 1.0) |
| return f"Estimated output: **~{est} frames**" if est else "Estimated output: —" |
|
|
| mode.change(_toggle_params, [mode, out_format], [every_seconds, nth_frame, exact_fps, jpg_quality, png_level]) |
| out_format.change(_toggle_params, [mode, out_format], [every_seconds, nth_frame, exact_fps, jpg_quality, png_level]) |
| demo.load(_toggle_params, [mode, out_format], [every_seconds, nth_frame, exact_fps, jpg_quality, png_level]) |
|
|
| for ctrl in [video, mode, every_seconds, nth_frame, exact_fps, start_time, end_time]: |
| ctrl.change(update_estimate, inputs=[video, mode, every_seconds, nth_frame, exact_fps, start_time, end_time], outputs=[estimate_md]) |
|
|
| btn_extract.click( |
| step1_extract, |
| inputs=[video, mode, every_seconds, nth_frame, exact_fps, start_time, end_time, long_side, out_format, jpg_quality, png_level, scene_detect, scene_thresh, prefix_vid, prog, preview_all], |
| outputs=[gallery, zip_out, details, cmd_preview, prog], |
| ) |
|
|
| if MISSING_MSG: |
| gr.Markdown(f"<span style='color:#b45309'>{MISSING_MSG}</span>") |
|
|
| return demo |
|
|
| if __name__ == "__main__": |
| build_ui().queue().launch() |
|
|