Spaces:

Clara211111
/

flow3r

Running on Zero

App Files Files Community

Clara211111 commited on Feb 27

Commit

225a205

1 Parent(s): fb4b0cb

test

Browse files

Files changed (4) hide show

README.md +1 -1
app copy.py +0 -740
app.py +0 -7
requirements.txt +1 -0

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ emoji: 👁
 colorFrom: pink
 colorTo: green
 sdk: gradio
-sdk_version: 5.17.1
 app_file: app.py
 pinned: false
 ---

 colorFrom: pink
 colorTo: green
 sdk: gradio
+sdk_version: 5.37.0
 app_file: app.py
 pinned: false
 ---

app copy.py DELETED Viewed

@@ -1,740 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the license found in the
-# LICENSE file in the root directory of this source tree.
-import os, time, sys
-print("### SPACE BOOT: file =", __file__, flush=True)
-print("### argv =", sys.argv, flush=True)
-print("### cwd =", os.getcwd(), flush=True)
-print("### gradio_ssr =", os.environ.get("GRADIO_SSR_MODE"), "zero =", os.environ.get("SPACES_ZERO_GPU"), flush=True)
-import os
-import cv2
-import torch
-import numpy as np
-import gradio as gr
-import sys
-import shutil
-from datetime import datetime
-import glob
-import gc
-import time
-import trimesh
-import matplotlib
-import spaces
-from flow3r.models.flow3r import Flow3r
-from flow3r.utils.basic import load_images_as_tensor
-from flow3r.utils.geometry import depth_edge
-from scipy.spatial.transform import Rotation
-from huggingface_hub import hf_hub_download
-# sys.path.append("flow3r/")
-device = "cuda" if torch.cuda.is_available() else "cpu"
-print("Initializing and loading Flow3r model...")
-model = Flow3r()
-ckpt_path = hf_hub_download(repo_id="Clara211111/flow3r", filename="flow3r.bin")
-checkpoint = torch.load(ckpt_path, weights_only=False, map_location='cpu')
-model.load_state_dict(checkpoint, strict=True)
-model.eval()
-model = model.to(device)
-# -------------------------------------------------------------------------
-# Utils
-# -------------------------------------------------------------------------
-def predictions_to_glb(
-    predictions,
-    conf_thres=50.0,
-    filter_by_frames="all",
-    show_cam=True,
-) -> trimesh.Scene:
-    """
-    Converts predictions to a 3D scene represented as a GLB file.
-    Args:
-        predictions (dict): Dictionary containing model predictions with keys:
-            - world_points: 3D point coordinates (S, H, W, 3)
-            - world_points_conf: Confidence scores (S, H, W)
-            - images: Input images (S, H, W, 3)
-            - extrinsic: Camera extrinsic matrices (S, 3, 4)
-        conf_thres (float): Percentage of low-confidence points to filter out (default: 50.0)
-        filter_by_frames (str): Frame filter specification (default: "all")
-        show_cam (bool): Include camera visualization (default: True)
-    Returns:
-        trimesh.Scene: Processed 3D scene containing point cloud and cameras
-    Raises:
-        ValueError: If input predictions structure is invalid
-    """
-    if not isinstance(predictions, dict):
-        raise ValueError("predictions must be a dictionary")
-    if conf_thres is None:
-        conf_thres = 10
-    print("Building GLB scene")
-    selected_frame_idx = None
-    if filter_by_frames != "all" and filter_by_frames != "All":
-        try:
-            # Extract the index part before the colon
-            selected_frame_idx = int(filter_by_frames.split(":")[0])
-        except (ValueError, IndexError):
-            pass
-    pred_world_points = predictions["points"]
-    pred_world_points_conf = predictions.get("conf", np.ones_like(pred_world_points[..., 0]))
-    # Get images from predictions
-    images = predictions["images"]
-    # Use extrinsic matrices instead of pred_extrinsic_list
-    camera_poses = predictions["camera_poses"]
-    if selected_frame_idx is not None:
-        pred_world_points = pred_world_points[selected_frame_idx][None]
-        pred_world_points_conf = pred_world_points_conf[selected_frame_idx][None]
-        images = images[selected_frame_idx][None]
-        camera_poses = camera_poses[selected_frame_idx][None]
-    vertices_3d = pred_world_points.reshape(-1, 3)
-    # Handle different image formats - check if images need transposing
-    if images.ndim == 4 and images.shape[1] == 3:  # NCHW format
-        colors_rgb = np.transpose(images, (0, 2, 3, 1))
-    else:  # Assume already in NHWC format
-        colors_rgb = images
-    colors_rgb = (colors_rgb.reshape(-1, 3) * 255).astype(np.uint8)
-    conf = pred_world_points_conf.reshape(-1)
-    # Convert percentage threshold to actual confidence value
-    if conf_thres == 0.0:
-        conf_threshold = 0.0
-    else:
-        # conf_threshold = np.percentile(conf, conf_thres)
-        conf_threshold = conf_thres / 100
-    conf_mask = (conf >= conf_threshold) & (conf > 1e-5)
-    vertices_3d = vertices_3d[conf_mask]
-    colors_rgb = colors_rgb[conf_mask]
-    if vertices_3d is None or np.asarray(vertices_3d).size == 0:
-        vertices_3d = np.array([[1, 0, 0]])
-        colors_rgb = np.array([[255, 255, 255]])
-        scene_scale = 1
-    else:
-        # Calculate the 5th and 95th percentiles along each axis
-        lower_percentile = np.percentile(vertices_3d, 5, axis=0)
-        upper_percentile = np.percentile(vertices_3d, 95, axis=0)
-        # Calculate the diagonal length of the percentile bounding box
-        scene_scale = np.linalg.norm(upper_percentile - lower_percentile)
-    colormap = matplotlib.colormaps.get_cmap("gist_rainbow")
-    # Initialize a 3D scene
-    scene_3d = trimesh.Scene()
-    # Add point cloud data to the scene
-    point_cloud_data = trimesh.PointCloud(vertices=vertices_3d, colors=colors_rgb)
-    scene_3d.add_geometry(point_cloud_data)
-    # Prepare 4x4 matrices for camera extrinsics
-    num_cameras = len(camera_poses)
-    if show_cam:
-        # Add camera models to the scene
-        for i in range(num_cameras):
-            camera_to_world = camera_poses[i]
-            rgba_color = colormap(i / num_cameras)
-            current_color = tuple(int(255 * x) for x in rgba_color[:3])
-            # integrate_camera_into_scene(scene_3d, camera_to_world, current_color, scene_scale)
-            integrate_camera_into_scene(scene_3d, camera_to_world, current_color, 1.)          # fixed camera size
-    # Rotate scene for better visualize
-    align_rotation = np.eye(4)
-    align_rotation[:3, :3] = Rotation.from_euler("y", 100, degrees=True).as_matrix()            # plane rotate
-    align_rotation[:3, :3] = align_rotation[:3, :3] @ Rotation.from_euler("x", 155, degrees=True).as_matrix()           # roll
-    scene_3d.apply_transform(align_rotation)
-    print("GLB Scene built")
-    return scene_3d
-def get_opengl_conversion_matrix() -> np.ndarray:
-    """
-    Constructs and returns the OpenGL conversion matrix.
-    Returns:
-        numpy.ndarray: A 4x4 OpenGL conversion matrix.
-    """
-    # Create an identity matrix
-    matrix = np.identity(4)
-    # Flip the y and z axes
-    matrix[1, 1] = -1
-    matrix[2, 2] = -1
-    return matrix
-def integrate_camera_into_scene(scene: trimesh.Scene, transform: np.ndarray, face_colors: tuple, scene_scale: float):
-    """
-    Integrates a fake camera mesh into the 3D scene.
-    Args:
-        scene (trimesh.Scene): The 3D scene to add the camera model.
-        transform (np.ndarray): Transformation matrix for camera positioning.
-        face_colors (tuple): Color of the camera face.
-        scene_scale (float): Scale of the scene.
-    """
-    cam_width = scene_scale * 0.05
-    cam_height = scene_scale * 0.1
-    # Create cone shape for camera
-    rot_45_degree = np.eye(4)
-    rot_45_degree[:3, :3] = Rotation.from_euler("z", 45, degrees=True).as_matrix()
-    rot_45_degree[2, 3] = -cam_height
-    opengl_transform = get_opengl_conversion_matrix()
-    # Combine transformations
-    complete_transform = transform @ opengl_transform @ rot_45_degree
-    camera_cone_shape = trimesh.creation.cone(cam_width, cam_height, sections=4)
-    # Generate mesh for the camera
-    slight_rotation = np.eye(4)
-    slight_rotation[:3, :3] = Rotation.from_euler("z", 2, degrees=True).as_matrix()
-    vertices_combined = np.concatenate(
-        [
-            camera_cone_shape.vertices,
-            0.95 * camera_cone_shape.vertices,
-            transform_points(slight_rotation, camera_cone_shape.vertices),
-        ]
-    )
-    vertices_transformed = transform_points(complete_transform, vertices_combined)
-    mesh_faces = compute_camera_faces(camera_cone_shape)
-    # Add the camera mesh to the scene
-    camera_mesh = trimesh.Trimesh(vertices=vertices_transformed, faces=mesh_faces)
-    camera_mesh.visual.face_colors[:, :3] = face_colors
-    scene.add_geometry(camera_mesh)
-def transform_points(transformation: np.ndarray, points: np.ndarray, dim: int = None) -> np.ndarray:
-    """
-    Applies a 4x4 transformation to a set of points.
-    Args:
-        transformation (np.ndarray): Transformation matrix.
-        points (np.ndarray): Points to be transformed.
-        dim (int, optional): Dimension for reshaping the result.
-    Returns:
-        np.ndarray: Transformed points.
-    """
-    points = np.asarray(points)
-    initial_shape = points.shape[:-1]
-    dim = dim or points.shape[-1]
-    # Apply transformation
-    transformation = transformation.swapaxes(-1, -2)  # Transpose the transformation matrix
-    points = points @ transformation[..., :-1, :] + transformation[..., -1:, :]
-    # Reshape the result
-    result = points[..., :dim].reshape(*initial_shape, dim)
-    return result
-def compute_camera_faces(cone_shape: trimesh.Trimesh) -> np.ndarray:
-    """
-    Computes the faces for the camera mesh.
-    Args:
-        cone_shape (trimesh.Trimesh): The shape of the camera cone.
-    Returns:
-        np.ndarray: Array of faces for the camera mesh.
-    """
-    # Create pseudo cameras
-    faces_list = []
-    num_vertices_cone = len(cone_shape.vertices)
-    for face in cone_shape.faces:
-        if 0 in face:
-            continue
-        v1, v2, v3 = face
-        v1_offset, v2_offset, v3_offset = face + num_vertices_cone
-        v1_offset_2, v2_offset_2, v3_offset_2 = face + 2 * num_vertices_cone
-        faces_list.extend(
-            [
-                (v1, v2, v2_offset),
-                (v1, v1_offset, v3),
-                (v3_offset, v2, v3),
-                (v1, v2, v2_offset_2),
-                (v1, v1_offset_2, v3),
-                (v3_offset_2, v2, v3),
-            ]
-        )
-    faces_list += [(v3, v2, v1) for v1, v2, v3 in faces_list]
-    return np.array(faces_list)
-# -------------------------------------------------------------------------
-# 1) Core model inference
-# -------------------------------------------------------------------------
-@spaces.GPU(duration=120)
-def run_model(target_dir, model) -> dict:
-    print(f"Processing images from {target_dir}")
-    # Device check
-    device = "cuda" if torch.cuda.is_available() else "cpu"
-    if not torch.cuda.is_available():
-        raise ValueError("CUDA is not available. Check your environment.")
-    # Move model to device
-    model = model.to(device)
-    model.eval()
-    # Load and preprocess images
-    image_names = glob.glob(os.path.join(target_dir, "images", "*"))
-    image_names = sorted(image_names)
-    print(f"Found {len(image_names)} images")
-    if len(image_names) == 0:
-        raise ValueError("No images found. Check your upload.")
-    # interval = 10 if target_dir.endswith('.mp4') else 1
-    interval = 1
-    imgs = load_images_as_tensor(os.path.join(target_dir, "images"), interval=interval).to(device) # (N, 3, H, W)
-    # Run inference
-    print("Running inference...")
-    dtype = torch.bfloat16 if torch.cuda.get_device_capability()[0] >= 8 else torch.float16
-    with torch.no_grad():
-        with torch.cuda.amp.autocast(dtype=dtype):
-            predictions = model(imgs[None]) # Add batch dimension
-    predictions['images'] = imgs[None].permute(0, 1, 3, 4, 2)
-    predictions['conf'] = torch.sigmoid(predictions['conf'])
-    edge = depth_edge(predictions['local_points'][..., 2], rtol=0.03)
-    predictions['conf'][edge] = 0.0
-    del predictions['local_points']
-    # Convert tensors to numpy
-    for key in predictions.keys():
-        if isinstance(predictions[key], torch.Tensor):
-            predictions[key] = predictions[key].cpu().numpy().squeeze(0)  # remove batch dimension
-    # Clean up
-    torch.cuda.empty_cache()
-    return predictions
-# -------------------------------------------------------------------------
-# 2) Handle uploaded video/images --> produce target_dir + images
-# -------------------------------------------------------------------------
-def handle_uploads(input_video, input_images):
-    """
-    Create a new 'target_dir' + 'images' subfolder, and place user-uploaded
-    images or extracted frames from video into it. Return (target_dir, image_paths).
-    """
-    start_time = time.time()
-    gc.collect()
-    torch.cuda.empty_cache()
-    # Create a unique folder name
-    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S_%f")
-    target_dir = f"input_images_{timestamp}"
-    target_dir_images = os.path.join(target_dir, "images")
-    # Clean up if somehow that folder already exists
-    if os.path.exists(target_dir):
-        shutil.rmtree(target_dir)
-    os.makedirs(target_dir)
-    os.makedirs(target_dir_images)
-    image_paths = []
-    # --- Handle images ---
-    if input_images is not None:
-        for file_data in input_images:
-            if isinstance(file_data, dict) and "name" in file_data:
-                file_path = file_data["name"]
-            else:
-                file_path = file_data
-            dst_path = os.path.join(target_dir_images, os.path.basename(file_path))
-            shutil.copy(file_path, dst_path)
-            image_paths.append(dst_path)
-    # --- Handle video ---
-    if input_video is not None:
-        if isinstance(input_video, dict) and "name" in input_video:
-            video_path = input_video["name"]
-        else:
-            video_path = input_video
-        vs = cv2.VideoCapture(video_path)
-        fps = vs.get(cv2.CAP_PROP_FPS)
-        frame_interval = int(fps * 1)  # 1 frame/sec
-        count = 0
-        video_frame_num = 0
-        while True:
-            gotit, frame = vs.read()
-            if not gotit:
-                break
-            count += 1
-            if count % frame_interval == 0:
-                image_path = os.path.join(target_dir_images, f"{video_frame_num:06}.png")
-                cv2.imwrite(image_path, frame)
-                image_paths.append(image_path)
-                video_frame_num += 1
-    # Sort final images for gallery
-    image_paths = sorted(image_paths)
-    end_time = time.time()
-    print(f"Files copied to {target_dir_images}; took {end_time - start_time:.3f} seconds")
-    return target_dir, image_paths
-# -------------------------------------------------------------------------
-# 3) Update gallery on upload
-# -------------------------------------------------------------------------
-def update_gallery_on_upload(input_video, input_images):
-    """
-    Whenever user uploads or changes files, immediately handle them
-    and show in the gallery. Return (target_dir, image_paths).
-    If nothing is uploaded, returns "None" and empty list.
-    """
-    if not input_video and not input_images:
-        return None, None, None, None
-    target_dir, image_paths = handle_uploads(input_video, input_images)
-    return None, target_dir, image_paths, "Upload complete. Click 'Reconstruct' to begin 3D processing."
-# -------------------------------------------------------------------------
-# 4) Reconstruction: uses the target_dir plus any viz parameters
-# -------------------------------------------------------------------------
-@spaces.GPU(duration=120)
-def gradio_demo(
-    target_dir,
-    conf_thres=3.0,
-    frame_filter="All",
-    show_cam=True,
-):
-    """
-    Perform reconstruction using the already-created target_dir/images.
-    """
-    if not os.path.isdir(target_dir) or target_dir == "None":
-        return None, "No valid target directory found. Please upload first.", None, None
-    start_time = time.time()
-    gc.collect()
-    torch.cuda.empty_cache()
-    # Prepare frame_filter dropdown
-    target_dir_images = os.path.join(target_dir, "images")
-    all_files = sorted(os.listdir(target_dir_images)) if os.path.isdir(target_dir_images) else []
-    all_files = [f"{i}: {filename}" for i, filename in enumerate(all_files)]
-    frame_filter_choices = ["All"] + all_files
-    print("Running run_model...")
-    with torch.no_grad():
-        predictions = run_model(target_dir, model)
-    # Save predictions
-    prediction_save_path = os.path.join(target_dir, "predictions.npz")
-    np.savez(prediction_save_path, **predictions)
-    # Handle None frame_filter
-    if frame_filter is None:
-        frame_filter = "All"
-    # Build a GLB file name
-    glbfile = os.path.join(
-        target_dir,
-        f"glbscene_{conf_thres}_{frame_filter.replace('.', '_').replace(':', '').replace(' ', '_')}_cam{show_cam}.glb",
-    )
-    # Convert predictions to GLB
-    glbscene = predictions_to_glb(
-        predictions,
-        conf_thres=conf_thres,
-        filter_by_frames=frame_filter,
-        show_cam=show_cam,
-        # mask_sky=mask_sky,
-    )
-    glbscene.export(file_obj=glbfile)
-    # Cleanup
-    del predictions
-    gc.collect()
-    torch.cuda.empty_cache()
-    end_time = time.time()
-    print(f"Total time: {end_time - start_time:.2f} seconds (including IO)")
-    log_msg = f"Reconstruction Success ({len(all_files)} frames). Waiting for visualization."
-    return glbfile, log_msg, gr.Dropdown(choices=frame_filter_choices, value=frame_filter, interactive=True)
-# -------------------------------------------------------------------------
-# 5) Helper functions for UI resets + re-visualization
-# -------------------------------------------------------------------------
-def clear_fields():
-    """
-    Clears the 3D viewer, the stored target_dir, and empties the gallery.
-    """
-    return None
-def update_log():
-    """
-    Display a quick log message while waiting.
-    """
-    return "Loading and Reconstructing..."
-def update_visualization(
-    target_dir, conf_thres, frame_filter, show_cam, is_example
-):
-    """
-    Reload saved predictions from npz, create (or reuse) the GLB for new parameters,
-    and return it for the 3D viewer. If is_example == "True", skip.
-    """
-    # If it's an example click, skip as requested
-    if is_example == "True":
-        return None, "No reconstruction available. Please click the Reconstruct button first."
-    if not target_dir or target_dir == "None" or not os.path.isdir(target_dir):
-        return None, "No reconstruction available. Please click the Reconstruct button first."
-    predictions_path = os.path.join(target_dir, "predictions.npz")
-    if not os.path.exists(predictions_path):
-        return None, f"No reconstruction available at {predictions_path}. Please run 'Reconstruct' first."
-    key_list = [
-        "images",
-        "points",
-        "conf",
-        "camera_poses",
-    ]
-    loaded = np.load(predictions_path)
-    predictions = {key: np.array(loaded[key]) for key in key_list}
-    glbfile = os.path.join(
-        target_dir,
-        f"glbscene_{conf_thres}_{frame_filter.replace('.', '_').replace(':', '').replace(' ', '_')}_cam{show_cam}.glb",
-    )
-    if not os.path.exists(glbfile):
-        glbscene = predictions_to_glb(
-            predictions,
-            conf_thres=conf_thres,
-            filter_by_frames=frame_filter,
-            show_cam=show_cam,
-            # mask_sky=mask_sky,
-        )
-        glbscene.export(file_obj=glbfile)
-    return glbfile, "Updating Visualization"
-# -------------------------------------------------------------------------
-# Example images
-# -------------------------------------------------------------------------
-great_wall_video = "examples/videos/great_wall.mp4"
-colosseum_video = "examples/videos/Colosseum.mp4"
-room_video = "examples/videos/room.mp4"
-kitchen_video = "examples/videos/kitchen.mp4"
-fern_video = "examples/videos/fern.mp4"
-single_cartoon_video = "examples/videos/single_cartoon.mp4"
-single_oil_painting_video = "examples/videos/single_oil_painting.mp4"
-pyramid_video = "examples/videos/pyramid.mp4"
-# -------------------------------------------------------------------------
-# 6) Build Gradio UI
-# -------------------------------------------------------------------------
-theme = gr.themes.Ocean()
-theme.set(
-    checkbox_label_background_fill_selected="*button_primary_background_fill",
-    checkbox_label_text_color_selected="*button_primary_text_color",
-)
-with gr.Blocks(
-    theme=theme,
-    css="""
-    .custom-log * {
-        font-style: italic;
-        font-size: 22px !important;
-        background-image: linear-gradient(120deg, #0ea5e9 0%, #6ee7b7 60%, #34d399 100%);
-        -webkit-background-clip: text;
-        background-clip: text;
-        font-weight: bold !important;
-        color: transparent !important;
-        text-align: center !important;
-    }
-    .example-log * {
-        font-style: italic;
-        font-size: 16px !important;
-        background-image: linear-gradient(120deg, #0ea5e9 0%, #6ee7b7 60%, #34d399 100%);
-        -webkit-background-clip: text;
-        background-clip: text;
-        color: transparent !important;
-    }
-    #my_radio .wrap {
-        display: flex;
-        flex-wrap: nowrap;
-        justify-content: center;
-        align-items: center;
-    }
-    #my_radio .wrap label {
-        display: flex;
-        width: 50%;
-        justify-content: center;
-        align-items: center;
-        margin: 0;
-        padding: 10px 0;
-        box-sizing: border-box;
-    }
-    """,
-) as demo:
-    # Instead of gr.State, we use a hidden Textbox:
-    is_example = gr.Textbox(label="is_example", visible=False, value="None")
-    num_images = gr.Textbox(label="num_images", visible=False, value="None")
-    gr.HTML(
-        """
-    <h1>Flow3r: Factored Flow Prediction for Visual Geometry Learning</h1>
-    <p>
-    <a href="https://github.com/Kidrauh/flow3r">GitHub Repository</a> |
-    <a href="https://flow3r-project.github.io/">Project Page</a>
-    </p>
-    <div style="font-size: 16px; line-height: 1.5;">
-    <p>Upload a video or a set of images to create a 3D reconstruction of a scene or object. Flow3r takes these images and generates a 3D point cloud, along with estimated camera poses.</p>
-    </div>
-    """
-    )
-    target_dir_output = gr.Textbox(label="Target Dir", visible=False, value="None")
-    with gr.Row():
-        with gr.Column(scale=2):
-            input_video = gr.Video(label="Upload Video", interactive=True)
-            input_images = gr.File(file_count="multiple", label="Upload Images", interactive=True)
-            image_gallery = gr.Gallery(
-                label="Preview",
-                columns=4,
-                height="300px",
-                # show_download_button=True,
-                object_fit="contain",
-                preview=True,
-            )
-        with gr.Column(scale=4):
-            with gr.Column():
-                gr.Markdown("**3D Reconstruction (Point Cloud and Camera Poses)**")
-                log_output = gr.Markdown(
-                    "Please upload a video or images, then click Reconstruct.", elem_classes=["custom-log"]
-                )
-                reconstruction_output = gr.Model3D(height=520, zoom_speed=0.5, pan_speed=0.5)
-            with gr.Row():
-                submit_btn = gr.Button("Reconstruct", scale=1, variant="primary")
-                clear_btn = gr.ClearButton(
-                    [input_video, input_images, reconstruction_output, log_output, target_dir_output, image_gallery],
-                    scale=1,
-                )
-            with gr.Row():
-                conf_thres = gr.Slider(minimum=0, maximum=100, value=0, step=0.1, label="Confidence Threshold (%)")
-                frame_filter = gr.Dropdown(choices=["All"], value="All", label="Show Points from Frame")
-                with gr.Column():
-                    show_cam = gr.Checkbox(label="Show Camera", value=True)
-    submit_btn.click(fn=clear_fields, inputs=[], outputs=[reconstruction_output]).then(
-        fn=update_log, inputs=[], outputs=[log_output]
-    ).then(
-        fn=gradio_demo,
-        inputs=[
-            target_dir_output,
-            conf_thres,
-            frame_filter,
-            show_cam,
-        ],
-        outputs=[reconstruction_output, log_output, frame_filter],
-    ).then(
-        fn=lambda: "False", inputs=[], outputs=[is_example]  # set is_example to "False"
-    )
-    # -------------------------------------------------------------------------
-    # Real-time Visualization Updates
-    # -------------------------------------------------------------------------
-    conf_thres.change(
-        update_visualization,
-        [
-            target_dir_output,
-            conf_thres,
-            frame_filter,
-            show_cam,
-            is_example,
-        ],
-        [reconstruction_output, log_output],
-    )
-    frame_filter.change(
-        update_visualization,
-        [
-            target_dir_output,
-            conf_thres,
-            frame_filter,
-            show_cam,
-            is_example,
-        ],
-        [reconstruction_output, log_output],
-    )
-    show_cam.change(
-        update_visualization,
-        [
-            target_dir_output,
-            conf_thres,
-            frame_filter,
-            show_cam,
-            is_example,
-        ],
-        [reconstruction_output, log_output],
-    )
-    # -------------------------------------------------------------------------
-    # Auto-update gallery whenever user uploads or changes their files
-    # -------------------------------------------------------------------------
-    input_video.change(
-        fn=update_gallery_on_upload,
-        inputs=[input_video, input_images],
-        outputs=[reconstruction_output, target_dir_output, image_gallery, log_output],
-    )
-    input_images.change(
-        fn=update_gallery_on_upload,
-        inputs=[input_video, input_images],
-        outputs=[reconstruction_output, target_dir_output, image_gallery, log_output],
-    )
-    print("### ABOUT TO LAUNCH", flush=True)
-    demo.queue(max_size=20).launch(show_error=True, share=True, ssr_mode=False)

app.py CHANGED Viewed

@@ -4,12 +4,6 @@
 # This source code is licensed under the license found in the
 # LICENSE file in the root directory of this source tree.
 import os, time, sys
-print("### SPACE BOOT: file =", __file__, flush=True)
-print("### argv =", sys.argv, flush=True)
-print("### cwd =", os.getcwd(), flush=True)
-print("### gradio_ssr =", os.environ.get("GRADIO_SSR_MODE"), "zero =", os.environ.get("SPACES_ZERO_GPU"), flush=True)
 import os
 import cv2
 import torch
@@ -736,5 +730,4 @@ with gr.Blocks(
         inputs=[input_video, input_images],
         outputs=[reconstruction_output, target_dir_output, image_gallery, log_output],
     )
-    print("### ABOUT TO LAUNCH", flush=True)
     demo.queue(max_size=20).launch(show_error=True, share=True, ssr_mode=False)

 # This source code is licensed under the license found in the
 # LICENSE file in the root directory of this source tree.
 import os, time, sys
 import os
 import cv2
 import torch
         inputs=[input_video, input_images],
         outputs=[reconstruction_output, target_dir_output, image_gallery, log_output],
     )
     demo.queue(max_size=20).launch(show_error=True, share=True, ssr_mode=False)

requirements.txt CHANGED Viewed

@@ -6,6 +6,7 @@ opencv-python
 plyfile
 huggingface_hub
 safetensors
 # below for gradio
 gradio

 plyfile
 huggingface_hub
 safetensors
+pydantic==2.10.6
 # below for gradio
 gradio