"""TripoSplat Gradio demo with Spark.js in-browser viewer. Usage: python app.py """ import base64 import subprocess import tempfile import time from pathlib import Path from uuid import uuid4 import gradio as gr import spaces import torch from triposplat import TripoSplatPipeline import example_inputs_b64 as _b64 # ---------------------------------------------------------------------------- # Download checkpoints from HuggingFace Hub (VAST-AI/TripoSplat) # ---------------------------------------------------------------------------- subprocess.run( [ "hf", "download", "VAST-AI/TripoSplat", "--local-dir", "ckpts" ], check=True, ) # ---------------------------------------------------------------------------- # Pipeline (loaded once at startup) # ---------------------------------------------------------------------------- PIPE = TripoSplatPipeline( ckpt_path = "ckpts/diffusion_models/triposplat_fp16.safetensors", decoder_path = "ckpts/vae/triposplat_vae_decoder_fp16.safetensors", dinov3_path = "ckpts/clip_vision/dino_v3_vit_h.safetensors", flux2_vae_encoder_path = "ckpts/vae/flux2-vae.safetensors", rmbg_path = "ckpts/background_removal/birefnet.safetensors", device = "cuda", ) OUT_ROOT = Path("gradio_outputs").resolve() OUT_ROOT.mkdir(parents=True, exist_ok=True) VIEWER_HTML = Path("static/viewer/viewer.html").resolve() # Decode example images from base64 into a persistent temp directory so that # gr.Examples (which needs file paths) works without binary files in the repo. _EXAMPLES_TMPDIR = tempfile.mkdtemp(prefix="triposplat_examples_") def _write_example(varname: str, filename: str) -> str: path = Path(_EXAMPLES_TMPDIR) / filename path.write_bytes(base64.b64decode(getattr(_b64, varname))) return str(path) EXAMPLES = [ _write_example("CREATURE_BUTTERFLY", "creature_butterfly.webp"), _write_example("BUILDING_STONE_HOUSE", "building_stone_house.webp"), _write_example("VEHICLE_PIRATE_SHIP", "vehicle_pirate_ship.webp"), _write_example("PLANT_WATER_LILY", "plant_water_lily.webp"), ] PLACEHOLDER_HTML = ( "
" "3D viewer will appear here after generation
" ) def _gr_file(path: Path) -> str: """Gradio serves any file under `allowed_paths` at `/gradio_api/file=`.""" return f"/gradio_api/file={path.as_posix()}" def _viewer_iframe(ply_path: Path) -> str: ts = time.time() # cache-bust so the iframe reloads each generation src = f"{_gr_file(VIEWER_HTML)}?ply={_gr_file(ply_path)}&ts={ts}" return ( f"" ) # ---------------------------------------------------------------------------- # Event handlers # ---------------------------------------------------------------------------- @spaces.GPU def generate(image, seed: int, steps: int, guidance_scale: float, num_gaussians: int, output_format: str, progress=gr.Progress(track_tqdm=True)): """Run the full pipeline (preprocess + encode + sample + decode) in a single GPU acquisition.""" if image is None: raise gr.Error("Please upload an image first.") progress(0, desc="Generating...") t0 = time.time() prepared = PIPE.preprocess_image(image) gen = torch.Generator(device=PIPE._device).manual_seed(int(seed)) cond = PIPE.encode_image(prepared, generator=gen) out = PIPE.sample_latent(cond, steps=int(steps), guidance_scale=float(guidance_scale), generator=gen, show_progress=True) gaussian = PIPE.decode_latent(out["latent"], num_gaussians=int(num_gaussians)) gen_dt = time.time() - t0 out_dir = OUT_ROOT / uuid4().hex[:12] out_dir.mkdir(parents=True, exist_ok=True) ply_path = out_dir / "splat.ply" gaussian.save_ply(str(ply_path)) fmt = output_format.lower() if fmt == "ply": download_path = ply_path elif fmt == "splat": download_path = out_dir / "splat.splat" gaussian.save_splat(str(download_path)) else: raise gr.Error(f"Unknown output format: {output_format}") info = (f"{gaussian.get_xyz.shape[0]:,} gaussians · " f"generation: {gen_dt:.1f}s · saved: {download_path.name}") return prepared, _viewer_iframe(ply_path), gr.update(value=str(download_path), interactive=True), info # ---------------------------------------------------------------------------- # Gradio UI # ---------------------------------------------------------------------------- with gr.Blocks(title="TripoSplat") as demo: gr.Markdown("# TripoSplat") gr.Markdown( "TripoSplat converts a single 2D image into high-quality and variable number of 3D Gaussians, developed by [TripoAI](https://www.tripo3d.ai/). " "It can serve as a powerful pipeline tool for asset creation, AR/VR, game development, simulation environments, and beyond.\n\n" "[Read Paper](https://arxiv.org/abs/2605.16355) | [Technical Blog](https://www.tripo3d.ai/research/triposplat) | [GitHub](https://github.com/VAST-AI-Research/TripoSplat)" ) with gr.Row(): with gr.Column(scale=1): image_in = gr.Image(label="Input image", type="pil", image_mode="RGBA", height=320) gr.Examples( examples=[[p] for p in EXAMPLES], inputs=[image_in], label="Examples (click to load)", examples_per_page=10, cache_examples=False, ) with gr.Accordion("Sampling settings", open=False): seed_in = gr.Number(label="Seed", value=42, precision=0) steps_in = gr.Slider(label="Inference steps", minimum=1, maximum=50, step=1, value=20) cfg_in = gr.Slider(label="Guidance scale", minimum=1.0, maximum=10.0, step=0.5, value=3.0) num_g_in = gr.Dropdown( label="Number of gaussians", choices=["32768", "65536", "131072", "262144"], value="262144", ) fmt_in = gr.Dropdown(label="Download format", choices=["ply", "splat"], value="ply") run_btn = gr.Button("Generate", variant="primary") prepared_out = gr.Image(label="Preprocessed input", interactive=False, height=240) info_out = gr.Markdown() with gr.Column(scale=2): viewer_out = gr.HTML(value=PLACEHOLDER_HTML, label="Spark.js viewer") file_out = gr.DownloadButton(label="Download", value=None, interactive=False) run_btn.click( fn=generate, inputs=[image_in, seed_in, steps_in, cfg_in, num_g_in, fmt_in], outputs=[prepared_out, viewer_out, file_out, info_out], ) if __name__ == "__main__": demo.launch( allowed_paths=[ str(VIEWER_HTML.parent), str(OUT_ROOT), _EXAMPLES_TMPDIR, ], )