TripoSplat / app.py
bennyguo
Inline image_in render; fix example-click misrouted to generate
5df883c
"""TripoSplat Gradio demo with Spark.js in-browser viewer.
Usage: python app.py
"""
import base64
import subprocess
import tempfile
import time
from pathlib import Path
from uuid import uuid4
import gradio as gr
import spaces
import torch
from triposplat import TripoSplatPipeline
import example_inputs_b64 as _b64
# ----------------------------------------------------------------------------
# Download checkpoints from HuggingFace Hub (VAST-AI/TripoSplat)
# ----------------------------------------------------------------------------
subprocess.run(
[
"hf", "download",
"VAST-AI/TripoSplat",
"--local-dir", "ckpts"
],
check=True,
)
# ----------------------------------------------------------------------------
# Pipeline (loaded once at startup)
# ----------------------------------------------------------------------------
PIPE = TripoSplatPipeline(
ckpt_path = "ckpts/diffusion_models/triposplat_fp16.safetensors",
decoder_path = "ckpts/vae/triposplat_vae_decoder_fp16.safetensors",
dinov3_path = "ckpts/clip_vision/dino_v3_vit_h.safetensors",
flux2_vae_encoder_path = "ckpts/vae/flux2-vae.safetensors",
rmbg_path = "ckpts/background_removal/birefnet.safetensors",
device = "cuda",
)
OUT_ROOT = Path("gradio_outputs").resolve()
OUT_ROOT.mkdir(parents=True, exist_ok=True)
VIEWER_HTML = Path("static/viewer/viewer.html").resolve()
# Decode example images from base64 into a persistent temp directory so that
# gr.Examples (which needs file paths) works without binary files in the repo.
_EXAMPLES_TMPDIR = tempfile.mkdtemp(prefix="triposplat_examples_")
def _write_example(varname: str, filename: str) -> str:
path = Path(_EXAMPLES_TMPDIR) / filename
path.write_bytes(base64.b64decode(getattr(_b64, varname)))
return str(path)
EXAMPLES = [
_write_example("CREATURE_BUTTERFLY", "creature_butterfly.webp"),
_write_example("BUILDING_STONE_HOUSE", "building_stone_house.webp"),
_write_example("VEHICLE_PIRATE_SHIP", "vehicle_pirate_ship.webp"),
_write_example("PLANT_WATER_LILY", "plant_water_lily.webp"),
]
PLACEHOLDER_HTML = (
"<div style='display:flex;align-items:center;justify-content:center;height:520px;"
"color:#94a3b8;font:16px system-ui;background:#111318;border-radius:12px'>"
"3D viewer will appear here after generation</div>"
)
def _gr_file(path: Path) -> str:
"""Gradio serves any file under `allowed_paths` at `/gradio_api/file=<abspath>`."""
return f"/gradio_api/file={path.as_posix()}"
def _viewer_iframe(ply_path: Path) -> str:
ts = time.time() # cache-bust so the iframe reloads each generation
src = f"{_gr_file(VIEWER_HTML)}?ply={_gr_file(ply_path)}&ts={ts}"
return (
f"<iframe src='{src}' "
"style='width:100%;height:520px;border:0;border-radius:12px;background:#0a0b0e'></iframe>"
)
# ----------------------------------------------------------------------------
# Event handlers
# ----------------------------------------------------------------------------
@spaces.GPU
def generate(image, seed: int, steps: int, guidance_scale: float,
num_gaussians: int, output_format: str,
progress=gr.Progress(track_tqdm=True)):
"""Run the full pipeline (preprocess + encode + sample + decode) in a
single GPU acquisition."""
if image is None:
raise gr.Error("Please upload an image first.")
progress(0, desc="Generating...")
t0 = time.time()
prepared = PIPE.preprocess_image(image)
gen = torch.Generator(device=PIPE._device).manual_seed(int(seed))
cond = PIPE.encode_image(prepared, generator=gen)
out = PIPE.sample_latent(cond, steps=int(steps),
guidance_scale=float(guidance_scale),
generator=gen, show_progress=True)
gaussian = PIPE.decode_latent(out["latent"], num_gaussians=int(num_gaussians))
gen_dt = time.time() - t0
out_dir = OUT_ROOT / uuid4().hex[:12]
out_dir.mkdir(parents=True, exist_ok=True)
ply_path = out_dir / "splat.ply"
gaussian.save_ply(str(ply_path))
fmt = output_format.lower()
if fmt == "ply":
download_path = ply_path
elif fmt == "splat":
download_path = out_dir / "splat.splat"
gaussian.save_splat(str(download_path))
else:
raise gr.Error(f"Unknown output format: {output_format}")
info = (f"{gaussian.get_xyz.shape[0]:,} gaussians · "
f"generation: {gen_dt:.1f}s · saved: {download_path.name}")
return prepared, _viewer_iframe(ply_path), gr.update(value=str(download_path), interactive=True), info
# ----------------------------------------------------------------------------
# Gradio UI
# ----------------------------------------------------------------------------
with gr.Blocks(title="TripoSplat") as demo:
gr.Markdown("# TripoSplat")
gr.Markdown(
"TripoSplat converts a single 2D image into high-quality and variable number of 3D Gaussians, developed by [TripoAI](https://www.tripo3d.ai/). "
"It can serve as a powerful pipeline tool for asset creation, AR/VR, game development, simulation environments, and beyond.\n\n"
"[Read Paper](https://arxiv.org/abs/2605.16355) | [Technical Blog](https://www.tripo3d.ai/research/triposplat) | [GitHub](https://github.com/VAST-AI-Research/TripoSplat)"
)
with gr.Row():
with gr.Column(scale=1):
image_in = gr.Image(label="Input image", type="pil", image_mode="RGBA",
height=320)
gr.Examples(
examples=[[p] for p in EXAMPLES],
inputs=[image_in],
label="Examples (click to load)",
examples_per_page=10,
cache_examples=False,
)
with gr.Accordion("Sampling settings", open=False):
seed_in = gr.Number(label="Seed", value=42, precision=0)
steps_in = gr.Slider(label="Inference steps", minimum=1, maximum=50, step=1, value=20)
cfg_in = gr.Slider(label="Guidance scale", minimum=1.0, maximum=10.0, step=0.5, value=3.0)
num_g_in = gr.Dropdown(
label="Number of gaussians",
choices=["32768", "65536", "131072", "262144"],
value="262144",
)
fmt_in = gr.Dropdown(label="Download format", choices=["ply", "splat"], value="ply")
run_btn = gr.Button("Generate", variant="primary")
prepared_out = gr.Image(label="Preprocessed input", interactive=False, height=240)
info_out = gr.Markdown()
with gr.Column(scale=2):
viewer_out = gr.HTML(value=PLACEHOLDER_HTML, label="Spark.js viewer")
file_out = gr.DownloadButton(label="Download", value=None, interactive=False)
run_btn.click(
fn=generate,
inputs=[image_in, seed_in, steps_in, cfg_in, num_g_in, fmt_in],
outputs=[prepared_out, viewer_out, file_out, info_out],
)
if __name__ == "__main__":
demo.launch(
allowed_paths=[
str(VIEWER_HTML.parent),
str(OUT_ROOT),
_EXAMPLES_TMPDIR,
],
)