Spaces:
Running on Zero
Running on Zero
File size: 7,302 Bytes
c43e1bf 0798bf7 db54c72 c43e1bf db54c72 c43e1bf db54c72 c43e1bf db54c72 c43e1bf 7f89ce5 c43e1bf 5df883c c43e1bf db54c72 c43e1bf | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 | """TripoSplat Gradio demo with Spark.js in-browser viewer.
Usage: python app.py
"""
import base64
import subprocess
import tempfile
import time
from pathlib import Path
from uuid import uuid4
import gradio as gr
import spaces
import torch
from triposplat import TripoSplatPipeline
import example_inputs_b64 as _b64
# ----------------------------------------------------------------------------
# Download checkpoints from HuggingFace Hub (VAST-AI/TripoSplat)
# ----------------------------------------------------------------------------
subprocess.run(
[
"hf", "download",
"VAST-AI/TripoSplat",
"--local-dir", "ckpts"
],
check=True,
)
# ----------------------------------------------------------------------------
# Pipeline (loaded once at startup)
# ----------------------------------------------------------------------------
PIPE = TripoSplatPipeline(
ckpt_path = "ckpts/diffusion_models/triposplat_fp16.safetensors",
decoder_path = "ckpts/vae/triposplat_vae_decoder_fp16.safetensors",
dinov3_path = "ckpts/clip_vision/dino_v3_vit_h.safetensors",
flux2_vae_encoder_path = "ckpts/vae/flux2-vae.safetensors",
rmbg_path = "ckpts/background_removal/birefnet.safetensors",
device = "cuda",
)
OUT_ROOT = Path("gradio_outputs").resolve()
OUT_ROOT.mkdir(parents=True, exist_ok=True)
VIEWER_HTML = Path("static/viewer/viewer.html").resolve()
# Decode example images from base64 into a persistent temp directory so that
# gr.Examples (which needs file paths) works without binary files in the repo.
_EXAMPLES_TMPDIR = tempfile.mkdtemp(prefix="triposplat_examples_")
def _write_example(varname: str, filename: str) -> str:
path = Path(_EXAMPLES_TMPDIR) / filename
path.write_bytes(base64.b64decode(getattr(_b64, varname)))
return str(path)
EXAMPLES = [
_write_example("CREATURE_BUTTERFLY", "creature_butterfly.webp"),
_write_example("BUILDING_STONE_HOUSE", "building_stone_house.webp"),
_write_example("VEHICLE_PIRATE_SHIP", "vehicle_pirate_ship.webp"),
_write_example("PLANT_WATER_LILY", "plant_water_lily.webp"),
]
PLACEHOLDER_HTML = (
"<div style='display:flex;align-items:center;justify-content:center;height:520px;"
"color:#94a3b8;font:16px system-ui;background:#111318;border-radius:12px'>"
"3D viewer will appear here after generation</div>"
)
def _gr_file(path: Path) -> str:
"""Gradio serves any file under `allowed_paths` at `/gradio_api/file=<abspath>`."""
return f"/gradio_api/file={path.as_posix()}"
def _viewer_iframe(ply_path: Path) -> str:
ts = time.time() # cache-bust so the iframe reloads each generation
src = f"{_gr_file(VIEWER_HTML)}?ply={_gr_file(ply_path)}&ts={ts}"
return (
f"<iframe src='{src}' "
"style='width:100%;height:520px;border:0;border-radius:12px;background:#0a0b0e'></iframe>"
)
# ----------------------------------------------------------------------------
# Event handlers
# ----------------------------------------------------------------------------
@spaces.GPU
def generate(image, seed: int, steps: int, guidance_scale: float,
num_gaussians: int, output_format: str,
progress=gr.Progress(track_tqdm=True)):
"""Run the full pipeline (preprocess + encode + sample + decode) in a
single GPU acquisition."""
if image is None:
raise gr.Error("Please upload an image first.")
progress(0, desc="Generating...")
t0 = time.time()
prepared = PIPE.preprocess_image(image)
gen = torch.Generator(device=PIPE._device).manual_seed(int(seed))
cond = PIPE.encode_image(prepared, generator=gen)
out = PIPE.sample_latent(cond, steps=int(steps),
guidance_scale=float(guidance_scale),
generator=gen, show_progress=True)
gaussian = PIPE.decode_latent(out["latent"], num_gaussians=int(num_gaussians))
gen_dt = time.time() - t0
out_dir = OUT_ROOT / uuid4().hex[:12]
out_dir.mkdir(parents=True, exist_ok=True)
ply_path = out_dir / "splat.ply"
gaussian.save_ply(str(ply_path))
fmt = output_format.lower()
if fmt == "ply":
download_path = ply_path
elif fmt == "splat":
download_path = out_dir / "splat.splat"
gaussian.save_splat(str(download_path))
else:
raise gr.Error(f"Unknown output format: {output_format}")
info = (f"{gaussian.get_xyz.shape[0]:,} gaussians · "
f"generation: {gen_dt:.1f}s · saved: {download_path.name}")
return prepared, _viewer_iframe(ply_path), gr.update(value=str(download_path), interactive=True), info
# ----------------------------------------------------------------------------
# Gradio UI
# ----------------------------------------------------------------------------
with gr.Blocks(title="TripoSplat") as demo:
gr.Markdown("# TripoSplat")
gr.Markdown(
"TripoSplat converts a single 2D image into high-quality and variable number of 3D Gaussians, developed by [TripoAI](https://www.tripo3d.ai/). "
"It can serve as a powerful pipeline tool for asset creation, AR/VR, game development, simulation environments, and beyond.\n\n"
"[Read Paper](https://arxiv.org/abs/2605.16355) | [Technical Blog](https://www.tripo3d.ai/research/triposplat) | [GitHub](https://github.com/VAST-AI-Research/TripoSplat)"
)
with gr.Row():
with gr.Column(scale=1):
image_in = gr.Image(label="Input image", type="pil", image_mode="RGBA",
height=320)
gr.Examples(
examples=[[p] for p in EXAMPLES],
inputs=[image_in],
label="Examples (click to load)",
examples_per_page=10,
cache_examples=False,
)
with gr.Accordion("Sampling settings", open=False):
seed_in = gr.Number(label="Seed", value=42, precision=0)
steps_in = gr.Slider(label="Inference steps", minimum=1, maximum=50, step=1, value=20)
cfg_in = gr.Slider(label="Guidance scale", minimum=1.0, maximum=10.0, step=0.5, value=3.0)
num_g_in = gr.Dropdown(
label="Number of gaussians",
choices=["32768", "65536", "131072", "262144"],
value="262144",
)
fmt_in = gr.Dropdown(label="Download format", choices=["ply", "splat"], value="ply")
run_btn = gr.Button("Generate", variant="primary")
prepared_out = gr.Image(label="Preprocessed input", interactive=False, height=240)
info_out = gr.Markdown()
with gr.Column(scale=2):
viewer_out = gr.HTML(value=PLACEHOLDER_HTML, label="Spark.js viewer")
file_out = gr.DownloadButton(label="Download", value=None, interactive=False)
run_btn.click(
fn=generate,
inputs=[image_in, seed_in, steps_in, cfg_in, num_g_in, fmt_in],
outputs=[prepared_out, viewer_out, file_out, info_out],
)
if __name__ == "__main__":
demo.launch(
allowed_paths=[
str(VIEWER_HTML.parent),
str(OUT_ROOT),
_EXAMPLES_TMPDIR,
],
)
|