| import os |
| import torch |
| import argparse |
| from PIL import Image |
|
|
| |
| import sys |
| sys.path.append(os.getcwd()) |
| sys.path.append(os.path.join(os.getcwd(), 'third_parties/dsine')) |
|
|
| from anigen.pipelines import AnigenImageTo3DPipeline |
| from anigen.utils.random_utils import set_random_seed |
| from anigen.utils.image_utils import _expand_image_inputs |
| from anigen.utils.ckpt_utils import ensure_ckpts |
|
|
|
|
| @torch.no_grad() |
| def main(): |
|
|
| parser = argparse.ArgumentParser() |
| parser.add_argument('--image_path', type=str, required=True, help='Path to input image or a folder of images') |
| parser.add_argument('--ss_flow_path', type=str, required=False, default='ckpts/anigen/ss_flow_duet', help='Path to SS Flow model directory') |
| parser.add_argument('--slat_flow_path', type=str, required=False, default='ckpts/anigen/slat_flow_auto', help='Path to SLat Flow model directory') |
| parser.add_argument('--output_dir', type=str, default='results/', help='Output directory') |
| parser.add_argument('--seed', type=int, default=42) |
| parser.add_argument('--cfg_scale_ss', type=float, default=7.5, help='Classifier-free guidance scale') |
| parser.add_argument('--cfg_scale', type=float, default=3.0, help='Classifier-free guidance scale') |
| parser.add_argument('--deterministic', action='store_true', help='Enable mostly-deterministic torch behavior (may be slower)') |
| parser.add_argument('--device', type=str, default='cuda') |
| parser.add_argument('--use_ema', action='store_true', help='Use EMA checkpoint if available') |
|
|
| parser.add_argument( |
| '--output_name', |
| type=str, |
| default=None, |
| help='Optional subfolder name to save outputs under `--output_dir`. If not provided, the image filename stem is used.', |
| ) |
|
|
| parser.add_argument('--no_smooth_skin_weights', action='store_true', help='Disable skin-weight smoothing') |
| parser.add_argument('--smooth_skin_weights_iters', type=int, default=100, help='Number of smoothing iterations (default: 100)') |
| parser.add_argument('--smooth_skin_weights_alpha', type=float, default=1.0, help='Smoothing alpha (default: 1.0)') |
|
|
| parser.add_argument( |
| '--no_filter_skin_weights', |
| action='store_true', |
| help='Use geodesic distribution to filter mesh skinning weights.', |
| ) |
|
|
| parser.add_argument( |
| '--joints_density', '--joint_density', |
| type=int, |
| default=1, |
| help='Optional joint density level for Slat flow (from 0 to 4, higher means more joints)', |
| ) |
| args = parser.parse_args() |
|
|
| base_output_dir = args.output_dir |
| input_image_paths, is_dir = _expand_image_inputs(args.image_path) |
| if is_dir and len(input_image_paths) == 0: |
| raise ValueError(f"No supported images found under directory: {args.image_path}") |
|
|
| |
| |
| batch_folder_name = None |
| if is_dir: |
| batch_folder_name = args.output_name if (args.output_name is not None and str(args.output_name).strip() != '') else os.path.basename(os.path.normpath(args.image_path)) |
| set_random_seed(args.seed, deterministic=args.deterministic) |
|
|
| ensure_ckpts() |
|
|
| print("Loading models...") |
| pipeline = AnigenImageTo3DPipeline.from_pretrained( |
| ss_flow_path=args.ss_flow_path, |
| slat_flow_path=args.slat_flow_path, |
| device=args.device, |
| use_ema=args.use_ema |
| ) |
| pipeline.cuda() |
|
|
| for idx, cur_image_path in enumerate(input_image_paths): |
| |
| image_stem = os.path.splitext(os.path.basename(cur_image_path))[0] |
| if is_dir: |
| args.output_dir = os.path.join(base_output_dir, str(batch_folder_name), image_stem) |
| else: |
| |
| folder_name = args.output_name if (args.output_name is not None and str(args.output_name).strip() != '') else image_stem |
| args.output_dir = os.path.join(base_output_dir, folder_name) |
| os.makedirs(args.output_dir, exist_ok=True) |
|
|
| |
| args.image_path = cur_image_path |
| print(f"Processing image {idx + 1}/{len(input_image_paths)}: {cur_image_path}") |
| image = Image.open(cur_image_path) |
| |
| |
| output_glb_path = os.path.join(args.output_dir, 'mesh.glb') |
| outputs = pipeline.run( |
| image, |
| seed=args.seed, |
| cfg_scale_ss=args.cfg_scale_ss, |
| cfg_scale_slat=args.cfg_scale, |
| joints_density=args.joints_density, |
| no_smooth_skin_weights=args.no_smooth_skin_weights, |
| no_filter_skin_weights=args.no_filter_skin_weights, |
| smooth_skin_weights_iters=args.smooth_skin_weights_iters, |
| smooth_skin_weights_alpha=args.smooth_skin_weights_alpha, |
| output_glb=output_glb_path |
| ) |
| |
| |
| outputs['processed_image'].save(os.path.join(args.output_dir, 'processed_image.png')) |
|
|
| |
| if __name__ == '__main__': |
| main() |
|
|