Upload folder using huggingface_hub
Browse files- ckpts/hdri_encoder_4096tokens_fp16.json +11 -0
- ckpts/hdri_encoder_4096tokens_fp16.pt +3 -0
- ckpts/neural_basis_3layer_relu_fp16.json +14 -0
- ckpts/neural_basis_3layer_relu_fp16.pt +3 -0
- ckpts/slat_dec_gs_swin8_B_64l8gs32_fp16.json +16 -0
- ckpts/slat_dec_gs_swin8_B_64l8gs32_fp16.pt +3 -0
- ckpts/slat_flow_img_dit_L_64l8p2_fp16.json +19 -0
- ckpts/slat_flow_img_dit_L_64l8p2_fp16_18w.pt +3 -0
- ckpts/slat_flow_img_dit_L_64l8p2_fp16_23w.pt +3 -0
- ckpts/slat_renderder_gs_swin8_B_64l8gs32_fp16.json +42 -0
- ckpts/slat_renderder_gs_swin8_B_64l8gs32_fp16.pt +3 -0
- pipeline.yaml +51 -0
- weights/RealESRGAN_x4plus.pth +3 -0
ckpts/hdri_encoder_4096tokens_fp16.json
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"name": "Hdri_Encoder",
|
| 3 |
+
"args": {
|
| 4 |
+
"output_dim": 768,
|
| 5 |
+
"num_tokens": 4096,
|
| 6 |
+
"cnn_out_channels": 256,
|
| 7 |
+
"n_heads": 12,
|
| 8 |
+
"num_transformer_layers": 3,
|
| 9 |
+
"rope_base": 10000.0
|
| 10 |
+
}
|
| 11 |
+
}
|
ckpts/hdri_encoder_4096tokens_fp16.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c763776c1fe8d4857283356349f26bcd286b8f631d4e3951f087348b031af052
|
| 3 |
+
size 868756605
|
ckpts/neural_basis_3layer_relu_fp16.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"name": "NeuralBasis",
|
| 3 |
+
"args":{
|
| 4 |
+
"input_dim": 32,
|
| 5 |
+
"output_dim": 5,
|
| 6 |
+
"hidden_dim": 64,
|
| 7 |
+
"num_layers": 3,
|
| 8 |
+
"use_normal": true,
|
| 9 |
+
"activation": "relu",
|
| 10 |
+
"normal_dim": 3,
|
| 11 |
+
"num_frequencies": 4,
|
| 12 |
+
"use_residual": false
|
| 13 |
+
}
|
| 14 |
+
}
|
ckpts/neural_basis_3layer_relu_fp16.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0b4ca2ec379c93784841ed3be7c7042117accfa3d93c9e893e9fcbccc51d022
|
| 3 |
+
size 840373734
|
ckpts/slat_dec_gs_swin8_B_64l8gs32_fp16.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"name": "SLatGaussianDecoder",
|
| 3 |
+
"args": {
|
| 4 |
+
"resolution": 64,
|
| 5 |
+
"model_channels": 768,
|
| 6 |
+
"latent_channels": 8,
|
| 7 |
+
"cond_channels": 768,
|
| 8 |
+
"num_blocks": 12,
|
| 9 |
+
"num_register_tokens": 16,
|
| 10 |
+
"num_heads": 12,
|
| 11 |
+
"mlp_ratio": 4,
|
| 12 |
+
"attn_mode": "swin",
|
| 13 |
+
"window_size": 8,
|
| 14 |
+
"use_fp16": true
|
| 15 |
+
}
|
| 16 |
+
}
|
ckpts/slat_dec_gs_swin8_B_64l8gs32_fp16.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6eda01884ae8746b44d977aff0514287224bc7f63bedf67269c974a35db3723c
|
| 3 |
+
size 840401603
|
ckpts/slat_flow_img_dit_L_64l8p2_fp16.json
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"name": "SLatFlowModel",
|
| 3 |
+
"args": {
|
| 4 |
+
"resolution": 64,
|
| 5 |
+
"in_channels": 8,
|
| 6 |
+
"out_channels": 8,
|
| 7 |
+
"model_channels": 1024,
|
| 8 |
+
"cond_channels": 1024,
|
| 9 |
+
"num_blocks": 24,
|
| 10 |
+
"num_heads": 16,
|
| 11 |
+
"mlp_ratio": 4,
|
| 12 |
+
"patch_size": 2,
|
| 13 |
+
"num_io_res_blocks": 2,
|
| 14 |
+
"io_block_channels": [128],
|
| 15 |
+
"pe_mode": "ape",
|
| 16 |
+
"qk_rms_norm": true,
|
| 17 |
+
"use_fp16": true
|
| 18 |
+
}
|
| 19 |
+
}
|
ckpts/slat_flow_img_dit_L_64l8p2_fp16_18w.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:decc9df7523b0aefc87fd097acedfd6777e93e85d3b9eb74b56fffa8348a2015
|
| 3 |
+
size 2401821834
|
ckpts/slat_flow_img_dit_L_64l8p2_fp16_23w.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d92835a8792e90687fed8c939d34959e94e73c30768d3343581a9f7b951c22ff
|
| 3 |
+
size 2401821834
|
ckpts/slat_renderder_gs_swin8_B_64l8gs32_fp16.json
ADDED
|
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"name": "SLatGaussianRenderer",
|
| 3 |
+
"args": {
|
| 4 |
+
"resolution": 64,
|
| 5 |
+
"model_channels": 768,
|
| 6 |
+
"latent_channels": 768,
|
| 7 |
+
"cond_channels": 768,
|
| 8 |
+
"num_blocks": 6,
|
| 9 |
+
"num_register_tokens": 16,
|
| 10 |
+
"num_heads": 12,
|
| 11 |
+
"mlp_ratio": 4,
|
| 12 |
+
"attn_mode": "swin",
|
| 13 |
+
"window_size": 8,
|
| 14 |
+
"use_fp16": true,
|
| 15 |
+
"representation_config": {
|
| 16 |
+
"lr": {
|
| 17 |
+
"_xyz": 1.0,
|
| 18 |
+
"_base_color": 1.0,
|
| 19 |
+
"_roughness": 1.0,
|
| 20 |
+
"_metallic": 1.0,
|
| 21 |
+
"_scaling": 1.0,
|
| 22 |
+
"_scaling_view": 1.0,
|
| 23 |
+
"_rotation": 0.2,
|
| 24 |
+
"_opacity": 1.0,
|
| 25 |
+
"_shadow": 0.5,
|
| 26 |
+
"_brightness": 0.5,
|
| 27 |
+
"_pbr1": 0.5,
|
| 28 |
+
"_hdri1": 0.5,
|
| 29 |
+
"_hdri2": 0.5,
|
| 30 |
+
"_rgb": 1.0
|
| 31 |
+
},
|
| 32 |
+
"perturb_offset": true,
|
| 33 |
+
"voxel_size": 1.5,
|
| 34 |
+
"num_gaussians": 32,
|
| 35 |
+
"2d_filter_kernel_size": 0.1,
|
| 36 |
+
"3d_filter_kernel_size": 9e-4,
|
| 37 |
+
"scaling_bias": 4e-3,
|
| 38 |
+
"opacity_bias": 0.1,
|
| 39 |
+
"scaling_activation": "softplus"
|
| 40 |
+
}
|
| 41 |
+
}
|
| 42 |
+
}
|
ckpts/slat_renderder_gs_swin8_B_64l8gs32_fp16.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b9c8f5fc1acb8477656bf5391f92051c80dfe212d8f0035207d92d8966573547
|
| 3 |
+
size 840392413
|
pipeline.yaml
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
name: NeARImageToRelightable3DPipeline
|
| 2 |
+
args:
|
| 3 |
+
models:
|
| 4 |
+
decoder: ckpts/slat_dec_gs_swin8_B_64l8gs32_fp16
|
| 5 |
+
hdri_encoder: ckpts/hdri_encoder_4096tokens_fp16
|
| 6 |
+
neural_basis: ckpts/neural_basis_3layer_relu_fp16
|
| 7 |
+
renderer: ckpts/slat_renderder_gs_swin8_B_64l8gs32_fp16
|
| 8 |
+
slat_flow_model: ckpts/slat_flow_img_dit_L_64l8p2_fp16
|
| 9 |
+
|
| 10 |
+
hyshape:
|
| 11 |
+
model_id: tencent/Hunyuan3D-2.1 # or use custom local path if you have downloaded the model locally https://huggingface.co/tencent/Hunyuan3D-2.1/tree/main/hunyuan3d-dit-v2-1
|
| 12 |
+
|
| 13 |
+
# ultrashape:
|
| 14 |
+
# model_id: infinith/UltraShape # or use custom local path if you have downloaded the model locally https://huggingface.co/infinith/UltraShape
|
| 15 |
+
|
| 16 |
+
sr_model:
|
| 17 |
+
model_path: weights/RealESRGAN_x4plus.pth
|
| 18 |
+
|
| 19 |
+
slat_sampler:
|
| 20 |
+
name: FlowEulerGuidanceIntervalSampler
|
| 21 |
+
args:
|
| 22 |
+
sigma_min: 0.00001
|
| 23 |
+
params:
|
| 24 |
+
steps: 25
|
| 25 |
+
cfg_strength: 5.0
|
| 26 |
+
cfg_interval:
|
| 27 |
+
- 0.5
|
| 28 |
+
- 1.0
|
| 29 |
+
rescale_t: 3.0
|
| 30 |
+
|
| 31 |
+
slat_normalization:
|
| 32 |
+
mean:
|
| 33 |
+
- -2.1687545776367188
|
| 34 |
+
- -0.004347046371549368
|
| 35 |
+
- -0.13352349400520325
|
| 36 |
+
- -0.08418072760105133
|
| 37 |
+
- -0.5271206498146057
|
| 38 |
+
- 0.7238689064979553
|
| 39 |
+
- -1.1414450407028198
|
| 40 |
+
- 1.2039363384246826
|
| 41 |
+
std:
|
| 42 |
+
- 2.377650737762451
|
| 43 |
+
- 2.386378288269043
|
| 44 |
+
- 2.124418020248413
|
| 45 |
+
- 2.1748552322387695
|
| 46 |
+
- 2.663944721221924
|
| 47 |
+
- 2.371192216873169
|
| 48 |
+
- 2.6217446327209473
|
| 49 |
+
- 2.684523105621338
|
| 50 |
+
|
| 51 |
+
image_cond_model: dinov2_vitl14_reg
|
weights/RealESRGAN_x4plus.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4fa0d38905f75ac06eb49a7951b426670021be3018265fd191d2125df9d682f1
|
| 3 |
+
size 67040989
|