luh0502 commited on
Commit
fab99f0
·
verified ·
1 Parent(s): bff2bf4

Upload folder using huggingface_hub

Browse files
ckpts/hdri_encoder_4096tokens_fp16.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "Hdri_Encoder",
3
+ "args": {
4
+ "output_dim": 768,
5
+ "num_tokens": 4096,
6
+ "cnn_out_channels": 256,
7
+ "n_heads": 12,
8
+ "num_transformer_layers": 3,
9
+ "rope_base": 10000.0
10
+ }
11
+ }
ckpts/hdri_encoder_4096tokens_fp16.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c763776c1fe8d4857283356349f26bcd286b8f631d4e3951f087348b031af052
3
+ size 868756605
ckpts/neural_basis_3layer_relu_fp16.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "NeuralBasis",
3
+ "args":{
4
+ "input_dim": 32,
5
+ "output_dim": 5,
6
+ "hidden_dim": 64,
7
+ "num_layers": 3,
8
+ "use_normal": true,
9
+ "activation": "relu",
10
+ "normal_dim": 3,
11
+ "num_frequencies": 4,
12
+ "use_residual": false
13
+ }
14
+ }
ckpts/neural_basis_3layer_relu_fp16.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0b4ca2ec379c93784841ed3be7c7042117accfa3d93c9e893e9fcbccc51d022
3
+ size 840373734
ckpts/slat_dec_gs_swin8_B_64l8gs32_fp16.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "SLatGaussianDecoder",
3
+ "args": {
4
+ "resolution": 64,
5
+ "model_channels": 768,
6
+ "latent_channels": 8,
7
+ "cond_channels": 768,
8
+ "num_blocks": 12,
9
+ "num_register_tokens": 16,
10
+ "num_heads": 12,
11
+ "mlp_ratio": 4,
12
+ "attn_mode": "swin",
13
+ "window_size": 8,
14
+ "use_fp16": true
15
+ }
16
+ }
ckpts/slat_dec_gs_swin8_B_64l8gs32_fp16.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6eda01884ae8746b44d977aff0514287224bc7f63bedf67269c974a35db3723c
3
+ size 840401603
ckpts/slat_flow_img_dit_L_64l8p2_fp16.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "SLatFlowModel",
3
+ "args": {
4
+ "resolution": 64,
5
+ "in_channels": 8,
6
+ "out_channels": 8,
7
+ "model_channels": 1024,
8
+ "cond_channels": 1024,
9
+ "num_blocks": 24,
10
+ "num_heads": 16,
11
+ "mlp_ratio": 4,
12
+ "patch_size": 2,
13
+ "num_io_res_blocks": 2,
14
+ "io_block_channels": [128],
15
+ "pe_mode": "ape",
16
+ "qk_rms_norm": true,
17
+ "use_fp16": true
18
+ }
19
+ }
ckpts/slat_flow_img_dit_L_64l8p2_fp16_18w.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:decc9df7523b0aefc87fd097acedfd6777e93e85d3b9eb74b56fffa8348a2015
3
+ size 2401821834
ckpts/slat_flow_img_dit_L_64l8p2_fp16_23w.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d92835a8792e90687fed8c939d34959e94e73c30768d3343581a9f7b951c22ff
3
+ size 2401821834
ckpts/slat_renderder_gs_swin8_B_64l8gs32_fp16.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "SLatGaussianRenderer",
3
+ "args": {
4
+ "resolution": 64,
5
+ "model_channels": 768,
6
+ "latent_channels": 768,
7
+ "cond_channels": 768,
8
+ "num_blocks": 6,
9
+ "num_register_tokens": 16,
10
+ "num_heads": 12,
11
+ "mlp_ratio": 4,
12
+ "attn_mode": "swin",
13
+ "window_size": 8,
14
+ "use_fp16": true,
15
+ "representation_config": {
16
+ "lr": {
17
+ "_xyz": 1.0,
18
+ "_base_color": 1.0,
19
+ "_roughness": 1.0,
20
+ "_metallic": 1.0,
21
+ "_scaling": 1.0,
22
+ "_scaling_view": 1.0,
23
+ "_rotation": 0.2,
24
+ "_opacity": 1.0,
25
+ "_shadow": 0.5,
26
+ "_brightness": 0.5,
27
+ "_pbr1": 0.5,
28
+ "_hdri1": 0.5,
29
+ "_hdri2": 0.5,
30
+ "_rgb": 1.0
31
+ },
32
+ "perturb_offset": true,
33
+ "voxel_size": 1.5,
34
+ "num_gaussians": 32,
35
+ "2d_filter_kernel_size": 0.1,
36
+ "3d_filter_kernel_size": 9e-4,
37
+ "scaling_bias": 4e-3,
38
+ "opacity_bias": 0.1,
39
+ "scaling_activation": "softplus"
40
+ }
41
+ }
42
+ }
ckpts/slat_renderder_gs_swin8_B_64l8gs32_fp16.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9c8f5fc1acb8477656bf5391f92051c80dfe212d8f0035207d92d8966573547
3
+ size 840392413
pipeline.yaml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: NeARImageToRelightable3DPipeline
2
+ args:
3
+ models:
4
+ decoder: ckpts/slat_dec_gs_swin8_B_64l8gs32_fp16
5
+ hdri_encoder: ckpts/hdri_encoder_4096tokens_fp16
6
+ neural_basis: ckpts/neural_basis_3layer_relu_fp16
7
+ renderer: ckpts/slat_renderder_gs_swin8_B_64l8gs32_fp16
8
+ slat_flow_model: ckpts/slat_flow_img_dit_L_64l8p2_fp16
9
+
10
+ hyshape:
11
+ model_id: tencent/Hunyuan3D-2.1 # or use custom local path if you have downloaded the model locally https://huggingface.co/tencent/Hunyuan3D-2.1/tree/main/hunyuan3d-dit-v2-1
12
+
13
+ # ultrashape:
14
+ # model_id: infinith/UltraShape # or use custom local path if you have downloaded the model locally https://huggingface.co/infinith/UltraShape
15
+
16
+ sr_model:
17
+ model_path: weights/RealESRGAN_x4plus.pth
18
+
19
+ slat_sampler:
20
+ name: FlowEulerGuidanceIntervalSampler
21
+ args:
22
+ sigma_min: 0.00001
23
+ params:
24
+ steps: 25
25
+ cfg_strength: 5.0
26
+ cfg_interval:
27
+ - 0.5
28
+ - 1.0
29
+ rescale_t: 3.0
30
+
31
+ slat_normalization:
32
+ mean:
33
+ - -2.1687545776367188
34
+ - -0.004347046371549368
35
+ - -0.13352349400520325
36
+ - -0.08418072760105133
37
+ - -0.5271206498146057
38
+ - 0.7238689064979553
39
+ - -1.1414450407028198
40
+ - 1.2039363384246826
41
+ std:
42
+ - 2.377650737762451
43
+ - 2.386378288269043
44
+ - 2.124418020248413
45
+ - 2.1748552322387695
46
+ - 2.663944721221924
47
+ - 2.371192216873169
48
+ - 2.6217446327209473
49
+ - 2.684523105621338
50
+
51
+ image_cond_model: dinov2_vitl14_reg
weights/RealESRGAN_x4plus.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fa0d38905f75ac06eb49a7951b426670021be3018265fd191d2125df9d682f1
3
+ size 67040989