File size: 3,512 Bytes
1c3643f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
{
    "models": {
        "property_encoder": {
            "name": "ElasticPropertyEncoder",
            "args": {
                "resolution": 64,
                "in_channels": 3072,
                "in_channels_phy": 14,
                "model_channels": 768,
                "latent_channels": 8,
                "num_blocks": 4,
                "num_heads": 12,
                "mlp_ratio": 4,
                "attn_mode": "swin",
                "window_size": 8,
                "use_fp16": true
            }
        },
        "property_decoder": {
            "name": "ElasticPropertyDecoder",
            "args": {
                "resolution": 64,
                "model_channels": 2048,
                "latent_channels": 8,
                "num_blocks": 4,
                "num_heads": 16,
                "mlp_ratio": 4,
                "attn_mode": "swin",
                "window_size": 8,
                "use_fp16": true,
                "representation_config": {
                    "use_color": true
                }
            }
        },
        "property_output": {
            "name": "PropertyOutput",
            "args": {
                "model_channels": 32,
                "output_channels_lang": 3072,
                "output_channels_phy": 14,
                "use_fp16": true
            }
        },
        "decoder": {
            "name": "ElasticSLatMeshDecodernew",
            "args": {
                "resolution": 64,
                "model_channels": 768,
                "phy_channels": 2048,
                "latent_channels": 8,
                "num_blocks": 12,
                "num_heads": 12,
                "mlp_ratio": 4,
                "attn_mode": "swin",
                "window_size": 8,
                "use_fp16": true,
                "representation_config": {
                    "use_color": true
                }
            }
        }
    },
    "dataset": {
        "name": "Slat2RenderGeomesh",
        "args": {
            "image_size": 384,
            "latent_model": "dinov2_vitl14_reg_slat_enc_swin8_B_64l8_fp16",
            "min_aesthetic_score": 4.5,
            "max_num_voxels": 28000
        }
    },
    "trainer": {
        "name": "SLatVaeMeshTrainer",
        "args": {
            "onlyphy_property": true,
            "max_steps": 1000000,
            "batch_size_per_gpu": 4,
            "batch_split": 4,
            "optimizer": {
                "name": "AdamW",
                "args": {
                    "lr": 0.0001,
                    "weight_decay": 0.0
                }
            },
            "ema_rate": [
                0.9999
            ],
            "fp16_mode": "inflat_all",
            "fp16_scale_growth": 0.001,
            "elastic": {
                "name": "LinearMemoryController",
                "args": {
                    "target_ratio": 0.6,
                    "max_mem_ratio_start": 0.5
                }
            },
            "grad_clip": {
                "name": "AdaptiveGradClipper",
                "args": {
                    "max_norm": 1.0,
                    "clip_percentile": 95
                }
            },
            "i_log": 10,
            "i_sample": 5000,
            "i_save": 10000,
            "lambda_ssim": 0.2,
            "lambda_lpips": 0.2,
            "lambda_tsdf": 0.01,
            "lambda_depth": 10.0,
            "lambda_color": 0.1,
            "lambda_kl": 1e-06,
            "depth_loss_type": "smooth_l1"
        }
    }
}