apozz commited on
Commit
9bc54ed
·
verified ·
1 Parent(s): 94d3272

Upload ss_generator.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. ss_generator.yaml +141 -0
ss_generator.yaml ADDED
@@ -0,0 +1,141 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ module:
2
+ condition_embedder:
3
+ backbone:
4
+ _target_: sam3d_objects.model.backbone.dit.embedder.embedder_fuser.EmbedderFuser
5
+ drop_modalities_weight:
6
+ - - - pointmap
7
+ - rgb_pointmap
8
+ - 1.0
9
+ dropout_prob: 0.1
10
+ embedder_list:
11
+ - - _target_: sam3d_objects.model.backbone.dit.embedder.dino.Dino
12
+ dino_model: dinov2_vitl14_reg
13
+ input_size: 518
14
+ normalize_images: true
15
+ - - - image
16
+ - cropped
17
+ - - rgb_image
18
+ - full
19
+ - - _target_: sam3d_objects.model.backbone.dit.embedder.dino.Dino
20
+ dino_model: dinov2_vitl14_reg
21
+ input_size: 518
22
+ normalize_images: true
23
+ - - - mask
24
+ - cropped
25
+ - - rgb_image_mask
26
+ - full
27
+ - - _target_: sam3d_objects.model.backbone.dit.embedder.pointmap.PointPatchEmbed
28
+ embed_dim: 512
29
+ input_size: 256
30
+ patch_size: 8
31
+ remap_output: linear
32
+ - - - pointmap
33
+ - cropped
34
+ - - rgb_pointmap
35
+ - full
36
+ force_drop_modalities: null
37
+ freeze: true
38
+ projection_net_hidden_dim_multiplier: 4.0
39
+ use_pos_embedding: learned
40
+ generator:
41
+ backbone:
42
+ _target_: sam3d_objects.model.backbone.generator.shortcut.model.ShortCut
43
+ batch_mode: true
44
+ cfg_modalities:
45
+ - shape
46
+ inference_steps: 2
47
+ loss_weights:
48
+ 6drotation_normalized: 0.1
49
+ _target_: sam3d_objects.config.utils.make_dict
50
+ scale: 0.1
51
+ shape: 0
52
+ translation: 1.0
53
+ translation_scale: 0.0
54
+ ratio_cfg_samples_in_self_consistency_target: 0.25
55
+ rescale_t: 1
56
+ reverse_fn:
57
+ _target_: sam3d_objects.model.backbone.generator.classifier_free_guidance.ClassifierFreeGuidanceWithExternalUnconditionalProbability
58
+ backbone:
59
+ _target_: sam3d_objects.model.backbone.tdfy_dit.models.mot_sparse_structure_flow.SparseStructureFlowTdfyWrapper
60
+ cond_channels: 1024
61
+ condition_embedder: null
62
+ force_zeros_cond: true
63
+ freeze_d_time_embedder: true
64
+ freeze_shared_parameters: true
65
+ in_channels: 8
66
+ is_shortcut_model: true
67
+ latent_mapping:
68
+ 6drotation_normalized:
69
+ _target_: sam3d_objects.model.backbone.tdfy_dit.models.mm_latent.Latent
70
+ in_channels: 6
71
+ model_channels: 1024
72
+ pos_embedder:
73
+ _target_: sam3d_objects.model.backbone.tdfy_dit.models.mm_latent.LearntPositionEmbedder
74
+ model_channels: 1024
75
+ token_len: 1
76
+ scale:
77
+ _target_: sam3d_objects.model.backbone.tdfy_dit.models.mm_latent.Latent
78
+ in_channels: 3
79
+ model_channels: 1024
80
+ pos_embedder:
81
+ _target_: sam3d_objects.model.backbone.tdfy_dit.models.mm_latent.LearntPositionEmbedder
82
+ model_channels: 1024
83
+ token_len: 1
84
+ shape:
85
+ _target_: sam3d_objects.model.backbone.tdfy_dit.models.mm_latent.Latent
86
+ in_channels: 8
87
+ model_channels: 1024
88
+ pos_embedder:
89
+ _target_: sam3d_objects.model.backbone.tdfy_dit.models.mm_latent.ShapePositionEmbedder
90
+ model_channels: 1024
91
+ patch_size: 1
92
+ resolution: 16
93
+ translation:
94
+ _target_: sam3d_objects.model.backbone.tdfy_dit.models.mm_latent.Latent
95
+ in_channels: 3
96
+ model_channels: 1024
97
+ pos_embedder:
98
+ _target_: sam3d_objects.model.backbone.tdfy_dit.models.mm_latent.LearntPositionEmbedder
99
+ model_channels: 1024
100
+ token_len: 1
101
+ translation_scale:
102
+ _target_: sam3d_objects.model.backbone.tdfy_dit.models.mm_latent.Latent
103
+ in_channels: 1
104
+ model_channels: 1024
105
+ pos_embedder:
106
+ _target_: sam3d_objects.model.backbone.tdfy_dit.models.mm_latent.LearntPositionEmbedder
107
+ model_channels: 1024
108
+ token_len: 1
109
+ latent_share_transformer:
110
+ 6drotation_normalized:
111
+ - 6drotation_normalized
112
+ - translation
113
+ - scale
114
+ - translation_scale
115
+ mlp_ratio: 4
116
+ model_channels: 1024
117
+ num_blocks: 24
118
+ num_heads: 16
119
+ out_channels: 8
120
+ patch_size: 1
121
+ pe_mode: ape
122
+ qk_rms_norm: true
123
+ resolution: 16
124
+ use_checkpoint: false
125
+ use_fp16: false
126
+ interval:
127
+ - 0
128
+ - 500
129
+ p_unconditional: 0.1
130
+ strength: 2.0
131
+ unconditional_handling: add_flag
132
+ self_consistency_cfg_strength: 2.0
133
+ self_consistency_prob: 0.25
134
+ shortcut_loss_weight: 1.0
135
+ sigma_min: 0.0
136
+ time_scale: 1000.0
137
+ training_time_sampler_fn:
138
+ _partial_: true
139
+ _target_: sam3d_objects.model.backbone.generator.flow_matching.model.lognorm_sampler
140
+ mean: -1.0
141
+ std: 1.0