bag100 commited on
Commit
c7604cd
·
verified ·
1 Parent(s): af9004f

Add fullscale_no_qp config

Browse files
Files changed (1) hide show
  1. fullscale_no_qp/config.json +180 -0
fullscale_no_qp/config.json ADDED
@@ -0,0 +1,180 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "sam3_defaults": false,
3
+ "da3_model": "depth-anything/DA3NESTED-GIANT-LARGE",
4
+ "da3_resolution": 1008,
5
+ "use_cached_depth": true,
6
+ "da3_cache_name": "da3_nested_cache_1008",
7
+ "d_model": 256,
8
+ "n_heads": 8,
9
+ "num_decoder_layers": 6,
10
+ "num_queries": 10,
11
+ "multi_object": false,
12
+ "match_strategy": "hungarian",
13
+ "per_text_decode": false,
14
+ "grouped_text_attn": false,
15
+ "sam3_multi_object": false,
16
+ "num_objects": 1,
17
+ "max_objects": 0,
18
+ "train_seghead": false,
19
+ "dataset": "scannetpp",
20
+ "frames_per_sequence": 50,
21
+ "samples_per_sequence": 1,
22
+ "part_query_mode": "random",
23
+ "augment": false,
24
+ "data_root": null,
25
+ "split": "train_balanced_v5",
26
+ "views": 8,
27
+ "sampling_strategy": "stratified",
28
+ "da3_chunk_size": 8,
29
+ "max_scenes": 245,
30
+ "resolution": 1008,
31
+ "min_mask_coverage": 0.0,
32
+ "epochs": 100,
33
+ "stop_at_epoch": 0,
34
+ "val_every": 0,
35
+ "val_split": "val_cache_good",
36
+ "val_max_samples": null,
37
+ "save_best_val": true,
38
+ "no_save_best_val": false,
39
+ "min_ram_gb": 100.0,
40
+ "batch_size": 8,
41
+ "num_workers": 4,
42
+ "prefetch_factor": 2,
43
+ "no_persistent_workers": false,
44
+ "lr": 0.0002,
45
+ "lr_scheduler": "cosine",
46
+ "lr_warmup_epochs": 2,
47
+ "lr_min": 1e-06,
48
+ "lr_step_size": 10,
49
+ "lr_gamma": 0.5,
50
+ "grad_accum": 1,
51
+ "grad_clip": 1.0,
52
+ "run_name": "fullscale_no_qp_245s_100ep",
53
+ "checkpoint_dir": "/home/nvidia/mv_sam3/checkpoints",
54
+ "resume": "checkpoints/fullscale_no_qp_245s_100ep",
55
+ "load_weights": null,
56
+ "focal_weight": 0.0,
57
+ "focal_alpha": 0.75,
58
+ "focal_gamma": 2.0,
59
+ "dice_weight": 5.0,
60
+ "boundary_weight": 0.0,
61
+ "lovasz_weight": 0.0,
62
+ "use_point_sampling": false,
63
+ "num_sample_points": 4096,
64
+ "loss_at_native_res": false,
65
+ "attn_map_size": 64,
66
+ "seed": 42,
67
+ "use_presence_token": true,
68
+ "use_box_prompts": true,
69
+ "box_prompt_dropout": 0.2,
70
+ "use_point_prompts": true,
71
+ "point_prompt_dropout": 0.2,
72
+ "num_pos_points": 10,
73
+ "num_neg_points": 2,
74
+ "samples_per_scene": 1,
75
+ "min_category_samples": 1,
76
+ "exclude_categories": null,
77
+ "prompt_type": "all",
78
+ "use_world_pe": true,
79
+ "use_gasa": true,
80
+ "gasa_beta_init": 1.0,
81
+ "gasa_kernel_dim": 32,
82
+ "gasa_fixed_kernel": false,
83
+ "gasa_kernel_type": "learned",
84
+ "gasa_bidirectional": false,
85
+ "use_image_to_token": false,
86
+ "use_pos_refine": false,
87
+ "use_box_rpb": false,
88
+ "dim_feedforward": 2048,
89
+ "post_norm": true,
90
+ "ffn_fp32": true,
91
+ "use_query_pe": false,
92
+ "use_depth_crossattn": false,
93
+ "per_layer_text": true,
94
+ "no_initial_text": false,
95
+ "no_text_proj": false,
96
+ "clean_v": false,
97
+ "additive_pe": true,
98
+ "cross_view": false,
99
+ "use_da3_poses_for_gasa": true,
100
+ "use_gt_poses_for_gasa": false,
101
+ "no_gt_poses": false,
102
+ "sheaf_use_gt_poses": false,
103
+ "pe_type": "world",
104
+ "no_pointmap_normalize": false,
105
+ "use_iterative_pos": false,
106
+ "presence_weight": 2.0,
107
+ "presence_focal": true,
108
+ "presence_alpha": 0.5,
109
+ "presence_gamma": 0.0,
110
+ "use_centroid_head": true,
111
+ "centroid_weight": 0.5,
112
+ "mask_based_centroid": false,
113
+ "use_triangulation": false,
114
+ "eval_localization": false,
115
+ "use_iou_head": false,
116
+ "iou_head_weight": 1.0,
117
+ "pred_logits_source": "mask_mean",
118
+ "contrastive_weight": 0.0,
119
+ "contrastive_margin": 0.5,
120
+ "contrastive_source": "logits",
121
+ "no_object_weight": 1.0,
122
+ "align_weight": 1.0,
123
+ "align_alpha": 0.5,
124
+ "align_gamma": 2.0,
125
+ "align_tau": 2.0,
126
+ "per_layer_align": false,
127
+ "per_layer_align_weight": null,
128
+ "use_sheaf_loss": false,
129
+ "sheaf_weight": 0.1,
130
+ "sheaf_type": "constant",
131
+ "sheaf_d_edge": 32,
132
+ "sheaf_threshold": 0.1,
133
+ "sheaf_soft_correspondences": false,
134
+ "sheaf_sigma": 0.1,
135
+ "sheaf_detach_target": true,
136
+ "sheaf_max_frame_distance": 0,
137
+ "sheaf_symmetric_detach": true,
138
+ "sheaf_mutual_nn": true,
139
+ "output_localization": false,
140
+ "output_depth": false,
141
+ "output_pointcloud": false,
142
+ "semantic_union": false,
143
+ "mask_selection": "confidence",
144
+ "vis_every_epochs": 0,
145
+ "vis_every_batches": 0,
146
+ "use_lora": false,
147
+ "lora_rank": 8,
148
+ "lora_alpha": 16.0,
149
+ "lora_sam3": false,
150
+ "lora_da3": false,
151
+ "lora_mask_embed": false,
152
+ "query_proj_mlp": false,
153
+ "no_query_proj": true,
154
+ "train_mask_embed": true,
155
+ "use_mask_refiner": false,
156
+ "init_scoring_from_sam3": false,
157
+ "init_text_crossattn_from_sam3": false,
158
+ "init_decoder_from_sam3": false,
159
+ "torch_compile": false,
160
+ "compile_mode": "reduce-overhead",
161
+ "batch_views": false,
162
+ "profile": false,
163
+ "use_spatial_tokens": true,
164
+ "use_spatial_attn_bias": false,
165
+ "use_text_spatial_bias": true,
166
+ "use_spatial_points": false,
167
+ "use_object_aware_spatial": true,
168
+ "spatial_augment_prob": 0.5,
169
+ "spatial_multi_instance_only": true,
170
+ "spatial_relational_prob": 0.0,
171
+ "spatial_gt_aware": true,
172
+ "spatial_ranking_weight": 0.0,
173
+ "spatial_ranking_margin": 0.5,
174
+ "mask_smooth_kernel": 0,
175
+ "include_categories": null,
176
+ "class_balanced": true,
177
+ "class_balance_power": 0.7,
178
+ "world_size": 7,
179
+ "resumed_from": "checkpoints/fullscale_no_qp_245s_100ep"
180
+ }