| batch_size = 1 |
| modelname = "groundingdino" |
| backbone = "swin_T_224_1k" |
| position_embedding = "sine" |
| pe_temperatureH = 20 |
| pe_temperatureW = 20 |
| return_interm_indices = [1, 2, 3] |
| backbone_freeze_keywords = None |
| enc_layers = 6 |
| dec_layers = 6 |
| pre_norm = False |
| dim_feedforward = 2048 |
| hidden_dim = 256 |
| dropout = 0.0 |
| nheads = 8 |
| num_queries = 900 |
| query_dim = 4 |
| num_patterns = 0 |
| num_feature_levels = 4 |
| enc_n_points = 4 |
| dec_n_points = 4 |
| two_stage_type = "standard" |
| two_stage_bbox_embed_share = False |
| two_stage_class_embed_share = False |
| transformer_activation = "relu" |
| dec_pred_bbox_embed_share = True |
| dn_box_noise_scale = 1.0 |
| dn_label_noise_ratio = 0.5 |
| dn_label_coef = 1.0 |
| dn_bbox_coef = 1.0 |
| embed_init_tgt = True |
| dn_labelbook_size = 2000 |
| max_text_len = 256 |
| text_encoder_type = "bert-base-uncased" |
| use_text_enhancer = True |
| use_fusion_layer = True |
| use_checkpoint = True |
| use_transformer_ckpt = True |
| use_text_cross_attention = True |
| text_dropout = 0.0 |
| fusion_dropout = 0.0 |
| fusion_droppath = 0.1 |
| sub_sentence_present = True |
|
|