Upload 3 files
Browse files- config.json +5 -5
- pytorch_model.bin +2 -2
config.json
CHANGED
|
@@ -19,7 +19,7 @@
|
|
| 19 |
"decoder_attention_heads": 8,
|
| 20 |
"decoder_depth_residual": false,
|
| 21 |
"decoder_ffn_dim": 256,
|
| 22 |
-
"decoder_layers":
|
| 23 |
"decoder_n_points": 4,
|
| 24 |
"decoder_self_attn": false,
|
| 25 |
"decoder_text_residual": false,
|
|
@@ -32,7 +32,7 @@
|
|
| 32 |
"dropout": 0.1,
|
| 33 |
"encoder_attention_heads": 8,
|
| 34 |
"encoder_ffn_dim": 256,
|
| 35 |
-
"encoder_layers":
|
| 36 |
"encoder_n_points": 4,
|
| 37 |
"focal_alpha": 0.25,
|
| 38 |
"freeze_backbone": true,
|
|
@@ -69,7 +69,7 @@
|
|
| 69 |
"num_depth_bins": 80,
|
| 70 |
"num_feature_levels": 4,
|
| 71 |
"num_queries": 1,
|
| 72 |
-
"num_text_output_layers":
|
| 73 |
"position_embedding_type": "sine",
|
| 74 |
"pretrained_backbone_path": "pretrained-models/swin_large_patch4_window7_224/model.safetensors",
|
| 75 |
"text_encoder_type": "pretrained-models/roberta-base",
|
|
@@ -78,8 +78,8 @@
|
|
| 78 |
"two_stage": false,
|
| 79 |
"use_dab": true,
|
| 80 |
"use_pretrained_backbone": true,
|
| 81 |
-
"use_text_guided_adapter":
|
| 82 |
"use_timm_backbone": true,
|
| 83 |
-
"vl_encoder_type": "
|
| 84 |
"with_box_refine": true
|
| 85 |
}
|
|
|
|
| 19 |
"decoder_attention_heads": 8,
|
| 20 |
"decoder_depth_residual": false,
|
| 21 |
"decoder_ffn_dim": 256,
|
| 22 |
+
"decoder_layers": 3,
|
| 23 |
"decoder_n_points": 4,
|
| 24 |
"decoder_self_attn": false,
|
| 25 |
"decoder_text_residual": false,
|
|
|
|
| 32 |
"dropout": 0.1,
|
| 33 |
"encoder_attention_heads": 8,
|
| 34 |
"encoder_ffn_dim": 256,
|
| 35 |
+
"encoder_layers": 6,
|
| 36 |
"encoder_n_points": 4,
|
| 37 |
"focal_alpha": 0.25,
|
| 38 |
"freeze_backbone": true,
|
|
|
|
| 69 |
"num_depth_bins": 80,
|
| 70 |
"num_feature_levels": 4,
|
| 71 |
"num_queries": 1,
|
| 72 |
+
"num_text_output_layers": 6,
|
| 73 |
"position_embedding_type": "sine",
|
| 74 |
"pretrained_backbone_path": "pretrained-models/swin_large_patch4_window7_224/model.safetensors",
|
| 75 |
"text_encoder_type": "pretrained-models/roberta-base",
|
|
|
|
| 78 |
"two_stage": false,
|
| 79 |
"use_dab": true,
|
| 80 |
"use_pretrained_backbone": true,
|
| 81 |
+
"use_text_guided_adapter": false,
|
| 82 |
"use_timm_backbone": true,
|
| 83 |
+
"vl_encoder_type": "simple-bridge-tower",
|
| 84 |
"with_box_refine": true
|
| 85 |
}
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b548993b0f92b4f4e1c18f2823f32c9b39cae8225277afa4b00a29447d940ea3
|
| 3 |
+
size 1365911480
|