vladislavbro commited on
Commit
a74dd14
·
verified ·
1 Parent(s): 0883a20

Add config from convert_d_fine_original_pytorch_checkpoint_to_hf.py

Browse files
Files changed (1) hide show
  1. config.json +24 -53
config.json CHANGED
@@ -1,21 +1,13 @@
1
  {
 
2
  "activation_dropout": 0.0,
3
  "activation_function": "silu",
4
  "anchor_image_size": null,
5
- "architectures": [
6
- "DFineForObjectDetection"
7
- ],
8
  "attention_dropout": 0.0,
9
  "auxiliary_loss": true,
10
  "backbone": null,
11
  "backbone_config": {
12
  "embedding_size": 32,
13
- "hidden_sizes": [
14
- 64,
15
- 128,
16
- 256,
17
- 512
18
- ],
19
  "layer_type": "basic",
20
  "model_type": "d_fine_resnet",
21
  "out_features": [
@@ -28,47 +20,23 @@
28
  3,
29
  4
30
  ],
31
- "stage_config": [
32
- [
33
- 64,
34
- 64,
35
- 128,
36
- 1,
37
- false,
38
- false,
39
- 3,
40
- 6
41
- ],
42
- [
43
- 128,
44
- 128,
45
- 512,
46
- 2,
47
- true,
48
- false,
49
- 3,
50
- 6
51
- ],
52
- [
53
- 512,
54
- 256,
55
- 1024,
56
- 5,
57
- true,
58
- true,
59
- 5,
60
- 6
61
- ],
62
- [
63
- 1024,
64
- 512,
65
- 2048,
66
- 2,
67
- true,
68
- true,
69
- 5,
70
- 6
71
- ]
72
  ],
73
  "stem_channels": [
74
  3,
@@ -89,6 +57,7 @@
89
  384
90
  ],
91
  "decoder_layers": 6,
 
92
  "decoder_n_points": [
93
  3,
94
  6,
@@ -294,21 +263,23 @@
294
  "layer_norm_eps": 1e-05,
295
  "layer_scale": 1,
296
  "learn_initial_query": false,
 
 
297
  "matcher_alpha": 0.25,
298
  "matcher_bbox_cost": 5.0,
299
  "matcher_class_cost": 2.0,
300
  "matcher_gamma": 2.0,
301
  "matcher_giou_cost": 2.0,
 
302
  "model_type": "d_fine",
303
  "normalize_before": false,
304
  "num_denoising": 100,
305
  "num_feature_levels": 3,
306
  "num_queries": 300,
307
  "positional_encoding_temperature": 10000,
308
- "reg_max": 32,
309
  "reg_scale": 4.0,
310
- "torch_dtype": "float32",
311
- "transformers_version": "4.49.0.dev0",
312
  "use_focal_loss": true,
313
  "use_pretrained_backbone": false,
314
  "use_timm_backbone": false,
 
1
  {
2
+ "_attn_implementation_autoset": true,
3
  "activation_dropout": 0.0,
4
  "activation_function": "silu",
5
  "anchor_image_size": null,
 
 
 
6
  "attention_dropout": 0.0,
7
  "auxiliary_loss": true,
8
  "backbone": null,
9
  "backbone_config": {
10
  "embedding_size": 32,
 
 
 
 
 
 
11
  "layer_type": "basic",
12
  "model_type": "d_fine_resnet",
13
  "out_features": [
 
20
  3,
21
  4
22
  ],
23
+ "stage_in_channels": [
24
+ 64,
25
+ 128,
26
+ 512,
27
+ 1024
28
+ ],
29
+ "stage_mid_channels": [
30
+ 64,
31
+ 128,
32
+ 256,
33
+ 512
34
+ ],
35
+ "stage_num_blocks": [
36
+ 1,
37
+ 2,
38
+ 5,
39
+ 2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
  ],
41
  "stem_channels": [
42
  3,
 
57
  384
58
  ],
59
  "decoder_layers": 6,
60
+ "decoder_method": "default",
61
  "decoder_n_points": [
62
  3,
63
  6,
 
263
  "layer_norm_eps": 1e-05,
264
  "layer_scale": 1,
265
  "learn_initial_query": false,
266
+ "lqe_hidden_dim": 64,
267
+ "lqe_layers": 2,
268
  "matcher_alpha": 0.25,
269
  "matcher_bbox_cost": 5.0,
270
  "matcher_class_cost": 2.0,
271
  "matcher_gamma": 2.0,
272
  "matcher_giou_cost": 2.0,
273
+ "max_num_bins": 32,
274
  "model_type": "d_fine",
275
  "normalize_before": false,
276
  "num_denoising": 100,
277
  "num_feature_levels": 3,
278
  "num_queries": 300,
279
  "positional_encoding_temperature": 10000,
 
280
  "reg_scale": 4.0,
281
+ "top_prob_values": 4,
282
+ "transformers_version": "4.50.0.dev0",
283
  "use_focal_loss": true,
284
  "use_pretrained_backbone": false,
285
  "use_timm_backbone": false,