vladislavbro commited on
Commit
e0f0534
·
verified ·
1 Parent(s): e659afa

Add config from convert_d_fine_original_pytorch_checkpoint_to_hf.py

Browse files
Files changed (1) hide show
  1. config.json +43 -6
config.json CHANGED
@@ -1,15 +1,22 @@
1
  {
 
2
  "activation_dropout": 0.0,
3
  "activation_function": "silu",
4
  "anchor_image_size": null,
5
- "architectures": [
6
- "DFineForObjectDetection"
7
- ],
8
  "attention_dropout": 0.0,
9
  "auxiliary_loss": true,
10
  "backbone": null,
11
  "backbone_config": {
 
 
 
 
 
 
 
 
12
  "embedding_size": 32,
 
13
  "hidden_sizes": [
14
  192,
15
  384,
@@ -17,7 +24,8 @@
17
  1536
18
  ],
19
  "layer_type": "basic",
20
- "model_type": "d_fine_resnet",
 
21
  "out_features": [
22
  "stage2",
23
  "stage3",
@@ -28,18 +36,49 @@
28
  3,
29
  4
30
  ],
 
 
 
 
 
 
31
  "stage_in_channels": [
32
  32,
33
  96,
34
  384,
35
  768
36
  ],
 
 
 
 
 
 
 
 
 
 
 
 
37
  "stage_mid_channels": [
38
  32,
39
  64,
40
  128,
41
  256
42
  ],
 
 
 
 
 
 
 
 
 
 
 
 
 
43
  "stage_numb_of_layers": [
44
  4,
45
  4,
@@ -80,7 +119,6 @@
80
  ],
81
  "decoder_offset_scale": 0.5,
82
  "depth_mult": 0.67,
83
- "disable_custom_kernels": true,
84
  "dropout": 0.0,
85
  "encode_proj_layers": [
86
  2
@@ -294,7 +332,6 @@
294
  "positional_encoding_temperature": 10000,
295
  "reg_scale": 4.0,
296
  "top_prob_values": 4,
297
- "torch_dtype": "float32",
298
  "transformers_version": "4.50.0.dev0",
299
  "use_focal_loss": true,
300
  "use_pretrained_backbone": false,
 
1
  {
2
+ "_attn_implementation_autoset": true,
3
  "activation_dropout": 0.0,
4
  "activation_function": "silu",
5
  "anchor_image_size": null,
 
 
 
6
  "attention_dropout": 0.0,
7
  "auxiliary_loss": true,
8
  "backbone": null,
9
  "backbone_config": {
10
+ "depths": [
11
+ 3,
12
+ 4,
13
+ 6,
14
+ 3
15
+ ],
16
+ "downsample_in_bottleneck": false,
17
+ "downsample_in_first_stage": false,
18
  "embedding_size": 32,
19
+ "hidden_act": "relu",
20
  "hidden_sizes": [
21
  192,
22
  384,
 
24
  1536
25
  ],
26
  "layer_type": "basic",
27
+ "model_type": "hgnet_v2",
28
+ "num_channels": 3,
29
  "out_features": [
30
  "stage2",
31
  "stage3",
 
36
  3,
37
  4
38
  ],
39
+ "stage_downsample": [
40
+ false,
41
+ true,
42
+ true,
43
+ true
44
+ ],
45
  "stage_in_channels": [
46
  32,
47
  96,
48
  384,
49
  768
50
  ],
51
+ "stage_kernel_size": [
52
+ 3,
53
+ 3,
54
+ 5,
55
+ 5
56
+ ],
57
+ "stage_light_block": [
58
+ false,
59
+ false,
60
+ true,
61
+ true
62
+ ],
63
  "stage_mid_channels": [
64
  32,
65
  64,
66
  128,
67
  256
68
  ],
69
+ "stage_names": [
70
+ "stem",
71
+ "stage1",
72
+ "stage2",
73
+ "stage3",
74
+ "stage4"
75
+ ],
76
+ "stage_num_blocks": [
77
+ 1,
78
+ 1,
79
+ 3,
80
+ 1
81
+ ],
82
  "stage_numb_of_layers": [
83
  4,
84
  4,
 
119
  ],
120
  "decoder_offset_scale": 0.5,
121
  "depth_mult": 0.67,
 
122
  "dropout": 0.0,
123
  "encode_proj_layers": [
124
  2
 
332
  "positional_encoding_temperature": 10000,
333
  "reg_scale": 4.0,
334
  "top_prob_values": 4,
 
335
  "transformers_version": "4.50.0.dev0",
336
  "use_focal_loss": true,
337
  "use_pretrained_backbone": false,