File size: 1,574 Bytes
9ce1696
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
{
  "backbone": {
    "embed_dim": 256,
    "embed_layer": "ConvPyramidPatchEmbed",
    "ffn_layer": "mlp",
    "ffn_ratio": 4,
    "interaction_indexes": [
      10,
      11
    ],
    "name": "ecpose_vittplus",
    "num_heads": 4,
    "num_levels": 3,
    "patch_size": 16,
    "proj_dim": null,
    "skip_load_backbone": false
  },
  "decoder": {
    "activation": "relu",
    "aux_loss": true,
    "cls_no_bias": false,
    "dec_n_points": 4,
    "dec_pred_class_embed_share": false,
    "dec_pred_pose_embed_share": false,
    "dim_feedforward": 512,
    "dropout": 0.0,
    "eval_spatial_size": [
      640,
      640
    ],
    "feat_strides": [
      8,
      16,
      32
    ],
    "hidden_dim": 256,
    "learnable_tgt_init": true,
    "nhead": 8,
    "normalize_before": false,
    "num_body_points": 17,
    "num_decoder_layers": 4,
    "num_feature_levels": 3,
    "num_queries": 60,
    "reg_max": 32,
    "reg_scale": 4,
    "return_intermediate_dec": true,
    "two_stage_bbox_embed_share": false,
    "two_stage_class_embed_share": false,
    "two_stage_type": "standard"
  },
  "encoder": {
    "act": "silu",
    "csp_type": "csp2",
    "depth_mult": 0.67,
    "dim_feedforward": 512,
    "dropout": 0.0,
    "expansion": 0.75,
    "feat_strides": [
      8,
      16,
      32
    ],
    "fuse_op": "sum",
    "hidden_dim": 256,
    "in_channels": [
      256,
      256,
      256
    ],
    "nhead": 8,
    "num_encoder_layers": 1,
    "use_encoder_idx": [
      2
    ]
  },
  "postprocessor": {
    "num_body_points": 17,
    "num_select": 60
  }
}