File size: 1,507 Bytes
f8e2b26 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 |
{
"aggregator_params": {},
"aggregator_type": "sum",
"common_params": {
"dropout": 0.1,
"hidden_dim": 512,
"interaction_encoder_enable": true,
"interaction_encoder_ffn_dim": 1024,
"interaction_encoder_n_heads": 8,
"interaction_encoder_n_layers": 4,
"projector_intermediate_dim": 512,
"track_encoder_ffn_dim": 1024,
"track_encoder_n_heads": 8,
"track_encoder_n_layers": 4
},
"mm_dim": 1024,
"object_interaction_encoder_enable": true,
"object_interaction_encoder_params": {
"dropout": 0.1,
"hidden_dim": 1024,
"n_heads": 8,
"n_layers": 2
},
"per_feature_params": {
"appearance": {
"feature_encoder_params": {
"emb_size": 128,
"hidden_dim": 512
},
"feature_encoder_type": "parts_appearance",
"hidden_dim": 512,
"interaction_encoder_ffn_dim": 1024,
"track_encoder_enable_motion_encoder": false,
"track_encoder_ffn_dim": 1024
},
"bbox": {
"feature_encoder_params": {
"input_dim": 5
},
"feature_encoder_type": "motion"
},
"keypoints": {
"feature_encoder_params": {
"input_dim": 35
},
"feature_encoder_type": "motion"
}
},
"similarity_prediction_head_hidden_dim": 1024,
"sph_common_params": {
"hidden_dim": 512
},
"sph_per_feature_params": {
"appearance": {
"hidden_dim": 512
},
"bbox": {
"hidden_dim": 512
},
"keypoints": {
"hidden_dim": 512
}
}
} |