| { | |
| "architectures": [ | |
| "HierarchicalTwoStreamTransformer" | |
| ], | |
| "model_type": "custom_transformer", | |
| "cnn_backbone": "mobilenetv3_large_100", | |
| "visual_feature_dim": 256, | |
| "pose_feature_dim": 256, | |
| "fusion_type": "gated", | |
| "num_transformer_layers": 1, | |
| "num_attention_heads": 4, | |
| "embedding_dim": 256, | |
| "num_classes": 8, | |
| "image_size": [128, 128], | |
| "num_frames": 30 | |
| } | |