| {"vit_model": "facebook/dino-vitb8", "bert_model": "bert-base-uncased", "num_answers": 25, "architecture": "ViT+BERT with Cross-Attention and Contrastive Loss"} |
| {"vit_model": "facebook/dino-vitb8", "bert_model": "bert-base-uncased", "num_answers": 25, "architecture": "ViT+BERT with Cross-Attention and Contrastive Loss"} |