[ { "dataset": "DocVQA", "image": "sample_images/docvqa_sample1.png", "question": "What is the 'actual' value per 1000, during the year 1975?", "ground_truth": "0.28", "description": "Document question answering about statistical data" }, { "dataset": "DocVQA", "image": "sample_images/docvqa_sample2.png", "question": "What is name of university?", "ground_truth": "University of California", "description": "Document question answering about institutional information" }, { "dataset": "InfographicVQA", "image": "sample_images/infovqa_sample1.jpeg", "question": "Which social platform has heavy female audience?", "ground_truth": "Pinterest", "description": "Infographic question answering about social media demographics" }, { "dataset": "ChartQA", "image": "sample_images/chartqa_sample1.jpeg", "question": "What is the highest value in the chart?", "ground_truth": "Unknown (sample chart)", "description": "Chart question answering about data visualization" }, { "dataset": "TextVQA", "image": "sample_images/textvqa_sample1.jpg", "question": "What text is visible in the image?", "ground_truth": "Various text (sample image)", "description": "Text-based visual question answering" }, { "dataset": "VQAv2", "image": "sample_images/vqav2_sample1.png", "question": "What is in the image?", "ground_truth": "Various objects (sample image)", "description": "General visual question answering" } ]