UniGenBench_Leaderboard_English_Long / leaderboard_data.json
CodeGoat24's picture
Update leaderboard_data.json
9a89940 verified
raw
history blame
18 kB
{
"leaderboard": [
{
"model": "BLIP-3o",
"link": "https://arxiv.org/pdf/2505.09568",
"hf": "https://huggingface.co/BLIP3o/BLIP3o-Model-8B",
"open_source": true,
"release_date": "2025-5",
"Overall": 59.87,
"Style": 92.80,
"World Knowledge": 80.22,
"Attribute-Overall": 63.89,
"Quantity": 51.39,
"Expression": 60.26,
"Material": 64.62,
"Size": 75.00,
"Shape": 54.37,
"Color": 81.67,
"Action-Overall": 63.97,
"Hand": 58.33,
"Full body": 70.11,
"Animal": 70.59,
"Non Contact": 60.20,
"Contact": 51.79,
"State": 71.70,
"Relationship-Overall": 66.50,
"Composition": 70.61,
"Similarity": 60.00,
"Inclusion": 67.39,
"Comparison": 64.84,
"Compound-Overall": 53.74,
"Imagination": 61.73,
"Feature matching": 45.57,
"Grammar-Overall": 68.58,
"Pronoun Reference": 79.04,
"Consistency": 61.11,
"Negation": 63.85,
"Layout-Overall": 68.47,
"2D": 72.79,
"3D": 64.02,
"Logical Reasoning": 39.55,
"Text": 1.15
},
{
"model": "CogVew4",
"link": "https://arxiv.org/pdf/2403.05121",
"hf": "https://huggingface.co/zai-org/CogView4-6B",
"open_source": true,
"release_date": "2024-3",
"Overall": 56.30,
"Style": 82.00,
"World Knowledge": 83.07,
"Attribute-Overall": 63.25,
"Quantity": 71.53,
"Expression": 44.23,
"Material": 55.19,
"Size": 72.22,
"Shape": 57.50,
"Color": 89.17,
"Action-Overall": 57.51,
"Hand": 53.85,
"Full body": 59.78,
"Animal": 68.38,
"Non Contact": 50.51,
"Contact": 51.19,
"State": 62.74,
"Relationship-Overall": 62.44,
"Composition": 60.47,
"Similarity": 60.00,
"Inclusion": 69.57,
"Comparison": 60.16,
"Compound-Overall": 44.72,
"Imagination": 47.19,
"Feature matching": 42.19,
"Grammar-Overall": 54.81,
"Pronoun Reference": 69.49,
"Consistency": 56.02,
"Negation": 38.46,
"Layout-Overall": 69.22,
"2D": 77.21,
"3D": 60.98,
"Logical Reasoning": 28.18,
"Text": 17.82
},
{
"model": "Hunyuan-DiT",
"link": "https://arxiv.org/pdf/2405.08748",
"hf": "https://huggingface.co/Tencent-Hunyuan/HunyuanDiT",
"open_source": true,
"release_date": "2024-5",
"Overall": 51.38,
"Style": 94.10,
"World Knowledge": 80.70,
"Attribute-Overall": 62.71,
"Quantity": 67.36,
"Expression": 44.23,
"Material": 71.70,
"Size": 61.81,
"Shape": 47.50,
"Color": 86.67,
"Action-Overall": 49.05,
"Hand": 35.90,
"Full body": 54.89,
"Animal": 54.41,
"Non Contact": 46.94,
"Contact": 35.71,
"State": 62.74,
"Relationship-Overall": 59.64,
"Composition": 60.14,
"Similarity": 64.44,
"Inclusion": 60.33,
"Comparison": 50.78,
"Compound-Overall": 41.62,
"Imagination": 46.68,
"Feature matching": 36.46,
"Grammar-Overall": 55.48,
"Pronoun Reference": 62.87,
"Consistency": 57.87,
"Negation": 45.77,
"Layout-Overall": 44.78,
"2D": 39.34,
"3D": 50.38,
"Logical Reasoning": 24.55,
"Text": 1.15
},
{
"model": "Janus",
"link": "https://arxiv.org/pdf/2410.13848",
"hf": "https://huggingface.co/deepseek-ai/Janus-1.3B",
"open_source": true,
"release_date": "2024-10",
"Overall": 51.23,
"Style": 89.90,
"World Knowledge": 73.58,
"Attribute-Overall": 54.81,
"Quantity": 37.50,
"Expression": 37.82,
"Material": 58.96,
"Size": 65.97,
"Shape": 47.50,
"Color": 86.67,
"Action-Overall": 50.38,
"Hand": 32.69,
"Full body": 51.63,
"Animal": 61.76,
"Non Contact": 48.47,
"Contact": 38.10,
"State": 66.51,
"Relationship-Overall": 55.08,
"Composition": 56.76,
"Similarity": 53.89,
"Inclusion": 59.24,
"Comparison": 46.88,
"Compound-Overall": 46.65,
"Imagination": 58.16,
"Feature matching": 34.90,
"Grammar-Overall": 59.09,
"Pronoun Reference": 66.18,
"Consistency": 51.39,
"Negation": 58.08,
"Layout-Overall": 54.85,
"2D": 57.72,
"3D": 51.89,
"Logical Reasoning": 26.82,
"Text": 1.15
},
{
"model": "Janus-flow",
"link": "https://arxiv.org/pdf/2411.07975",
"hf": "https://huggingface.co/deepseek-ai/JanusFlow-1.3B",
"open_source": true,
"release_date": "2024-11",
"Overall": 46.39,
"Style": 86.20,
"World Knowledge": 62.50,
"Attribute-Overall": 47.97,
"Quantity": 43.06,
"Expression": 30.77,
"Material": 55.19,
"Size": 55.56,
"Shape": 30.00,
"Color": 78.33,
"Action-Overall": 43.35,
"Hand": 23.08,
"Full body": 48.37,
"Animal": 58.82,
"Non Contact": 36.73,
"Contact": 36.31,
"State": 55.66,
"Relationship-Overall": 50.00,
"Composition": 59.80,
"Similarity": 38.89,
"Inclusion": 51.63,
"Comparison": 40.62,
"Compound-Overall": 45.10,
"Imagination": 57.65,
"Feature matching": 32.29,
"Grammar-Overall": 60.29,
"Pronoun Reference": 66.18,
"Consistency": 48.61,
"Negation": 63.85,
"Layout-Overall": 46.46,
"2D": 49.26,
"3D": 43.56,
"Logical Reasoning": 21.14,
"Text": 0.86
},
{
"model": "Emu-3",
"link": "https://arxiv.org/pdf/2409.18869",
"hf": "https://huggingface.co/BAAI/Emu3-Gen",
"open_source": true,
"release_date": "2024-09",
"Overall": 46.02,
"Style": 86.80,
"World Knowledge": 77.06,
"Attribute-Overall": 51.39,
"Quantity": 44.44,
"Expression": 45.51,
"Material": 53.77,
"Size": 43.06,
"Shape": 46.25,
"Color": 80.00,
"Action-Overall": 40.11,
"Hand": 25.00,
"Full body": 47.28,
"Animal": 50.74,
"Non Contact": 35.20,
"Contact": 27.98,
"State": 52.36,
"Relationship-Overall": 49.75,
"Composition": 56.76,
"Similarity": 46.67,
"Inclusion": 48.37,
"Comparison": 39.84,
"Compound-Overall": 36.86,
"Imagination": 41.33,
"Feature matching": 32.29,
"Grammar-Overall": 52.94,
"Pronoun Reference": 59.56,
"Consistency": 53.70,
"Negation": 45.38,
"Layout-Overall": 44.78,
"2D": 45.22,
"3D": 44.32,
"Logical Reasoning": 19.32,
"Text": 1.15
},
{
"model": "Playground2.5",
"link": "https://arxiv.org/pdf/2402.17245",
"hf": "https://huggingface.co/playgroundai/playground-v2-512px-base",
"open_source": true,
"release_date": "2024-02",
"Overall": 45.61,
"Style": 89.50,
"World Knowledge": 76.11,
"Attribute-Overall": 52.78,
"Quantity": 58.33,
"Expression": 43.59,
"Material": 57.08,
"Size": 44.44,
"Shape": 41.25,
"Color": 75.83,
"Action-Overall": 42.68,
"Hand": 28.85,
"Full body": 50.00,
"Animal": 52.21,
"Non Contact": 35.20,
"Contact": 29.17,
"State": 58.02,
"Relationship-Overall": 51.52,
"Composition": 60.14,
"Similarity": 49.44,
"Inclusion": 48.37,
"Comparison": 39.06,
"Compound-Overall": 35.44,
"Imagination": 43.88,
"Feature matching": 26.82,
"Grammar-Overall": 53.21,
"Pronoun Reference": 58.82,
"Consistency": 50.00,
"Negation": 50.00,
"Layout-Overall": 37.13,
"2D": 34.56,
"3D": 39.77,
"Logical Reasoning": 16.59,
"Text": 1.15
},
{
"model": "SDXL",
"link": "https://arxiv.org/pdf/2307.01952",
"hf": "https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0",
"open_source": true,
"release_date": "2023-07",
"Overall": 39.75,
"Style": 87.40,
"World Knowledge": 72.63,
"Attribute-Overall": 44.34,
"Quantity": 44.44,
"Expression": 25.00,
"Material": 52.83,
"Size": 44.44,
"Shape": 33.75,
"Color": 68.33,
"Action-Overall": 34.22,
"Hand": 19.23,
"Full body": 35.33,
"Animal": 43.38,
"Non Contact": 26.53,
"Contact": 24.40,
"State": 53.30,
"Relationship-Overall": 44.92,
"Composition": 53.72,
"Similarity": 38.33,
"Inclusion": 39.67,
"Comparison": 41.41,
"Compound-Overall": 26.68,
"Imagination": 33.93,
"Feature matching": 19.27,
"Grammar-Overall": 47.33,
"Pronoun Reference": 50.37,
"Consistency": 42.59,
"Negation": 48.08,
"Layout-Overall": 29.85,
"2D": 26.47,
"3D": 33.33,
"Logical Reasoning": 9.55,
"Text": 1.15
},
{
"model": "GPT-4o",
"link": "https://platform.openai.com/docs/guides/image-generation",
"hf": "-",
"open_source": false,
"release_date": "2025-04",
"Overall": 92.77,
"Style": 98.57,
"World Knowledge": 98.87,
"Attribute-Overall": 93.59,
"Quantity": 90.00,
"Expression": 94.70,
"Material": 94.20,
"Size": 91.61,
"Shape": 92.50,
"Color": 99.17,
"Action-Overall": 90.79,
"Hand": 89.74,
"Full body": 92.22,
"Animal": 87.12,
"Non Contact": 90.43,
"Contact": 89.82,
"State": 93.75,
"Relationship-Overall": 94.97,
"Composition": 96.23,
"Similarity": 95.00,
"Inclusion": 94.89,
"Comparison": 92.19,
"Compound-Overall": 93.55,
"Imagination": 95.64,
"Feature matching": 91.40,
"Grammar-Overall": 91.76,
"Pronoun Reference": 92.91,
"Consistency": 91.67,
"Negation": 90.57,
"Layout-Overall": 91.35,
"2D": 91.04,
"3D": 91.67,
"Logical Reasoning": 84.97,
"Text": 89.24
},
{
"model": "Imagen-4.0-Ultra",
"link": "https://deepmind.google/models/imagen/",
"hf": "-",
"open_source": false,
"release_date": "2025-06",
"Overall": 91.54,
"Style": 99.20,
"World Knowledge": 97.47,
"Attribute-Overall": 92.52,
"Quantity": 93.06,
"Expression": 81.41,
"Material": 94.34,
"Size": 95.83,
"Shape": 91.88,
"Color": 100.0,
"Action-Overall": 92.20,
"Hand": 90.38,
"Full body": 93.44,
"Animal": 91.91,
"Non Contact": 90.31,
"Contact": 89.29,
"State": 96.70,
"Relationship-Overall": 93.02,
"Composition": 95.27,
"Similarity": 84.44,
"Inclusion": 98.37,
"Comparison": 92.19,
"Compound-Overall": 91.37,
"Imagination": 92.86,
"Feature matching": 89.84,
"Grammar-Overall": 87.97,
"Pronoun Reference": 94.12,
"Consistency": 87.04,
"Negation": 82.31,
"Layout-Overall": 93.10,
"2D": 92.65,
"3D": 93.56,
"Logical Reasoning": 79.55,
"Text": 89.08
},
{
"model": "Seedream-3.0",
"link": "https://www.byteplus.com/en/product/Seedream",
"hf": "-",
"open_source": false,
"release_date": "2025-05",
"Overall": 78.95,
"Style": 98.10,
"World Knowledge": 95.25,
"Attribute-Overall": 85.58,
"Quantity": 80.56,
"Expression": 82.05,
"Material": 90.57,
"Size": 85.42,
"Shape": 78.12,
"Color": 97.50,
"Action-Overall": 82.98,
"Hand": 75.00,
"Full body": 89.67,
"Animal": 85.29,
"Non Contact": 75.51,
"Contact": 80.95,
"State": 90.09,
"Relationship-Overall": 80.84,
"Composition": 82.77,
"Similarity": 73.89,
"Inclusion": 84.24,
"Comparison": 81.25,
"Compound-Overall": 73.84,
"Imagination": 78.57,
"Feature matching": 69.01,
"Grammar-Overall": 61.36,
"Pronoun Reference": 79.78,
"Consistency": 69.91,
"Negation": 35.00,
"Layout-Overall": 87.31,
"2D": 86.76,
"3D": 87.88,
"Logical Reasoning": 52.73,
"Text": 71.55
},
{
"model": "Imagen-3.0",
"link": "https://arxiv.org/pdf/2408.07009",
"hf": "-",
"open_source": false,
"release_date": "2025-02",
"Overall": 71.85,
"Style": 89.25,
"World Knowledge": 94.75,
"Attribute-Overall": 77.33,
"Quantity": 75.78,
"Expression": 64.67,
"Material": 80.66,
"Size": 82.84,
"Shape": 70.00,
"Color": 93.10,
"Action-Overall": 81.46,
"Hand": 80.00,
"Full body": 83.89,
"Animal": 85.29,
"Non Contact": 77.37,
"Contact": 74.40,
"State": 87.38,
"Relationship-Overall": 82.86,
"Composition": 83.90,
"Similarity": 73.33,
"Inclusion": 88.64,
"Comparison": 83.90,
"Compound-Overall": 71.71,
"Imagination": 79.23,
"Feature matching": 64.06,
"Grammar-Overall": 69.84,
"Pronoun Reference": 79.04,
"Consistency": 70.75,
"Negation": 59.13,
"Layout-Overall": 81.34,
"2D": 82.72,
"3D": 79.92,
"Logical Reasoning": 48.36,
"Text": 21.55
},
{
"model": "DALL-E-3",
"link": "https://openai.com/zh-Hans-CN/index/dall-e-3/",
"hf": "-",
"open_source": false,
"release_date": "2024-09",
"Overall": 69.18,
"Style": 95.06,
"World Knowledge": 93.51,
"Attribute-Overall": 75.97,
"Quantity": 62.14,
"Expression": 59.87,
"Material": 87.74,
"Size": 87.50,
"Shape": 65.00,
"Color": 92.50,
"Action-Overall": 69.83,
"Hand": 60.90,
"Full body": 75.00,
"Animal": 76.47,
"Non Contact": 66.84,
"Contact": 63.41,
"State": 75.47,
"Relationship-Overall": 78.06,
"Composition": 82.43,
"Similarity": 69.44,
"Inclusion": 87.78,
"Comparison": 66.41,
"Compound-Overall": 70.60,
"Imagination": 76.79,
"Feature matching": 64.21,
"Grammar-Overall": 68.07,
"Pronoun Reference": 74.24,
"Consistency": 74.07,
"Negation": 56.64,
"Layout-Overall": 66.67,
"2D": 57.72,
"3D": 76.17,
"Logical Reasoning": 48.18,
"Text": 25.86
},
{
"model": "FLUX-pro-1.1-Ultra",
"link": "https://bfl.ai/",
"hf": "-",
"open_source": false,
"release_date": "2025-03",
"Overall": 70.67,
"Style": 90.60,
"World Knowledge": 91.61,
"Attribute-Overall": 76.50,
"Quantity": 75.69,
"Expression": 59.62,
"Material": 78.77,
"Size": 77.78,
"Shape": 74.38,
"Color": 96.67,
"Action-Overall": 76.50,
"Hand": 57.69,
"Full body": 68.48,
"Animal": 77.21,
"Non Contact": 76.53,
"Contact": 64.29,
"State": 76.89,
"Relationship-Overall": 77.54,
"Composition": 80.41,
"Similarity": 72.78,
"Inclusion": 82.07,
"Comparison": 71.09,
"Compound-Overall": 67.78,
"Imagination": 74.74,
"Feature matching": 60.68,
"Grammar-Overall": 70.05,
"Pronoun Reference": 84.56,
"Consistency": 68.98,
"Negation": 55.77,
"Layout-Overall": 81.53,
"2D": 80.15,
"3D": 82.95,
"Logical Reasoning": 43.18,
"Text": 37.36
},
{
"model": "Keling-Ketu",
"link": "https://kolors.kuaishou.com/",
"hf": "-",
"open_source": false,
"release_date": "2025-04",
"Overall": 65.93,
"Style": 92.27,
"World Knowledge": 86.62,
"Attribute-Overall": 71.66,
"Quantity": 75.00,
"Expression": 56.41,
"Material": 78.77,
"Size": 79.17,
"Shape": 53.12,
"Color": 91.38,
"Action-Overall": 68.73,
"Hand": 54.49,
"Full body": 76.09,
"Animal": 72.79,
"Non Contact": 69.90,
"Contact": 58.93,
"State": 76.89,
"Relationship-Overall": 70.94,
"Composition": 68.92,
"Similarity": 70.56,
"Inclusion": 74.46,
"Comparison": 71.09,
"Compound-Overall": 60.81,
"Imagination": 66.24,
"Feature matching": 55.26,
"Grammar-Overall": 71.26,
"Pronoun Reference": 77.21,
"Consistency": 67.59,
"Negation": 68.08,
"Layout-Overall": 77.23,
"2D": 80.97,
"3D": 73.36,
"Logical Reasoning": 43.75,
"Text": 16.03
},
{
"model": "Qwen-Image",
"link": "https://arxiv.org/pdf/2508.02324",
"hf": "https://huggingface.co/Qwen/Qwen-Image",
"open_source": true,
"release_date": "2025-08",
"Overall": 78.81,
"Style": 95.10,
"World Knowledge": 94.30,
"Attribute-Overall": 87.61,
"Quantity": 81.94,
"Expression": 84.62,
"Material": 91.98,
"Size": 84.03,
"Shape": 84.38,
"Color": 99.17,
"Action-Overall": 84.13,
"Hand": 82.05,
"Full body": 88.59,
"Animal": 88.24,
"Non Contact": 80.61,
"Contact": 77.38,
"State": 87.74,
"Relationship-Overall": 79.70,
"Composition": 81.76,
"Similarity": 67.78,
"Inclusion": 86.96,
"Comparison": 81.25,
"Compound-Overall": 73.32,
"Imagination": 73.21,
"Feature matching": 73.44,
"Grammar-Overall": 60.29,
"Pronoun Reference": 83.82,
"Consistency": 70.37,
"Negation": 27.31,
"Layout-Overall": 85.52,
"2D": 86.40,
"3D": 85.23,
"Logical Reasoning": 53.64,
"Text": 76.14
}
]
}