| { |
| "leaderboard": [ |
| { |
| "model": "Janus-Pro", |
| "link": "https://arxiv.org/pdf/2501.17811", |
| "hf": "https://huggingface.co/deepseek-ai/Janus-Pro-7B", |
| "open_source": true, |
| "release_date": "2025-01", |
|
|
| "Overall": 71.11, |
| "Style": 94.02, |
| "World Knowledge": 88.15, |
| "Attribute-Overall": 81.81, |
| "Quantity": 62.23, |
| "Expression": 66.39, |
| "Material": 83.43, |
| "Size": 85.42, |
| "Shape": 75.87, |
| "Color": 89.20, |
| |
| "Action-Overall": 69.14, |
| "Hand": 57.69, |
| "Full body": 73.44, |
| "Animal": 76.09, |
| "Non Contact": 62.95, |
| "Contact": 61.21, |
| "State": 73.52, |
| |
| "Relationship-Overall": 77.96, |
| "Composition": 77.42, |
| "Similarity": 71.15, |
| "Inclusion": 82.18, |
| "Comparison": 80.58, |
| |
| "Compound-Overall": 76.53, |
| "Imagination": 80.59, |
| "Feature matching": 67.52, |
| |
| "Grammar-Overall": 74.62, |
| "Pronoun Reference": 87.30, |
| "Consistency": 73.81, |
| "Negation": 64.08, |
| |
| "Layout-Overall": 82.14, |
| "2D": 81.78, |
| "3D": 82.61, |
| |
| "Logical Reasoning": 62.62, |
| |
| "Text": 4.08 |
| }, |
| { |
| "model": "SD-3.5-Large", |
| "link": "https://stability.ai/news/introducing-stable-diffusion-3-5", |
| "hf": "https://huggingface.co/stabilityai/stable-diffusion-3.5-large", |
| "open_source": true, |
| "release_date": "2024-10", |
|
|
| "Overall": 64.35, |
| "Style": 88.12, |
| "World Knowledge": 88.15, |
|
|
| "Attribute-Overall": 78.78, |
| "Quantity": 68.62, |
| "Expression": 62.22, |
| "Material": 81.85, |
| "Size": 78.79, |
| "Shape": 70.63, |
| "Color": 86.32, |
| |
| "Action-Overall": 59.63, |
| "Hand": 57.69, |
| "Full body": 52.81, |
| "Animal": 57.25, |
| "Non Contact": 50.89, |
| "Contact": 48.85, |
| "State": 68.68, |
| |
| "Relationship-Overall": 67.62, |
| "Composition": 70.15, |
| "Similarity": 62.18, |
| "Inclusion": 70.11, |
| "Comparison": 64.81, |
| |
| "Compound-Overall": 62.21, |
| "Imagination": 65.82, |
| "Feature matching": 54.21, |
| |
| "Grammar-Overall": 65.23, |
| "Pronoun Reference": 75.79, |
| "Consistency": 61.51, |
| "Negation": 59.15, |
| |
| "Layout-Overall": 71.19, |
| "2D": 73.45, |
| "3D": 68.30, |
| |
| "Logical Reasoning": 44.90, |
| |
| "Text": 17.66 |
| }, |
| { |
| "model": "Seedream-4.0", |
| "link": "https://www.volcengine.com/docs/82379/1541523", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2025-09", |
|
|
| "Overall": 89.77, |
|
|
| "Style": 98.42, |
|
|
| "World Knowledge": 95.95, |
|
|
| "Attribute-Overall": 95.06, |
| "Quantity": 92.02, |
| "Expression": 89.31, |
| "Material": 95.26, |
| "Size": 94.70, |
| "Shape": 92.48, |
| "Color": 98.27, |
|
|
| "Action-Overall": 86.76, |
| "Hand": 83.01, |
| "Full body": 87.50, |
| "Animal": 81.52, |
| "Non Contact": 88.39, |
| "Contact": 83.62, |
| "State": 89.82, |
|
|
| "Relationship-Overall": 88.69, |
| "Composition": 87.37, |
| "Similarity": 80.77, |
| "Inclusion": 93.97, |
| "Comparison": 92.72, |
|
|
| "Compound-Overall": 87.79, |
| "Imagination": 88.19, |
| "Feature matching": 86.92, |
|
|
| "Grammar-Overall": 82.74, |
| "Pronoun Reference": 95.63, |
| "Consistency": 83.33, |
| "Negation": 70.77, |
|
|
| "Layout-Overall": 92.38, |
| "2D": 92.94, |
| "3D": 91.67, |
|
|
| "Logical Reasoning": 79.13, |
|
|
| "Text": 90.76 |
| }, |
| { |
| "model": "DALL-E-3", |
| "link": "https://openai.com/zh-Hans-CN/index/dall-e-3/", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2023-09", |
|
|
| "Overall": 70.82, |
|
|
| "Style": 95.08, |
|
|
| "World Knowledge": 92.71, |
|
|
| "Attribute-Overall": 84.98, |
| "Quantity": 64.67, |
| "Expression": 72.59, |
| "Material": 88.72, |
| "Size": 89.48, |
| "Shape": 77.14, |
| "Color": 90.15, |
|
|
| "Action-Overall": 68.36, |
| "Hand": 63.49, |
| "Full body": 63.96, |
| "Animal": 67.03, |
| "Non Contact": 59.55, |
| "Contact": 60.17, |
| "State": 76.29, |
|
|
| "Relationship-Overall": 77.90, |
| "Composition": 80.57, |
| "Similarity": 70.51, |
| "Inclusion": 83.53, |
| "Comparison": 73.76, |
|
|
| "Compound-Overall": 73.88, |
| "Imagination": 77.67, |
| "Feature matching": 65.00, |
|
|
| "Grammar-Overall": 68.19, |
| "Pronoun Reference": 82.92, |
| "Consistency": 66.27, |
| "Negation": 56.99, |
|
|
| "Layout-Overall": 71.76, |
| "2D": 69.22, |
| "3D": 75.00, |
|
|
| "Logical Reasoning": 57.11, |
|
|
| "Text": 18.26 |
| }, |
| { |
| "model": "Runway-Gen4-Image", |
| "link": "https://docs.dev.runwayml.com/api/#tag/Start-generating/paths/~1v1~1text_to_image/post", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2024-11", |
|
|
| "Overall": 68.29, |
|
|
| "Style": 91.72, |
|
|
| "World Knowledge": 88.82, |
|
|
| "Attribute-Overall": 79.83, |
| "Quantity": 70.65, |
| "Expression": 65.43, |
| "Material": 85.33, |
| "Size": 81.01, |
| "Shape": 67.38, |
| "Color": 85.64, |
|
|
| "Action-Overall": 64.30, |
| "Hand": 55.33, |
| "Full body": 63.92, |
| "Animal": 70.65, |
| "Non Contact": 56.82, |
| "Contact": 56.10, |
| "State": 69.76, |
|
|
| "Relationship-Overall": 69.53, |
| "Composition": 70.05, |
| "Similarity": 59.09, |
| "Inclusion": 76.76, |
| "Comparison": 70.39, |
|
|
| "Compound-Overall": 68.57, |
| "Imagination": 69.47, |
| "Feature matching": 66.50, |
|
|
| "Grammar-Overall": 70.55, |
| "Pronoun Reference": 76.23, |
| "Consistency": 62.70, |
| "Negation": 72.76, |
|
|
| "Layout-Overall": 73.79, |
| "2D": 72.56, |
| "3D": 75.37, |
|
|
| "Logical Reasoning": 48.28, |
|
|
| "Text": 27.47 |
| }, |
| { |
| "model": "Imagen-4.0-generate-preview-06-06", |
| "link": "https://deepmind.google/models/imagen/", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2025-01", |
|
|
| "Overall": 85.34, |
|
|
| "Style": 94.44, |
|
|
| "World Knowledge": 97.11, |
|
|
| "Attribute-Overall": 90.14, |
| "Quantity": 82.45, |
| "Expression": 77.64, |
| "Material": 90.96, |
| "Size": 92.23, |
| "Shape": 86.36, |
| "Color": 95.60, |
|
|
| "Action-Overall": 82.62, |
| "Hand": 83.65, |
| "Full body": 82.81, |
| "Animal": 78.62, |
| "Non Contact": 85.27, |
| "Contact": 78.74, |
| "State": 84.09, |
|
|
| "Relationship-Overall": 86.42, |
| "Composition": 86.48, |
| "Similarity": 80.13, |
| "Inclusion": 91.38, |
| "Comparison": 86.89, |
|
|
| "Compound-Overall": 86.56, |
| "Imagination": 86.81, |
| "Feature matching": 85.98, |
|
|
| "Grammar-Overall": 81.35, |
| "Pronoun Reference": 94.05, |
| "Consistency": 80.56, |
| "Negation": 70.77, |
|
|
| "Layout-Overall": 90.24, |
| "2D": 90.40, |
| "3D": 90.04, |
|
|
| "Logical Reasoning": 72.82, |
|
|
| "Text": 71.74 |
| }, |
| { |
| "model": "Imagen-3.0-generate-002", |
| "link": "https://arxiv.org/pdf/2408.07009", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2025-02", |
|
|
| "Overall": 75.76, |
|
|
| "Style": 92.41, |
|
|
| "World Knowledge": 94.19, |
|
|
| "Attribute-Overall": 86.32, |
| "Quantity": 75.58, |
| "Expression": 71.41, |
| "Material": 88.34, |
| "Size": 88.52, |
| "Shape": 78.27, |
| "Color": 93.13, |
|
|
| "Action-Overall": 75.81, |
| "Hand": 73.63, |
| "Full body": 77.12, |
| "Animal": 76.81, |
| "Non Contact": 69.44, |
| "Contact": 65.48, |
| "State": 80.62, |
|
|
| "Relationship-Overall": 80.76, |
| "Composition": 80.15, |
| "Similarity": 74.17, |
| "Inclusion": 90.59, |
| "Comparison": 78.54, |
|
|
| "Compound-Overall": 78.70, |
| "Imagination": 81.14, |
| "Feature matching": 73.22, |
|
|
| "Grammar-Overall": 77.96, |
| "Pronoun Reference": 91.67, |
| "Consistency": 76.61, |
| "Negation": 66.67, |
|
|
| "Layout-Overall": 86.06, |
| "2D": 83.97, |
| "3D": 88.69, |
|
|
| "Logical Reasoning": 61.25, |
|
|
| "Text": 24.18 |
| }, |
| { |
| "model": "Stability-AI-stable-image-ultra", |
| "link": "https://platform.stability.ai/docs/api-reference#tag/Generate/paths/~1v2beta~1stable-image~1generate~1ultra/post", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2024-06", |
|
|
| "Overall": 62.01, |
|
|
| "Style": 85.63, |
|
|
| "World Knowledge": 86.71, |
|
|
| "Attribute-Overall": 74.73, |
| "Quantity": 66.49, |
| "Expression": 55.69, |
| "Material": 76.43, |
| "Size": 77.27, |
| "Shape": 67.48, |
| "Color": 83.02, |
|
|
| "Action-Overall": 58.27, |
| "Hand": 58.33, |
| "Full body": 49.38, |
| "Animal": 59.42, |
| "Non Contact": 52.23, |
| "Contact": 45.98, |
| "State": 66.30, |
|
|
| "Relationship-Overall": 63.63, |
| "Composition": 64.92, |
| "Similarity": 56.73, |
| "Inclusion": 67.53, |
| "Comparison": 63.11, |
|
|
| "Compound-Overall": 58.28, |
| "Imagination": 62.66, |
| "Feature matching": 48.60, |
|
|
| "Grammar-Overall": 65.10, |
| "Pronoun Reference": 76.19, |
| "Consistency": 61.11, |
| "Negation": 58.80, |
|
|
| "Layout-Overall": 71.67, |
| "2D": 74.86, |
| "3D": 67.57, |
|
|
| "Logical Reasoning": 40.29, |
|
|
| "Text": 15.76 |
| }, |
| { |
| "model": "FLUX-pro-1.1-Ultra", |
| "link": "https://bfl.ai/", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2024-11", |
|
|
| "Overall": 75.40, |
|
|
| "Style": 91.36, |
|
|
| "World Knowledge": 91.76, |
|
|
| "Attribute-Overall": 84.97, |
| "Quantity": 79.26, |
| "Expression": 68.58, |
| "Material": 82.98, |
| "Size": 89.96, |
| "Shape": 80.59, |
| "Color": 93.01, |
|
|
| "Action-Overall": 72.43, |
| "Hand": 67.31, |
| "Full body": 66.25, |
| "Animal": 73.19, |
| "Non Contact": 66.96, |
| "Contact": 62.07, |
| "State": 80.53, |
|
|
| "Relationship-Overall": 81.90, |
| "Composition": 81.89, |
| "Similarity": 74.04, |
| "Inclusion": 90.52, |
| "Comparison": 80.58, |
|
|
| "Compound-Overall": 78.07, |
| "Imagination": 80.40, |
| "Feature matching": 72.88, |
|
|
| "Grammar-Overall": 71.94, |
| "Pronoun Reference": 84.52, |
| "Consistency": 68.55, |
| "Negation": 63.73, |
|
|
| "Layout-Overall": 82.62, |
| "2D": 81.78, |
| "3D": 83.70, |
|
|
| "Logical Reasoning": 60.92, |
|
|
| "Text": 38.04 |
| }, |
| { |
| "model": "Qwen-Image", |
| "link": "https://arxiv.org/pdf/2508.02324", |
| "hf": "https://huggingface.co/Qwen/Qwen-Image", |
| "open_source": true, |
| "release_date": "2025-08", |
|
|
| "Overall": 83.94, |
|
|
| "Style": 96.93, |
|
|
| "World Knowledge": 95.09, |
|
|
| "Attribute-Overall": 93.65, |
| "Quantity": 92.02, |
| "Expression": 89.86, |
| "Material": 94.50, |
| "Size": 89.58, |
| "Shape": 86.71, |
| "Color": 97.85, |
|
|
| "Action-Overall": 81.86, |
| "Hand": 78.53, |
| "Full body": 81.88, |
| "Animal": 83.70, |
| "Non Contact": 83.04, |
| "Contact": 71.84, |
| "State": 85.57, |
|
|
| "Relationship-Overall": 83.41, |
| "Composition": 81.76, |
| "Similarity": 79.17, |
| "Inclusion": 88.79, |
| "Comparison": 85.19, |
|
|
| "Compound-Overall": 81.98, |
| "Imagination": 82.38, |
| "Feature matching": 81.07, |
|
|
| "Grammar-Overall": 73.86, |
| "Pronoun Reference": 90.48, |
| "Consistency": 78.57, |
| "Negation": 54.93, |
|
|
| "Layout-Overall": 88.97, |
| "2D": 91.24, |
| "3D": 86.05, |
|
|
| "Logical Reasoning": 66.75, |
|
|
| "Text": 76.90 |
| }, |
| { |
| "model": "FLUX-kontext-pro", |
| "link": "https://bfl.ai/models/flux-kontext", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2025-05", |
|
|
| "Overall": 78.58, |
| "Style": 94.83, |
| "World Knowledge": 93.60, |
|
|
| "Attribute-Overall": 86.24, |
| "Quantity": 74.47, |
| "Expression": 75.00, |
| "Material": 85.47, |
| "Size": 89.58, |
| "Shape": 80.63, |
| "Color": 92.89, |
| |
| "Action-Overall": 74.44, |
| "Hand": 73.05, |
| "Full body": 73.12, |
| "Animal": 75.00, |
| "Non Contact": 67.73, |
| "Contact": 70.40, |
| "State": 77.98, |
| |
| "Relationship-Overall": 78.40, |
| "Composition": 73.85, |
| "Similarity": 72.08, |
| "Inclusion": 89.08, |
| "Comparison": 82.77, |
| |
| "Compound-Overall": 79.75, |
| "Imagination": 83.58, |
| "Feature matching": 71.23, |
| |
| "Grammar-Overall": 77.05, |
| "Pronoun Reference": 90.32, |
| "Consistency": 75.40, |
| "Negation": 66.90, |
| |
| "Layout-Overall": 85.46, |
| "2D": 84.09, |
| "3D": 87.23, |
| |
| "Logical Reasoning": 66.26, |
| |
| "Text": 49.73 |
| }, |
| { |
| "model": "Hunyuan-DiT", |
| "link": "https://arxiv.org/pdf/2405.08748", |
| "hf": "https://huggingface.co/Tencent-Hunyuan/HunyuanDiT", |
| "open_source": true, |
| "release_date": "2024-05", |
|
|
| "Overall": 54.88, |
|
|
| "Style": 92.94, |
|
|
| "World Knowledge": 80.06, |
|
|
| "Attribute-Overall": 69.47, |
| "Quantity": 65.43, |
| "Expression": 52.22, |
| "Material": 72.14, |
| "Size": 75.19, |
| "Shape": 58.22, |
| "Color": 76.31, |
|
|
| "Action-Overall": 48.80, |
| "Hand": 39.10, |
| "Full body": 46.25, |
| "Animal": 47.46, |
| "Non Contact": 41.07, |
| "Contact": 34.48, |
| "State": 59.58, |
|
|
| "Relationship-Overall": 55.66, |
| "Composition": 56.89, |
| "Similarity": 55.45, |
| "Inclusion": 57.18, |
| "Comparison": 52.18, |
|
|
| "Compound-Overall": 50.22, |
| "Imagination": 55.49, |
| "Feature matching": 38.55, |
|
|
| "Grammar-Overall": 58.76, |
| "Pronoun Reference": 64.68, |
| "Consistency": 59.52, |
| "Negation": 52.82, |
|
|
| "Layout-Overall": 61.43, |
| "2D": 60.45, |
| "3D": 62.68, |
|
|
| "Logical Reasoning": 29.85, |
|
|
| "Text": 1.63 |
| }, |
| { |
| "model": "FLUX.1-dev", |
| "link": "https://bfl.ai/blog/24-08-01-bfl", |
| "hf": "https://huggingface.co/black-forest-labs/FLUX.1-dev", |
| "open_source": true, |
| "release_date": "2024-08", |
|
|
| "Overall": 69.42, |
| "Style": 89.29, |
| "World Knowledge": 89.45, |
|
|
| "Attribute-Overall": 79.90, |
| "Quantity": 73.94, |
| "Expression": 64.44, |
| "Material": 80.05, |
| "Size": 84.47, |
| "Shape": 71.50, |
| "Color": 87.47, |
| |
| "Action-Overall": 64.54, |
| "Hand": 63.78, |
| "Full body": 62.50, |
| "Animal": 65.94, |
| "Non Contact": 56.70, |
| "Contact": 56.32, |
| "State": 69.57, |
| |
| "Relationship-Overall": 69.40, |
| "Composition": 65.05, |
| "Similarity": 66.03, |
| "Inclusion": 79.60, |
| "Comparison": 71.60, |
| |
| "Compound-Overall": 68.46, |
| "Imagination": 71.10, |
| "Feature matching": 62.62, |
| |
| "Grammar-Overall": 70.56, |
| "Pronoun Reference": 83.33, |
| "Consistency": 67.46, |
| "Negation": 61.97, |
| |
| "Layout-Overall": 77.54, |
| "2D": 81.21, |
| "3D": 72.83, |
| |
| "Logical Reasoning": 54.37, |
| |
| "Text": 30.71 |
| }, |
| { |
| "model": "FLUX-kontext-max", |
| "link": "https://bfl.ai/models/flux-kontext", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2025-05", |
|
|
| "Overall": 80.88, |
| "Style": 96.51, |
| "World Knowledge": 93.35, |
|
|
| "Attribute-Overall": 87.45, |
| "Quantity": 79.79, |
| "Expression": 76.68, |
| "Material": 87.35, |
| "Size": 88.83, |
| "Shape": 81.51, |
| "Color": 93.74, |
| |
| "Action-Overall": 75.52, |
| "Hand": 73.08, |
| "Full body": 75.94, |
| "Animal": 74.28, |
| "Non Contact": 66.82, |
| "Contact": 71.55, |
| "State": 79.76, |
| |
| "Relationship-Overall": 80.78, |
| "Composition": 77.30, |
| "Similarity": 73.05, |
| "Inclusion": 89.94, |
| "Comparison": 85.44, |
| |
| "Compound-Overall": 82.24, |
| "Imagination": 84.75, |
| "Feature matching": 76.65, |
| |
| "Grammar-Overall": 79.34, |
| "Pronoun Reference": 90.08, |
| "Consistency": 76.61, |
| "Negation": 72.18, |
| |
| "Layout-Overall": 87.58, |
| "2D": 85.73, |
| "3D": 89.96, |
| |
| "Logical Reasoning": 71.12, |
| |
| "Text": 54.89 |
| }, |
| { |
| "model": "Recraft", |
| "link": "https://www.recraft.ai/docs#generate-image", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2024-12", |
|
|
| "Overall": 60.93, |
| "Style": 87.13, |
| "World Knowledge": 86.99, |
|
|
| "Attribute-Overall": 73.23, |
| "Quantity": 56.38, |
| "Expression": 57.22, |
| "Material": 72.82, |
| "Size": 76.89, |
| "Shape": 63.64, |
| "Color": 83.07, |
| |
| "Action-Overall": 51.77, |
| "Hand": 40.06, |
| "Full body": 54.37, |
| "Animal": 55.07, |
| "Non Contact": 45.09, |
| "Contact": 37.36, |
| "State": 60.08, |
| |
| "Relationship-Overall": 55.82, |
| "Composition": 51.79, |
| "Similarity": 46.47, |
| "Inclusion": 66.09, |
| "Comparison": 61.89, |
| |
| "Compound-Overall": 49.56, |
| "Imagination": 50.21, |
| "Feature matching": 48.13, |
| |
| "Grammar-Overall": 60.28, |
| "Pronoun Reference": 73.41, |
| "Consistency": 55.56, |
| "Negation": 52.82, |
| |
| "Layout-Overall": 63.81, |
| "2D": 65.96, |
| "3D": 61.05, |
| |
| "Logical Reasoning": 34.22, |
| |
| "Text": 46.47 |
| }, |
| { |
| "model": "wan2.2-t2i-plus", |
| "link": "https://help.aliyun.com/zh/model-studio/text-to-image-v2-api-reference", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2025-07", |
|
|
| "Overall": 68.76, |
| "Style": 90.28, |
| "World Knowledge": 87.57, |
|
|
| "Attribute-Overall": 81.08, |
| "Quantity": 78.19, |
| "Expression": 69.17, |
| "Material": 80.42, |
| "Size": 82.77, |
| "Shape": 73.60, |
| "Color": 88.10, |
| |
| "Action-Overall": 66.49, |
| "Hand": 64.10, |
| "Full body": 60.94, |
| "Animal": 70.29, |
| "Non Contact": 59.38, |
| "Contact": 55.46, |
| "State": 73.32, |
| |
| "Relationship-Overall": 72.79, |
| "Composition": 69.13, |
| "Similarity": 66.67, |
| "Inclusion": 81.03, |
| "Comparison": 77.43, |
| |
| "Compound-Overall": 71.73, |
| "Imagination": 74.16, |
| "Feature matching": 66.36, |
| |
| "Grammar-Overall": 70.18, |
| "Pronoun Reference": 86.90, |
| "Consistency": 61.11, |
| "Negation": 63.38, |
| |
| "Layout-Overall": 79.13, |
| "2D": 82.34, |
| "3D": 75.00, |
| |
| "Logical Reasoning": 55.58, |
| |
| "Text": 12.77 |
| }, |
| { |
| "model": "Nano Banana", |
| "link": "https://ainanobanana.io/", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2025-08", |
|
|
| "Overall": 88.82, |
|
|
| "Style": 98.83, |
|
|
| "World Knowledge": 95.78, |
|
|
| "Attribute-Overall": 93.06, |
| "Quantity": 88.24, |
| "Expression": 86.09, |
| "Material": 93.05, |
| "Size": 93.70, |
| "Shape": 88.73, |
| "Color": 97.31, |
|
|
| "Action-Overall": 83.93, |
| "Hand": 84.57, |
| "Full body": 84.95, |
| "Animal": 81.16, |
| "Non Contact": 83.41, |
| "Contact": 78.16, |
| "State": 86.28, |
|
|
| "Relationship-Overall": 91.59, |
| "Composition": 90.98, |
| "Similarity": 91.32, |
| "Inclusion": 92.80, |
| "Comparison": 91.91, |
|
|
| "Compound-Overall": 90.63, |
| "Imagination": 92.15, |
| "Feature matching": 87.23, |
|
|
| "Grammar-Overall": 89.33, |
| "Pronoun Reference": 94.84, |
| "Consistency": 89.24, |
| "Negation": 84.51, |
|
|
| "Layout-Overall": 94.04, |
| "2D": 94.77, |
| "3D": 93.12, |
|
|
| "Logical Reasoning": 81.27, |
|
|
| "Text": 69.75 |
| }, |
| { |
| "model": "GPT-4o", |
| "link": "https://platform.openai.com/docs/guides/image-generation", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2025-03", |
|
|
| "Overall": 92.63, |
|
|
| "Style": 99.08, |
|
|
| "World Knowledge": 97.95, |
|
|
| "Attribute-Overall": 93.53, |
| "Quantity": 86.70, |
| "Expression": 93.44, |
| "Material": 92.45, |
| "Size": 94.89, |
| "Shape": 92.48, |
| "Color": 94.95, |
|
|
| "Action-Overall": 87.78, |
| "Hand": 89.94, |
| "Full body": 87.19, |
| "Animal": 90.94, |
| "Non Contact": 89.29, |
| "Contact": 83.05, |
| "State": 87.75, |
|
|
| "Relationship-Overall": 91.13, |
| "Composition": 89.18, |
| "Similarity": 90.71, |
| "Inclusion": 96.84, |
| "Comparison": 90.29, |
|
|
| "Compound-Overall": 93.99, |
| "Imagination": 94.39, |
| "Feature matching": 93.10, |
|
|
| "Grammar-Overall": 94.46, |
| "Pronoun Reference": 95.97, |
| "Consistency": 91.67, |
| "Negation": 95.65, |
|
|
| "Layout-Overall": 93.59, |
| "2D": 94.29, |
| "3D": 92.70, |
|
|
| "Logical Reasoning": 91.02, |
|
|
| "Text": 83.79 |
| }, |
| { |
| "model": "Seedream-3.0", |
| "link": "https://www.byteplus.com/en/product/Seedream", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2025-06", |
|
|
| "Overall": 80.99, |
|
|
| "Style": 97.18, |
|
|
| "World Knowledge": 93.79, |
|
|
| "Attribute-Overall": 91.90, |
| "Quantity": 83.51, |
| "Expression": 81.25, |
| "Material": 93.07, |
| "Size": 88.26, |
| "Shape": 90.03, |
| "Color": 97.48, |
|
|
| "Action-Overall": 79.94, |
| "Hand": 77.88, |
| "Full body": 84.69, |
| "Animal": 78.26, |
| "Non Contact": 74.11, |
| "Contact": 71.84, |
| "State": 83.60, |
|
|
| "Relationship-Overall": 83.41, |
| "Composition": 81.63, |
| "Similarity": 79.17, |
| "Inclusion": 87.64, |
| "Comparison": 86.41, |
|
|
| "Compound-Overall": 81.03, |
| "Imagination": 80.49, |
| "Feature matching": 82.24, |
|
|
| "Grammar-Overall": 75.13, |
| "Pronoun Reference": 90.48, |
| "Consistency": 80.56, |
| "Negation": 56.69, |
|
|
| "Layout-Overall": 88.41, |
| "2D": 87.85, |
| "3D": 89.13, |
|
|
| "Logical Reasoning": 62.62, |
|
|
| "Text": 56.52 |
| }, |
| { |
| "model": "Imagen-4.0-Fast-preview-06-06", |
| "link": "https://deepmind.google/models/imagen/", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2025-06", |
|
|
| "Overall": 81.54, |
|
|
| "Style": 93.77, |
|
|
| "World Knowledge": 93.64, |
|
|
| "Attribute-Overall": 90.33, |
| "Quantity": 78.72, |
| "Expression": 78.89, |
| "Material": 91.11, |
| "Size": 90.15, |
| "Shape": 86.89, |
| "Color": 96.33, |
|
|
| "Action-Overall": 80.18, |
| "Hand": 82.05, |
| "Full body": 84.06, |
| "Animal": 81.88, |
| "Non Contact": 75.00, |
| "Contact": 74.71, |
| "State": 80.93, |
|
|
| "Relationship-Overall": 84.05, |
| "Composition": 82.53, |
| "Similarity": 80.13, |
| "Inclusion": 92.82, |
| "Comparison": 82.52, |
|
|
| "Compound-Overall": 84.01, |
| "Imagination": 86.18, |
| "Feature matching": 79.21, |
|
|
| "Grammar-Overall": 79.57, |
| "Pronoun Reference": 91.27, |
| "Consistency": 81.35, |
| "Negation": 67.61, |
|
|
| "Layout-Overall": 90.48, |
| "2D": 90.11, |
| "3D": 90.94, |
|
|
| "Logical Reasoning": 67.72, |
|
|
| "Text": 51.63 |
| }, |
| { |
| "model": "Imagen-4.0-Ultra-preview-06-06", |
| "link": "https://deepmind.google/models/imagen/", |
| "hf": "-", |
| "open_source": false, |
| "release_date": "2025-06", |
|
|
| "Overall": 90.95, |
|
|
| "Style": 97.67, |
|
|
| "World Knowledge": 98.26, |
|
|
| "Attribute-Overall": 93.21, |
| "Quantity": 89.84, |
| "Expression": 83.17, |
| "Material": 94.20, |
| "Size": 94.69, |
| "Shape": 89.86, |
| "Color": 97.22, |
|
|
| "Action-Overall": 86.91, |
| "Hand": 89.10, |
| "Full body": 86.56, |
| "Animal": 85.14, |
| "Non Contact": 86.61, |
| "Contact": 81.84, |
| "State": 88.63, |
|
|
| "Relationship-Overall": 90.57, |
| "Composition": 90.05, |
| "Similarity": 84.62, |
| "Inclusion": 94.52, |
| "Comparison": 92.72, |
|
|
| "Compound-Overall": 91.42, |
| "Imagination": 92.82, |
| "Feature matching": 88.32, |
|
|
| "Grammar-Overall": 88.07, |
| "Pronoun Reference": 96.83, |
| "Consistency": 87.70, |
| "Negation": 80.63, |
|
|
| "Layout-Overall": 93.49, |
| "2D": 92.64, |
| "3D": 94.57, |
|
|
| "Logical Reasoning": 83.50, |
|
|
| "Text": 86.41 |
| } |
| ] |
| } |
|
|