{ "leaderboard": [ { "model": "Runway-Gen4-Image", "link": "https://docs.dev.runwayml.com/api/#tag/Start-generating/paths/~1v1~1text_to_image/post", "hf": "-", "open_source": false, "release_date": "2024-11", "Overall": 69.75, "Style": 93.44, "World Knowledge": 90.36, "Attribute-Overall": 74.03, "Quantity": 72.86, "Expression": 51.97, "Material": 89.42, "Size": 68.06, "Shape": 65.62, "Color": 95.00, "Action-Overall": 70.21, "Hand": 62.18, "Full body": 79.35, "Animal": 82.35, "Non Contact": 66.15, "Contact": 60.37, "State": 71.70, "Relationship-Overall": 72.56, "Composition": 74.32, "Similarity": 62.22, "Inclusion": 77.84, "Comparison": 75.78, "Compound-Overall": 67.76, "Imagination": 71.65, "Feature matching": 63.71, "Grammar-Overall": 70.08, "Pronoun Reference": 71.21, "Consistency": 67.59, "Negation": 71.03, "Layout-Overall": 76.33, "2D": 77.61, "3D": 75.00, "Logical Reasoning": 49.31, "Text": 33.43 }, { "model": "Nano Banana", "link": "https://ainanobanana.io/", "hf": "-", "open_source": false, "release_date": "2025-08", "Overall": 87.45, "Style": 98.87, "World Knowledge": 96.32, "Attribute-Overall": 87.84, "Quantity": 85.00, "Expression": 83.33, "Material": 88.50, "Size": 95.74, "Shape": 78.21, "Color": 99.17, "Action-Overall": 86.83, "Hand": 82.05, "Full body": 93.41, "Animal": 86.03, "Non Contact": 82.47, "Contact": 83.33, "State": 91.98, "Relationship-Overall": 92.00, "Composition": 94.76, "Similarity": 86.52, "Inclusion": 91.26, "Comparison": 94.53, "Compound-Overall": 87.83, "Imagination": 89.66, "Feature matching": 86.02, "Grammar-Overall": 83.36, "Pronoun Reference": 90.71, "Consistency": 82.08, "Negation": 76.59, "Layout-Overall": 91.96, "2D": 92.65, "3D": 91.25, "Logical Reasoning": 74.26, "Text": 75.22 }, { "model": "Stability-AI-stable-image-ultra", "link": "https://platform.stability.ai/docs/api-reference#tag/Generate/paths/~1v2beta~1stable-image~1generate~1ultra/post", "hf": "-", "open_source": false, "release_date": "2024-06", "Overall": 61.96, "Style": 87.20, "World Knowledge": 87.18, "Attribute-Overall": 66.35, "Quantity": 67.36, "Expression": 48.08, "Material": 64.15, "Size": 69.44, "Shape": 64.38, "Color": 91.67, "Action-Overall": 59.22, "Hand": 55.77, "Full body": 58.15, "Animal": 63.24, "Non Contact": 61.22, "Contact": 51.79, "State": 64.15, "Relationship-Overall": 69.04, "Composition": 72.64, "Similarity": 66.67, "Inclusion": 70.11, "Comparison": 62.50, "Compound-Overall": 54.25, "Imagination": 60.97, "Feature matching": 47.40, "Grammar-Overall": 61.10, "Pronoun Reference": 78.68, "Consistency": 58.33, "Negation": 45.00, "Layout-Overall": 64.55, "2D": 67.28, "3D": 61.74, "Logical Reasoning": 31.59, "Text": 39.08 }, { "model": "HiDream_v2L", "link": "https://hidreamai.com/doc/txt2img/request", "hf": "-", "open_source": false, "release_date": "2025-07", "Overall": 61.64, "Style": 87.99, "World Knowledge": 89.62, "Attribute-Overall": 64.38, "Quantity": 65.71, "Expression": 44.87, "Material": 57.82, "Size": 74.26, "Shape": 59.87, "Color": 94.92, "Action-Overall": 59.50, "Hand": 51.28, "Full body": 58.56, "Animal": 67.65, "Non Contact": 61.98, "Contact": 51.52, "State": 65.09, "Relationship-Overall": 66.62, "Composition": 71.23, "Similarity": 64.20, "Inclusion": 65.93, "Comparison": 60.32, "Compound-Overall": 49.28, "Imagination": 53.75, "Feature matching": 44.76, "Grammar-Overall": 58.86, "Pronoun Reference": 72.35, "Consistency": 60.00, "Negation": 44.23, "Layout-Overall": 69.06, "2D": 70.41, "3D": 67.68, "Logical Reasoning": 26.73, "Text": 44.31 }, { "model": "Imagen-4.0-Fast-preview-06-06", "link": "https://deepmind.google/models/imagen/", "hf": "-", "open_source": false, "release_date": "2025-01", "Overall": 77.75, "Style": 92.00, "World Knowledge": 94.78, "Attribute-Overall": 83.65, "Quantity": 77.08, "Expression": 75.00, "Material": 85.85, "Size": 89.58, "Shape": 78.75, "Color": 98.33, "Action-Overall": 79.85, "Hand": 73.72, "Full body": 84.24, "Animal": 81.62, "Non Contact": 76.53, "Contact": 76.79, "State": 84.91, "Relationship-Overall": 82.36, "Composition": 83.45, "Similarity": 73.89, "Inclusion": 89.13, "Comparison": 82.03, "Compound-Overall": 74.10, "Imagination": 80.10, "Feature matching": 67.97, "Grammar-Overall": 76.74, "Pronoun Reference": 86.03, "Consistency": 75.00, "Negation": 68.46, "Layout-Overall": 86.19, "2D": 88.24, "3D": 84.09, "Logical Reasoning": 56.36, "Text": 51.44 }, { "model": "Recraft", "link": "https://www.recraft.ai/docs#generate-image", "hf": "-", "open_source": false, "release_date": "2024-12", "Overall": 62.63, "Style": 87.20, "World Knowledge": 90.19, "Attribute-Overall": 68.16, "Quantity": 68.06, "Expression": 56.41, "Material": 70.75, "Size": 65.97, "Shape": 57.50, "Color": 95.83, "Action-Overall": 60.55, "Hand": 50.00, "Full body": 70.65, "Animal": 76.47, "Non Contact": 55.61, "Contact": 48.81, "State": 63.21, "Relationship-Overall": 62.56, "Composition": 64.53, "Similarity": 59.44, "Inclusion": 59.24, "Comparison": 67.19, "Compound-Overall": 44.85, "Imagination": 43.37, "Feature matching": 46.35, "Grammar-Overall": 63.64, "Pronoun Reference": 73.16, "Consistency": 58.33, "Negation": 58.08, "Layout-Overall": 57.84, "2D": 58.82, "3D": 56.82, "Logical Reasoning": 29.55, "Text": 61.78 }, { "model": "FLUX-kontext-max", "link": "https://bfl.ai/models/flux-kontext", "hf": "-", "open_source": false, "release_date": "2025-05", "Overall": 80.00, "Style": 96.59, "World Knowledge": 94.19, "Attribute-Overall": 80.93, "Quantity": 75.69, "Expression": 74.32, "Material": 82.55, "Size": 86.81, "Shape": 74.38, "Color": 94.17, "Action-Overall": 77.38, "Hand": 67.95, "Full body": 83.15, "Animal": 77.94, "Non Contact": 77.04, "Contact": 70.83, "State": 84.43, "Relationship-Overall": 85.08, "Composition": 87.50, "Similarity": 78.89, "Inclusion": 90.00, "Comparison": 81.25, "Compound-Overall": 78.99, "Imagination": 83.93, "Feature matching": 73.96, "Grammar-Overall": 78.53, "Pronoun Reference": 84.23, "Consistency": 78.70, "Negation": 72.69, "Layout-Overall": 85.04, "2D": 86.74, "3D": 88.33, "Logical Reasoning": 61.36, "Text": 61.92 }, { "model": "FLUX-kontext-pro", "link": "https://bfl.ai/models/flux-kontext", "hf": "-", "open_source": false, "release_date": "2025-05", "Overall": 75.84, "Style": 94.78, "World Knowledge": 91.61, "Attribute-Overall": 79.20, "Quantity": 75.00, "Expression": 71.62, "Material": 76.89, "Size": 84.72, "Shape": 74.38, "Color": 97.50, "Action-Overall": 77.66, "Hand": 75.00, "Full body": 79.35, "Animal": 80.88, "Non Contact": 71.94, "Contact": 73.21, "State": 84.91, "Relationship-Overall": 79.34, "Composition": 81.42, "Similarity": 75.56, "Inclusion": 83.33, "Comparison": 74.22, "Compound-Overall": 72.68, "Imagination": 75.00, "Feature matching": 70.31, "Grammar-Overall": 72.69, "Pronoun Reference": 84.23, "Consistency": 76.85, "Negation": 57.69, "Layout-Overall": 84.47, "2D": 85.98, "3D": 82.95, "Logical Reasoning": 55.68, "Text": 50.29 }, { "model": "wan2.2-t2i-plus", "link": "https://help.aliyun.com/zh/model-studio/text-to-image-v2-api-reference", "hf": "-", "open_source": false, "release_date": "2025-07", "Overall": 64.82, "Style": 91.10, "World Knowledge": 87.34, "Attribute-Overall": 70.19, "Quantity": 76.39, "Expression": 55.77, "Material": 66.51, "Size": 71.53, "Shape": 64.38, "Color": 94.17, "Action-Overall": 68.00, "Hand": 58.33, "Full body": 75.82, "Animal": 69.12, "Non Contact": 68.88, "Contact": 57.74, "State": 75.00, "Relationship-Overall": 73.03, "Composition": 70.27, "Similarity": 67.98, "Inclusion": 77.72, "Comparison": 76.69, "Compound-Overall": 61.37, "Imagination": 66.92, "Feature matching": 55.73, "Grammar-Overall": 66.53, "Pronoun Reference": 73.90, "Consistency": 56.74, "Negation": 66.92, "Layout-Overall": 74.77, "2D": 77.49, "3D": 71.97, "Logical Reasoning": 42.05, "Text": 13.83 }, { "model": "FLUX.1-dev", "link": "https://bfl.ai/blog/24-08-01-bfl", "hf": "https://huggingface.co/black-forest-labs/FLUX.1-dev", "open_source": true, "release_date": "2024-08", "Overall": 61.30, "Style": 83.90, "World Knowledge": 88.92, "Attribute-Overall": 67.84, "Quantity": 72.22, "Expression": 53.85, "Material": 58.96, "Size": 75.00, "Shape": 65.00, "Color": 91.67, "Action-Overall": 62.17, "Hand": 51.28, "Full body": 67.39, "Animal": 69.85, "Non Contact": 59.69, "Contact": 58.93, "State": 65.57, "Relationship-Overall": 67.26, "Composition": 62.50, "Similarity": 66.67, "Inclusion": 72.83, "Comparison": 62.50, "Compound-Overall": 47.04, "Imagination": 47.96, "Feature matching": 46.09, "Grammar-Overall": 60.96, "Pronoun Reference": 73.16, "Consistency": 63.43, "Negation": 46.15, "Layout-Overall": 71.83, "2D": 74.26, "3D": 69.32, "Logical Reasoning": 30.91, "Text": 32.18 }, { "model": "HiDream-I1-Full", "link": "https://arxiv.org/pdf/2505.22705", "hf": "https://huggingface.co/HiDream-ai/HiDream-I1-Full", "open_source": true, "release_date": "2025-05", "Overall": 71.81, "Style": 92.50, "World Knowledge": 94.15, "Attribute-Overall": 72.97, "Quantity": 73.61, "Expression": 59.62, "Material": 72.17, "Size": 79.17, "Shape": 61.88, "Color": 98.33, "Action-Overall": 73.00, "Hand": 62.18, "Full body": 76.09, "Animal": 73.53, "Non Contact": 74.49, "Contact": 70.24, "State": 78.77, "Relationship-Overall": 75.38, "Composition": 79.05, "Similarity": 68.33, "Inclusion": 78.26, "Comparison": 72.66, "Compound-Overall": 62.63, "Imagination": 64.29, "Feature matching": 60.94, "Grammar-Overall": 63.24, "Pronoun Reference": 83.09, "Consistency": 65.74, "Negation": 40.38, "Layout-Overall": 78.17, "2D": 82.72, "3D": 73.48, "Logical Reasoning": 41.14, "Text": 64.94 }, { "model": "Pref-GRPO", "link": "https://github.com/CodeGoat24/UnifiedReward", "hf": "https://huggingface.co/CodeGoat24/FLUX.1-dev-PrefGRPO", "open_source": true, "release_date": "2025-08", "Overall": 69.46, "Style": 88.40, "World Knowledge": 90.35, "Attribute-Overall": 75.00, "Quantity": 71.53, "Expression": 60.90, "Material": 73.11, "Size": 77.08, "Shape": 74.38, "Color": 99.17, "Action-Overall": 69.77, "Hand": 60.90, "Full body": 72.28, "Animal": 77.21, "Non Contact": 68.37, "Contact": 64.88, "State": 74.53, "Relationship-Overall": 76.52, "Composition": 81.42, "Similarity": 76.67, "Inclusion": 76.09, "Comparison": 65.62, "Compound-Overall": 63.27, "Imagination": 65.56, "Feature matching": 60.94, "Grammar-Overall": 62.43, "Pronoun Reference": 79.04, "Consistency": 66.20, "Negation": 41.92, "Layout-Overall": 77.61, "2D": 82.35, "3D": 72.73, "Logical Reasoning": 47.13, "Text": 47.13 }, { "model": "SD-3.5-Large", "link": "https://stability.ai/news/introducing-stable-diffusion-3-5", "hf": "https://huggingface.co/stabilityai/stable-diffusion-3.5-large", "open_source": true, "release_date": "2024-10", "Overall": 62.99, "Style": 88.60, "World Knowledge": 88.92, "Attribute-Overall": 68.59, "Quantity": 71.53, "Expression": 51.92, "Material": 68.87, "Size": 68.06, "Shape": 65.62, "Color": 90.83, "Action-Overall": 62.17, "Hand": 57.05, "Full body": 61.96, "Animal": 63.24, "Non Contact": 62.24, "Contact": 59.52, "State": 67.45, "Relationship-Overall": 69.80, "Composition": 75.34, "Similarity": 68.33, "Inclusion": 68.48, "Comparison": 60.94, "Compound-Overall": 58.76, "Imagination": 64.80, "Feature matching": 52.60, "Grammar-Overall": 58.96, "Pronoun Reference": 74.63, "Consistency": 61.11, "Negation": 40.77, "Layout-Overall": 69.03, "2D": 70.96, "3D": 67.05, "Logical Reasoning": 32.27, "Text": 32.76 }, { "model": "Janus-Pro", "link": "https://arxiv.org/pdf/2501.17811", "hf": "https://huggingface.co/deepseek-ai/Janus-Pro-7B", "open_source": true, "release_date": "2025-01", "Overall": 61.61, "Style": 90.80, "World Knowledge": 86.71, "Attribute-Overall": 67.74, "Quantity": 56.25, "Expression": 55.77, "Material": 71.70, "Size": 73.61, "Shape": 61.88, "Color": 90.83, "Action-Overall": 64.26, "Hand": 50.64, "Full body": 63.04, "Animal": 75.00, "Non Contact": 62.24, "Contact": 56.55, "State": 76.42, "Relationship-Overall": 68.40, "Composition": 76.01, "Similarity": 56.11, "Inclusion": 75.00, "Comparison": 58.59, "Compound-Overall": 62.11, "Imagination": 69.64, "Feature matching": 54.43, "Grammar-Overall": 64.44, "Pronoun Reference": 75.37, "Consistency": 66.20, "Negation": 51.54, "Layout-Overall": 72.01, "2D": 74.63, "3D": 69.32, "Logical Reasoning": 37.05, "Text": 2.59 }, { "model": "Show-o2", "link": "https://arxiv.org/pdf/2506.15564", "hf": "https://huggingface.co/showlab/show-o2-7B", "open_source": true, "release_date": "2025-06", "Overall": 62.73, "Style": 87.20, "World Knowledge": 86.08, "Attribute-Overall": 70.51, "Quantity": 59.03, "Expression": 63.46, "Material": 73.58, "Size": 72.92, "Shape": 63.12, "Color": 95.00, "Action-Overall": 69.58, "Hand": 56.41, "Full body": 77.72, "Animal": 72.79, "Non Contact": 70.41, "Contact": 52.38, "State": 83.02, "Relationship-Overall": 70.18, "Composition": 79.05, "Similarity": 61.11, "Inclusion": 70.11, "Comparison": 62.50, "Compound-Overall": 64.69, "Imagination": 69.90, "Feature matching": 59.38, "Grammar-Overall": 61.63, "Pronoun Reference": 75.37, "Consistency": 65.28, "Negation": 44.23, "Layout-Overall": 75.37, "2D": 77.94, "3D": 72.73, "Logical Reasoning": 40.91, "Text": 1.15 }, { "model": "Bagel", "link": "https://arxiv.org/pdf/2505.14683", "hf": "https://huggingface.co/ByteDance-Seed/BAGEL-7B-MoT", "open_source": true, "release_date": "2025-05", "Overall": 61.53, "Style": 90.20, "World Knowledge": 85.60, "Attribute-Overall": 67.74, "Quantity": 59.03, "Expression": 50.00, "Material": 72.64, "Size": 76.39, "Shape": 59.38, "Color": 93.33, "Action-Overall": 61.98, "Hand": 52.56, "Full body": 60.87, "Animal": 69.12, "Non Contact": 62.24, "Contact": 58.93, "State": 67.45, "Relationship-Overall": 70.69, "Composition": 76.35, "Similarity": 70.56, "Inclusion": 69.57, "Comparison": 59.38, "Compound-Overall": 58.12, "Imagination": 67.35, "Feature matching": 48.70, "Grammar-Overall": 66.44, "Pronoun Reference": 71.69, "Consistency": 68.52, "Negation": 59.23, "Layout-Overall": 76.49, "2D": 79.04, "3D": 73.86, "Logical Reasoning": 30.23, "Text": 7.76 }, { "model": "BLIP3-o", "link": "https://arxiv.org/pdf/2505.09568", "hf": "https://huggingface.co/BLIP3o/BLIP3o-Model-8B", "open_source": true, "release_date": "2025-05", "Overall": 59.87, "Style": 92.80, "World Knowledge": 80.22, "Attribute-Overall": 63.89, "Quantity": 51.39, "Expression": 60.26, "Material": 64.62, "Size": 75.00, "Shape": 54.37, "Color": 81.67, "Action-Overall": 63.97, "Hand": 58.33, "Full body": 70.11, "Animal": 70.59, "Non Contact": 60.20, "Contact": 51.79, "State": 71.70, "Relationship-Overall": 66.50, "Composition": 70.61, "Similarity": 60.00, "Inclusion": 67.39, "Comparison": 64.84, "Compound-Overall": 53.74, "Imagination": 61.73, "Feature matching": 45.57, "Grammar-Overall": 68.58, "Pronoun Reference": 79.04, "Consistency": 61.11, "Negation": 63.85, "Layout-Overall": 68.47, "2D": 72.79, "3D": 64.02, "Logical Reasoning": 39.55, "Text": 1.15 }, { "model": "CogVew4", "link": "https://arxiv.org/pdf/2403.05121", "hf": "https://huggingface.co/zai-org/CogView4-6B", "open_source": true, "release_date": "2024-03", "Overall": 56.30, "Style": 82.00, "World Knowledge": 83.07, "Attribute-Overall": 63.25, "Quantity": 71.53, "Expression": 44.23, "Material": 55.19, "Size": 72.22, "Shape": 57.50, "Color": 89.17, "Action-Overall": 57.51, "Hand": 53.85, "Full body": 59.78, "Animal": 68.38, "Non Contact": 50.51, "Contact": 51.19, "State": 62.74, "Relationship-Overall": 62.44, "Composition": 60.47, "Similarity": 60.00, "Inclusion": 69.57, "Comparison": 60.16, "Compound-Overall": 44.72, "Imagination": 47.19, "Feature matching": 42.19, "Grammar-Overall": 54.81, "Pronoun Reference": 69.49, "Consistency": 56.02, "Negation": 38.46, "Layout-Overall": 69.22, "2D": 77.21, "3D": 60.98, "Logical Reasoning": 28.18, "Text": 17.82 }, { "model": "Hunyuan-DiT", "link": "https://arxiv.org/pdf/2405.08748", "hf": "https://huggingface.co/Tencent-Hunyuan/HunyuanDiT", "open_source": true, "release_date": "2024-05", "Overall": 51.38, "Style": 94.10, "World Knowledge": 80.70, "Attribute-Overall": 62.71, "Quantity": 67.36, "Expression": 44.23, "Material": 71.70, "Size": 61.81, "Shape": 47.50, "Color": 86.67, "Action-Overall": 49.05, "Hand": 35.90, "Full body": 54.89, "Animal": 54.41, "Non Contact": 46.94, "Contact": 35.71, "State": 62.74, "Relationship-Overall": 59.64, "Composition": 60.14, "Similarity": 64.44, "Inclusion": 60.33, "Comparison": 50.78, "Compound-Overall": 41.62, "Imagination": 46.68, "Feature matching": 36.46, "Grammar-Overall": 55.48, "Pronoun Reference": 62.87, "Consistency": 57.87, "Negation": 45.77, "Layout-Overall": 44.78, "2D": 39.34, "3D": 50.38, "Logical Reasoning": 24.55, "Text": 1.15 }, { "model": "Janus", "link": "https://arxiv.org/pdf/2410.13848", "hf": "https://huggingface.co/deepseek-ai/Janus-1.3B", "open_source": true, "release_date": "2024-10", "Overall": 51.23, "Style": 89.90, "World Knowledge": 73.58, "Attribute-Overall": 54.81, "Quantity": 37.50, "Expression": 37.82, "Material": 58.96, "Size": 65.97, "Shape": 47.50, "Color": 86.67, "Action-Overall": 50.38, "Hand": 32.69, "Full body": 51.63, "Animal": 61.76, "Non Contact": 48.47, "Contact": 38.10, "State": 66.51, "Relationship-Overall": 55.08, "Composition": 56.76, "Similarity": 53.89, "Inclusion": 59.24, "Comparison": 46.88, "Compound-Overall": 46.65, "Imagination": 58.16, "Feature matching": 34.90, "Grammar-Overall": 59.09, "Pronoun Reference": 66.18, "Consistency": 51.39, "Negation": 58.08, "Layout-Overall": 54.85, "2D": 57.72, "3D": 51.89, "Logical Reasoning": 26.82, "Text": 1.15 }, { "model": "Janus-flow", "link": "https://arxiv.org/pdf/2411.07975", "hf": "https://huggingface.co/deepseek-ai/JanusFlow-1.3B", "open_source": true, "release_date": "2024-11", "Overall": 46.39, "Style": 86.20, "World Knowledge": 62.50, "Attribute-Overall": 47.97, "Quantity": 43.06, "Expression": 30.77, "Material": 55.19, "Size": 55.56, "Shape": 30.00, "Color": 78.33, "Action-Overall": 43.35, "Hand": 23.08, "Full body": 48.37, "Animal": 58.82, "Non Contact": 36.73, "Contact": 36.31, "State": 55.66, "Relationship-Overall": 50.00, "Composition": 59.80, "Similarity": 38.89, "Inclusion": 51.63, "Comparison": 40.62, "Compound-Overall": 45.10, "Imagination": 57.65, "Feature matching": 32.29, "Grammar-Overall": 60.29, "Pronoun Reference": 66.18, "Consistency": 48.61, "Negation": 63.85, "Layout-Overall": 46.46, "2D": 49.26, "3D": 43.56, "Logical Reasoning": 21.14, "Text": 0.86 }, { "model": "Emu3", "link": "https://arxiv.org/pdf/2409.18869", "hf": "https://huggingface.co/BAAI/Emu3-Gen", "open_source": true, "release_date": "2024-09", "Overall": 46.02, "Style": 86.80, "World Knowledge": 77.06, "Attribute-Overall": 51.39, "Quantity": 44.44, "Expression": 45.51, "Material": 53.77, "Size": 43.06, "Shape": 46.25, "Color": 80.00, "Action-Overall": 40.11, "Hand": 25.00, "Full body": 47.28, "Animal": 50.74, "Non Contact": 35.20, "Contact": 27.98, "State": 52.36, "Relationship-Overall": 49.75, "Composition": 56.76, "Similarity": 46.67, "Inclusion": 48.37, "Comparison": 39.84, "Compound-Overall": 36.86, "Imagination": 41.33, "Feature matching": 32.29, "Grammar-Overall": 52.94, "Pronoun Reference": 59.56, "Consistency": 53.70, "Negation": 45.38, "Layout-Overall": 44.78, "2D": 45.22, "3D": 44.32, "Logical Reasoning": 19.32, "Text": 1.15 }, { "model": "Playground2.5", "link": "https://arxiv.org/pdf/2402.17245", "hf": "https://huggingface.co/playgroundai/playground-v2.5-1024px-aesthetic", "open_source": true, "release_date": "2024-02", "Overall": 45.61, "Style": 89.50, "World Knowledge": 76.11, "Attribute-Overall": 52.78, "Quantity": 58.33, "Expression": 43.59, "Material": 57.08, "Size": 44.44, "Shape": 41.25, "Color": 75.83, "Action-Overall": 42.68, "Hand": 28.85, "Full body": 50.00, "Animal": 52.21, "Non Contact": 35.20, "Contact": 29.17, "State": 58.02, "Relationship-Overall": 51.52, "Composition": 60.14, "Similarity": 49.44, "Inclusion": 48.37, "Comparison": 39.06, "Compound-Overall": 35.44, "Imagination": 43.88, "Feature matching": 26.82, "Grammar-Overall": 53.21, "Pronoun Reference": 58.82, "Consistency": 50.00, "Negation": 50.00, "Layout-Overall": 37.13, "2D": 34.56, "3D": 39.77, "Logical Reasoning": 16.59, "Text": 1.15 }, { "model": "SDXL", "link": "https://arxiv.org/pdf/2307.01952", "hf": "https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0", "open_source": true, "release_date": "2023-07", "Overall": 39.75, "Style": 87.40, "World Knowledge": 72.63, "Attribute-Overall": 44.34, "Quantity": 44.44, "Expression": 25.00, "Material": 52.83, "Size": 44.44, "Shape": 33.75, "Color": 68.33, "Action-Overall": 34.22, "Hand": 19.23, "Full body": 35.33, "Animal": 43.38, "Non Contact": 26.53, "Contact": 24.40, "State": 53.30, "Relationship-Overall": 44.92, "Composition": 53.72, "Similarity": 38.33, "Inclusion": 39.67, "Comparison": 41.41, "Compound-Overall": 26.68, "Imagination": 33.93, "Feature matching": 19.27, "Grammar-Overall": 47.33, "Pronoun Reference": 50.37, "Consistency": 42.59, "Negation": 48.08, "Layout-Overall": 29.85, "2D": 26.47, "3D": 33.33, "Logical Reasoning": 9.55, "Text": 1.15 }, { "model": "GPT-4o", "link": "https://platform.openai.com/docs/guides/image-generation", "hf": "-", "open_source": false, "release_date": "2025-03", "Overall": 92.77, "Style": 98.57, "World Knowledge": 98.87, "Attribute-Overall": 93.59, "Quantity": 90.00, "Expression": 94.70, "Material": 94.20, "Size": 91.61, "Shape": 92.50, "Color": 99.17, "Action-Overall": 90.79, "Hand": 89.74, "Full body": 92.22, "Animal": 87.12, "Non Contact": 90.43, "Contact": 89.82, "State": 93.75, "Relationship-Overall": 94.97, "Composition": 96.23, "Similarity": 95.00, "Inclusion": 94.89, "Comparison": 92.19, "Compound-Overall": 93.55, "Imagination": 95.64, "Feature matching": 91.40, "Grammar-Overall": 91.76, "Pronoun Reference": 92.91, "Consistency": 91.67, "Negation": 90.57, "Layout-Overall": 91.35, "2D": 91.04, "3D": 91.67, "Logical Reasoning": 84.97, "Text": 89.24 }, { "model": "Imagen-4.0-Ultra-preview-06-06", "link": "https://deepmind.google/models/imagen/", "hf": "-", "open_source": false, "release_date": "2025-06", "Overall": 91.54, "Style": 99.20, "World Knowledge": 97.47, "Attribute-Overall": 92.52, "Quantity": 93.06, "Expression": 81.41, "Material": 94.34, "Size": 95.83, "Shape": 91.88, "Color": 100.0, "Action-Overall": 92.20, "Hand": 90.38, "Full body": 93.44, "Animal": 91.91, "Non Contact": 90.31, "Contact": 89.29, "State": 96.70, "Relationship-Overall": 93.02, "Composition": 95.27, "Similarity": 84.44, "Inclusion": 98.37, "Comparison": 92.19, "Compound-Overall": 91.37, "Imagination": 92.86, "Feature matching": 89.84, "Grammar-Overall": 87.97, "Pronoun Reference": 94.12, "Consistency": 87.04, "Negation": 82.31, "Layout-Overall": 93.10, "2D": 92.65, "3D": 93.56, "Logical Reasoning": 79.55, "Text": 89.08 }, { "model": "Seedream-3.0", "link": "https://www.byteplus.com/en/product/Seedream", "hf": "-", "open_source": false, "release_date": "2025-06", "Overall": 78.95, "Style": 98.10, "World Knowledge": 95.25, "Attribute-Overall": 85.58, "Quantity": 80.56, "Expression": 82.05, "Material": 90.57, "Size": 85.42, "Shape": 78.12, "Color": 97.50, "Action-Overall": 82.98, "Hand": 75.00, "Full body": 89.67, "Animal": 85.29, "Non Contact": 75.51, "Contact": 80.95, "State": 90.09, "Relationship-Overall": 80.84, "Composition": 82.77, "Similarity": 73.89, "Inclusion": 84.24, "Comparison": 81.25, "Compound-Overall": 73.84, "Imagination": 78.57, "Feature matching": 69.01, "Grammar-Overall": 61.36, "Pronoun Reference": 79.78, "Consistency": 69.91, "Negation": 35.00, "Layout-Overall": 87.31, "2D": 86.76, "3D": 87.88, "Logical Reasoning": 52.73, "Text": 71.55 }, { "model": "Imagen-3.0-generate-002", "link": "https://arxiv.org/pdf/2408.07009", "hf": "-", "open_source": false, "release_date": "2025-02", "Overall": 71.85, "Style": 89.25, "World Knowledge": 94.75, "Attribute-Overall": 77.33, "Quantity": 75.78, "Expression": 64.67, "Material": 80.66, "Size": 82.84, "Shape": 70.00, "Color": 93.10, "Action-Overall": 81.46, "Hand": 80.00, "Full body": 83.89, "Animal": 85.29, "Non Contact": 77.37, "Contact": 74.40, "State": 87.38, "Relationship-Overall": 82.86, "Composition": 83.90, "Similarity": 73.33, "Inclusion": 88.64, "Comparison": 83.90, "Compound-Overall": 71.71, "Imagination": 79.23, "Feature matching": 64.06, "Grammar-Overall": 69.84, "Pronoun Reference": 79.04, "Consistency": 70.75, "Negation": 59.13, "Layout-Overall": 81.34, "2D": 82.72, "3D": 79.92, "Logical Reasoning": 48.36, "Text": 21.55 }, { "model": "DALL-E-3", "link": "https://openai.com/zh-Hans-CN/index/dall-e-3/", "hf": "-", "open_source": false, "release_date": "2023-09", "Overall": 69.18, "Style": 95.06, "World Knowledge": 93.51, "Attribute-Overall": 75.97, "Quantity": 62.14, "Expression": 59.87, "Material": 87.74, "Size": 87.50, "Shape": 65.00, "Color": 92.50, "Action-Overall": 69.83, "Hand": 60.90, "Full body": 75.00, "Animal": 76.47, "Non Contact": 66.84, "Contact": 63.41, "State": 75.47, "Relationship-Overall": 78.06, "Composition": 82.43, "Similarity": 69.44, "Inclusion": 87.78, "Comparison": 66.41, "Compound-Overall": 70.60, "Imagination": 76.79, "Feature matching": 64.21, "Grammar-Overall": 68.07, "Pronoun Reference": 74.24, "Consistency": 74.07, "Negation": 56.64, "Layout-Overall": 66.67, "2D": 57.72, "3D": 76.17, "Logical Reasoning": 48.18, "Text": 25.86 }, { "model": "FLUX-pro-1.1-Ultra", "link": "https://bfl.ai/", "hf": "-", "open_source": false, "release_date": "2024-11", "Overall": 70.67, "Style": 90.60, "World Knowledge": 91.61, "Attribute-Overall": 76.50, "Quantity": 75.69, "Expression": 59.62, "Material": 78.77, "Size": 77.78, "Shape": 74.38, "Color": 96.67, "Action-Overall": 76.50, "Hand": 57.69, "Full body": 68.48, "Animal": 77.21, "Non Contact": 76.53, "Contact": 64.29, "State": 76.89, "Relationship-Overall": 77.54, "Composition": 80.41, "Similarity": 72.78, "Inclusion": 82.07, "Comparison": 71.09, "Compound-Overall": 67.78, "Imagination": 74.74, "Feature matching": 60.68, "Grammar-Overall": 70.05, "Pronoun Reference": 84.56, "Consistency": 68.98, "Negation": 55.77, "Layout-Overall": 81.53, "2D": 80.15, "3D": 82.95, "Logical Reasoning": 43.18, "Text": 37.36 }, { "model": "Keling-Ketu", "link": "https://kolors.kuaishou.com/", "hf": "-", "open_source": false, "release_date": "2025-04", "Overall": 65.93, "Style": 92.27, "World Knowledge": 86.62, "Attribute-Overall": 71.66, "Quantity": 75.00, "Expression": 56.41, "Material": 78.77, "Size": 79.17, "Shape": 53.12, "Color": 91.38, "Action-Overall": 68.73, "Hand": 54.49, "Full body": 76.09, "Animal": 72.79, "Non Contact": 69.90, "Contact": 58.93, "State": 76.89, "Relationship-Overall": 70.94, "Composition": 68.92, "Similarity": 70.56, "Inclusion": 74.46, "Comparison": 71.09, "Compound-Overall": 60.81, "Imagination": 66.24, "Feature matching": 55.26, "Grammar-Overall": 71.26, "Pronoun Reference": 77.21, "Consistency": 67.59, "Negation": 68.08, "Layout-Overall": 77.23, "2D": 80.97, "3D": 73.36, "Logical Reasoning": 43.75, "Text": 16.03 }, { "model": "Qwen-Image", "link": "https://arxiv.org/pdf/2508.02324", "hf": "https://huggingface.co/Qwen/Qwen-Image", "open_source": true, "release_date": "2025-08", "Overall": 78.81, "Style": 95.10, "World Knowledge": 94.30, "Attribute-Overall": 87.61, "Quantity": 81.94, "Expression": 84.62, "Material": 91.98, "Size": 84.03, "Shape": 84.38, "Color": 99.17, "Action-Overall": 84.13, "Hand": 82.05, "Full body": 88.59, "Animal": 88.24, "Non Contact": 80.61, "Contact": 77.38, "State": 87.74, "Relationship-Overall": 79.70, "Composition": 81.76, "Similarity": 67.78, "Inclusion": 86.96, "Comparison": 81.25, "Compound-Overall": 73.32, "Imagination": 73.21, "Feature matching": 73.44, "Grammar-Overall": 60.29, "Pronoun Reference": 83.82, "Consistency": 70.37, "Negation": 27.31, "Layout-Overall": 85.52, "2D": 86.40, "3D": 85.23, "Logical Reasoning": 53.64, "Text": 76.14 } ] }