UniGenBench_Leaderboard_Chinese / leaderboard_data.json
CodeGoat24's picture
Update leaderboard_data.json
dd69fb3 verified
{
"leaderboard": [
{
"model": "wan2.5-t2i-preview",
"link": "https://help.aliyun.com/zh/model-studio/text-to-image-v2-api-reference",
"hf": "-",
"open_source": false,
"release_date": "2025-09",
"Overall": 78.40,
"Style": 93.30,
"World Knowledge": 93.51,
"Attribute-Overall": 83.65,
"Quantity": 78.47,
"Expression": 75.64,
"Material": 90.09,
"Size": 84.72,
"Shape": 76.88,
"Color": 96.67,
"Action-Overall": 76.62,
"Hand": 73.72,
"Full body": 72.28,
"Animal": 81.62,
"Non Contact": 77.04,
"Contact": 73.81,
"State": 81.13,
"Relationship-Overall": 81.85,
"Composition": 80.07,
"Similarity": 73.33,
"Inclusion": 88.04,
"Comparison": 89.06,
"Compound-Overall": 78.74,
"Imagination": 84.95,
"Feature matching": 72.40,
"Grammar-Overall": 72.58,
"Pronoun Reference": 82.72,
"Consistency": 70.37,
"Negation": 63.67,
"Layout-Overall": 75.93,
"2D": 76.10,
"3D": 75.76,
"Logical Reasoning": 63.64,
"Text": 64.22
},
{
"model": "Echo-4o",
"link": "https://arxiv.org/pdf/2508.09987",
"hf": "https://huggingface.co/Yejy53/Echo-4o",
"open_source": true,
"release_date": "2025-8",
"Overall": 72.40,
"Style": 92.80,
"World Knowledge": 87.66,
"Attribute-Overall": 84.29,
"Quantity": 72.92,
"Expression": 77.56,
"Material": 89.15,
"Size": 88.19,
"Shape": 80.00,
"Color": 99.17,
"Action-Overall": 76.05,
"Hand": 73.08,
"Full body": 83.15,
"Animal": 85.29,
"Non Contact": 75.00,
"Contact": 65.48,
"State": 75.47,
"Relationship-Overall": 82.23,
"Composition": 85.81,
"Similarity": 75.00,
"Inclusion": 88.04,
"Comparison": 75.78,
"Compound-Overall": 77.96,
"Imagination": 82.91,
"Feature matching": 72.92,
"Grammar-Overall": 75.40,
"Pronoun Reference": 80.15,
"Consistency": 77.31,
"Negation": 68.85,
"Layout-Overall": 83.02,
"2D": 84.19,
"3D": 81.82,
"Logical Reasoning": 56.82,
"Text": 7.76
},
{
"model": "Emu3",
"link": "https://arxiv.org/pdf/2409.18869",
"hf": "https://huggingface.co/BAAI/Emu3-Gen",
"open_source": true,
"release_date": "2024-09",
"Overall": 33.91,
"Style": 78.08,
"World Knowledge": 55.54,
"Attribute-Overall": 38.29,
"Quantity": 27.78,
"Expression": 30.13,
"Material": 44.34,
"Size": 32.64,
"Shape": 27.67,
"Color": 71.67,
"Action-Overall": 31.18,
"Hand": 16.67,
"Full body": 36.96,
"Animal": 49.26,
"Non Contact": 26.02,
"Contact": 17.86,
"State": 40.57,
"Relationship-Overall": 36.68,
"Composition": 43.58,
"Similarity": 31.67,
"Inclusion": 38.04,
"Comparison": 25.78,
"Compound-Overall": 21.65,
"Imagination": 29.85,
"Feature matching": 13.28,
"Grammar-Overall": 41.31,
"Pronoun Reference": 41.91,
"Consistency": 38.89,
"Negation": 42.69,
"Layout-Overall": 22.43,
"2D": 17.71,
"3D": 27.27,
"Logical Reasoning": 13.90,
"Text": 0.00
},
{
"model": "UniWorld-V1",
"link": "https://arxiv.org/pdf/2506.03147",
"hf": "https://huggingface.co/LanguageBind/UniWorld-V1",
"open_source": true,
"release_date": "2025-06",
"Overall": 15.21,
"Style": 49.40,
"World Knowledge": 16.61,
"Attribute-Overall": 15.06,
"Quantity": 14.58,
"Expression": 19.87,
"Material": 8.02,
"Size": 13.19,
"Shape": 5.00,
"Color": 37.50,
"Action-Overall": 14.64,
"Hand": 9.62,
"Full body": 17.93,
"Animal": 18.38,
"Non Contact": 9.69,
"Contact": 6.55,
"State": 24.06,
"Relationship-Overall": 11.80,
"Composition": 16.55,
"Similarity": 6.67,
"Inclusion": 12.50,
"Comparison": 7.03,
"Compound-Overall": 4.38,
"Imagination": 6.63,
"Feature matching": 2.08,
"Grammar-Overall": 27.81,
"Pronoun Reference": 19.85,
"Consistency": 16.20,
"Negation": 45.77,
"Layout-Overall": 9.14,
"2D": 8.09,
"3D": 10.23,
"Logical Reasoning": 2.95,
"Text": 0.29
},
{
"model": "Lumina-DiMOO",
"link": "https://synbol.github.io/Lumina-DiMOO/",
"hf": "https://huggingface.co/Alpha-VLLM/Lumina-DiMOO",
"open_source": true,
"release_date": "2025-09",
"Overall": 58.35,
"Style": 80.90,
"World Knowledge": 69.46,
"Attribute-Overall": 75.64,
"Quantity": 62.50,
"Expression": 71.79,
"Material": 77.83,
"Size": 78.47,
"Shape": 70.00,
"Color": 96.67,
"Action-Overall": 61.12,
"Hand": 42.95,
"Full body": 61.41,
"Animal": 76.47,
"Non Contact": 58.67,
"Contact": 51.79,
"State": 74.06,
"Relationship-Overall": 67.13,
"Composition": 68.58,
"Similarity": 62.78,
"Inclusion": 76.09,
"Comparison": 57.03,
"Compound-Overall": 56.06,
"Imagination": 56.96,
"Feature matching": 52.34,
"Grammar-Overall": 64.84,
"Pronoun Reference": 76.10,
"Consistency": 70.37,
"Negation": 48.46,
"Layout-Overall": 69.22,
"2D": 73.53,
"3D": 64.77,
"Logical Reasoning": 39.09,
"Text": 0.00
},
{
"model": "MMaDA",
"link": "https://arxiv.org/pdf/2505.15809",
"hf": "https://huggingface.co/Gen-Verse/MMaDA-8B-MixCoT",
"open_source": true,
"release_date": "2025-05",
"Overall": 44.00,
"Style": 78.20,
"World Knowledge": 52.06,
"Attribute-Overall": 55.24,
"Quantity": 52.78,
"Expression": 33.97,
"Material": 58.49,
"Size": 61.11,
"Shape": 45.00,
"Color": 86.67,
"Action-Overall": 43.44,
"Hand": 24.36,
"Full body": 54.35,
"Animal": 47.06,
"Non Contact": 31.63,
"Contact": 29.17,
"State": 67.92,
"Relationship-Overall": 56.22,
"Composition": 59.80,
"Similarity": 52.22,
"Inclusion": 60.87,
"Comparison": 46.88,
"Compound-Overall": 32.86,
"Imagination": 39.29,
"Feature matching": 26.30,
"Grammar-Overall": 58.56,
"Pronoun Reference": 59.93,
"Consistency": 46.30,
"Negation": 67.31,
"Layout-Overall": 37.31,
"2D": 38.97,
"3D": 35.61,
"Logical Reasoning": 26.14,
"Text": 0.00
},
{
"model": "OmniGen2",
"link": "https://arxiv.org/pdf/2506.18871",
"hf": "https://huggingface.co/OmniGen2/OmniGen2",
"open_source": true,
"release_date": "2025-06",
"Overall": 63.20,
"Style": 93.00,
"World Knowledge": 86.39,
"Attribute-Overall": 75.43,
"Quantity": 67.36,
"Expression": 69.87,
"Material": 78.30,
"Size": 77.78,
"Shape": 68.75,
"Color": 93.33,
"Action-Overall": 66.54,
"Hand": 64.10,
"Full body": 69.57,
"Animal": 74.26,
"Non Contact": 61.73,
"Contact": 55.95,
"State": 73.58,
"Relationship-Overall": 70.69,
"Composition": 77.03,
"Similarity": 66.67,
"Inclusion": 71.74,
"Comparison": 60.16,
"Compound-Overall": 59.92,
"Imagination": 66.33,
"Feature matching": 53.39,
"Grammar-Overall": 65.64,
"Pronoun Reference": 71.69,
"Consistency": 71.30,
"Negation": 54.62,
"Layout-Overall": 69.96,
"2D": 76.84,
"3D": 62.88,
"Logical Reasoning": 44.09,
"Text": 0.29
},
{
"model": "OneCAT",
"link": "https://arxiv.org/pdf/2509.03498",
"hf": "https://huggingface.co/onecat-ai/OneCAT-3B",
"open_source": true,
"release_date": "2025-09",
"Overall": 58.50,
"Style": 94.40,
"World Knowledge": 86.55,
"Attribute-Overall": 63.89,
"Quantity": 56.94,
"Expression": 66.03,
"Material": 73.58,
"Size": 65.28,
"Shape": 38.75,
"Color": 84.17,
"Action-Overall": 63.12,
"Hand": 42.31,
"Full body": 75.00,
"Animal": 80.88,
"Non Contact": 61.22,
"Contact": 44.05,
"State": 73.58,
"Relationship-Overall": 67.39,
"Composition": 72.64,
"Similarity": 61.67,
"Inclusion": 69.57,
"Comparison": 60.16,
"Compound-Overall": 51.55,
"Imagination": 63.52,
"Feature matching": 39.32,
"Grammar-Overall": 59.00,
"Pronoun Reference": 64.34,
"Consistency": 60.19,
"Negation": 52.69,
"Layout-Overall": 60.45,
"2D": 61.76,
"3D": 59.09,
"Logical Reasoning": 38.64,
"Text": 0.00
},
{
"model": "X-Omni",
"link": "https://arxiv.org/pdf/2507.22058",
"hf": "https://huggingface.co/X-Omni/X-Omni-Zh",
"open_source": true,
"release_date": "2025-08",
"Overall": 53.69,
"Style": 70.07,
"World Knowledge": 71.52,
"Attribute-Overall": 63.85,
"Quantity": 61.81,
"Expression": 52.56,
"Material": 63.51,
"Size": 67.36,
"Shape": 57.50,
"Color": 85.83,
"Action-Overall": 58.37,
"Hand": 48.72,
"Full body": 68.48,
"Animal": 63.97,
"Non Contact": 56.53,
"Contact": 43.45,
"State": 66.51,
"Relationship-Overall": 59.77,
"Composition": 60.14,
"Similarity": 60.00,
"Inclusion": 62.50,
"Comparison": 54.69,
"Compound-Overall": 41.75,
"Imagination": 48.72,
"Feature matching": 34.64,
"Grammar-Overall": 56.28,
"Pronoun Reference": 63.97,
"Consistency": 53.70,
"Negation": 50.38,
"Layout-Overall": 59.51,
"2D": 66.91,
"3D": 51.89,
"Logical Reasoning": 34.77,
"Text": 20.98
},
{
"model": "Bagel",
"link": "https://arxiv.org/pdf/2505.14683",
"hf": "https://huggingface.co/ByteDance-Seed/BAGEL-7B-MoT",
"open_source": true,
"release_date": "2025-05",
"Overall": 65.69,
"Style": 92.30,
"World Knowledge": 86.71,
"Attribute-Overall": 75.21,
"Quantity": 64.58,
"Expression": 63.46,
"Material": 83.49,
"Size": 79.86,
"Shape": 66.25,
"Color": 95.00,
"Action-Overall": 65.78,
"Hand": 61.54,
"Full body": 63.59,
"Animal": 75.74,
"Non Contact": 65.31,
"Contact": 61.90,
"State": 67.92,
"Relationship-Overall": 75.38,
"Composition": 77.70,
"Similarity": 67.78,
"Inclusion": 82.07,
"Comparison": 71.09,
"Compound-Overall": 69.85,
"Imagination": 79.59,
"Feature matching": 59.90,
"Grammar-Overall": 69.52,
"Pronoun Reference": 73.16,
"Consistency": 75.00,
"Negation": 61.15,
"Layout-Overall": 77.61,
"2D": 82.72,
"3D": 72.35,
"Logical Reasoning": 37.95,
"Text": 6.61
},
{
"model": "HiDream-I1-Full",
"link": "https://arxiv.org/pdf/2505.22705",
"hf": "https://huggingface.co/HiDream-ai/HiDream-I1-Full",
"open_source": true,
"release_date": "2025-05",
"Overall": 50.65,
"Style": 83.30,
"World Knowledge": 78.32,
"Attribute-Overall": 62.18,
"Quantity": 69.44,
"Expression": 45.51,
"Material": 55.66,
"Size": 70.14,
"Shape": 55.00,
"Color": 86.67,
"Action-Overall": 53.71,
"Hand": 44.23,
"Full body": 57.61,
"Animal": 55.88,
"Non Contact": 53.06,
"Contact": 47.62,
"State": 61.32,
"Relationship-Overall": 57.23,
"Composition": 57.77,
"Similarity": 52.78,
"Inclusion": 63.04,
"Comparison": 53.91,
"Compound-Overall": 34.54,
"Imagination": 38.01,
"Feature matching": 30.99,
"Grammar-Overall": 53.88,
"Pronoun Reference": 62.13,
"Consistency": 51.85,
"Negation": 46.92,
"Layout-Overall": 59.70,
"2D": 63.60,
"3D": 55.68,
"Logical Reasoning": 23.64,
"Text": 0.00
},
{
"model": "Hunyuan-Image-2.1",
"link": "https://github.com/Tencent-Hunyuan/HunyuanImage-2.1",
"hf": "https://huggingface.co/spaces/tencent/HunyuanImage-2.1",
"open_source": true,
"release_date": "2025-09",
"Overall": 77.76,
"Style": 92.20,
"World Knowledge": 90.51,
"Attribute-Overall": 84.19,
"Quantity": 87.50,
"Expression": 80.77,
"Material": 82.55,
"Size": 86.11,
"Shape": 75.00,
"Color": 97.50,
"Action-Overall": 80.51,
"Hand": 76.28,
"Full body": 84.24,
"Animal": 85.29,
"Non Contact": 78.06,
"Contact": 79.17,
"State": 80.66,
"Relationship-Overall": 82.74,
"Composition": 80.74,
"Similarity": 80.56,
"Inclusion": 87.50,
"Comparison": 83.59,
"Compound-Overall": 70.62,
"Imagination": 71.68,
"Feature matching": 69.53,
"Grammar-Overall": 61.50,
"Pronoun Reference": 80.15,
"Consistency": 67.13,
"Negation": 37.31,
"Layout-Overall": 85.45,
"2D": 88.24,
"3D": 82.58,
"Logical Reasoning": 50.23,
"Text": 79.60
},
{
"model": "BLIP3-o",
"link": "https://arxiv.org/pdf/2505.09568",
"hf": "https://huggingface.co/BLIP3o/BLIP3o-NEXT-SFT-3B",
"open_source": true,
"release_date": "2025-08",
"Overall": 59.25,
"Style": 92.60,
"World Knowledge": 81.17,
"Attribute-Overall": 66.56,
"Quantity": 57.64,
"Expression": 65.38,
"Material": 67.92,
"Size": 77.08,
"Shape": 47.50,
"Color": 89.17,
"Action-Overall": 64.35,
"Hand": 57.69,
"Full body": 73.37,
"Animal": 68.38,
"Non Contact": 59.18,
"Contact": 55.95,
"State": 70.28,
"Relationship-Overall": 65.36,
"Composition": 69.26,
"Similarity": 58.33,
"Inclusion": 63.04,
"Comparison": 69.53,
"Compound-Overall": 51.80,
"Imagination": 61.99,
"Feature matching": 41.41,
"Grammar-Overall": 63.37,
"Pronoun Reference": 70.22,
"Consistency": 57.41,
"Negation": 61.16,
"Layout-Overall": 65.67,
"2D": 69.12,
"3D": 62.12,
"Logical Reasoning": 41.59,
"Text": 0.00
},
{
"model": "BLIP3-o-Next",
"link": "https://arxiv.org/pdf/2505.09568",
"hf": "https://huggingface.co/BLIP3o/BLIP3o-NEXT-SFT-3B",
"open_source": true,
"release_date": "2025-08",
"Overall": 44.48,
"Style": 74.60,
"World Knowledge": 50.00,
"Attribute-Overall": 55.98,
"Quantity": 44.44,
"Expression": 57.69,
"Material": 56.13,
"Size": 63.89,
"Shape": 48.12,
"Color": 68.33,
"Action-Overall": 47.62,
"Hand": 37.82,
"Full body": 61.41,
"Animal": 45.59,
"Non Contact": 45.41,
"Contact": 36.90,
"State": 54.72,
"Relationship-Overall": 53.55,
"Composition": 54.05,
"Similarity": 48.33,
"Inclusion": 50.00,
"Comparison": 64.84,
"Compound-Overall": 26.55,
"Imagination": 32.14,
"Feature matching": 20.83,
"Grammar-Overall": 54.14,
"Pronoun Reference": 65.07,
"Consistency": 49.54,
"Negation": 46.54,
"Layout-Overall": 54.85,
"2D": 58.82,
"3D": 50.76,
"Logical Reasoning": 27.50,
"Text": 0.00
},
{
"model": "Janus-flow",
"link": "https://arxiv.org/pdf/2411.07975",
"hf": "https://huggingface.co/deepseek-ai/JanusFlow-1.3B",
"open_source": true,
"release_date": "2024-11",
"Overall": 20.93,
"Style": 58.50,
"World Knowledge": 18.67,
"Attribute-Overall": 19.23,
"Quantity": 22.92,
"Expression": 10.90,
"Material": 21.70,
"Size": 24.31,
"Shape": 8.12,
"Color": 30.00,
"Action-Overall": 22.05,
"Hand": 4.49,
"Full body": 31.52,
"Animal": 22.06,
"Non Contact": 14.80,
"Contact": 19.05,
"State": 35.85,
"Relationship-Overall": 19.54,
"Composition": 23.65,
"Similarity": 16.11,
"Inclusion": 20.11,
"Comparison": 14.06,
"Compound-Overall": 10.70,
"Imagination": 19.13,
"Feature matching": 2.08,
"Grammar-Overall": 35.03,
"Pronoun Reference": 32.72,
"Consistency": 16.67,
"Negation": 52.69,
"Layout-Overall": 14.93,
"2D": 12.13,
"3D": 17.80,
"Logical Reasoning": 10.68,
"Text": 0.00
},
{
"model": "CogView4",
"link": "https://arxiv.org/pdf/2403.05121",
"hf": "https://huggingface.co/zai-org/CogView4-6B",
"open_source": true,
"release_date": "2024-03",
"Overall": 55.14,
"Style": 82.40,
"World Knowledge": 84.18,
"Attribute-Overall": 63.35,
"Quantity": 68.75,
"Expression": 44.87,
"Material": 56.60,
"Size": 72.92,
"Shape": 53.75,
"Color": 94.17,
"Action-Overall": 61.69,
"Hand": 61.54,
"Full body": 66.30,
"Animal": 64.71,
"Non Contact": 52.04,
"Contact": 54.76,
"State": 70.28,
"Relationship-Overall": 61.68,
"Composition": 61.82,
"Similarity": 62.22,
"Inclusion": 63.59,
"Comparison": 57.81,
"Compound-Overall": 45.75,
"Imagination": 51.02,
"Feature matching": 40.36,
"Grammar-Overall": 54.55,
"Pronoun Reference": 67.65,
"Consistency": 57.41,
"Negation": 38.46,
"Layout-Overall": 65.30,
"2D": 75.00,
"3D": 55.30,
"Logical Reasoning": 30.23,
"Text": 2.30
},
{
"model": "Janus",
"link": "https://arxiv.org/pdf/2410.13848",
"hf": "https://huggingface.co/deepseek-ai/Janus-1.3B",
"open_source": true,
"release_date": "2024-10",
"Overall": 30.98,
"Style": 78.10,
"World Knowledge": 27.85,
"Attribute-Overall": 30.88,
"Quantity": 29.17,
"Expression": 17.31,
"Material": 35.85,
"Size": 45.83,
"Shape": 14.37,
"Color": 17.31,
"Action-Overall": 31.37,
"Hand": 14.10,
"Full body": 38.59,
"Animal": 42.65,
"Non Contact": 24.49,
"Contact": 23.21,
"State": 43.40,
"Relationship-Overall": 30.58,
"Composition": 32.43,
"Similarity": 32.22,
"Inclusion": 27.72,
"Comparison": 28.12,
"Compound-Overall": 17.53,
"Imagination": 25.26,
"Feature matching": 9.64,
"Grammar-Overall": 48.40,
"Pronoun Reference": 48.53,
"Consistency": 33.33,
"Negation": 60.77,
"Layout-Overall": 31.72,
"2D": 31.25,
"3D": 32.20,
"Logical Reasoning": 13.41,
"Text": 0.00
},
{
"model": "Janus-Pro",
"link": "https://arxiv.org/pdf/2501.17811",
"hf": "https://huggingface.co/deepseek-ai/Janus-Pro-7B",
"open_source": true,
"release_date": "2025-01",
"Overall": 30.83,
"Style": 75.60,
"World Knowledge": 39.08,
"Attribute-Overall": 33.12,
"Quantity": 24.31,
"Expression": 19.23,
"Material": 43.87,
"Size": 45.14,
"Shape": 18.75,
"Color": 47.50,
"Action-Overall": 26.33,
"Hand": 13.46,
"Full body": 26.09,
"Animal": 34.56,
"Non Contact": 22.45,
"Contact": 20.83,
"State": 38.68,
"Relationship-Overall": 32.74,
"Composition": 38.85,
"Similarity": 35.56,
"Inclusion": 26.09,
"Comparison": 24.22,
"Compound-Overall": 24.48,
"Imagination": 33.42,
"Feature matching": 15.36,
"Grammar-Overall": 36.63,
"Pronoun Reference": 36.76,
"Consistency": 31.94,
"Negation": 40.38,
"Layout-Overall": 30.04,
"2D": 29.78,
"3D": 30.30,
"Logical Reasoning": 10.23,
"Text": 0.00
},
{
"model": "Kolors",
"link": "https://github.com/Kwai-Kolors/Kolors/blob/master/imgs/Kolors_paper.pdf",
"hf": "https://huggingface.co/Kwai-Kolors/Kolors",
"open_source": true,
"release_date": "2024-7",
"Overall": 58.80,
"Style": 85.20,
"World Knowledge": 86.23,
"Attribute-Overall": 69.34,
"Quantity": 70.14,
"Expression": 51.92,
"Material": 73.11,
"Size": 77.78,
"Shape": 56.25,
"Color": 91.67,
"Action-Overall": 65.02,
"Hand": 58.33,
"Full body": 59.24,
"Animal": 71.32,
"Non Contact": 63.78,
"Contact": 57.54,
"State": 77.83,
"Relationship-Overall": 67.13,
"Composition": 71.96,
"Similarity": 69.44,
"Inclusion": 67.39,
"Comparison": 52.34,
"Compound-Overall": 66.03,
"Imagination": 64.80,
"Feature matching": 45.05,
"Grammar-Overall": 56.68,
"Pronoun Reference": 67.28,
"Consistency": 59.26,
"Negation": 43.46,
"Layout-Overall": 62.31,
"2D": 58.82,
"3D": 65.91,
"Logical Reasoning": 36.14,
"Text": 4.89
},
{
"model": "Seedream-4.0",
"link": "https://www.volcengine.com/docs/82379/1541523",
"hf": "-",
"open_source": false,
"release_date": "2025-09",
"Overall": 87.31,
"Style": 99.00,
"World Knowledge": 94.94,
"Attribute-Overall": 90.06,
"Quantity": 86.81,
"Expression": 85.90,
"Material": 97.64,
"Size": 86.81,
"Shape": 83.12,
"Color": 99.17,
"Action-Overall": 87.55,
"Hand": 82.69,
"Full body": 90.22,
"Animal": 91.91,
"Non Contact": 84.69,
"Contact": 82.74,
"State": 92.45,
"Relationship-Overall": 88.58,
"Composition": 85.14,
"Similarity": 84.44,
"Inclusion": 95.65,
"Comparison": 92.19,
"Compound-Overall": 81.57,
"Imagination": 85.20,
"Feature matching": 77.86,
"Grammar-Overall": 78.48,
"Pronoun Reference": 89.71,
"Consistency": 75.00,
"Negation": 69.62,
"Layout-Overall": 90.30,
"2D": 90.81,
"3D": 89.77,
"Logical Reasoning": 68.64,
"Text": 93.97
},
{
"model": "Imagen-4.0-generate-preview-06-06",
"link": "https://deepmind.google/models/imagen/",
"hf": "-",
"open_source": false,
"release_date": "2025-01",
"Overall": 79.52,
"Style": 97.50,
"World Knowledge": 96.84,
"Attribute-Overall": 86.22,
"Quantity": 83.33,
"Expression": 77.56,
"Material": 92.92,
"Size": 93.75,
"Shape": 72.50,
"Color": 98.33,
"Action-Overall": 90.40,
"Hand": 89.10,
"Full body": 89.67,
"Animal": 93.38,
"Non Contact": 86.73,
"Contact": 90.48,
"State": 93.40,
"Relationship-Overall": 90.74,
"Composition": 91.55,
"Similarity": 83.33,
"Inclusion": 94.57,
"Comparison": 93.75,
"Compound-Overall": 85.70,
"Imagination": 92.60,
"Feature matching": 78.65,
"Grammar-Overall": 82.89,
"Pronoun Reference": 92.65,
"Consistency": 82.87,
"Negation": 72.69,
"Layout-Overall": 89.18,
"2D": 91.54,
"3D": 86.74,
"Logical Reasoning": 73.18,
"Text": 2.59
},
{
"model": "Runway-Gen4-Image",
"link": "https://docs.dev.runwayml.com/api/#tag/Start-generating/paths/~1v1~1text_to_image/post",
"hf": "-",
"open_source": false,
"release_date": "2024-11",
"Overall": 54.93,
"Style": 64.75,
"World Knowledge": 71.05,
"Attribute-Overall": 60.43,
"Quantity": 54.29,
"Expression": 46.05,
"Material": 72.60,
"Size": 57.64,
"Shape": 50.62,
"Color": 81.90,
"Action-Overall": 60.42,
"Hand": 52.63,
"Full body": 65.22,
"Animal": 75.00,
"Non Contact": 51.56,
"Contact": 54.37,
"State": 65.09,
"Relationship-Overall": 65.90,
"Composition": 66.89,
"Similarity": 51.11,
"Inclusion": 74.43,
"Comparison": 72.66,
"Compound-Overall": 61.00,
"Imagination": 68.22,
"Feature matching": 53.49,
"Grammar-Overall": 58.38,
"Pronoun Reference": 55.38,
"Consistency": 55.09,
"Negation": 64.29,
"Layout-Overall": 64.71,
"2D": 59.93,
"3D": 69.62,
"Logical Reasoning": 42.03,
"Text": 0.59
},
{
"model": "HiDream_v2L",
"link": "https://hidreamai.com/doc/txt2img/request",
"hf": "-",
"open_source": false,
"release_date": "2025-07",
"Overall": 59.95,
"Style": 89.34,
"World Knowledge": 91.02,
"Attribute-Overall": 67.87,
"Quantity": 71.43,
"Expression": 42.31,
"Material": 70.59,
"Size": 70.00,
"Shape": 64.52,
"Color": 94.17,
"Action-Overall": 64.90,
"Hand": 48.72,
"Full body": 65.22,
"Animal": 75.00,
"Non Contact": 71.88,
"Contact": 55.95,
"State": 71.15,
"Relationship-Overall": 72.67,
"Composition": 78.82,
"Similarity": 65.00,
"Inclusion": 75.56,
"Comparison": 65.32,
"Compound-Overall": 53.19,
"Imagination": 62.63,
"Feature matching": 43.55,
"Grammar-Overall": 62.57,
"Pronoun Reference": 75.38,
"Consistency": 68.75,
"Negation": 44.53,
"Layout-Overall": 64.77,
"2D": 66.29,
"3D": 63.26,
"Logical Reasoning": 32.01,
"Text": 1.16
},
{
"model": "FLUX-kontext-pro",
"link": "https://bfl.ai/models/flux-kontext",
"hf": "-",
"open_source": false,
"release_date": "2025-05",
"Overall": 1.27,
"Style": 6.93,
"World Knowledge": 0.00,
"Attribute-Overall": 0.11,
"Quantity": 0.69,
"Expression": 0.00,
"Material": 0.00,
"Size": 0.00,
"Shape": 0.00,
"Color": 0.00,
"Action-Overall": 0.29,
"Hand": 0.00,
"Full body": 0.00,
"Animal": 0.00,
"Non Contact": 0.00,
"Contact": 0.00,
"State": 1.47,
"Relationship-Overall": 0.13,
"Composition": 0.34,
"Similarity": 0.00,
"Inclusion": 0.00,
"Comparison": 0.00,
"Compound-Overall": 0.00,
"Imagination": 0.00,
"Feature matching": 0.00,
"Grammar-Overall": 5.24,
"Pronoun Reference": 0.00,
"Consistency": 2.31,
"Negation": 13.28,
"Layout-Overall": 0.00,
"2D": 0.00,
"3D": 0.00,
"Logical Reasoning": 0.00,
"Text": 0.00
},
{
"model": "FLUX-pro-1.1-Ultra",
"link": "https://bfl.ai/",
"hf": "-",
"open_source": false,
"release_date": "2024-11",
"Overall": 1.31,
"Style": 7.63,
"World Knowledge": 0.32,
"Attribute-Overall": 0.32,
"Quantity": 0.00,
"Expression": 0.00,
"Material": 0.94,
"Size": 0.00,
"Shape": 0.00,
"Color": 0.83,
"Action-Overall": 0.00,
"Hand": 0.00,
"Full body": 0.00,
"Animal": 0.00,
"Non Contact": 0.00,
"Contact": 0.00,
"State": 0.00,
"Relationship-Overall": 0.26,
"Composition": 0.34,
"Similarity": 0.57,
"Inclusion": 0.00,
"Comparison": 0.00,
"Compound-Overall": 0.00,
"Imagination": 0.00,
"Feature matching": 0.00,
"Grammar-Overall": 4.30,
"Pronoun Reference": 0.37,
"Consistency": 1.39,
"Negation": 10.94,
"Layout-Overall": 0.19,
"2D": 0.37,
"3D": 0.00,
"Logical Reasoning": 0.00,
"Text": 0.00
},
{
"model": "DALL-E-3",
"link": "https://openai.com/zh-Hans-CN/index/dall-e-3/",
"hf": "-",
"open_source": false,
"release_date": "2023-09",
"Overall": 67.93,
"Style": 95.90,
"World Knowledge": 93.04,
"Attribute-Overall": 78.42,
"Quantity": 60.42,
"Expression": 68.59,
"Material": 91.04,
"Size": 90.28,
"Shape": 65.00,
"Color": 94.17,
"Action-Overall": 72.24,
"Hand": 69.87,
"Full body": 77.17,
"Animal": 82.35,
"Non Contact": 66.33,
"Contact": 61.90,
"State": 76.89,
"Relationship-Overall": 79.95,
"Composition": 81.76,
"Similarity": 77.78,
"Inclusion": 87.50,
"Comparison": 67.97,
"Compound-Overall": 72.94,
"Imagination": 82.14,
"Feature matching": 63.54,
"Grammar-Overall": 71.52,
"Pronoun Reference": 79.78,
"Consistency": 76.39,
"Negation": 58.85,
"Layout-Overall": 62.50,
"2D": 54.41,
"3D": 70.83,
"Logical Reasoning": 51.59,
"Text": 1.15
},
{
"model": "Qwen-Image",
"link": "https://arxiv.org/pdf/2508.02324",
"hf": "https://huggingface.co/Qwen/Qwen-Image",
"open_source": true,
"release_date": "2025-08",
"Overall": 81.04,
"Style": 95.50,
"World Knowledge": 92.41,
"Attribute-Overall": 91.88,
"Quantity": 88.89,
"Expression": 91.03,
"Material": 96.23,
"Size": 90.28,
"Shape": 86.25,
"Color": 98.33,
"Action-Overall": 85.74,
"Hand": 83.33,
"Full body": 87.50,
"Animal": 89.71,
"Non Contact": 81.63,
"Contact": 82.14,
"State": 90.09,
"Relationship-Overall": 82.99,
"Composition": 85.47,
"Similarity": 73.33,
"Inclusion": 90.76,
"Comparison": 79.69,
"Compound-Overall": 76.16,
"Imagination": 80.10,
"Feature matching": 72.14,
"Grammar-Overall": 62.83,
"Pronoun Reference": 83.46,
"Consistency": 74.07,
"Negation": 31.92,
"Layout-Overall": 82.65,
"2D": 84.93,
"3D": 80.30,
"Logical Reasoning": 57.73,
"Text": 82.47
},
{
"model": "wan2.2-t2i-plus",
"link": "https://help.aliyun.com/zh/model-studio/text-to-image-v2-api-reference",
"hf": "-",
"open_source": false,
"release_date": "2025-07",
"Overall": 66.96,
"Style": 91.06,
"World Knowledge": 84.39,
"Attribute-Overall": 73.93,
"Quantity": 75.00,
"Expression": 67.31,
"Material": 74.06,
"Size": 74.31,
"Shape": 66.25,
"Color": 90.83,
"Action-Overall": 72.52,
"Hand": 69.23,
"Full body": 80.00,
"Animal": 84.56,
"Non Contact": 65.31,
"Contact": 61.90,
"State": 75.94,
"Relationship-Overall": 76.78,
"Composition": 71.28,
"Similarity": 72.78,
"Inclusion": 85.87,
"Comparison": 82.03,
"Compound-Overall": 64.77,
"Imagination": 74.23,
"Feature matching": 55.00,
"Grammar-Overall": 70.59,
"Pronoun Reference": 77.21,
"Consistency": 63.43,
"Negation": 69.62,
"Layout-Overall": 71.83,
"2D": 73.16,
"3D": 70.45,
"Logical Reasoning": 51.82,
"Text": 11.92
},
{
"model": "FLUX.1-dev",
"link": "https://bfl.ai/blog/24-08-01-bfl",
"hf": "https://huggingface.co/black-forest-labs/FLUX.1-dev",
"open_source": true,
"release_date": "2024-08",
"Overall": 2.74,
"Style": 10.50,
"World Knowledge": 0.63,
"Attribute-Overall": 0.43,
"Quantity": 0.00,
"Expression": 1.92,
"Material": 0.47,
"Size": 0.00,
"Shape": 0.00,
"Color": 0.00,
"Action-Overall": 0.95,
"Hand": 1.92,
"Full body": 0.54,
"Animal": 0.74,
"Non Contact": 0.00,
"Contact": 0.00,
"State": 2.36,
"Relationship-Overall": 0.13,
"Composition": 0.34,
"Similarity": 0.00,
"Inclusion": 0.00,
"Comparison": 0.00,
"Compound-Overall": 0.13,
"Imagination": 0.26,
"Feature matching": 0.00,
"Grammar-Overall": 7.75,
"Pronoun Reference": 0.74,
"Consistency": 1.39,
"Negation": 20.38,
"Layout-Overall": 0.19,
"2D": 0.00,
"3D": 0.38,
"Logical Reasoning": 0.00,
"Text": 0.00
},
{
"model": "Nano Banana",
"link": "https://ainanobanana.io/",
"hf": "-",
"open_source": false,
"release_date": "2025-08",
"Overall": 80.91,
"Style": 99.27,
"World Knowledge": 96.47,
"Attribute-Overall": 87.76,
"Quantity": 81.62,
"Expression": 80.79,
"Material": 89.66,
"Size": 95.74,
"Shape": 82.05,
"Color": 98.33,
"Action-Overall": 86.99,
"Hand": 86.54,
"Full body": 91.38,
"Animal": 90.44,
"Non Contact": 81.96,
"Contact": 81.44,
"State": 90.64,
"Relationship-Overall": 91.39,
"Composition": 92.33,
"Similarity": 83.89,
"Inclusion": 93.44,
"Comparison": 96.88,
"Compound-Overall": 86.89,
"Imagination": 90.40,
"Feature matching": 83.42,
"Grammar-Overall": 83.33,
"Pronoun Reference": 87.27,
"Consistency": 84.69,
"Negation": 78.12,
"Layout-Overall": 88.80,
"2D": 91.82,
"3D": 85.66,
"Logical Reasoning": 76.10,
"Text": 12.06
},
{
"model": "Hunyuan-DiT",
"link": "https://arxiv.org/pdf/2405.08748",
"hf": "https://huggingface.co/Tencent-Hunyuan/HunyuanDiT",
"open_source": true,
"release_date": "2024-05",
"Overall": 53.36,
"Style": 92.50,
"World Knowledge": 84.97,
"Attribute-Overall": 62.93,
"Quantity": 63.19,
"Expression": 46.15,
"Material": 72.17,
"Size": 63.89,
"Shape": 49.38,
"Color": 85.00,
"Action-Overall": 57.22,
"Hand": 45.51,
"Full body": 67.93,
"Animal": 61.76,
"Non Contact": 48.47,
"Contact": 47.02,
"State": 69.81,
"Relationship-Overall": 59.39,
"Composition": 65.88,
"Similarity": 64.44,
"Inclusion": 56.52,
"Comparison": 41.41,
"Compound-Overall": 44.59,
"Imagination": 52.04,
"Feature matching": 36.98,
"Grammar-Overall": 54.68,
"Pronoun Reference": 59.93,
"Consistency": 62.04,
"Negation": 43.08,
"Layout-Overall": 47.76,
"2D": 39.71,
"3D": 56.06,
"Logical Reasoning": 29.55,
"Text": 0.00
},
{
"model": "Recraft",
"link": "https://www.recraft.ai/docs#generate-image",
"hf": "-",
"open_source": false,
"release_date": "2024-12",
"Overall": 57.67,
"Style": 87.70,
"World Knowledge": 90.03,
"Attribute-Overall": 69.34,
"Quantity": 66.67,
"Expression": 59.62,
"Material": 66.51,
"Size": 73.61,
"Shape": 61.25,
"Color": 95.83,
"Action-Overall": 63.88,
"Hand": 50.64,
"Full body": 72.28,
"Animal": 77.94,
"Non Contact": 63.78,
"Contact": 45.24,
"State": 72.17,
"Relationship-Overall": 64.47,
"Composition": 65.54,
"Similarity": 58.89,
"Inclusion": 65.22,
"Comparison": 68.75,
"Compound-Overall": 43.94,
"Imagination": 45.92,
"Feature matching": 41.93,
"Grammar-Overall": 60.56,
"Pronoun Reference": 62.87,
"Consistency": 59.26,
"Negation": 59.23,
"Layout-Overall": 58.40,
"2D": 55.15,
"3D": 61.74,
"Logical Reasoning": 34.09,
"Text": 4.31
},
{
"model": "Imagen-3.0-generate-002",
"link": "https://arxiv.org/pdf/2408.07009",
"hf": "-",
"open_source": false,
"release_date": "2025-02",
"Overall": 13.62,
"Style": 8.30,
"World Knowledge": 0.00,
"Attribute-Overall": 0.00,
"Quantity": 0.00,
"Expression": 0.00,
"Material": 0.00,
"Size": 0.00,
"Shape": 0.00,
"Color": 0.00,
"Action-Overall": 0.38,
"Hand": 0.00,
"Full body": 0.54,
"Animal": 0.00,
"Non Contact": 0.00,
"Contact": 0.00,
"State": 1.42,
"Relationship-Overall": 0.13,
"Composition": 0.34,
"Similarity": 0.00,
"Inclusion": 0.00,
"Comparison": 0.00,
"Compound-Overall": 0.00,
"Imagination": 0.00,
"Feature matching": 0.00,
"Grammar-Overall": 4.81,
"Pronoun Reference": 0.00,
"Consistency": 0.46,
"Negation": 13.46,
"Layout-Overall": 0.00,
"2D": 0.00,
"3D": 0.00,
"Logical Reasoning": 0.00,
"Text": 0.00
},
{
"model": "Imagen-4.0-Fast-preview-06-06",
"link": "https://deepmind.google/models/imagen/",
"hf": "-",
"open_source": false,
"release_date": "2025-06",
"Overall": 71.60,
"Style": 93.30,
"World Knowledge": 91.30,
"Attribute-Overall": 80.98,
"Quantity": 76.39,
"Expression": 66.03,
"Material": 83.49,
"Size": 88.19,
"Shape": 78.75,
"Color": 95.83,
"Action-Overall": 79.28,
"Hand": 74.36,
"Full body": 79.35,
"Animal": 83.82,
"Non Contact": 73.47,
"Contact": 75.60,
"State": 88.21,
"Relationship-Overall": 82.49,
"Composition": 82.09,
"Similarity": 78.33,
"Inclusion": 88.04,
"Comparison": 81.25,
"Compound-Overall": 73.97,
"Imagination": 83.67,
"Feature matching": 64.06,
"Grammar-Overall": 77.41,
"Pronoun Reference": 83.82,
"Consistency": 78.24,
"Negation": 70.00,
"Layout-Overall": 78.73,
"2D": 80.51,
"3D": 76.89,
"Logical Reasoning": 54.77,
"Text": 3.74
},
{
"model": "FLUX-kontext-max",
"link": "https://bfl.ai/models/flux-kontext",
"hf": "-",
"open_source": false,
"release_date": "2025-05",
"Overall": 71.85,
"Style": 96.38,
"World Knowledge": 92.83,
"Attribute-Overall": 76.41,
"Quantity": 65.97,
"Expression": 69.44,
"Material": 80.19,
"Size": 84.72,
"Shape": 66.67,
"Color": 93.33,
"Action-Overall": 78.59,
"Hand": 76.32,
"Full body": 83.15,
"Animal": 83.33,
"Non Contact": 69.90,
"Contact": 73.17,
"State": 85.78,
"Relationship-Overall": 83.97,
"Composition": 85.14,
"Similarity": 74.43,
"Inclusion": 91.67,
"Comparison": 83.59,
"Compound-Overall": 75.13,
"Imagination": 82.65,
"Feature matching": 67.12,
"Grammar-Overall": 75.68,
"Pronoun Reference": 79.85,
"Consistency": 75.46,
"Negation": 71.48,
"Layout-Overall": 81.34,
"2D": 81.62,
"3D": 81.06,
"Logical Reasoning": 56.48,
"Text": 1.72
},
{
"model": "Seedream-3.0",
"link": "https://www.byteplus.com/en/product/Seedream",
"hf": "-",
"open_source": false,
"release_date": "2025-06",
"Overall": 81.68,
"Style": 97.50,
"World Knowledge": 93.99,
"Attribute-Overall": 88.03,
"Quantity": 84.03,
"Expression": 82.69,
"Material": 94.34,
"Size": 89.58,
"Shape": 80.00,
"Color": 97.50,
"Action-Overall": 86.98,
"Hand": 85.26,
"Full body": 90.76,
"Animal": 89.71,
"Non Contact": 85.20,
"Contact": 80.36,
"State": 90.09,
"Relationship-Overall": 84.39,
"Composition": 86.82,
"Similarity": 74.44,
"Inclusion": 90.22,
"Comparison": 84.38,
"Compound-Overall": 76.68,
"Imagination": 82.14,
"Feature matching": 71.09,
"Grammar-Overall": 67.25,
"Pronoun Reference": 84.19,
"Consistency": 79.17,
"Negation": 39.62,
"Layout-Overall": 84.14,
"2D": 89.34,
"3D": 78.79,
"Logical Reasoning": 59.09,
"Text": 78.74
},
{
"model": "Imagen-4.0-Ultra-preview-06-06",
"link": "https://deepmind.google/models/imagen/",
"hf": "-",
"open_source": false,
"release_date": "2025-06",
"Overall": 83.21,
"Style": 98.90,
"World Knowledge": 97.94,
"Attribute-Overall": 90.71,
"Quantity": 88.89,
"Expression": 79.49,
"Material": 94.81,
"Size": 93.75,
"Shape": 88.12,
"Color": 100.0,
"Action-Overall": 93.82,
"Hand": 94.87,
"Full body": 92.93,
"Animal": 95.59,
"Non Contact": 87.76,
"Contact": 95.24,
"State": 97.17,
"Relationship-Overall": 92.13,
"Composition": 91.22,
"Similarity": 87.22,
"Inclusion": 97.83,
"Comparison": 92.97,
"Compound-Overall": 89.95,
"Imagination": 94.90,
"Feature matching": 84.90,
"Grammar-Overall": 87.43,
"Pronoun Reference": 93.01,
"Consistency": 85.65,
"Negation": 83.08,
"Layout-Overall": 92.16,
"2D": 93.75,
"3D": 90.53,
"Logical Reasoning": 79.32,
"Text": 9.77
},
{
"model": "GPT-4o",
"link": "https://platform.openai.com/docs/guides/image-generation",
"hf": "-",
"open_source": false,
"release_date": "2025-03",
"Overall": 91.02,
"Style": 99.39,
"World Knowledge": 98.72,
"Attribute-Overall": 94.99,
"Quantity": 93.62,
"Expression": 94.59,
"Material": 96.19,
"Size": 93.06,
"Shape": 92.95,
"Color": 100.0,
"Action-Overall": 92.34,
"Hand": 94.08,
"Full body": 97.28,
"Animal": 90.91,
"Non Contact": 90.31,
"Contact": 88.34,
"State": 92.65,
"Relationship-Overall": 95.77,
"Composition": 97.30,
"Similarity": 93.18,
"Inclusion": 96.69,
"Comparison": 94.53,
"Compound-Overall": 93.91,
"Imagination": 95.92,
"Feature matching": 91.74,
"Grammar-Overall": 91.02,
"Pronoun Reference": 95.15,
"Consistency": 89.35,
"Negation": 88.05,
"Layout-Overall": 89.27,
"2D": 89.18,
"3D": 89.35,
"Logical Reasoning": 91.44,
"Text": 63.37
}
]
}