๐Ÿค Do Chatbot LLMs Talk Too Much?
YapBench Benchmark
Measuring how wordy (lengthโ€‘biased) LLMs are when a short answer would do.
tabularis.ai | Total models: 76 | Last Update: 27 December 2025
{
  • "headers": [
    • "Rank",
    • "model",
    • "YapIndex",
    • "Cat A",
    • "Cat B",
    • "Cat C"
    ],
  • "data": [
    • [
      • "๐Ÿฅ‡",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-3.5-turbo</a>",
      • 22.7,
      • 18,
      • 36,
      • 14
      ],
    • [
      • "๐Ÿฅˆ",
      • "<a target="_blank" href="https://huggingface.co/moonshotai/kimi-k2-0905" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">moonshotai/kimi-k2-0905</a>",
      • 44.7,
      • 81,
      • 38.5,
      • 14.5
      ],
    • [
      • "๐Ÿฅ‰",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4</a>",
      • 51.2,
      • 44,
      • 28,
      • 81.5
      ],
    • [
      • "4",
      • "<a target="_blank" href="https://huggingface.co/z-ai/glm-4.7" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">z-ai/glm-4.7</a>",
      • 66.3,
      • 138.5,
      • 58.5,
      • 2
      ],
    • [
      • "5",
      • "<a target="_blank" href="https://x.ai/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">x-ai/grok-4-fast</a>",
      • 70.2,
      • 55.5,
      • 153.5,
      • 1.5
      ],
    • [
      • "6",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4.1-mini</a>",
      • 75.7,
      • 30,
      • 42,
      • 155
      ],
    • [
      • "7",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/o3</a>",
      • 84.3,
      • 96.5,
      • 47,
      • 109.5
      ],
    • [
      • "8",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5.1-codex</a>",
      • 85.3,
      • 61.5,
      • 41,
      • 153.5
      ],
    • [
      • "9",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5.2</a>",
      • 86.8,
      • 190,
      • 49.5,
      • 21
      ],
    • [
      • "10",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5.2 (reasoning)</a>",
      • 89.8,
      • 196.5,
      • 45.5,
      • 27.5
      ],
    • [
      • "11",
      • "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-opus-4.5</a>",
      • 97,
      • 217.5,
      • 50.5,
      • 23
      ],
    • [
      • "12",
      • "<a target="_blank" href="https://x.ai/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">x-ai/grok-4.1-fast</a>",
      • 98,
      • 27,
      • 263,
      • 4
      ],
    • [
      • "13",
      • "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-opus-4.5 (reasoning)</a>",
      • 99.2,
      • 224.5,
      • 50,
      • 23
      ],
    • [
      • "14",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5</a>",
      • 100.7,
      • 272.5,
      • 8.5,
      • 21
      ],
    • [
      • "15",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4.1-nano</a>",
      • 105.2,
      • 54.5,
      • 41.5,
      • 219.5
      ],
    • [
      • "16",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5.1</a>",
      • 111.8,
      • 214,
      • 44,
      • 77.5
      ],
    • [
      • "17",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/o4-mini</a>",
      • 115.5,
      • 88,
      • 80,
      • 178.5
      ],
    • [
      • "18",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5.1 (reasoning)</a>",
      • 120.8,
      • 223,
      • 46,
      • 93.5
      ],
    • [
      • "19",
      • "<a target="_blank" href="https://x.ai/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">x-ai/grok-4</a>",
      • 126.3,
      • 129,
      • 248,
      • 2
      ],
    • [
      • "20",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/o3-mini</a>",
      • 153.2,
      • 142,
      • 160.5,
      • 157
      ],
    • [
      • "21",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4o</a>",
      • 167.2,
      • 57.5,
      • 48.5,
      • 395.5
      ],
    • [
      • "22",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4.1</a>",
      • 168,
      • 92.5,
      • 83.5,
      • 328
      ],
    • [
      • "23",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5-nano</a>",
      • 175,
      • 353,
      • 82.5,
      • 89.5
      ],
    • [
      • "24",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4o-mini</a>",
      • 183.2,
      • 72.5,
      • 104.5,
      • 372.5
      ],
    • [
      • "25",
      • "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.5-flash (reasoning)</a>",
      • 195.2,
      • 337.5,
      • 68.5,
      • 179.5
      ],
    • [
      • "26",
      • "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-3.5-sonnet</a>",
      • 199.7,
      • 132.5,
      • 180.5,
      • 286
      ],
    • [
      • "27",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-oss-20b</a>",
      • 199.7,
      • 110.5,
      • 67,
      • 421.5
      ],
    • [
      • "28",
      • "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.5-flash</a>",
      • 210.5,
      • 482.5,
      • 42,
      • 107
      ],
    • [
      • "29",
      • "<a target="_blank" href="https://www.deepseek.com/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">deepseek/deepseek-v3.2 (reasoning)</a>",
      • 215,
      • 123.5,
      • 314,
      • 207.5
      ],
    • [
      • "30",
      • "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-3-pro-preview</a>",
      • 226,
      • 334.5,
      • 86.5,
      • 257
      ],
    • [
      • "31",
      • "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.0-flash-lite-001</a>",
      • 227.7,
      • 138,
      • 42,
      • 503
      ],
    • [
      • "32",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5-mini</a>",
      • 250.5,
      • 412,
      • 105,
      • 234.5
      ],
    • [
      • "33",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4-turbo</a>",
      • 252.5,
      • 78.5,
      • 63,
      • 616
      ],
    • [
      • "34",
      • "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-235b-a22b-2507 (reasoning)</a>",
      • 260.3,
      • 130,
      • 124,
      • 527
      ],
    • [
      • "35",
      • "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-235b-a22b-2507</a>",
      • 264,
      • 138,
      • 136.5,
      • 517.5
      ],
    • [
      • "36",
      • "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen-plus</a>",
      • 267.3,
      • 124,
      • 119.5,
      • 558.5
      ],
    • [
      • "37",
      • "<a target="_blank" href="https://huggingface.co/allenai/olmo-2-0325-32b-instruct" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">allenai/olmo-2-0325-32b-instruct</a>",
      • 268.7,
      • 620.5,
      • 164.5,
      • 21
      ],
    • [
      • "38",
      • "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-oss-120b</a>",
      • 269.7,
      • 142,
      • 128.5,
      • 538.5
      ],
    • [
      • "39",
      • "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-sonnet-4.5 (reasoning)</a>",
      • 278.7,
      • 289.5,
      • 131.5,
      • 415
      ],
    • [
      • "40",
      • "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.5-flash-lite (reasoning)</a>",
      • 280.5,
      • 186,
      • 47.5,
      • 608
      ],
    • [
      • "41",
      • "<a target="_blank" href="https://huggingface.co/microsoft/phi-4-reasoning-plus (reasoning)" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">microsoft/phi-4-reasoning-plus (reasoning)</a>",
      • 281,
      • 207,
      • 184.5,
      • 451.5
      ],
    • [
      • "42",
      • "<a target="_blank" href="https://huggingface.co/microsoft/phi-4-reasoning-plus" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">microsoft/phi-4-reasoning-plus</a>",
      • 281.2,
      • 210,
      • 187.5,
      • 446
      ],
    • [
      • "43",
      • "<a target="_blank" href="https://x.ai/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">x-ai/grok-code-fast-1</a>",
      • 284.5,
      • 137.5,
      • 474.5,
      • 241.5
      ],
    • [
      • "44",
      • "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-sonnet-4.5</a>",
      • 285,
      • 283.5,
      • 130,
      • 441.5
      ],
    • [
      • "45",
      • "<a target="_blank" href="https://huggingface.co/minimax/minimax-m2" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">minimax/minimax-m2</a>",
      • 297.3,
      • 138.5,
      • 385.5,
      • 368
      ],
    • [
      • "46",
      • "<a target="_blank" href="https://huggingface.co/meta-llama/llama-3.3-70b-instruct" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">meta-llama/llama-3.3-70b-instruct</a>",
      • 312.8,
      • 164,
      • 125.5,
      • 649
      ],
    • [
      • "47",
      • "<a target="_blank" href="https://huggingface.co/meta-llama/llama-3.1-8b-instruct" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">meta-llama/llama-3.1-8b-instruct</a>",
      • 315.7,
      • 135,
      • 96.5,
      • 715.5
      ],
    • [
      • "48",
      • "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-coder (reasoning)</a>",
      • 325.5,
      • 197,
      • 214.5,
      • 565
      ],
    • [
      • "49",
      • "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-coder</a>",
      • 326.3,
      • 194,
      • 202,
      • 583
      ],
    • [
      • "50",
      • "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.0-flash-001</a>",
      • 326.5,
      • 273,
      • 40,
      • 666.5
      ],
    • [
      • "51",
      • "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-haiku-4.5</a>",
      • 333.2,
      • 231,
      • 125,
      • 643.5
      ],
    • [
      • "52",
      • "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-haiku-4.5 (reasoning)</a>",
      • 335.2,
      • 237,
      • 125,
      • 643.5
      ],
    • [
      • "53",
      • "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-3-flash-preview</a>",
      • 339.3,
      • 426.5,
      • 120.5,
      • 471
      ],
    • [
      • "54",
      • "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-3-flash-preview (reasoning)</a>",
      • 340.8,
      • 395,
      • 117.5,
      • 510
      ],
    • [
      • "55",
      • "<a target="_blank" href="https://huggingface.co/meta-llama/llama-4-maverick" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">meta-llama/llama-4-maverick</a>",
      • 342.8,
      • 139,
      • 232,
      • 657.5
      ],
    • [
      • "56",
      • "<a target="_blank" href="https://www.deepseek.com/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">deepseek/deepseek-chat</a>",
      • 345.7,
      • 142,
      • 329.5,
      • 565.5
      ],
    • [
      • "57",
      • "<a target="_blank" href="https://huggingface.co/meta-llama/llama-4-scout" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">meta-llama/llama-4-scout</a>",
      • 350.5,
      • 138.5,
      • 177.5,
      • 735.5
      ],
    • [
      • "58",
      • "<a target="_blank" href="https://docs.mistral.ai/getting-started/models/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">mistralai/mistral-medium-3</a>",
      • 361,
      • 138,
      • 376.5,
      • 568.5
      ],
    • [
      • "59",
      • "<a target="_blank" href="https://docs.mistral.ai/getting-started/models/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">mistralai/mistral-small-3.1-24b-instruct</a>",
      • 389.2,
      • 190,
      • 215,
      • 762.5
      ],
    • [
      • "60",
      • "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-3.5-haiku</a>",
      • 401.2,
      • 168,
      • 280.5,
      • 755
      ],
    • [
      • "61",
      • "<a target="_blank" href="https://huggingface.co/z-ai/glm-4.6v" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">z-ai/glm-4.6v</a>",
      • 410.5,
      • 196,
      • 143,
      • 892.5
      ],
    • [
      • "62",
      • "<a target="_blank" href="https://www.deepseek.com/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">deepseek/deepseek-v3.2</a>",
      • 426.2,
      • 234.5,
      • 303,
      • 741
      ],
    • [
      • "63",
      • "<a target="_blank" href="https://docs.mistral.ai/getting-started/models/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">mistralai/mistral-large-2512</a>",
      • 444,
      • 405,
      • 370.5,
      • 556.5
      ],
    • [
      • "64",
      • "<a target="_blank" href="https://docs.mistral.ai/getting-started/models/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">mistralai/devstral-2512</a>",
      • 449,
      • 341,
      • 447,
      • 559
      ],
    • [
      • "65",
      • "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.5-flash-lite</a>",
      • 476.2,
      • 450,
      • 42.5,
      • 936
      ],
    • [
      • "66",
      • "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-vl-8b-instruct</a>",
      • 518,
      • 281,
      • 564.5,
      • 708.5
      ],
    • [
      • "67",
      • "<a target="_blank" href="https://huggingface.co/allenai/olmo-3.1-32b-think:free" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">allenai/olmo-3.1-32b-think:free</a>",
      • 530.5,
      • 172,
      • 596,
      • 823.5
      ],
    • [
      • "68",
      • "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.5-pro</a>",
      • 539.8,
      • 391,
      • 195.5,
      • 1033
      ],
    • [
      • "69",
      • "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-14b</a>",
      • 558,
      • 134,
      • 536,
      • 1004
      ],
    • [
      • "70",
      • "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-vl-235b-a22b-thinking</a>",
      • 602.8,
      • 214.5,
      • 830.5,
      • 763.5
      ],
    • [
      • "71",
      • "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-32b</a>",
      • 725.3,
      • 205,
      • 805,
      • 1166
      ],
    • [
      • "72",
      • "<a target="_blank" href="https://huggingface.co/amazon/nova-2-lite-v1 (reasoning)" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">amazon/nova-2-lite-v1 (reasoning)</a>",
      • 788.3,
      • 1155.5,
      • 228.5,
      • 981
      ],
    • [
      • "73",
      • "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen-plus (reasoning)</a>",
      • 800.3,
      • 265,
      • 1125.5,
      • 1010.5
      ],
    • [
      • "74",
      • "<a target="_blank" href="https://huggingface.co/amazon/nova-2-lite-v1" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">amazon/nova-2-lite-v1</a>",
      • 896.3,
      • 568.5,
      • 585,
      • 1535.5
      ],
    • [
      • "75",
      • "<a target="_blank" href="https://huggingface.co/z-ai/glm-4.6:exacto" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">z-ai/glm-4.6:exacto</a>",
      • 930.7,
      • 1064,
      • 410.5,
      • 1317.5
      ],
    • [
      • "76",
      • "<a target="_blank" href="https://huggingface.co/z-ai/glm-4.5" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">z-ai/glm-4.5</a>",
      • 1427,
      • 1199.5,
      • 985.5,
      • 2096
      ]
    ],
  • "metadata": null
}