{
- "headers": [
- "Rank",
- "model",
- "YapIndex",
- "Cat A",
- "Cat B",
- "Cat C",
- "YapTax$"
- "data": [
- [
- "🥇",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-3.5-turbo</a>",
- "<span style="display:none">000022.7</span>22.7<span style="font-size:0.75em;color:#888;"> ±4.8</span>",
- "<span style="display:none">000018.0</span>18.0<span style="font-size:0.75em;color:#888;"> ±8.5</span>",
- "<span style="display:none">000036.0</span>36.0<span style="font-size:0.75em;color:#888;"> ±6.3</span>",
- "<span style="display:none">000014.0</span>14.0<span style="font-size:0.75em;color:#888;"> ±7.5</span>",
- 0.02
- [
- "🥈",
- "<a target="_blank" href="https://huggingface.co/moonshotai/kimi-k2-0905" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">moonshotai/kimi-k2-0905</a>",
- "<span style="display:none">000044.7</span>44.7<span style="font-size:0.75em;color:#888;"> ±4.8</span>",
- "<span style="display:none">000081.0</span>81.0<span style="font-size:0.75em;color:#888;"> ±11.5</span>",
- "<span style="display:none">000038.5</span>38.5<span style="font-size:0.75em;color:#888;"> ±5.0</span>",
- "<span style="display:none">000014.5</span>14.5<span style="font-size:0.75em;color:#888;"> ±4.2</span>",
- 0.05
- [
- "🥉",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4</a>",
- "<span style="display:none">000051.2</span>51.2<span style="font-size:0.75em;color:#888;"> ±20.6</span>",
- "<span style="display:none">000044.0</span>44.0<span style="font-size:0.75em;color:#888;"> ±16.0</span>",
- "<span style="display:none">000028.0</span>28.0<span style="font-size:0.75em;color:#888;"> ±2.8</span>",
- "<span style="display:none">000081.5</span>81.5<span style="font-size:0.75em;color:#888;"> ±56.5</span>",
- 1.39
- [
- "4",
- "<a target="_blank" href="https://huggingface.co/z-ai/glm-4.7" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">z-ai/glm-4.7</a>",
- "<span style="display:none">000066.3</span>66.3<span style="font-size:0.75em;color:#888;"> ±40.8</span>",
- "<span style="display:none">000138.5</span>138.5<span style="font-size:0.75em;color:#888;"> ±111.5</span>",
- "<span style="display:none">000058.5</span>58.5<span style="font-size:0.75em;color:#888;"> ±22.5</span>",
- "<span style="display:none">000002.0</span>2.0<span style="font-size:0.75em;color:#888;"> ±1.8</span>",
- 0.07
- [
- "5",
- "<a target="_blank" href="https://x.ai/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">x-ai/grok-4-fast</a>",
- "<span style="display:none">000070.2</span>70.2<span style="font-size:0.75em;color:#888;"> ±15.0</span>",
- "<span style="display:none">000055.5</span>55.5<span style="font-size:0.75em;color:#888;"> ±18.0</span>",
- "<span style="display:none">000153.5</span>153.5<span style="font-size:0.75em;color:#888;"> ±39.8</span>",
- "<span style="display:none">000001.5</span>1.5<span style="font-size:0.75em;color:#888;"> ±2.5</span>",
- 0.02
- [
- "6",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4.1-mini</a>",
- "<span style="display:none">000075.7</span>75.7<span style="font-size:0.75em;color:#888;"> ±15.3</span>",
- "<span style="display:none">000030.0</span>30.0<span style="font-size:0.75em;color:#888;"> ±5.5</span>",
- "<span style="display:none">000042.0</span>42.0<span style="font-size:0.75em;color:#888;"> ±5.8</span>",
- "<span style="display:none">000155.0</span>155.0<span style="font-size:0.75em;color:#888;"> ±43.5</span>",
- 0.06
- [
- "7",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/o3</a>",
- "<span style="display:none">000084.3</span>84.3<span style="font-size:0.75em;color:#888;"> ±14.7</span>",
- "<span style="display:none">000096.5</span>96.5<span style="font-size:0.75em;color:#888;"> ±25.0</span>",
- "<span style="display:none">000047.0</span>47.0<span style="font-size:0.75em;color:#888;"> ±7.8</span>",
- "<span style="display:none">000109.5</span>109.5<span style="font-size:0.75em;color:#888;"> ±33.0</span>",
- 0.29
- [
- "8",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5.1-codex</a>",
- "<span style="display:none">000085.3</span>85.3<span style="font-size:0.75em;color:#888;"> ±7.4</span>",
- "<span style="display:none">000061.5</span>61.5<span style="font-size:0.75em;color:#888;"> ±14.2</span>",
- "<span style="display:none">000041.0</span>41.0<span style="font-size:0.75em;color:#888;"> ±4.5</span>",
- "<span style="display:none">000153.5</span>153.5<span style="font-size:0.75em;color:#888;"> ±14.0</span>",
- 0.27
- [
- "9",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5.2</a>",
- "<span style="display:none">000086.8</span>86.8<span style="font-size:0.75em;color:#888;"> ±16.7</span>",
- "<span style="display:none">000190.0</span>190.0<span style="font-size:0.75em;color:#888;"> ±33.5</span>",
- "<span style="display:none">000049.5</span>49.5<span style="font-size:0.75em;color:#888;"> ±11.0</span>",
- "<span style="display:none">000021.0</span>21.0<span style="font-size:0.75em;color:#888;"> ±31.0</span>",
- 0.55
- [
- "10",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5.2 (reasoning)</a>",
- "<span style="display:none">000089.8</span>89.8<span style="font-size:0.75em;color:#888;"> ±22.0</span>",
- "<span style="display:none">000196.5</span>196.5<span style="font-size:0.75em;color:#888;"> ±49.0</span>",
- "<span style="display:none">000045.5</span>45.5<span style="font-size:0.75em;color:#888;"> ±9.8</span>",
- "<span style="display:none">000027.5</span>27.5<span style="font-size:0.75em;color:#888;"> ±34.8</span>",
- 0.52
- [
- "11",
- "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-opus-4.5</a>",
- "<span style="display:none">000097.0</span>97.0<span style="font-size:0.75em;color:#888;"> ±28.9</span>",
- "<span style="display:none">000217.5</span>217.5<span style="font-size:0.75em;color:#888;"> ±88.8</span>",
- "<span style="display:none">000050.5</span>50.5<span style="font-size:0.75em;color:#888;"> ±18.5</span>",
- "<span style="display:none">000023.0</span>23.0<span style="font-size:0.75em;color:#888;"> ±5.5</span>",
- 1.52
- [
- "12",
- "<a target="_blank" href="https://x.ai/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">x-ai/grok-4.1-fast</a>",
- "<span style="display:none">000098.0</span>98.0<span style="font-size:0.75em;color:#888;"> ±11.0</span>",
- "<span style="display:none">000027.0</span>27.0<span style="font-size:0.75em;color:#888;"> ±11.0</span>",
- "<span style="display:none">000263.0</span>263.0<span style="font-size:0.75em;color:#888;"> ±28.5</span>",
- "<span style="display:none">000004.0</span>4.0<span style="font-size:0.75em;color:#888;"> ±4.2</span>",
- 0.03
- [
- "13",
- "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-opus-4.5 (reasoning)</a>",
- "<span style="display:none">000099.2</span>99.2<span style="font-size:0.75em;color:#888;"> ±29.3</span>",
- "<span style="display:none">000224.5</span>224.5<span style="font-size:0.75em;color:#888;"> ±90.3</span>",
- "<span style="display:none">000050.0</span>50.0<span style="font-size:0.75em;color:#888;"> ±18.5</span>",
- "<span style="display:none">000023.0</span>23.0<span style="font-size:0.75em;color:#888;"> ±5.5</span>",
- 1.44
- [
- "14",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5</a>",
- "<span style="display:none">000100.7</span>100.7<span style="font-size:0.75em;color:#888;"> ±22.8</span>",
- "<span style="display:none">000272.5</span>272.5<span style="font-size:0.75em;color:#888;"> ±70.0</span>",
- "<span style="display:none">000008.5</span>8.5<span style="font-size:0.75em;color:#888;"> ±16.0</span>",
- "<span style="display:none">000021.0</span>21.0<span style="font-size:0.75em;color:#888;"> ±14.5</span>",
- 0.33
- [
- "15",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4.1-nano</a>",
- "<span style="display:none">000105.2</span>105.2<span style="font-size:0.75em;color:#888;"> ±10.7</span>",
- "<span style="display:none">000054.5</span>54.5<span style="font-size:0.75em;color:#888;"> ±16.0</span>",
- "<span style="display:none">000041.5</span>41.5<span style="font-size:0.75em;color:#888;"> ±4.2</span>",
- "<span style="display:none">000219.5</span>219.5<span style="font-size:0.75em;color:#888;"> ±23.0</span>",
- 0.02
- [
- "16",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5.1</a>",
- "<span style="display:none">000111.8</span>111.8<span style="font-size:0.75em;color:#888;"> ±22.6</span>",
- "<span style="display:none">000214.0</span>214.0<span style="font-size:0.75em;color:#888;"> ±58.0</span>",
- "<span style="display:none">000044.0</span>44.0<span style="font-size:0.75em;color:#888;"> ±12.8</span>",
- "<span style="display:none">000077.5</span>77.5<span style="font-size:0.75em;color:#888;"> ±43.3</span>",
- 0.42
- [
- "17",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/o4-mini</a>",
- "<span style="display:none">000115.5</span>115.5<span style="font-size:0.75em;color:#888;"> ±27.0</span>",
- "<span style="display:none">000088.0</span>88.0<span style="font-size:0.75em;color:#888;"> ±79.5</span>",
- "<span style="display:none">000080.0</span>80.0<span style="font-size:0.75em;color:#888;"> ±17.5</span>",
- "<span style="display:none">000178.5</span>178.5<span style="font-size:0.75em;color:#888;"> ±35.8</span>",
- 0.27
- [
- "18",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5.1 (reasoning)</a>",
- "<span style="display:none">000120.8</span>120.8<span style="font-size:0.75em;color:#888;"> ±22.3</span>",
- "<span style="display:none">000223.0</span>223.0<span style="font-size:0.75em;color:#888;"> ±48.0</span>",
- "<span style="display:none">000046.0</span>46.0<span style="font-size:0.75em;color:#888;"> ±12.5</span>",
- "<span style="display:none">000093.5</span>93.5<span style="font-size:0.75em;color:#888;"> ±44.8</span>",
- 0.43
- [
- "19",
- "<a target="_blank" href="https://x.ai/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">x-ai/grok-4</a>",
- "<span style="display:none">000126.3</span>126.3<span style="font-size:0.75em;color:#888;"> ±19.8</span>",
- "<span style="display:none">000129.0</span>129.0<span style="font-size:0.75em;color:#888;"> ±9.8</span>",
- "<span style="display:none">000248.0</span>248.0<span style="font-size:0.75em;color:#888;"> ±54.3</span>",
- "<span style="display:none">000002.0</span>2.0<span style="font-size:0.75em;color:#888;"> ±6.5</span>",
- 1.02
- [
- "20",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/o3-mini</a>",
- "<span style="display:none">000153.2</span>153.2<span style="font-size:0.75em;color:#888;"> ±15.6</span>",
- "<span style="display:none">000142.0</span>142.0<span style="font-size:0.75em;color:#888;"> ±27.0</span>",
- "<span style="display:none">000160.5</span>160.5<span style="font-size:0.75em;color:#888;"> ±33.5</span>",
- "<span style="display:none">000157.0</span>157.0<span style="font-size:0.75em;color:#888;"> ±18.2</span>",
- 0.17
- [
- "21",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4o</a>",
- "<span style="display:none">000167.2</span>167.2<span style="font-size:0.75em;color:#888;"> ±16.6</span>",
- "<span style="display:none">000057.5</span>57.5<span style="font-size:0.75em;color:#888;"> ±23.0</span>",
- "<span style="display:none">000048.5</span>48.5<span style="font-size:0.75em;color:#888;"> ±21.0</span>",
- "<span style="display:none">000395.5</span>395.5<span style="font-size:0.75em;color:#888;"> ±30.8</span>",
- 0.56
- [
- "22",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4.1</a>",
- "<span style="display:none">000168.0</span>168.0<span style="font-size:0.75em;color:#888;"> ±19.6</span>",
- "<span style="display:none">000092.5</span>92.5<span style="font-size:0.75em;color:#888;"> ±27.8</span>",
- "<span style="display:none">000083.5</span>83.5<span style="font-size:0.75em;color:#888;"> ±39.0</span>",
- "<span style="display:none">000328.0</span>328.0<span style="font-size:0.75em;color:#888;"> ±41.0</span>",
- 0.54
- [
- "23",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5-nano</a>",
- "<span style="display:none">000175.0</span>175.0<span style="font-size:0.75em;color:#888;"> ±24.5</span>",
- "<span style="display:none">000353.0</span>353.0<span style="font-size:0.75em;color:#888;"> ±56.0</span>",
- "<span style="display:none">000082.5</span>82.5<span style="font-size:0.75em;color:#888;"> ±20.8</span>",
- "<span style="display:none">000089.5</span>89.5<span style="font-size:0.75em;color:#888;"> ±48.0</span>",
- 0.02
- [
- "24",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4o-mini</a>",
- "<span style="display:none">000183.2</span>183.2<span style="font-size:0.75em;color:#888;"> ±25.8</span>",
- "<span style="display:none">000072.5</span>72.5<span style="font-size:0.75em;color:#888;"> ±35.8</span>",
- "<span style="display:none">000104.5</span>104.5<span style="font-size:0.75em;color:#888;"> ±48.0</span>",
- "<span style="display:none">000372.5</span>372.5<span style="font-size:0.75em;color:#888;"> ±53.5</span>",
- 0.04
- [
- "25",
- "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.5-flash (reasoning)</a>",
- "<span style="display:none">000195.2</span>195.2<span style="font-size:0.75em;color:#888;"> ±76.7</span>",
- "<span style="display:none">000337.5</span>337.5<span style="font-size:0.75em;color:#888;"> ±143.2</span>",
- "<span style="display:none">000068.5</span>68.5<span style="font-size:0.75em;color:#888;"> ±24.5</span>",
- "<span style="display:none">000179.5</span>179.5<span style="font-size:0.75em;color:#888;"> ±150.8</span>",
- 0.28
- [
- "26",
- "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-3.5-sonnet</a>",
- "<span style="display:none">000199.7</span>199.7<span style="font-size:0.75em;color:#888;"> ±24.5</span>",
- "<span style="display:none">000132.5</span>132.5<span style="font-size:0.75em;color:#888;"> ±14.5</span>",
- "<span style="display:none">000180.5</span>180.5<span style="font-size:0.75em;color:#888;"> ±38.5</span>",
- "<span style="display:none">000286.0</span>286.0<span style="font-size:0.75em;color:#888;"> ±53.8</span>",
- 2.53
- [
- "27",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-oss-20b</a>",
- "<span style="display:none">000199.7</span>199.7<span style="font-size:0.75em;color:#888;"> ±40.0</span>",
- "<span style="display:none">000110.5</span>110.5<span style="font-size:0.75em;color:#888;"> ±14.8</span>",
- "<span style="display:none">000067.0</span>67.0<span style="font-size:0.75em;color:#888;"> ±47.0</span>",
- "<span style="display:none">000421.5</span>421.5<span style="font-size:0.75em;color:#888;"> ±111.5</span>",
- 0.02
- [
- "28",
- "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.5-flash</a>",
- "<span style="display:none">000210.5</span>210.5<span style="font-size:0.75em;color:#888;"> ±84.2</span>",
- "<span style="display:none">000482.5</span>482.5<span style="font-size:0.75em;color:#888;"> ±92.2</span>",
- "<span style="display:none">000042.0</span>42.0<span style="font-size:0.75em;color:#888;"> ±4.8</span>",
- "<span style="display:none">000107.0</span>107.0<span style="font-size:0.75em;color:#888;"> ±179.5</span>",
- 0.31
- [
- "29",
- "<a target="_blank" href="https://www.deepseek.com/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">deepseek/deepseek-v3.2 (reasoning)</a>",
- "<span style="display:none">000215.0</span>215.0<span style="font-size:0.75em;color:#888;"> ±82.1</span>",
- "<span style="display:none">000123.5</span>123.5<span style="font-size:0.75em;color:#888;"> ±58.0</span>",
- "<span style="display:none">000314.0</span>314.0<span style="font-size:0.75em;color:#888;"> ±85.0</span>",
- "<span style="display:none">000207.5</span>207.5<span style="font-size:0.75em;color:#888;"> ±215.0</span>",
- 0.03
- [
- "30",
- "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-3-pro-preview</a>",
- "<span style="display:none">000226.0</span>226.0<span style="font-size:0.75em;color:#888;"> ±63.1</span>",
- "<span style="display:none">000334.5</span>334.5<span style="font-size:0.75em;color:#888;"> ±175.8</span>",
- "<span style="display:none">000086.5</span>86.5<span style="font-size:0.75em;color:#888;"> ±32.8</span>",
- "<span style="display:none">000257.0</span>257.0<span style="font-size:0.75em;color:#888;"> ±43.0</span>",
- 1.2
- [
- "31",
- "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.0-flash-lite-001</a>",
- "<span style="display:none">000227.7</span>227.7<span style="font-size:0.75em;color:#888;"> ±95.2</span>",
- "<span style="display:none">000138.0</span>138.0<span style="font-size:0.75em;color:#888;"> ±183.5</span>",
- "<span style="display:none">000042.0</span>42.0<span style="font-size:0.75em;color:#888;"> ±4.0</span>",
- "<span style="display:none">000503.0</span>503.0<span style="font-size:0.75em;color:#888;"> ±188.8</span>",
- 0.04
- [
- "32",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-5-mini</a>",
- "<span style="display:none">000250.5</span>250.5<span style="font-size:0.75em;color:#888;"> ±28.5</span>",
- "<span style="display:none">000412.0</span>412.0<span style="font-size:0.75em;color:#888;"> ±68.0</span>",
- "<span style="display:none">000105.0</span>105.0<span style="font-size:0.75em;color:#888;"> ±17.0</span>",
- "<span style="display:none">000234.5</span>234.5<span style="font-size:0.75em;color:#888;"> ±39.0</span>",
- 0.15
- [
- "33",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-4-turbo</a>",
- "<span style="display:none">000252.5</span>252.5<span style="font-size:0.75em;color:#888;"> ±36.8</span>",
- "<span style="display:none">000078.5</span>78.5<span style="font-size:0.75em;color:#888;"> ±45.5</span>",
- "<span style="display:none">000063.0</span>63.0<span style="font-size:0.75em;color:#888;"> ±45.5</span>",
- "<span style="display:none">000616.0</span>616.0<span style="font-size:0.75em;color:#888;"> ±93.2</span>",
- 2.66
- [
- "34",
- "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-235b-a22b-2507 (reasoning)</a>",
- "<span style="display:none">000260.3</span>260.3<span style="font-size:0.75em;color:#888;"> ±38.8</span>",
- "<span style="display:none">000130.0</span>130.0<span style="font-size:0.75em;color:#888;"> ±18.5</span>",
- "<span style="display:none">000124.0</span>124.0<span style="font-size:0.75em;color:#888;"> ±64.0</span>",
- "<span style="display:none">000527.0</span>527.0<span style="font-size:0.75em;color:#888;"> ±76.0</span>",
- 0.04
- [
- "35",
- "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-235b-a22b-2507</a>",
- "<span style="display:none">000264.0</span>264.0<span style="font-size:0.75em;color:#888;"> ±37.0</span>",
- "<span style="display:none">000138.0</span>138.0<span style="font-size:0.75em;color:#888;"> ±20.0</span>",
- "<span style="display:none">000136.5</span>136.5<span style="font-size:0.75em;color:#888;"> ±62.5</span>",
- "<span style="display:none">000517.5</span>517.5<span style="font-size:0.75em;color:#888;"> ±74.1</span>",
- 0.04
- [
- "36",
- "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen-plus</a>",
- "<span style="display:none">000267.3</span>267.3<span style="font-size:0.75em;color:#888;"> ±35.5</span>",
- "<span style="display:none">000124.0</span>124.0<span style="font-size:0.75em;color:#888;"> ±18.0</span>",
- "<span style="display:none">000119.5</span>119.5<span style="font-size:0.75em;color:#888;"> ±68.2</span>",
- "<span style="display:none">000558.5</span>558.5<span style="font-size:0.75em;color:#888;"> ±68.8</span>",
- 0.11
- [
- "37",
- "<a target="_blank" href="https://huggingface.co/allenai/olmo-2-0325-32b-instruct" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">allenai/olmo-2-0325-32b-instruct</a>",
- "<span style="display:none">000268.7</span>268.7<span style="font-size:0.75em;color:#888;"> ±50.3</span>",
- "<span style="display:none">000620.5</span>620.5<span style="font-size:0.75em;color:#888;"> ±129.0</span>",
- "<span style="display:none">000164.5</span>164.5<span style="font-size:0.75em;color:#888;"> ±42.0</span>",
- "<span style="display:none">000021.0</span>21.0<span style="font-size:0.75em;color:#888;"> ±22.0</span>",
- 0.02
- [
- "38",
- "<a target="_blank" href="https://platform.openai.com/docs/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">openai/gpt-oss-120b</a>",
- "<span style="display:none">000269.7</span>269.7<span style="font-size:0.75em;color:#888;"> ±69.6</span>",
- "<span style="display:none">000142.0</span>142.0<span style="font-size:0.75em;color:#888;"> ±64.1</span>",
- "<span style="display:none">000128.5</span>128.5<span style="font-size:0.75em;color:#888;"> ±56.1</span>",
- "<span style="display:none">000538.5</span>538.5<span style="font-size:0.75em;color:#888;"> ±214.0</span>",
- 0.03
- [
- "39",
- "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-sonnet-4.5 (reasoning)</a>",
- "<span style="display:none">000278.7</span>278.7<span style="font-size:0.75em;color:#888;"> ±41.7</span>",
- "<span style="display:none">000289.5</span>289.5<span style="font-size:0.75em;color:#888;"> ±96.0</span>",
- "<span style="display:none">000131.5</span>131.5<span style="font-size:0.75em;color:#888;"> ±22.8</span>",
- "<span style="display:none">000415.0</span>415.0<span style="font-size:0.75em;color:#888;"> ±66.3</span>",
- 1.65
- [
- "40",
- "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.5-flash-lite (reasoning)</a>",
- "<span style="display:none">000280.5</span>280.5<span style="font-size:0.75em;color:#888;"> ±56.8</span>",
- "<span style="display:none">000186.0</span>186.0<span style="font-size:0.75em;color:#888;"> ±125.5</span>",
- "<span style="display:none">000047.5</span>47.5<span style="font-size:0.75em;color:#888;"> ±16.8</span>",
- "<span style="display:none">000608.0</span>608.0<span style="font-size:0.75em;color:#888;"> ±122.5</span>",
- 0.06
- [
- "41",
- "<a target="_blank" href="https://huggingface.co/microsoft/phi-4-reasoning-plus (reasoning)" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">microsoft/phi-4-reasoning-plus (reasoning)</a>",
- "<span style="display:none">000281.0</span>281.0<span style="font-size:0.75em;color:#888;"> ±19.7</span>",
- "<span style="display:none">000207.0</span>207.0<span style="font-size:0.75em;color:#888;"> ±21.5</span>",
- "<span style="display:none">000184.5</span>184.5<span style="font-size:0.75em;color:#888;"> ±34.2</span>",
- "<span style="display:none">000451.5</span>451.5<span style="font-size:0.75em;color:#888;"> ±43.8</span>",
- 0.03
- [
- "42",
- "<a target="_blank" href="https://huggingface.co/microsoft/phi-4-reasoning-plus" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">microsoft/phi-4-reasoning-plus</a>",
- "<span style="display:none">000281.2</span>281.2<span style="font-size:0.75em;color:#888;"> ±18.2</span>",
- "<span style="display:none">000210.0</span>210.0<span style="font-size:0.75em;color:#888;"> ±16.5</span>",
- "<span style="display:none">000187.5</span>187.5<span style="font-size:0.75em;color:#888;"> ±33.8</span>",
- "<span style="display:none">000446.0</span>446.0<span style="font-size:0.75em;color:#888;"> ±38.8</span>",
- 0.03
- [
- "43",
- "<a target="_blank" href="https://x.ai/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">x-ai/grok-code-fast-1</a>",
- "<span style="display:none">000284.5</span>284.5<span style="font-size:0.75em;color:#888;"> ±41.8</span>",
- "<span style="display:none">000137.5</span>137.5<span style="font-size:0.75em;color:#888;"> ±48.5</span>",
- "<span style="display:none">000474.5</span>474.5<span style="font-size:0.75em;color:#888;"> ±72.8</span>",
- "<span style="display:none">000241.5</span>241.5<span style="font-size:0.75em;color:#888;"> ±114.8</span>",
- 0.14
- [
- "44",
- "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-sonnet-4.5</a>",
- "<span style="display:none">000285.0</span>285.0<span style="font-size:0.75em;color:#888;"> ±39.4</span>",
- "<span style="display:none">000283.5</span>283.5<span style="font-size:0.75em;color:#888;"> ±84.8</span>",
- "<span style="display:none">000130.0</span>130.0<span style="font-size:0.75em;color:#888;"> ±27.3</span>",
- "<span style="display:none">000441.5</span>441.5<span style="font-size:0.75em;color:#888;"> ±62.3</span>",
- 1.63
- [
- "45",
- "<a target="_blank" href="https://huggingface.co/minimax/minimax-m2" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">minimax/minimax-m2</a>",
- "<span style="display:none">000297.3</span>297.3<span style="font-size:0.75em;color:#888;"> ±106.3</span>",
- "<span style="display:none">000138.5</span>138.5<span style="font-size:0.75em;color:#888;"> ±34.5</span>",
- "<span style="display:none">000385.5</span>385.5<span style="font-size:0.75em;color:#888;"> ±147.1</span>",
- "<span style="display:none">000368.0</span>368.0<span style="font-size:0.75em;color:#888;"> ±254.5</span>",
- 0.1
- [
- "46",
- "<a target="_blank" href="https://huggingface.co/meta-llama/llama-3.3-70b-instruct" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">meta-llama/llama-3.3-70b-instruct</a>",
- "<span style="display:none">000312.8</span>312.8<span style="font-size:0.75em;color:#888;"> ±45.0</span>",
- "<span style="display:none">000164.0</span>164.0<span style="font-size:0.75em;color:#888;"> ±33.2</span>",
- "<span style="display:none">000125.5</span>125.5<span style="font-size:0.75em;color:#888;"> ±73.8</span>",
- "<span style="display:none">000649.0</span>649.0<span style="font-size:0.75em;color:#888;"> ±102.2</span>",
- 0.03
- [
- "47",
- "<a target="_blank" href="https://huggingface.co/meta-llama/llama-3.1-8b-instruct" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">meta-llama/llama-3.1-8b-instruct</a>",
- "<span style="display:none">000315.7</span>315.7<span style="font-size:0.75em;color:#888;"> ±45.2</span>",
- "<span style="display:none">000135.0</span>135.0<span style="font-size:0.75em;color:#888;"> ±19.2</span>",
- "<span style="display:none">000096.5</span>96.5<span style="font-size:0.75em;color:#888;"> ±56.0</span>",
- "<span style="display:none">000715.5</span>715.5<span style="font-size:0.75em;color:#888;"> ±116.0</span>",
- 0
- [
- "48",
- "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-coder (reasoning)</a>",
- "<span style="display:none">000325.5</span>325.5<span style="font-size:0.75em;color:#888;"> ±30.3</span>",
- "<span style="display:none">000197.0</span>197.0<span style="font-size:0.75em;color:#888;"> ±35.3</span>",
- "<span style="display:none">000214.5</span>214.5<span style="font-size:0.75em;color:#888;"> ±41.8</span>",
- "<span style="display:none">000565.0</span>565.0<span style="font-size:0.75em;color:#888;"> ±76.5</span>",
- 0.1
- [
- "49",
- "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-coder</a>",
- "<span style="display:none">000326.3</span>326.3<span style="font-size:0.75em;color:#888;"> ±22.3</span>",
- "<span style="display:none">000194.0</span>194.0<span style="font-size:0.75em;color:#888;"> ±25.0</span>",
- "<span style="display:none">000202.0</span>202.0<span style="font-size:0.75em;color:#888;"> ±39.1</span>",
- "<span style="display:none">000583.0</span>583.0<span style="font-size:0.75em;color:#888;"> ±45.5</span>",
- 0.1
- [
- "50",
- "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.0-flash-001</a>",
- "<span style="display:none">000326.5</span>326.5<span style="font-size:0.75em;color:#888;"> ±87.0</span>",
- "<span style="display:none">000273.0</span>273.0<span style="font-size:0.75em;color:#888;"> ±141.5</span>",
- "<span style="display:none">000040.0</span>40.0<span style="font-size:0.75em;color:#888;"> ±4.0</span>",
- "<span style="display:none">000666.5</span>666.5<span style="font-size:0.75em;color:#888;"> ±204.9</span>",
- 0.06
- [
- "51",
- "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-haiku-4.5</a>",
- "<span style="display:none">000333.2</span>333.2<span style="font-size:0.75em;color:#888;"> ±26.7</span>",
- "<span style="display:none">000231.0</span>231.0<span style="font-size:0.75em;color:#888;"> ±54.2</span>",
- "<span style="display:none">000125.0</span>125.0<span style="font-size:0.75em;color:#888;"> ±29.0</span>",
- "<span style="display:none">000643.5</span>643.5<span style="font-size:0.75em;color:#888;"> ±43.0</span>",
- 0.64
- [
- "52",
- "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-haiku-4.5 (reasoning)</a>",
- "<span style="display:none">000335.2</span>335.2<span style="font-size:0.75em;color:#888;"> ±26.8</span>",
- "<span style="display:none">000237.0</span>237.0<span style="font-size:0.75em;color:#888;"> ±54.8</span>",
- "<span style="display:none">000125.0</span>125.0<span style="font-size:0.75em;color:#888;"> ±32.8</span>",
- "<span style="display:none">000643.5</span>643.5<span style="font-size:0.75em;color:#888;"> ±40.0</span>",
- 0.65
- [
- "53",
- "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-3-flash-preview</a>",
- "<span style="display:none">000339.3</span>339.3<span style="font-size:0.75em;color:#888;"> ±50.4</span>",
- "<span style="display:none">000426.5</span>426.5<span style="font-size:0.75em;color:#888;"> ±123.5</span>",
- "<span style="display:none">000120.5</span>120.5<span style="font-size:0.75em;color:#888;"> ±49.8</span>",
- "<span style="display:none">000471.0</span>471.0<span style="font-size:0.75em;color:#888;"> ±58.0</span>",
- 0.37
- [
- "54",
- "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-3-flash-preview (reasoning)</a>",
- "<span style="display:none">000340.8</span>340.8<span style="font-size:0.75em;color:#888;"> ±66.4</span>",
- "<span style="display:none">000395.0</span>395.0<span style="font-size:0.75em;color:#888;"> ±175.5</span>",
- "<span style="display:none">000117.5</span>117.5<span style="font-size:0.75em;color:#888;"> ±60.3</span>",
- "<span style="display:none">000510.0</span>510.0<span style="font-size:0.75em;color:#888;"> ±53.8</span>",
- 0.42
- [
- "55",
- "<a target="_blank" href="https://huggingface.co/meta-llama/llama-4-maverick" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">meta-llama/llama-4-maverick</a>",
- "<span style="display:none">000342.8</span>342.8<span style="font-size:0.75em;color:#888;"> ±64.6</span>",
- "<span style="display:none">000139.0</span>139.0<span style="font-size:0.75em;color:#888;"> ±33.0</span>",
- "<span style="display:none">000232.0</span>232.0<span style="font-size:0.75em;color:#888;"> ±55.8</span>",
- "<span style="display:none">000657.5</span>657.5<span style="font-size:0.75em;color:#888;"> ±173.5</span>",
- 0.07
- [
- "56",
- "<a target="_blank" href="https://www.deepseek.com/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">deepseek/deepseek-chat</a>",
- "<span style="display:none">000345.7</span>345.7<span style="font-size:0.75em;color:#888;"> ±22.3</span>",
- "<span style="display:none">000142.0</span>142.0<span style="font-size:0.75em;color:#888;"> ±28.5</span>",
- "<span style="display:none">000329.5</span>329.5<span style="font-size:0.75em;color:#888;"> ±45.5</span>",
- "<span style="display:none">000565.5</span>565.5<span style="font-size:0.75em;color:#888;"> ±41.0</span>",
- 0.15
- [
- "57",
- "<a target="_blank" href="https://huggingface.co/meta-llama/llama-4-scout" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">meta-llama/llama-4-scout</a>",
- "<span style="display:none">000350.5</span>350.5<span style="font-size:0.75em;color:#888;"> ±39.3</span>",
- "<span style="display:none">000138.5</span>138.5<span style="font-size:0.75em;color:#888;"> ±16.0</span>",
- "<span style="display:none">000177.5</span>177.5<span style="font-size:0.75em;color:#888;"> ±73.0</span>",
- "<span style="display:none">000735.5</span>735.5<span style="font-size:0.75em;color:#888;"> ±85.5</span>",
- 0.04
- [
- "58",
- "<a target="_blank" href="https://docs.mistral.ai/getting-started/models/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">mistralai/mistral-medium-3</a>",
- "<span style="display:none">000361.0</span>361.0<span style="font-size:0.75em;color:#888;"> ±34.0</span>",
- "<span style="display:none">000138.0</span>138.0<span style="font-size:0.75em;color:#888;"> ±51.0</span>",
- "<span style="display:none">000376.5</span>376.5<span style="font-size:0.75em;color:#888;"> ±59.5</span>",
- "<span style="display:none">000568.5</span>568.5<span style="font-size:0.75em;color:#888;"> ±53.2</span>",
- 0.28
- [
- "59",
- "<a target="_blank" href="https://docs.mistral.ai/getting-started/models/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">mistralai/mistral-small-3.1-24b-instruct</a>",
- "<span style="display:none">000389.2</span>389.2<span style="font-size:0.75em;color:#888;"> ±37.0</span>",
- "<span style="display:none">000190.0</span>190.0<span style="font-size:0.75em;color:#888;"> ±37.0</span>",
- "<span style="display:none">000215.0</span>215.0<span style="font-size:0.75em;color:#888;"> ±37.0</span>",
- "<span style="display:none">000762.5</span>762.5<span style="font-size:0.75em;color:#888;"> ±83.6</span>",
- 0.01
- [
- "60",
- "<a target="_blank" href="https://docs.anthropic.com/en/docs/models-overview" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">anthropic/claude-3.5-haiku</a>",
- "<span style="display:none">000401.2</span>401.2<span style="font-size:0.75em;color:#888;"> ±25.4</span>",
- "<span style="display:none">000168.0</span>168.0<span style="font-size:0.75em;color:#888;"> ±30.5</span>",
- "<span style="display:none">000280.5</span>280.5<span style="font-size:0.75em;color:#888;"> ±15.5</span>",
- "<span style="display:none">000755.0</span>755.0<span style="font-size:0.75em;color:#888;"> ±61.5</span>",
- 0.59
- [
- "61",
- "<a target="_blank" href="https://huggingface.co/z-ai/glm-4.6v" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">z-ai/glm-4.6v</a>",
- "<span style="display:none">000410.5</span>410.5<span style="font-size:0.75em;color:#888;"> ±104.0</span>",
- "<span style="display:none">000196.0</span>196.0<span style="font-size:0.75em;color:#888;"> ±55.3</span>",
- "<span style="display:none">000143.0</span>143.0<span style="font-size:0.75em;color:#888;"> ±70.3</span>",
- "<span style="display:none">000892.5</span>892.5<span style="font-size:0.75em;color:#888;"> ±310.3</span>",
- 0.14
- [
- "62",
- "<a target="_blank" href="https://www.deepseek.com/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">deepseek/deepseek-v3.2</a>",
- "<span style="display:none">000426.2</span>426.2<span style="font-size:0.75em;color:#888;"> ±61.5</span>",
- "<span style="display:none">000234.5</span>234.5<span style="font-size:0.75em;color:#888;"> ±128.3</span>",
- "<span style="display:none">000303.0</span>303.0<span style="font-size:0.75em;color:#888;"> ±109.0</span>",
- "<span style="display:none">000741.0</span>741.0<span style="font-size:0.75em;color:#888;"> ±62.2</span>",
- 0.06
- [
- "63",
- "<a target="_blank" href="https://docs.mistral.ai/getting-started/models/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">mistralai/mistral-large-2512</a>",
- "<span style="display:none">000444.0</span>444.0<span style="font-size:0.75em;color:#888;"> ±60.3</span>",
- "<span style="display:none">000405.0</span>405.0<span style="font-size:0.75em;color:#888;"> ±126.0</span>",
- "<span style="display:none">000370.5</span>370.5<span style="font-size:0.75em;color:#888;"> ±77.0</span>",
- "<span style="display:none">000556.5</span>556.5<span style="font-size:0.75em;color:#888;"> ±75.8</span>",
- 0.28
- [
- "64",
- "<a target="_blank" href="https://docs.mistral.ai/getting-started/models/" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">mistralai/devstral-2512</a>",
- "<span style="display:none">000449.0</span>449.0<span style="font-size:0.75em;color:#888;"> ±53.3</span>",
- "<span style="display:none">000341.0</span>341.0<span style="font-size:0.75em;color:#888;"> ±113.5</span>",
- "<span style="display:none">000447.0</span>447.0<span style="font-size:0.75em;color:#888;"> ±74.5</span>",
- "<span style="display:none">000559.0</span>559.0<span style="font-size:0.75em;color:#888;"> ±60.5</span>",
- 0.03
- [
- "65",
- "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.5-flash-lite</a>",
- "<span style="display:none">000476.2</span>476.2<span style="font-size:0.75em;color:#888;"> ±73.5</span>",
- "<span style="display:none">000450.0</span>450.0<span style="font-size:0.75em;color:#888;"> ±121.5</span>",
- "<span style="display:none">000042.5</span>42.5<span style="font-size:0.75em;color:#888;"> ±4.5</span>",
- "<span style="display:none">000936.0</span>936.0<span style="font-size:0.75em;color:#888;"> ±174.5</span>",
- 0.07
- [
- "66",
- "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-vl-8b-instruct</a>",
- "<span style="display:none">000518.0</span>518.0<span style="font-size:0.75em;color:#888;"> ±38.6</span>",
- "<span style="display:none">000281.0</span>281.0<span style="font-size:0.75em;color:#888;"> ±48.8</span>",
- "<span style="display:none">000564.5</span>564.5<span style="font-size:0.75em;color:#888;"> ±54.3</span>",
- "<span style="display:none">000708.5</span>708.5<span style="font-size:0.75em;color:#888;"> ±93.5</span>",
- 0.1
- [
- "67",
- "<a target="_blank" href="https://huggingface.co/allenai/olmo-3.1-32b-think:free" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">allenai/olmo-3.1-32b-think:free</a>",
- "<span style="display:none">000530.5</span>530.5<span style="font-size:0.75em;color:#888;"> ±48.2</span>",
- "<span style="display:none">000172.0</span>172.0<span style="font-size:0.75em;color:#888;"> ±42.3</span>",
- "<span style="display:none">000596.0</span>596.0<span style="font-size:0.75em;color:#888;"> ±105.8</span>",
- "<span style="display:none">000823.5</span>823.5<span style="font-size:0.75em;color:#888;"> ±91.0</span>",
- 0
- [
- "68",
- "<a target="_blank" href="https://ai.google.dev/models" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">google/gemini-2.5-pro</a>",
- "<span style="display:none">000539.8</span>539.8<span style="font-size:0.75em;color:#888;"> ±98.2</span>",
- "<span style="display:none">000391.0</span>391.0<span style="font-size:0.75em;color:#888;"> ±139.5</span>",
- "<span style="display:none">000195.5</span>195.5<span style="font-size:0.75em;color:#888;"> ±73.0</span>",
- "<span style="display:none">001033.0</span>1033.0<span style="font-size:0.75em;color:#888;"> ±230.5</span>",
- 2.71
- [
- "69",
- "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-14b</a>",
- "<span style="display:none">000558.0</span>558.0<span style="font-size:0.75em;color:#888;"> ±32.0</span>",
- "<span style="display:none">000134.0</span>134.0<span style="font-size:0.75em;color:#888;"> ±18.2</span>",
- "<span style="display:none">000536.0</span>536.0<span style="font-size:0.75em;color:#888;"> ±87.3</span>",
- "<span style="display:none">001004.0</span>1004.0<span style="font-size:0.75em;color:#888;"> ±46.0</span>",
- 0.04
- [
- "70",
- "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-vl-235b-a22b-thinking</a>",
- "<span style="display:none">000602.8</span>602.8<span style="font-size:0.75em;color:#888;"> ±59.9</span>",
- "<span style="display:none">000214.5</span>214.5<span style="font-size:0.75em;color:#888;"> ±79.0</span>",
- "<span style="display:none">000830.5</span>830.5<span style="font-size:0.75em;color:#888;"> ±110.0</span>",
- "<span style="display:none">000763.5</span>763.5<span style="font-size:0.75em;color:#888;"> ±106.5</span>",
- 0.25
- [
- "71",
- "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen3-32b</a>",
- "<span style="display:none">000725.3</span>725.3<span style="font-size:0.75em;color:#888;"> ±47.8</span>",
- "<span style="display:none">000205.0</span>205.0<span style="font-size:0.75em;color:#888;"> ±47.0</span>",
- "<span style="display:none">000805.0</span>805.0<span style="font-size:0.75em;color:#888;"> ±95.8</span>",
- "<span style="display:none">001166.0</span>1166.0<span style="font-size:0.75em;color:#888;"> ±92.2</span>",
- 0.05
- [
- "72",
- "<a target="_blank" href="https://huggingface.co/amazon/nova-2-lite-v1 (reasoning)" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">amazon/nova-2-lite-v1 (reasoning)</a>",
- "<span style="display:none">000788.3</span>788.3<span style="font-size:0.75em;color:#888;"> ±123.8</span>",
- "<span style="display:none">001155.5</span>1155.5<span style="font-size:0.75em;color:#888;"> ±319.5</span>",
- "<span style="display:none">000228.5</span>228.5<span style="font-size:0.75em;color:#888;"> ±74.0</span>",
- "<span style="display:none">000981.0</span>981.0<span style="font-size:0.75em;color:#888;"> ±182.0</span>",
- 1.96
- [
- "73",
- "<a target="_blank" href="https://huggingface.co/Qwen" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">qwen/qwen-plus (reasoning)</a>",
- "<span style="display:none">000800.3</span>800.3<span style="font-size:0.75em;color:#888;"> ±78.9</span>",
- "<span style="display:none">000265.0</span>265.0<span style="font-size:0.75em;color:#888;"> ±70.0</span>",
- "<span style="display:none">001125.5</span>1125.5<span style="font-size:0.75em;color:#888;"> ±160.3</span>",
- "<span style="display:none">001010.5</span>1010.5<span style="font-size:0.75em;color:#888;"> ±129.0</span>",
- 0.37
- [
- "74",
- "<a target="_blank" href="https://huggingface.co/amazon/nova-2-lite-v1" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">amazon/nova-2-lite-v1</a>",
- "<span style="display:none">000896.3</span>896.3<span style="font-size:0.75em;color:#888;"> ±91.3</span>",
- "<span style="display:none">000568.5</span>568.5<span style="font-size:0.75em;color:#888;"> ±121.8</span>",
- "<span style="display:none">000585.0</span>585.0<span style="font-size:0.75em;color:#888;"> ±120.0</span>",
- "<span style="display:none">001535.5</span>1535.5<span style="font-size:0.75em;color:#888;"> ±184.8</span>",
- 0.81
- [
- "75",
- "<a target="_blank" href="https://huggingface.co/z-ai/glm-4.6:exacto" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">z-ai/glm-4.6:exacto</a>",
- "<span style="display:none">000930.7</span>930.7<span style="font-size:0.75em;color:#888;"> ±244.3</span>",
- "<span style="display:none">001064.0</span>1064.0<span style="font-size:0.75em;color:#888;"> ±438.0</span>",
- "<span style="display:none">000410.5</span>410.5<span style="font-size:0.75em;color:#888;"> ±123.5</span>",
- "<span style="display:none">001317.5</span>1317.5<span style="font-size:0.75em;color:#888;"> ±522.0</span>",
- 0.56
- [
- "76",
- "<a target="_blank" href="https://huggingface.co/z-ai/glm-4.5" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">z-ai/glm-4.5</a>",
- "<span style="display:none">001427.0</span>1427.0<span style="font-size:0.75em;color:#888;"> ±487.2</span>",
- "<span style="display:none">001199.5</span>1199.5<span style="font-size:0.75em;color:#888;"> ±784.5</span>",
- "<span style="display:none">000985.5</span>985.5<span style="font-size:0.75em;color:#888;"> ±322.6</span>",
- "<span style="display:none">002096.0</span>2096.0<span style="font-size:0.75em;color:#888;"> ±822.5</span>",
- 0.76
- [
- "metadata": null