1 claude-opus-4-6-thinking 1505±10 ±3,679 Unknown
2 claude-opus-4-6 1503±9 ±4,427 Unknown
3 gemini-3-pro 1486±4 ±35,513 Unknown
4 grok-4.1-thinking 1475±4 ±35,214 Unknown
5 gemini-3-flash 1472±5 ±26,167 Unknown
6 claude-opus-4-5-20251101-thinking-32k 1471±5 ±27,282 Unknown
7 claude-opus-4-5-20251101 1467±4 ±32,179 Unknown
8 grok-4.1 1464±4 ±39,284 Unknown
9 gemini-3-flash (thinking-minimal) 1462±5 ±17,361 Unknown
10 gpt-5.1-high 1458±4 ±31,519 Unknown
11 ernie-5.0-0110 1452±6Preliminary ±11,080 Unknown
12 claude-sonnet-4-5-20250929 1451±4 ±43,519 Unknown
13 claude-sonnet-4-5-20250929-thinking-32k 1450±4 ±45,809 Unknown
14 ernie-5.0-preview-1203 1449±7 ±9,773 Unknown
15 gemini-2.5-pro 1449±3 ±94,838 Unknown
16 claude-opus-4-1-20250805-thinking-16k 1449±4 ±49,947 Unknown
17 kimi-k2.5-thinking 1448±7 ±8,083 Unknown
18 claude-opus-4-1-20250805 1445±3 ±74,911 Unknown
19 gpt-4.5-preview-2025-02-27 1444±6 ±14,549 Unknown
20 chatgpt-4o-latest-20250326 1442±3 ±82,329 Unknown
21 glm-4.7 1441±6 ±12,013 Unknown
22 kimi-k2.5-instant 1438±10 ±3,830 Unknown
23 gpt-5.1 1438±4 ±33,736 Unknown
24 gpt-5.2 1438±6 ±12,759 Unknown
25 gpt-5.2-high 1436±6 ±16,100 Unknown
26 gpt-5-high 1434±5 ±32,619 Unknown
27 qwen3-max-preview 1434±5 ±27,842 Unknown
28 o3-2025-04-16 1432±4 ±61,351 Unknown
29 grok-4-1-fast-reasoning 1431±4 ±28,142 Unknown
30 kimi-k2-thinking-turbo 1429±4 ±33,118 Unknown
31 gpt-5-chat 1426±4 ±31,821 Unknown
32 glm-4.6 1425±4 ±35,331 Unknown
33 qwen3-max-2025-09-23 1425±6 ±9,223 Unknown
34 claude-opus-4-20250514-thinking-16k 1424±4 ±37,973 Unknown
35 deepseek-v3.2-exp 1423±6 ±11,762 Unknown
36 deepseek-v3.2-exp-thinking 1423±7 ±8,999 Unknown
37 qwen3-235b-a22b-instruct-2507 1422±3 ±69,176 Unknown
38 grok-4-fast-chat 1422±8 ±6,989 Unknown
39 deepseek-v3.2 1421±5 ±27,695 Unknown
40 deepseek-v3.2-thinking 1421±5 ±22,732 Unknown
41 deepseek-r1-0528 1418±6 ±19,289 Unknown
42 ernie-5.0-preview-1022 1418±9 ±4,616 Unknown
43 deepseek-v3.1 1418±6 ±15,298 Unknown
44 kimi-k2-0905-preview 1417±6 ±11,973 Unknown
45 deepseek-v3.1-thinking 1417±7 ±11,985 Unknown
46 kimi-k2-0711-preview 1417±5 ±28,662 Unknown
47 mistral-large-3 1416±5 ±24,050 Unknown
48 deepseek-v3.1-terminus 1416±10 ±3,761 Unknown
49 deepseek-v3.1-terminus-thinking 1415±10 ±3,548 Unknown
50 qwen3-vl-235b-a22b-instruct 1415±6 ±11,684 Unknown
51 gpt-4.1-2025-04-14 1413±4 ±52,211 Unknown
52 claude-opus-4-20250514 1413±4 ±45,573 Unknown
53 grok-3-preview-02-24 1411±4 ±33,970 Unknown
54 mistral-medium-2508 1411±3 ±63,013 Unknown
55 gemini-2.5-flash 1410±3 ±94,114 Unknown
56 glm-4.5 1410±5 ±24,792 Unknown
57 grok-4-0709 1410±4 ±42,143 Unknown
58 gemini-2.5-flash-preview-09-2025 1405±4 ±32,875 Unknown
59 claude-haiku-4-5-20251001 1404±4 ±44,511 Unknown
60 grok-4-fast-reasoning 1403±5 ±18,637 Unknown
61 o1-2024-12-17 1402±4 ±27,822 Unknown
62 qwen3-235b-a22b-no-thinking 1401±4 ±39,546 Unknown
63 qwen3-next-80b-a3b-instruct 1401±5 ±22,856 Unknown
64 claude-sonnet-4-20250514-thinking-32k 1400±4 ±36,207 Unknown
65 longcat-flash-chat 1399±6 ±11,548 Unknown
66 qwen3-235b-a22b-thinking-2507 1398±6 ±9,254 Unknown
67 deepseek-r1 1398±5 ±18,537 Unknown
68 qwen3-vl-235b-a22b-thinking 1395±7 ±7,971 Unknown
69 amazon-nova-experimental-chat-12-10 1395±10 ±3,718 Unknown
70 mimo-v2-flash (non-thinking) 1394±5 ±16,651 Unknown
71 deepseek-v3-0324 1394±4 ±46,690 Unknown
72 hunyuan-vision-1.5-thinking 1393±12 ±2,225 Unknown
73 mai-1-preview 1391±5 ±18,134 Unknown
74 o4-mini-2025-04-16 1391±4 ±46,676 Unknown
75 gpt-5-mini-high 1390±5 ±27,145 Unknown
76 claude-sonnet-4-20250514 1390±4 ±41,645 Unknown
77 claude-3-7-sonnet-20250219-thinking-32k 1388±4 ±39,889 Unknown
78 o1-preview 1388±5 ±31,120 Unknown
79 minimax-m2.1-preview 1387±5 ±16,114 Unknown
80 hunyuan-t1-20250711 1387±9 ±4,801 Unknown
81 qwen3-coder-480b-a35b-instruct 1386±5 ±26,652 Unknown
82 step-3.5-flash 1386±8 ±5,571 Unknown
83 mistral-medium-2505 1385±5 ±34,548 Unknown
84 qwen3-30b-a3b-instruct-2507 1383±5 ±24,092 Unknown
85 hunyuan-turbos-20250416 1382±6 ±11,053 Unknown
86 gpt-4.1-mini-2025-04-14 1382±4 ±40,532 Unknown
87 gemini-2.5-flash-lite-preview-09-2025-no-thinking 1380±4 ±47,414 Unknown
88 glm-4.6v 1378±11 ±2,819 Unknown
89 gemini-2.5-flash-lite-preview-06-17-thinking 1375±4 ±33,929 Unknown
90 qwen3-235b-a22b 1375±5 ±27,164 Unknown
91 qwen2.5-max 1374±4 ±33,294 Unknown
92 claude-3-5-sonnet-20241022 1373±3 ±89,471 Unknown
93 claude-3-7-sonnet-20250219 1372±4 ±44,434 Unknown
94 glm-4.5-air 1371±4 ±31,382 Unknown
95 qwen3-next-80b-a3b-thinking 1369±6 ±13,859 Unknown
96 minimax-m1 1367±4 ±36,838 Unknown
97 amazon-nova-experimental-chat-11-10 1367±5 ±16,393 Unknown
98 gemma-3-27b-it 1365±4 ±48,694 Unknown
99 o3-mini-high 1364±5 ±18,584 Unknown
100 glm-4.7-flash 1363±7 ±7,376 Unknown
101 grok-3-mini-high 1363±5 ±17,523 Unknown
102 gemini-2.0-flash-001 1361±4 ±44,828 Unknown
103 deepseek-v3 1358±5 ±21,788 Unknown
104 grok-3-mini-beta 1357±5 ±23,765 Unknown
105 intellect-3 1356±8 ±5,325 Unknown
106 mistral-small-2506 1356±5 ±18,343 Unknown
107 gpt-oss-120b 1354±4 ±30,963 Unknown
108 gemini-2.0-flash-lite-preview-02-05 1353±4 ±24,951 Unknown
109 glm-4.5v 1353±8 ±4,973 Unknown
110 command-a-03-2025 1353±3 ±57,439 Unknown
111 gemini-1.5-pro-002 1351±3 ±55,607 Unknown
112 amazon-nova-experimental-chat-10-20 1349±6 ±11,439 Unknown
113 hunyuan-turbos-20250226 1349±12 ±2,226 Unknown
114 o3-mini 1348±3 ±58,638 Unknown
115 amazon-nova-experimental-chat-10-09 1347±11 ±2,890 Unknown
116 llama-3.1-nemotron-ultra-253b-v1 1347±12 ±2,546 Unknown
117 qwen3-32b 1347±9 ±3,932 Unknown
118 ling-flash-2.0 1347±7 ±7,038 Unknown
119 minimax-m2 1347±8 ±6,742 Unknown
120 step-3 1346±7 ±6,592 Unknown
121 qwen-plus-0125 1346±8 ±5,823 Unknown
122 gpt-4o-2024-05-13 1346±3 ±112,863 Unknown
123 glm-4-plus-0111 1343±8 ±5,760 Unknown
124 claude-3-5-sonnet-20240620 1343±3 ±82,417 Unknown
125 gemma-3-12b-it 1342±10 ±3,829 Unknown
126 nvidia-llama-3.3-nemotron-super-49b-v1.5 1341±10 ±3,432 Unknown
127 hunyuan-turbo-0110 1340±12 ±2,295 Unknown
128 gpt-5-nano-high 1338±7 ±8,399 Unknown
129 nova-2-lite 1337±6 ±12,258 Unknown
130 o1-mini 1337±4 ±51,986 Unknown
131 qwq-32b 1336±4 ±26,118 Unknown
132 llama-3.1-405b-instruct-bf16 1335±4 ±41,392 Unknown
133 gpt-4o-2024-08-06 1335±4 ±45,498 Unknown
134 grok-2-2024-08-13 1335±4 ±63,495 Unknown
135 gemini-advanced-0514 1335±5 ±50,142 Unknown
136 step-2-16k-exp-202412 1334±9 ±4,829 Unknown
137 llama-3.1-405b-instruct-fp8 1334±4 ±59,655 Unknown
138 olmo-3.1-32b-instruct 1331±6 ±11,634 Unknown
139 yi-lightning 1329±5 ±27,340 Unknown
140 qwen3-30b-a3b 1328±5 ±27,431 Unknown
141 llama-4-maverick-17b-128e-instruct 1328±4 ±41,136 Unknown
142 llama-3.3-nemotron-49b-super-v1 1327±12 ±2,230 Unknown
143 hunyuan-large-2025-02-10 1326±10 ±3,738 Unknown
144 gpt-4-turbo-2024-04-09 1324±4 ±98,130 Unknown
145 claude-3-5-haiku-20241022 1324±3 ±71,183 Unknown
146 deepseek-v2.5-1210 1323±8 ±6,793 Unknown
147 gemini-1.5-pro-001 1323±4 ±79,132 Unknown
148 llama-4-scout-17b-16e-instruct 1323±5 ±31,235 Unknown
149 claude-3-opus-20240229 1322±3 ±194,904 Unknown
150 gpt-4.1-nano-2025-04-14 1322±8 ±6,107 Unknown
151 step-1o-turbo-202506 1321±7 ±9,687 Unknown
152 ring-flash-2.0 1320±7 ±7,204 Unknown
153 llama-3.3-70b-instruct 1320±3 ±55,576 Unknown
154 glm-4-plus 1319±5 ±26,134 Unknown
155 gemma-3n-e4b-it 1319±5 ±23,342 Unknown
156 qwen-max-0919 1318±6 ±16,479 Unknown
157 gpt-4o-mini-2024-07-18 1318±3 ±68,801 Unknown
158 gpt-oss-20b 1317±6 ±10,810 Unknown
159 nvidia-nemotron-3-nano-30b-a3b-bf16 1317±6 ±15,500 Unknown
160 qwen2.5-plus-1127 1315±6 ±10,179 Unknown
161 athene-v2-chat 1314±5 ±24,746 Unknown
162 mistral-large-2407 1314±4 ±45,460 Unknown
163 gpt-4-0125-preview 1313±4 ±93,439 Unknown
164 gpt-4-1106-preview 1313±4 ±100,107 Unknown
165 hunyuan-standard-2025-02-10 1312±10 ±3,905 Unknown
166 mercury 1310±14 ±1,920 Unknown
167 gemini-1.5-flash-002 1310±4 ±34,909 Unknown
168 grok-2-mini-2024-08-13 1308±4 ±52,574 Unknown
169 deepseek-v2.5 1307±5 ±24,574 Unknown
170 athene-70b-0725 1306±6 ±19,622 Unknown
171 olmo-3-32b-think 1306±8 ±5,892 Unknown
172 mistral-large-2411 1305±4 ±28,081 Unknown
173 magistral-medium-2506 1305±6 ±12,065 Unknown
174 mistral-small-3.1-24b-instruct-2503 1305±4 ±34,130 Unknown
175 gemma-3-4b-it 1303±9 ±4,177 Unknown
176 qwen2.5-72b-instruct 1303±4 ±39,409 Unknown
177 llama-3.1-nemotron-70b-instruct 1299±8 ±7,136 Unknown
178 hunyuan-large-vision 1296±9 ±5,600 Unknown
179 llama-3.1-70b-instruct 1294±4 ±55,234 Unknown
180 amazon-nova-pro-v1.0 1290±5 ±24,753 Unknown
181 jamba-1.5-large 1289±7 ±8,659 Unknown
182 gemma-2-27b-it 1288±3 ±75,764 Unknown
183 ibm-granite-h-small 1288±8 ±5,682 Unknown
184 reka-core-20240904 1288±7 ±7,309 Unknown
185 gpt-4-0314 1287±5 ±54,167 Unknown
186 llama-3.1-tulu-3-70b 1287±10 ±2,846 Unknown
187 llama-3.1-nemotron-51b-instruct 1287±10 ±3,749 Unknown
188 olmo-3.1-32b-think 1286±7 ±8,479 Unknown
189 gemini-1.5-flash-001 1286±4 ±62,823 Unknown
190 claude-3-sonnet-20240229 1281±4 ±109,289 Unknown
191 gemma-2-9b-it-simpo 1280±7 ±10,069 Unknown
192 nemotron-4-340b-instruct 1278±5 ±19,661 Unknown
193 command-r-plus-08-2024 1277±7 ±9,869 Unknown
194 llama-3-70b-instruct 1276±4 ±156,880 Unknown
195 gpt-4-0613 1276±4 ±88,721 Unknown
196 mistral-small-24b-instruct-2501 1274±6 ±14,677 Unknown
197 glm-4-0520 1274±7 ±9,788 Unknown
198 reka-flash-20240904 1272±7 ±7,537 Unknown
199 qwen2.5-coder-32b-instruct 1271±8 ±5,430 Unknown
200 c4ai-aya-expanse-32b 1267±5 ±27,123 Unknown
201 gemma-2-9b-it 1266±4 ±54,615 Unknown
202 deepseek-coder-v2 1264±6 ±15,147 Unknown
203 command-r-plus 1262±4 ±77,556 Unknown
204 qwen2-72b-instruct 1262±5 ±37,325 Unknown
205 claude-3-haiku-20240307 1261±4 ±117,705 Unknown
206 amazon-nova-lite-v1.0 1261±5 ±19,376 Unknown
207 gemini-1.5-flash-8b-001 1259±4 ±35,556 Unknown
208 phi-4 1256±5 ±24,126 Unknown
209 olmo-2-0325-32b-instruct 1252±11 ±3,335 Unknown
210 command-r-08-2024 1251±7 ±10,141 Unknown
211 mistral-large-2402 1243±5 ±62,437 Unknown
212 amazon-nova-micro-v1.0 1241±5 ±19,355 Unknown
213 jamba-1.5-mini 1239±7 ±8,854 Unknown
214 ministral-8b-2410 1237±9 ±4,780 Unknown
215 gemini-pro-dev-api 1235±7 ±18,352 Unknown
216 qwen1.5-110b-chat 1234±6 ±26,191 Unknown
217 reka-flash-21b-20240226-online 1234±7 ±15,451 Unknown
218 qwen1.5-72b-chat 1234±5 ±39,296 Unknown
219 hunyuan-standard-256k 1233±12 ±2,729 Unknown
220 mixtral-8x22b-instruct-v0.1 1230±5 ±51,417 Unknown
221 command-r 1227±5 ±54,038 Unknown
222 reka-flash-21b-20240226 1227±6 ±24,806 Unknown
223 gpt-3.5-turbo-0125 1224±5 ±66,191 Unknown
224 llama-3-8b-instruct 1223±4 ±104,636 Unknown
225 mistral-medium 1223±6 ±34,552 Unknown
226 c4ai-aya-expanse-8b 1223±7 ±9,827 Unknown
227 gemini-pro 1222±12 ±6,390 Unknown
228 llama-3.1-tulu-3-8b 1221±11 ±2,895 Unknown
229 yi-1.5-34b-chat 1214±5 ±24,142 Unknown
230 zephyr-orpo-141b-A35b-v0.1 1213±11 ±4,653 Unknown
231 llama-3.1-8b-instruct 1212±4 ±49,605 Unknown
232 granite-3.1-8b-instruct 1209±11 ±3,092 Unknown
233 qwen1.5-32b-chat 1204±6 ±21,744 Unknown
234 gpt-3.5-turbo-1106 1203±9 ±16,616 Unknown
235 gemma-2-2b-it 1199±4 ±46,618 Unknown
236 phi-3-medium-4k-instruct 1198±5 ±25,055 Unknown
237 mixtral-8x7b-instruct-v0.1 1198±4 ±73,505 Unknown
238 dbrx-instruct-preview 1195±6 ±32,196 Unknown
239 internlm2_5-20b-chat 1191±7 ±9,902 Unknown
240 qwen1.5-14b-chat 1191±7 ±17,841 Unknown
241 wizardlm-70b 1185±9 ±8,214 Unknown
242 deepseek-llm-67b-chat 1185±12 ±4,933 Unknown
243 yi-34b-chat 1184±7 ±15,483 Unknown
244 openchat-3.5-0106 1183±8 ±12,636 Unknown
245 openchat-3.5 1183±10 ±7,967 Unknown
246 granite-3.0-8b-instruct 1182±9 ±6,643 Unknown
247 gemma-1.1-7b-it 1180±6 ±23,893 Unknown
248 snowflake-arctic-instruct 1180±6 ±32,836 Unknown
249 granite-3.1-2b-instruct 1180±11 ±3,191 Unknown
250 tulu-2-dpo-70b 1178±10 ±6,534 Unknown
251 openhermes-2.5-mistral-7b 1176±10 ±5,006 Unknown
252 vicuna-33b 1173±6 ±22,479 Unknown
253 starling-lm-7b-beta 1172±7 ±16,057 Unknown
254 phi-3-small-8k-instruct 1172±6 ±17,763 Unknown
255 llama-2-70b-chat 1171±6 ±38,491 Unknown
256 starling-lm-7b-alpha 1168±8 ±10,224 Unknown
257 llama-3.2-3b-instruct 1167±8 ±7,936 Unknown
258 nous-hermes-2-mixtral-8x7b-dpo 1165±12 ±3,776 Unknown
259 qwq-32b-preview 1157±12 ±3,233 Unknown
260 granite-3.0-2b-instruct 1156±8 ±6,837 Unknown
261 llama2-70b-steerlm-chat 1156±13 ±3,584 Unknown
262 solar-10.7b-instruct-v1.0 1153±13 ±4,155 Unknown
263 dolphin-2.2.1-mistral-7b 1152±15 ±1,679 Unknown
264 mpt-30b-chat 1151±12 ±2,571 Unknown
265 mistral-7b-instruct-v0.2 1150±7 ±19,402 Unknown
266 wizardlm-13b 1150±9 ±7,046 Unknown
267 falcon-180b-chat 1147±17 ±1,295 Unknown
268 qwen1.5-7b-chat 1144±10 ±4,735 Unknown
269 phi-3-mini-4k-instruct-june-2024 1143±6 ±12,296 Unknown
270 llama-2-13b-chat 1142±7 ±19,171 Unknown
271 vicuna-13b 1141±7 ±19,366 Unknown
272 qwen-14b-chat 1139±11 ±4,964 Unknown
273 palm-2 1138±9 ±8,554 Unknown
274 codellama-34b-instruct 1137±9 ±7,363 Unknown
275 gemma-7b-it 1136±10 ±8,925 Unknown
276 zephyr-7b-beta 1131±9 ±11,116 Unknown
277 phi-3-mini-128k-instruct 1130±7 ±20,691 Unknown
278 phi-3-mini-4k-instruct 1129±6 ±20,115 Unknown
279 guanaco-33b 1128±12 ±2,921 Unknown
280 zephyr-7b-alpha 1127±16 ±1,785 Unknown
281 stripedhyena-nous-7b 1121±11 ±5,184 Unknown
282 codellama-70b-instruct 1119±18 ±1,143 Unknown
283 vicuna-7b 1115±9 ±6,923 Unknown
284 smollm2-1.7b-instruct 1115±14 ±2,201 Unknown
285 gemma-1.1-2b-it 1114±8 ±10,853 Unknown
286 llama-3.2-1b-instruct 1112±8 ±8,045 Unknown
287 mistral-7b-instruct 1110±9 ±8,977 Unknown
288 llama-2-7b-chat 1108±7 ±14,148 Unknown
289 gemma-2b-it 1092±12 ±4,779 Unknown
290 qwen1.5-4b-chat 1091±9 ±7,598 Unknown
291 olmo-7b-instruct 1075±11 ±6,329 Unknown
292 koala-13b 1071±10 ±6,964 Unknown
293 alpaca-13b 1068±12 ±5,745 Unknown
294 gpt4all-13b-snoozy 1066±15 ±1,743 Unknown
295 mpt-7b-chat 1062±12 ±3,925 Unknown
296 chatglm3-6b 1056±12 ±4,658 Unknown
297 RWKV-4-Raven-14B 1042±11 ±4,845 Unknown
298 chatglm2-6b 1025±14 ±2,657 Unknown
299 oasst-pythia-12b 1023±11 ±6,311 Unknown
300 chatglm-6b 996±13 ±4,914 Unknown
301 fastchat-t5-3b 992±12 ±4,203 Unknown
302 dolly-v2-12b 981±14 ±3,412 Unknown
303 llama-13b 973±16 ±2,391 Unknown
304 stablelm-tuned-alpha-7b 953±13 ±3,287 Unknown