Spaces:
Running
Running
add opus 4.5
Browse files- index.html +79 -43
index.html
CHANGED
|
@@ -94,8 +94,44 @@
|
|
| 94 |
</thead>
|
| 95 |
<tbody>
|
| 96 |
|
| 97 |
-
<tr data-model="litellm_proxy/
|
| 98 |
<td class="rank mono sticky-0" data-label="#">#1</td>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 99 |
<td class="model-name sticky-1" data-label="Модель">Gemini 3 Pro Preview</td>
|
| 100 |
<td class="num mono" data-label="Критичные/1000">
|
| 101 |
|
|
@@ -131,7 +167,7 @@
|
|
| 131 |
</tr>
|
| 132 |
|
| 133 |
<tr data-model="openrouter/anthropic/claude-sonnet-4.5">
|
| 134 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 135 |
<td class="model-name sticky-1" data-label="Модель">Claude Sonnet 4.5</td>
|
| 136 |
<td class="num mono" data-label="Критичные/1000">
|
| 137 |
|
|
@@ -167,7 +203,7 @@
|
|
| 167 |
</tr>
|
| 168 |
|
| 169 |
<tr data-model="openrouter/openai/gpt-4o">
|
| 170 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 171 |
<td class="model-name sticky-1" data-label="Модель">GPT-4o</td>
|
| 172 |
<td class="num mono" data-label="Критичные/1000">
|
| 173 |
|
|
@@ -203,7 +239,7 @@
|
|
| 203 |
</tr>
|
| 204 |
|
| 205 |
<tr data-model="litellm_proxy/gemini-2.5-flash">
|
| 206 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 207 |
<td class="model-name sticky-1" data-label="Модель">Gemini 2.5 Flash (GA)</td>
|
| 208 |
<td class="num mono" data-label="Критичные/1000">
|
| 209 |
|
|
@@ -239,7 +275,7 @@
|
|
| 239 |
</tr>
|
| 240 |
|
| 241 |
<tr data-model="openrouter/minimax/minimax-01">
|
| 242 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 243 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-Text-01 (Minimax API)</td>
|
| 244 |
<td class="num mono" data-label="Критичные/1000">
|
| 245 |
|
|
@@ -275,7 +311,7 @@
|
|
| 275 |
</tr>
|
| 276 |
|
| 277 |
<tr data-model="openai/Vikhrmodels/Vistral-24B-Instruct">
|
| 278 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 279 |
<td class="model-name sticky-1" data-label="Модель">Vikhrmodels/Vistral-24B-Instruct (SGLang)</td>
|
| 280 |
<td class="num mono" data-label="Критичные/1000">
|
| 281 |
|
|
@@ -311,7 +347,7 @@
|
|
| 311 |
</tr>
|
| 312 |
|
| 313 |
<tr data-model="openai/unsloth/gemma-3-27b-it">
|
| 314 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 315 |
<td class="model-name sticky-1" data-label="Модель">Gemma-3-27b-it (SGLang)</td>
|
| 316 |
<td class="num mono" data-label="Критичные/1000">
|
| 317 |
|
|
@@ -347,7 +383,7 @@
|
|
| 347 |
</tr>
|
| 348 |
|
| 349 |
<tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
|
| 350 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 351 |
<td class="model-name sticky-1" data-label="Модель">Qwen/Qwen3-235B-A22B-Instruct-2507 (Vertex AI API)</td>
|
| 352 |
<td class="num mono" data-label="Критичные/1000">
|
| 353 |
|
|
@@ -383,7 +419,7 @@
|
|
| 383 |
</tr>
|
| 384 |
|
| 385 |
<tr data-model="openai/mistralai/Mistral-Small-3.2-24B-Instruct-2506">
|
| 386 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 387 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Small-3.2-24B-Instruct-2506 (vllm)</td>
|
| 388 |
<td class="num mono" data-label="Критичные/1000">
|
| 389 |
|
|
@@ -419,7 +455,7 @@
|
|
| 419 |
</tr>
|
| 420 |
|
| 421 |
<tr data-model="openrouter/deepseek/deepseek-chat">
|
| 422 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 423 |
<td class="model-name sticky-1" data-label="Модель">DeepSeek V3 (Novita API)</td>
|
| 424 |
<td class="num mono" data-label="Критичные/1000">
|
| 425 |
|
|
@@ -455,7 +491,7 @@
|
|
| 455 |
</tr>
|
| 456 |
|
| 457 |
<tr data-model="openai/RefalMachine/RuadaptQwen3-32B-Instruct">
|
| 458 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 459 |
<td class="model-name sticky-1" data-label="Модель">RefalMachine/RuadaptQwen3-32B-Instruct (SGLang)</td>
|
| 460 |
<td class="num mono" data-label="Критичные/1000">
|
| 461 |
|
|
@@ -491,7 +527,7 @@
|
|
| 491 |
</tr>
|
| 492 |
|
| 493 |
<tr data-model="openai/yandex/YandexGPT-5-Lite-8B-instruct">
|
| 494 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 495 |
<td class="model-name sticky-1" data-label="Модель">yandex/YandexGPT-5-Lite-8B-instruct (SGLang)</td>
|
| 496 |
<td class="num mono" data-label="Критичные/1000">
|
| 497 |
|
|
@@ -527,7 +563,7 @@
|
|
| 527 |
</tr>
|
| 528 |
|
| 529 |
<tr data-model="deepseek/deepseek-chat">
|
| 530 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 531 |
<td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-chat (Deepseek API)</td>
|
| 532 |
<td class="num mono" data-label="Критичные/1000">
|
| 533 |
|
|
@@ -563,7 +599,7 @@
|
|
| 563 |
</tr>
|
| 564 |
|
| 565 |
<tr data-model="openrouter/anthropic/claude-haiku-4.5">
|
| 566 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 567 |
<td class="model-name sticky-1" data-label="Модель">Claude Haiku 4.5</td>
|
| 568 |
<td class="num mono" data-label="Критичные/1000">
|
| 569 |
|
|
@@ -599,7 +635,7 @@
|
|
| 599 |
</tr>
|
| 600 |
|
| 601 |
<tr data-model="openai/Qwen/Qwen3-VL-32B-Instruct">
|
| 602 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 603 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-VL-32B-Instruct (SGLang)</td>
|
| 604 |
<td class="num mono" data-label="Критичные/1000">
|
| 605 |
|
|
@@ -635,7 +671,7 @@
|
|
| 635 |
</tr>
|
| 636 |
|
| 637 |
<tr data-model="openai/AvitoTech/avibe">
|
| 638 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 639 |
<td class="model-name sticky-1" data-label="Модель">AvitoTech/avibe</td>
|
| 640 |
<td class="num mono" data-label="Критичные/1000">
|
| 641 |
|
|
@@ -671,7 +707,7 @@
|
|
| 671 |
</tr>
|
| 672 |
|
| 673 |
<tr data-model="openai/ai-sage/GigaChat-20B-A3B-instruct-v1.5-bf16">
|
| 674 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 675 |
<td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
|
| 676 |
<td class="num mono" data-label="Критичные/1000">
|
| 677 |
|
|
@@ -707,7 +743,7 @@
|
|
| 707 |
</tr>
|
| 708 |
|
| 709 |
<tr data-model="deepseek/deepseek-reasoner">
|
| 710 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 711 |
<td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-reasoner (Deepseek API)</td>
|
| 712 |
<td class="num mono" data-label="Критичные/1000">
|
| 713 |
|
|
@@ -743,7 +779,7 @@
|
|
| 743 |
</tr>
|
| 744 |
|
| 745 |
<tr data-model="litellm_proxy/deepseek-v3">
|
| 746 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 747 |
<td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
|
| 748 |
<td class="num mono" data-label="Критичные/1000">
|
| 749 |
|
|
@@ -779,7 +815,7 @@
|
|
| 779 |
</tr>
|
| 780 |
|
| 781 |
<tr data-model="litellm_proxy/tmp-gemma-3n-e4b-it">
|
| 782 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 783 |
<td class="model-name sticky-1" data-label="Модель">google/gemma-3n-E4B-it (AI Studio)</td>
|
| 784 |
<td class="num mono" data-label="Критичные/1000">
|
| 785 |
|
|
@@ -815,7 +851,7 @@
|
|
| 815 |
</tr>
|
| 816 |
|
| 817 |
<tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
|
| 818 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 819 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
|
| 820 |
<td class="num mono" data-label="Критичные/1000">
|
| 821 |
|
|
@@ -851,7 +887,7 @@
|
|
| 851 |
</tr>
|
| 852 |
|
| 853 |
<tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
|
| 854 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 855 |
<td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
|
| 856 |
<td class="num mono" data-label="Критичные/1000">
|
| 857 |
|
|
@@ -887,7 +923,7 @@
|
|
| 887 |
</tr>
|
| 888 |
|
| 889 |
<tr data-model="openai/Qwen/Qwen3-32B">
|
| 890 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 891 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
|
| 892 |
<td class="num mono" data-label="Критичные/1000">
|
| 893 |
|
|
@@ -923,7 +959,7 @@
|
|
| 923 |
</tr>
|
| 924 |
|
| 925 |
<tr data-model="openai/t-tech/T-pro-it-2.0">
|
| 926 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 927 |
<td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
|
| 928 |
<td class="num mono" data-label="Критичные/1000">
|
| 929 |
|
|
@@ -959,7 +995,7 @@
|
|
| 959 |
</tr>
|
| 960 |
|
| 961 |
<tr data-model="openrouter/openrouter/polaris-alpha">
|
| 962 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 963 |
<td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
|
| 964 |
<td class="num mono" data-label="Критичные/1000">
|
| 965 |
|
|
@@ -995,7 +1031,7 @@
|
|
| 995 |
</tr>
|
| 996 |
|
| 997 |
<tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
|
| 998 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 999 |
<td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
|
| 1000 |
<td class="num mono" data-label="Критичные/1000">
|
| 1001 |
|
|
@@ -1031,7 +1067,7 @@
|
|
| 1031 |
</tr>
|
| 1032 |
|
| 1033 |
<tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
|
| 1034 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1035 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
|
| 1036 |
<td class="num mono" data-label="Критичные/1000">
|
| 1037 |
|
|
@@ -1067,7 +1103,7 @@
|
|
| 1067 |
</tr>
|
| 1068 |
|
| 1069 |
<tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
|
| 1070 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1071 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
|
| 1072 |
<td class="num mono" data-label="Критичные/1000">
|
| 1073 |
|
|
@@ -1103,7 +1139,7 @@
|
|
| 1103 |
</tr>
|
| 1104 |
|
| 1105 |
<tr data-model="openrouter/moonshotai/kimi-k2-0905">
|
| 1106 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1107 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
|
| 1108 |
<td class="num mono" data-label="Критичные/1000">
|
| 1109 |
|
|
@@ -1139,7 +1175,7 @@
|
|
| 1139 |
</tr>
|
| 1140 |
|
| 1141 |
<tr data-model="openrouter/z-ai/glm-4.6">
|
| 1142 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1143 |
<td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
|
| 1144 |
<td class="num mono" data-label="Критичные/1000">
|
| 1145 |
|
|
@@ -1175,7 +1211,7 @@
|
|
| 1175 |
</tr>
|
| 1176 |
|
| 1177 |
<tr data-model="openrouter/openai/gpt-5">
|
| 1178 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1179 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
|
| 1180 |
<td class="num mono" data-label="Критичные/1000">
|
| 1181 |
|
|
@@ -1211,7 +1247,7 @@
|
|
| 1211 |
</tr>
|
| 1212 |
|
| 1213 |
<tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
|
| 1214 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1215 |
<td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
|
| 1216 |
<td class="num mono" data-label="Критичные/1000">
|
| 1217 |
|
|
@@ -1247,7 +1283,7 @@
|
|
| 1247 |
</tr>
|
| 1248 |
|
| 1249 |
<tr data-model="openrouter/openai/gpt-5">
|
| 1250 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1251 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
|
| 1252 |
<td class="num mono" data-label="Критичные/1000">
|
| 1253 |
|
|
@@ -1283,7 +1319,7 @@
|
|
| 1283 |
</tr>
|
| 1284 |
|
| 1285 |
<tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
|
| 1286 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1287 |
<td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
|
| 1288 |
<td class="num mono" data-label="Критичные/1000">
|
| 1289 |
|
|
@@ -1319,7 +1355,7 @@
|
|
| 1319 |
</tr>
|
| 1320 |
|
| 1321 |
<tr data-model="openrouter/openai/gpt-oss-120b">
|
| 1322 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1323 |
<td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
|
| 1324 |
<td class="num mono" data-label="Критичные/1000">
|
| 1325 |
|
|
@@ -1355,7 +1391,7 @@
|
|
| 1355 |
</tr>
|
| 1356 |
|
| 1357 |
<tr data-model="openai/gpt-4.1">
|
| 1358 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1359 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
|
| 1360 |
<td class="num mono" data-label="Критичные/1000">
|
| 1361 |
|
|
@@ -1391,7 +1427,7 @@
|
|
| 1391 |
</tr>
|
| 1392 |
|
| 1393 |
<tr data-model="openrouter/mistralai/mistral-nemo">
|
| 1394 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1395 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
|
| 1396 |
<td class="num mono" data-label="Критичные/1000">
|
| 1397 |
|
|
@@ -1427,7 +1463,7 @@
|
|
| 1427 |
</tr>
|
| 1428 |
|
| 1429 |
<tr data-model="openai/gpt-4.1-mini">
|
| 1430 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1431 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
|
| 1432 |
<td class="num mono" data-label="Критичные/1000">
|
| 1433 |
|
|
@@ -1463,7 +1499,7 @@
|
|
| 1463 |
</tr>
|
| 1464 |
|
| 1465 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1466 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1467 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
|
| 1468 |
<td class="num mono" data-label="Критичные/1000">
|
| 1469 |
|
|
@@ -1499,7 +1535,7 @@
|
|
| 1499 |
</tr>
|
| 1500 |
|
| 1501 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1502 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1503 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
|
| 1504 |
<td class="num mono" data-label="Критичные/1000">
|
| 1505 |
|
|
@@ -1535,7 +1571,7 @@
|
|
| 1535 |
</tr>
|
| 1536 |
|
| 1537 |
<tr data-model="openai/gpt-4.1-nano">
|
| 1538 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1539 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
|
| 1540 |
<td class="num mono" data-label="Критичные/1000">
|
| 1541 |
|
|
@@ -1571,7 +1607,7 @@
|
|
| 1571 |
</tr>
|
| 1572 |
|
| 1573 |
<tr data-model="openrouter/openai/gpt-oss-20b">
|
| 1574 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1575 |
<td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
|
| 1576 |
<td class="num mono" data-label="Критичные/1000">
|
| 1577 |
|
|
@@ -1629,7 +1665,7 @@
|
|
| 1629 |
</div>
|
| 1630 |
<p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
|
| 1631 |
<p class="info-text">
|
| 1632 |
-
Обновлено: 2025-12-01
|
| 1633 |
</p>
|
| 1634 |
</div>
|
| 1635 |
<script>
|
|
|
|
| 94 |
</thead>
|
| 95 |
<tbody>
|
| 96 |
|
| 97 |
+
<tr data-model="litellm_proxy/opus-4-5">
|
| 98 |
<td class="rank mono sticky-0" data-label="#">#1</td>
|
| 99 |
+
<td class="model-name sticky-1" data-label="Модель">Claude Opus 4.5</td>
|
| 100 |
+
<td class="num mono" data-label="Критичные/1000">
|
| 101 |
+
|
| 102 |
+
0.05 ± 0.01
|
| 103 |
+
|
| 104 |
+
</td>
|
| 105 |
+
<td class="num mono" data-label="Обычные/1000">
|
| 106 |
+
|
| 107 |
+
0.12 ± 0.02
|
| 108 |
+
|
| 109 |
+
</td>
|
| 110 |
+
<td class="num mono" data-label="Доп./1000">
|
| 111 |
+
|
| 112 |
+
0.05 ± 0.02
|
| 113 |
+
|
| 114 |
+
</td>
|
| 115 |
+
<td data-label="Нормировано ошибок">
|
| 116 |
+
<div class="score-cell">
|
| 117 |
+
<div class="progress-bar">
|
| 118 |
+
|
| 119 |
+
|
| 120 |
+
|
| 121 |
+
<div class="progress-fill" style="width: 94.0%"></div>
|
| 122 |
+
</div>
|
| 123 |
+
<span class="score-value">
|
| 124 |
+
|
| 125 |
+
0.24 ± 0.04
|
| 126 |
+
|
| 127 |
+
</span>
|
| 128 |
+
</div>
|
| 129 |
+
</td>
|
| 130 |
+
<td class="num mono" data-label="Всего токенов">125,802</td>
|
| 131 |
+
</tr>
|
| 132 |
+
|
| 133 |
+
<tr data-model="litellm_proxy/gemini/gemini-3-pro-preview">
|
| 134 |
+
<td class="rank mono sticky-0" data-label="#">#2</td>
|
| 135 |
<td class="model-name sticky-1" data-label="Модель">Gemini 3 Pro Preview</td>
|
| 136 |
<td class="num mono" data-label="Критичные/1000">
|
| 137 |
|
|
|
|
| 167 |
</tr>
|
| 168 |
|
| 169 |
<tr data-model="openrouter/anthropic/claude-sonnet-4.5">
|
| 170 |
+
<td class="rank mono sticky-0" data-label="#">#3</td>
|
| 171 |
<td class="model-name sticky-1" data-label="Модель">Claude Sonnet 4.5</td>
|
| 172 |
<td class="num mono" data-label="Критичные/1000">
|
| 173 |
|
|
|
|
| 203 |
</tr>
|
| 204 |
|
| 205 |
<tr data-model="openrouter/openai/gpt-4o">
|
| 206 |
+
<td class="rank mono sticky-0" data-label="#">#4</td>
|
| 207 |
<td class="model-name sticky-1" data-label="Модель">GPT-4o</td>
|
| 208 |
<td class="num mono" data-label="Критичные/1000">
|
| 209 |
|
|
|
|
| 239 |
</tr>
|
| 240 |
|
| 241 |
<tr data-model="litellm_proxy/gemini-2.5-flash">
|
| 242 |
+
<td class="rank mono sticky-0" data-label="#">#5</td>
|
| 243 |
<td class="model-name sticky-1" data-label="Модель">Gemini 2.5 Flash (GA)</td>
|
| 244 |
<td class="num mono" data-label="Критичные/1000">
|
| 245 |
|
|
|
|
| 275 |
</tr>
|
| 276 |
|
| 277 |
<tr data-model="openrouter/minimax/minimax-01">
|
| 278 |
+
<td class="rank mono sticky-0" data-label="#">#6</td>
|
| 279 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-Text-01 (Minimax API)</td>
|
| 280 |
<td class="num mono" data-label="Критичные/1000">
|
| 281 |
|
|
|
|
| 311 |
</tr>
|
| 312 |
|
| 313 |
<tr data-model="openai/Vikhrmodels/Vistral-24B-Instruct">
|
| 314 |
+
<td class="rank mono sticky-0" data-label="#">#7</td>
|
| 315 |
<td class="model-name sticky-1" data-label="Модель">Vikhrmodels/Vistral-24B-Instruct (SGLang)</td>
|
| 316 |
<td class="num mono" data-label="Критичные/1000">
|
| 317 |
|
|
|
|
| 347 |
</tr>
|
| 348 |
|
| 349 |
<tr data-model="openai/unsloth/gemma-3-27b-it">
|
| 350 |
+
<td class="rank mono sticky-0" data-label="#">#8</td>
|
| 351 |
<td class="model-name sticky-1" data-label="Модель">Gemma-3-27b-it (SGLang)</td>
|
| 352 |
<td class="num mono" data-label="Критичные/1000">
|
| 353 |
|
|
|
|
| 383 |
</tr>
|
| 384 |
|
| 385 |
<tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
|
| 386 |
+
<td class="rank mono sticky-0" data-label="#">#9</td>
|
| 387 |
<td class="model-name sticky-1" data-label="Модель">Qwen/Qwen3-235B-A22B-Instruct-2507 (Vertex AI API)</td>
|
| 388 |
<td class="num mono" data-label="Критичные/1000">
|
| 389 |
|
|
|
|
| 419 |
</tr>
|
| 420 |
|
| 421 |
<tr data-model="openai/mistralai/Mistral-Small-3.2-24B-Instruct-2506">
|
| 422 |
+
<td class="rank mono sticky-0" data-label="#">#10</td>
|
| 423 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Small-3.2-24B-Instruct-2506 (vllm)</td>
|
| 424 |
<td class="num mono" data-label="Критичные/1000">
|
| 425 |
|
|
|
|
| 455 |
</tr>
|
| 456 |
|
| 457 |
<tr data-model="openrouter/deepseek/deepseek-chat">
|
| 458 |
+
<td class="rank mono sticky-0" data-label="#">#11</td>
|
| 459 |
<td class="model-name sticky-1" data-label="Модель">DeepSeek V3 (Novita API)</td>
|
| 460 |
<td class="num mono" data-label="Критичные/1000">
|
| 461 |
|
|
|
|
| 491 |
</tr>
|
| 492 |
|
| 493 |
<tr data-model="openai/RefalMachine/RuadaptQwen3-32B-Instruct">
|
| 494 |
+
<td class="rank mono sticky-0" data-label="#">#12</td>
|
| 495 |
<td class="model-name sticky-1" data-label="Модель">RefalMachine/RuadaptQwen3-32B-Instruct (SGLang)</td>
|
| 496 |
<td class="num mono" data-label="Критичные/1000">
|
| 497 |
|
|
|
|
| 527 |
</tr>
|
| 528 |
|
| 529 |
<tr data-model="openai/yandex/YandexGPT-5-Lite-8B-instruct">
|
| 530 |
+
<td class="rank mono sticky-0" data-label="#">#13</td>
|
| 531 |
<td class="model-name sticky-1" data-label="Модель">yandex/YandexGPT-5-Lite-8B-instruct (SGLang)</td>
|
| 532 |
<td class="num mono" data-label="Критичные/1000">
|
| 533 |
|
|
|
|
| 563 |
</tr>
|
| 564 |
|
| 565 |
<tr data-model="deepseek/deepseek-chat">
|
| 566 |
+
<td class="rank mono sticky-0" data-label="#">#14</td>
|
| 567 |
<td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-chat (Deepseek API)</td>
|
| 568 |
<td class="num mono" data-label="Критичные/1000">
|
| 569 |
|
|
|
|
| 599 |
</tr>
|
| 600 |
|
| 601 |
<tr data-model="openrouter/anthropic/claude-haiku-4.5">
|
| 602 |
+
<td class="rank mono sticky-0" data-label="#">#15</td>
|
| 603 |
<td class="model-name sticky-1" data-label="Модель">Claude Haiku 4.5</td>
|
| 604 |
<td class="num mono" data-label="Критичные/1000">
|
| 605 |
|
|
|
|
| 635 |
</tr>
|
| 636 |
|
| 637 |
<tr data-model="openai/Qwen/Qwen3-VL-32B-Instruct">
|
| 638 |
+
<td class="rank mono sticky-0" data-label="#">#16</td>
|
| 639 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-VL-32B-Instruct (SGLang)</td>
|
| 640 |
<td class="num mono" data-label="Критичные/1000">
|
| 641 |
|
|
|
|
| 671 |
</tr>
|
| 672 |
|
| 673 |
<tr data-model="openai/AvitoTech/avibe">
|
| 674 |
+
<td class="rank mono sticky-0" data-label="#">#17</td>
|
| 675 |
<td class="model-name sticky-1" data-label="Модель">AvitoTech/avibe</td>
|
| 676 |
<td class="num mono" data-label="Критичные/1000">
|
| 677 |
|
|
|
|
| 707 |
</tr>
|
| 708 |
|
| 709 |
<tr data-model="openai/ai-sage/GigaChat-20B-A3B-instruct-v1.5-bf16">
|
| 710 |
+
<td class="rank mono sticky-0" data-label="#">#18</td>
|
| 711 |
<td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
|
| 712 |
<td class="num mono" data-label="Критичные/1000">
|
| 713 |
|
|
|
|
| 743 |
</tr>
|
| 744 |
|
| 745 |
<tr data-model="deepseek/deepseek-reasoner">
|
| 746 |
+
<td class="rank mono sticky-0" data-label="#">#19</td>
|
| 747 |
<td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-reasoner (Deepseek API)</td>
|
| 748 |
<td class="num mono" data-label="Критичные/1000">
|
| 749 |
|
|
|
|
| 779 |
</tr>
|
| 780 |
|
| 781 |
<tr data-model="litellm_proxy/deepseek-v3">
|
| 782 |
+
<td class="rank mono sticky-0" data-label="#">#20</td>
|
| 783 |
<td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
|
| 784 |
<td class="num mono" data-label="Критичные/1000">
|
| 785 |
|
|
|
|
| 815 |
</tr>
|
| 816 |
|
| 817 |
<tr data-model="litellm_proxy/tmp-gemma-3n-e4b-it">
|
| 818 |
+
<td class="rank mono sticky-0" data-label="#">#21</td>
|
| 819 |
<td class="model-name sticky-1" data-label="Модель">google/gemma-3n-E4B-it (AI Studio)</td>
|
| 820 |
<td class="num mono" data-label="Критичные/1000">
|
| 821 |
|
|
|
|
| 851 |
</tr>
|
| 852 |
|
| 853 |
<tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
|
| 854 |
+
<td class="rank mono sticky-0" data-label="#">#22</td>
|
| 855 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
|
| 856 |
<td class="num mono" data-label="Критичные/1000">
|
| 857 |
|
|
|
|
| 887 |
</tr>
|
| 888 |
|
| 889 |
<tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
|
| 890 |
+
<td class="rank mono sticky-0" data-label="#">#23</td>
|
| 891 |
<td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
|
| 892 |
<td class="num mono" data-label="Критичные/1000">
|
| 893 |
|
|
|
|
| 923 |
</tr>
|
| 924 |
|
| 925 |
<tr data-model="openai/Qwen/Qwen3-32B">
|
| 926 |
+
<td class="rank mono sticky-0" data-label="#">#24</td>
|
| 927 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
|
| 928 |
<td class="num mono" data-label="Критичные/1000">
|
| 929 |
|
|
|
|
| 959 |
</tr>
|
| 960 |
|
| 961 |
<tr data-model="openai/t-tech/T-pro-it-2.0">
|
| 962 |
+
<td class="rank mono sticky-0" data-label="#">#25</td>
|
| 963 |
<td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
|
| 964 |
<td class="num mono" data-label="Критичные/1000">
|
| 965 |
|
|
|
|
| 995 |
</tr>
|
| 996 |
|
| 997 |
<tr data-model="openrouter/openrouter/polaris-alpha">
|
| 998 |
+
<td class="rank mono sticky-0" data-label="#">#26</td>
|
| 999 |
<td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
|
| 1000 |
<td class="num mono" data-label="Критичные/1000">
|
| 1001 |
|
|
|
|
| 1031 |
</tr>
|
| 1032 |
|
| 1033 |
<tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
|
| 1034 |
+
<td class="rank mono sticky-0" data-label="#">#27</td>
|
| 1035 |
<td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
|
| 1036 |
<td class="num mono" data-label="Критичные/1000">
|
| 1037 |
|
|
|
|
| 1067 |
</tr>
|
| 1068 |
|
| 1069 |
<tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
|
| 1070 |
+
<td class="rank mono sticky-0" data-label="#">#28</td>
|
| 1071 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
|
| 1072 |
<td class="num mono" data-label="Критичные/1000">
|
| 1073 |
|
|
|
|
| 1103 |
</tr>
|
| 1104 |
|
| 1105 |
<tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
|
| 1106 |
+
<td class="rank mono sticky-0" data-label="#">#29</td>
|
| 1107 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
|
| 1108 |
<td class="num mono" data-label="Критичные/1000">
|
| 1109 |
|
|
|
|
| 1139 |
</tr>
|
| 1140 |
|
| 1141 |
<tr data-model="openrouter/moonshotai/kimi-k2-0905">
|
| 1142 |
+
<td class="rank mono sticky-0" data-label="#">#30</td>
|
| 1143 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
|
| 1144 |
<td class="num mono" data-label="Критичные/1000">
|
| 1145 |
|
|
|
|
| 1175 |
</tr>
|
| 1176 |
|
| 1177 |
<tr data-model="openrouter/z-ai/glm-4.6">
|
| 1178 |
+
<td class="rank mono sticky-0" data-label="#">#31</td>
|
| 1179 |
<td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
|
| 1180 |
<td class="num mono" data-label="Критичные/1000">
|
| 1181 |
|
|
|
|
| 1211 |
</tr>
|
| 1212 |
|
| 1213 |
<tr data-model="openrouter/openai/gpt-5">
|
| 1214 |
+
<td class="rank mono sticky-0" data-label="#">#32</td>
|
| 1215 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
|
| 1216 |
<td class="num mono" data-label="Критичные/1000">
|
| 1217 |
|
|
|
|
| 1247 |
</tr>
|
| 1248 |
|
| 1249 |
<tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
|
| 1250 |
+
<td class="rank mono sticky-0" data-label="#">#33</td>
|
| 1251 |
<td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
|
| 1252 |
<td class="num mono" data-label="Критичные/1000">
|
| 1253 |
|
|
|
|
| 1283 |
</tr>
|
| 1284 |
|
| 1285 |
<tr data-model="openrouter/openai/gpt-5">
|
| 1286 |
+
<td class="rank mono sticky-0" data-label="#">#34</td>
|
| 1287 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
|
| 1288 |
<td class="num mono" data-label="Критичные/1000">
|
| 1289 |
|
|
|
|
| 1319 |
</tr>
|
| 1320 |
|
| 1321 |
<tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
|
| 1322 |
+
<td class="rank mono sticky-0" data-label="#">#35</td>
|
| 1323 |
<td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
|
| 1324 |
<td class="num mono" data-label="Критичные/1000">
|
| 1325 |
|
|
|
|
| 1355 |
</tr>
|
| 1356 |
|
| 1357 |
<tr data-model="openrouter/openai/gpt-oss-120b">
|
| 1358 |
+
<td class="rank mono sticky-0" data-label="#">#36</td>
|
| 1359 |
<td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
|
| 1360 |
<td class="num mono" data-label="Критичные/1000">
|
| 1361 |
|
|
|
|
| 1391 |
</tr>
|
| 1392 |
|
| 1393 |
<tr data-model="openai/gpt-4.1">
|
| 1394 |
+
<td class="rank mono sticky-0" data-label="#">#37</td>
|
| 1395 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
|
| 1396 |
<td class="num mono" data-label="Критичные/1000">
|
| 1397 |
|
|
|
|
| 1427 |
</tr>
|
| 1428 |
|
| 1429 |
<tr data-model="openrouter/mistralai/mistral-nemo">
|
| 1430 |
+
<td class="rank mono sticky-0" data-label="#">#38</td>
|
| 1431 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
|
| 1432 |
<td class="num mono" data-label="Критичные/1000">
|
| 1433 |
|
|
|
|
| 1463 |
</tr>
|
| 1464 |
|
| 1465 |
<tr data-model="openai/gpt-4.1-mini">
|
| 1466 |
+
<td class="rank mono sticky-0" data-label="#">#39</td>
|
| 1467 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
|
| 1468 |
<td class="num mono" data-label="Критичные/1000">
|
| 1469 |
|
|
|
|
| 1499 |
</tr>
|
| 1500 |
|
| 1501 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1502 |
+
<td class="rank mono sticky-0" data-label="#">#40</td>
|
| 1503 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
|
| 1504 |
<td class="num mono" data-label="Критичные/1000">
|
| 1505 |
|
|
|
|
| 1535 |
</tr>
|
| 1536 |
|
| 1537 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1538 |
+
<td class="rank mono sticky-0" data-label="#">#41</td>
|
| 1539 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
|
| 1540 |
<td class="num mono" data-label="Критичные/1000">
|
| 1541 |
|
|
|
|
| 1571 |
</tr>
|
| 1572 |
|
| 1573 |
<tr data-model="openai/gpt-4.1-nano">
|
| 1574 |
+
<td class="rank mono sticky-0" data-label="#">#42</td>
|
| 1575 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
|
| 1576 |
<td class="num mono" data-label="Критичные/1000">
|
| 1577 |
|
|
|
|
| 1607 |
</tr>
|
| 1608 |
|
| 1609 |
<tr data-model="openrouter/openai/gpt-oss-20b">
|
| 1610 |
+
<td class="rank mono sticky-0" data-label="#">#43</td>
|
| 1611 |
<td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
|
| 1612 |
<td class="num mono" data-label="Критичные/1000">
|
| 1613 |
|
|
|
|
| 1665 |
</div>
|
| 1666 |
<p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
|
| 1667 |
<p class="info-text">
|
| 1668 |
+
Обновлено: 2025-12-01 20:43:49 | Всего моделей: 43 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
|
| 1669 |
</p>
|
| 1670 |
</div>
|
| 1671 |
<script>
|