Spaces:
Running
Running
add pony alpha
Browse files- index.html +75 -39
index.html
CHANGED
|
@@ -778,8 +778,44 @@
|
|
| 778 |
<td class="num mono" data-label="Всего токенов">88,360</td>
|
| 779 |
</tr>
|
| 780 |
|
| 781 |
-
<tr data-model="
|
| 782 |
<td class="rank mono sticky-0" data-label="#">#20</td>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 783 |
<td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
|
| 784 |
<td class="num mono" data-label="Критичные/1000">
|
| 785 |
|
|
@@ -815,7 +851,7 @@
|
|
| 815 |
</tr>
|
| 816 |
|
| 817 |
<tr data-model="deepseek/deepseek-reasoner">
|
| 818 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 819 |
<td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-reasoner (Deepseek API)</td>
|
| 820 |
<td class="num mono" data-label="Критичные/1000">
|
| 821 |
|
|
@@ -851,7 +887,7 @@
|
|
| 851 |
</tr>
|
| 852 |
|
| 853 |
<tr data-model="mistral/ministral-14b-2512">
|
| 854 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 855 |
<td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-14B-Instruct-2512 (Mistral API)</td>
|
| 856 |
<td class="num mono" data-label="Критичные/1000">
|
| 857 |
|
|
@@ -887,7 +923,7 @@
|
|
| 887 |
</tr>
|
| 888 |
|
| 889 |
<tr data-model="litellm_proxy/deepseek-v3">
|
| 890 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 891 |
<td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
|
| 892 |
<td class="num mono" data-label="Критичные/1000">
|
| 893 |
|
|
@@ -923,7 +959,7 @@
|
|
| 923 |
</tr>
|
| 924 |
|
| 925 |
<tr data-model="litellm_proxy/tmp-gemma-3n-e4b-it">
|
| 926 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 927 |
<td class="model-name sticky-1" data-label="Модель">google/gemma-3n-E4B-it (AI Studio)</td>
|
| 928 |
<td class="num mono" data-label="Критичные/1000">
|
| 929 |
|
|
@@ -959,7 +995,7 @@
|
|
| 959 |
</tr>
|
| 960 |
|
| 961 |
<tr data-model="mistral/ministral-8b-2512">
|
| 962 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 963 |
<td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-8B-Instruct-2512 (Mistral API)</td>
|
| 964 |
<td class="num mono" data-label="Критичные/1000">
|
| 965 |
|
|
@@ -995,7 +1031,7 @@
|
|
| 995 |
</tr>
|
| 996 |
|
| 997 |
<tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
|
| 998 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 999 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
|
| 1000 |
<td class="num mono" data-label="Критичные/1000">
|
| 1001 |
|
|
@@ -1031,7 +1067,7 @@
|
|
| 1031 |
</tr>
|
| 1032 |
|
| 1033 |
<tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
|
| 1034 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1035 |
<td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
|
| 1036 |
<td class="num mono" data-label="Критичные/1000">
|
| 1037 |
|
|
@@ -1067,7 +1103,7 @@
|
|
| 1067 |
</tr>
|
| 1068 |
|
| 1069 |
<tr data-model="openai/mimo-v2-flash">
|
| 1070 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1071 |
<td class="model-name sticky-1" data-label="Модель">Xiaomi Mimo V2 Flash (Xiaomi API, non-reasoning)</td>
|
| 1072 |
<td class="num mono" data-label="Критичные/1000">
|
| 1073 |
|
|
@@ -1103,7 +1139,7 @@
|
|
| 1103 |
</tr>
|
| 1104 |
|
| 1105 |
<tr data-model="openai/Qwen/Qwen3-32B">
|
| 1106 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1107 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
|
| 1108 |
<td class="num mono" data-label="Критичные/1000">
|
| 1109 |
|
|
@@ -1139,7 +1175,7 @@
|
|
| 1139 |
</tr>
|
| 1140 |
|
| 1141 |
<tr data-model="openrouter/moonshotai/kimi-k2.5">
|
| 1142 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1143 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (non-reasoning, Moonshot AI API)</td>
|
| 1144 |
<td class="num mono" data-label="Критичные/1000">
|
| 1145 |
|
|
@@ -1175,7 +1211,7 @@
|
|
| 1175 |
</tr>
|
| 1176 |
|
| 1177 |
<tr data-model="openai/t-tech/T-pro-it-2.0">
|
| 1178 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1179 |
<td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
|
| 1180 |
<td class="num mono" data-label="Критичные/1000">
|
| 1181 |
|
|
@@ -1211,7 +1247,7 @@
|
|
| 1211 |
</tr>
|
| 1212 |
|
| 1213 |
<tr data-model="openrouter/openrouter/polaris-alpha">
|
| 1214 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1215 |
<td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
|
| 1216 |
<td class="num mono" data-label="Критичные/1000">
|
| 1217 |
|
|
@@ -1247,7 +1283,7 @@
|
|
| 1247 |
</tr>
|
| 1248 |
|
| 1249 |
<tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
|
| 1250 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1251 |
<td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview 0.6 (Arcee-AI API)</td>
|
| 1252 |
<td class="num mono" data-label="Критичные/1000">
|
| 1253 |
|
|
@@ -1283,7 +1319,7 @@
|
|
| 1283 |
</tr>
|
| 1284 |
|
| 1285 |
<tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
|
| 1286 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1287 |
<td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
|
| 1288 |
<td class="num mono" data-label="Критичные/1000">
|
| 1289 |
|
|
@@ -1319,7 +1355,7 @@
|
|
| 1319 |
</tr>
|
| 1320 |
|
| 1321 |
<tr data-model="openrouter/z-ai/glm-4.7-flash">
|
| 1322 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1323 |
<td class="model-name sticky-1" data-label="Модель">zai-org/GLM-4.7-Flash (z.ai API, reasoning, temp=0.6)</td>
|
| 1324 |
<td class="num mono" data-label="Критичные/1000">
|
| 1325 |
|
|
@@ -1355,7 +1391,7 @@
|
|
| 1355 |
</tr>
|
| 1356 |
|
| 1357 |
<tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
|
| 1358 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1359 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
|
| 1360 |
<td class="num mono" data-label="Критичные/1000">
|
| 1361 |
|
|
@@ -1391,7 +1427,7 @@
|
|
| 1391 |
</tr>
|
| 1392 |
|
| 1393 |
<tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
|
| 1394 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1395 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
|
| 1396 |
<td class="num mono" data-label="Критичные/1000">
|
| 1397 |
|
|
@@ -1427,7 +1463,7 @@
|
|
| 1427 |
</tr>
|
| 1428 |
|
| 1429 |
<tr data-model="openrouter/moonshotai/kimi-k2.5">
|
| 1430 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1431 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (reasoning, temp=1, Moonshot AI API)</td>
|
| 1432 |
<td class="num mono" data-label="Критичные/1000">
|
| 1433 |
|
|
@@ -1463,7 +1499,7 @@
|
|
| 1463 |
</tr>
|
| 1464 |
|
| 1465 |
<tr data-model="openrouter/moonshotai/kimi-k2-0905">
|
| 1466 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1467 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
|
| 1468 |
<td class="num mono" data-label="Критичные/1000">
|
| 1469 |
|
|
@@ -1499,7 +1535,7 @@
|
|
| 1499 |
</tr>
|
| 1500 |
|
| 1501 |
<tr data-model="openrouter/z-ai/glm-4.6">
|
| 1502 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1503 |
<td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
|
| 1504 |
<td class="num mono" data-label="Критичные/1000">
|
| 1505 |
|
|
@@ -1535,7 +1571,7 @@
|
|
| 1535 |
</tr>
|
| 1536 |
|
| 1537 |
<tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
|
| 1538 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1539 |
<td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview (Arcee-AI API)</td>
|
| 1540 |
<td class="num mono" data-label="Критичные/1000">
|
| 1541 |
|
|
@@ -1571,7 +1607,7 @@
|
|
| 1571 |
</tr>
|
| 1572 |
|
| 1573 |
<tr data-model="openrouter/openai/gpt-5">
|
| 1574 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1575 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
|
| 1576 |
<td class="num mono" data-label="Критичные/1000">
|
| 1577 |
|
|
@@ -1607,7 +1643,7 @@
|
|
| 1607 |
</tr>
|
| 1608 |
|
| 1609 |
<tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
|
| 1610 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1611 |
<td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
|
| 1612 |
<td class="num mono" data-label="Критичные/1000">
|
| 1613 |
|
|
@@ -1643,7 +1679,7 @@
|
|
| 1643 |
</tr>
|
| 1644 |
|
| 1645 |
<tr data-model="openrouter/openai/gpt-5">
|
| 1646 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1647 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
|
| 1648 |
<td class="num mono" data-label="Критичные/1000">
|
| 1649 |
|
|
@@ -1679,7 +1715,7 @@
|
|
| 1679 |
</tr>
|
| 1680 |
|
| 1681 |
<tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
|
| 1682 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1683 |
<td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
|
| 1684 |
<td class="num mono" data-label="Критичные/1000">
|
| 1685 |
|
|
@@ -1715,7 +1751,7 @@
|
|
| 1715 |
</tr>
|
| 1716 |
|
| 1717 |
<tr data-model="openrouter/stepfun/step-3.5-flash:free">
|
| 1718 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1719 |
<td class="model-name sticky-1" data-label="Модель">Step-3.5-flash (StepFun API, fp8, temp=0.6, reasoning)</td>
|
| 1720 |
<td class="num mono" data-label="Критичные/1000">
|
| 1721 |
|
|
@@ -1751,7 +1787,7 @@
|
|
| 1751 |
</tr>
|
| 1752 |
|
| 1753 |
<tr data-model="openrouter/openai/gpt-oss-120b">
|
| 1754 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1755 |
<td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
|
| 1756 |
<td class="num mono" data-label="Критичные/1000">
|
| 1757 |
|
|
@@ -1787,7 +1823,7 @@
|
|
| 1787 |
</tr>
|
| 1788 |
|
| 1789 |
<tr data-model="openai/gpt-4.1">
|
| 1790 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1791 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
|
| 1792 |
<td class="num mono" data-label="Критичные/1000">
|
| 1793 |
|
|
@@ -1823,7 +1859,7 @@
|
|
| 1823 |
</tr>
|
| 1824 |
|
| 1825 |
<tr data-model="openrouter/nvidia/nemotron-3-nano-30b-a3b:free">
|
| 1826 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1827 |
<td class="model-name sticky-1" data-label="Модель">Nemotron-3-Nano-30B-A3B (NVIDIA API, non-reasoning)</td>
|
| 1828 |
<td class="num mono" data-label="Критичные/1000">
|
| 1829 |
|
|
@@ -1859,7 +1895,7 @@
|
|
| 1859 |
</tr>
|
| 1860 |
|
| 1861 |
<tr data-model="mistral/ministral-3b-2512">
|
| 1862 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1863 |
<td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-3B-Instruct-2512 (Mistral API)</td>
|
| 1864 |
<td class="num mono" data-label="Критичные/1000">
|
| 1865 |
|
|
@@ -1895,7 +1931,7 @@
|
|
| 1895 |
</tr>
|
| 1896 |
|
| 1897 |
<tr data-model="openrouter/mistralai/mistral-nemo">
|
| 1898 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1899 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
|
| 1900 |
<td class="num mono" data-label="Критичные/1000">
|
| 1901 |
|
|
@@ -1931,7 +1967,7 @@
|
|
| 1931 |
</tr>
|
| 1932 |
|
| 1933 |
<tr data-model="openai/gpt-4.1-mini">
|
| 1934 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1935 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
|
| 1936 |
<td class="num mono" data-label="Критичные/1000">
|
| 1937 |
|
|
@@ -1967,7 +2003,7 @@
|
|
| 1967 |
</tr>
|
| 1968 |
|
| 1969 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 1970 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 1971 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
|
| 1972 |
<td class="num mono" data-label="Критичные/1000">
|
| 1973 |
|
|
@@ -2003,7 +2039,7 @@
|
|
| 2003 |
</tr>
|
| 2004 |
|
| 2005 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 2006 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 2007 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
|
| 2008 |
<td class="num mono" data-label="Критичные/1000">
|
| 2009 |
|
|
@@ -2039,7 +2075,7 @@
|
|
| 2039 |
</tr>
|
| 2040 |
|
| 2041 |
<tr data-model="openai/gpt-4.1-nano">
|
| 2042 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 2043 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
|
| 2044 |
<td class="num mono" data-label="Критичные/1000">
|
| 2045 |
|
|
@@ -2075,7 +2111,7 @@
|
|
| 2075 |
</tr>
|
| 2076 |
|
| 2077 |
<tr data-model="openai/ai-sage/GigaChat3-10B-A1.8B-bf16">
|
| 2078 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 2079 |
<td class="model-name sticky-1" data-label="Модель">ai-sage/GigaChat3-10B-A1.8B-bf16 (sglang)</td>
|
| 2080 |
<td class="num mono" data-label="Критичные/1000">
|
| 2081 |
|
|
@@ -2111,7 +2147,7 @@
|
|
| 2111 |
</tr>
|
| 2112 |
|
| 2113 |
<tr data-model="openrouter/openai/gpt-oss-20b">
|
| 2114 |
-
<td class="rank mono sticky-0" data-label="#">#
|
| 2115 |
<td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
|
| 2116 |
<td class="num mono" data-label="Критичные/1000">
|
| 2117 |
|
|
@@ -2169,7 +2205,7 @@
|
|
| 2169 |
</div>
|
| 2170 |
<p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
|
| 2171 |
<p class="info-text">
|
| 2172 |
-
Обновлено: 2026-02-
|
| 2173 |
</p>
|
| 2174 |
</div>
|
| 2175 |
<script>
|
|
|
|
| 778 |
<td class="num mono" data-label="Всего токенов">88,360</td>
|
| 779 |
</tr>
|
| 780 |
|
| 781 |
+
<tr data-model="openrouter/openrouter/pony-alpha">
|
| 782 |
<td class="rank mono sticky-0" data-label="#">#20</td>
|
| 783 |
+
<td class="model-name sticky-1" data-label="Модель">Pony Alpha (temp=0.6)</td>
|
| 784 |
+
<td class="num mono" data-label="Критичные/1000">
|
| 785 |
+
|
| 786 |
+
0.22 ± 0.04
|
| 787 |
+
|
| 788 |
+
</td>
|
| 789 |
+
<td class="num mono" data-label="Обычные/1000">
|
| 790 |
+
|
| 791 |
+
0.43 ± 0.04
|
| 792 |
+
|
| 793 |
+
</td>
|
| 794 |
+
<td class="num mono" data-label="Доп./1000">
|
| 795 |
+
|
| 796 |
+
0.24 ± 0.02
|
| 797 |
+
|
| 798 |
+
</td>
|
| 799 |
+
<td data-label="Нормировано ошибок">
|
| 800 |
+
<div class="score-cell">
|
| 801 |
+
<div class="progress-bar">
|
| 802 |
+
|
| 803 |
+
|
| 804 |
+
|
| 805 |
+
<div class="progress-fill" style="width: 75.25%"></div>
|
| 806 |
+
</div>
|
| 807 |
+
<span class="score-value">
|
| 808 |
+
|
| 809 |
+
0.99 ± 0.07
|
| 810 |
+
|
| 811 |
+
</span>
|
| 812 |
+
</div>
|
| 813 |
+
</td>
|
| 814 |
+
<td class="num mono" data-label="Всего токенов">126,482</td>
|
| 815 |
+
</tr>
|
| 816 |
+
|
| 817 |
+
<tr data-model="openai/ai-sage/GigaChat-20B-A3B-instruct-v1.5-bf16">
|
| 818 |
+
<td class="rank mono sticky-0" data-label="#">#21</td>
|
| 819 |
<td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
|
| 820 |
<td class="num mono" data-label="Критичные/1000">
|
| 821 |
|
|
|
|
| 851 |
</tr>
|
| 852 |
|
| 853 |
<tr data-model="deepseek/deepseek-reasoner">
|
| 854 |
+
<td class="rank mono sticky-0" data-label="#">#22</td>
|
| 855 |
<td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-reasoner (Deepseek API)</td>
|
| 856 |
<td class="num mono" data-label="Критичные/1000">
|
| 857 |
|
|
|
|
| 887 |
</tr>
|
| 888 |
|
| 889 |
<tr data-model="mistral/ministral-14b-2512">
|
| 890 |
+
<td class="rank mono sticky-0" data-label="#">#23</td>
|
| 891 |
<td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-14B-Instruct-2512 (Mistral API)</td>
|
| 892 |
<td class="num mono" data-label="Критичные/1000">
|
| 893 |
|
|
|
|
| 923 |
</tr>
|
| 924 |
|
| 925 |
<tr data-model="litellm_proxy/deepseek-v3">
|
| 926 |
+
<td class="rank mono sticky-0" data-label="#">#24</td>
|
| 927 |
<td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
|
| 928 |
<td class="num mono" data-label="Критичные/1000">
|
| 929 |
|
|
|
|
| 959 |
</tr>
|
| 960 |
|
| 961 |
<tr data-model="litellm_proxy/tmp-gemma-3n-e4b-it">
|
| 962 |
+
<td class="rank mono sticky-0" data-label="#">#25</td>
|
| 963 |
<td class="model-name sticky-1" data-label="Модель">google/gemma-3n-E4B-it (AI Studio)</td>
|
| 964 |
<td class="num mono" data-label="Критичные/1000">
|
| 965 |
|
|
|
|
| 995 |
</tr>
|
| 996 |
|
| 997 |
<tr data-model="mistral/ministral-8b-2512">
|
| 998 |
+
<td class="rank mono sticky-0" data-label="#">#26</td>
|
| 999 |
<td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-8B-Instruct-2512 (Mistral API)</td>
|
| 1000 |
<td class="num mono" data-label="Критичные/1000">
|
| 1001 |
|
|
|
|
| 1031 |
</tr>
|
| 1032 |
|
| 1033 |
<tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
|
| 1034 |
+
<td class="rank mono sticky-0" data-label="#">#27</td>
|
| 1035 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
|
| 1036 |
<td class="num mono" data-label="Критичные/1000">
|
| 1037 |
|
|
|
|
| 1067 |
</tr>
|
| 1068 |
|
| 1069 |
<tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
|
| 1070 |
+
<td class="rank mono sticky-0" data-label="#">#28</td>
|
| 1071 |
<td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
|
| 1072 |
<td class="num mono" data-label="Критичные/1000">
|
| 1073 |
|
|
|
|
| 1103 |
</tr>
|
| 1104 |
|
| 1105 |
<tr data-model="openai/mimo-v2-flash">
|
| 1106 |
+
<td class="rank mono sticky-0" data-label="#">#29</td>
|
| 1107 |
<td class="model-name sticky-1" data-label="Модель">Xiaomi Mimo V2 Flash (Xiaomi API, non-reasoning)</td>
|
| 1108 |
<td class="num mono" data-label="Критичные/1000">
|
| 1109 |
|
|
|
|
| 1139 |
</tr>
|
| 1140 |
|
| 1141 |
<tr data-model="openai/Qwen/Qwen3-32B">
|
| 1142 |
+
<td class="rank mono sticky-0" data-label="#">#30</td>
|
| 1143 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
|
| 1144 |
<td class="num mono" data-label="Критичные/1000">
|
| 1145 |
|
|
|
|
| 1175 |
</tr>
|
| 1176 |
|
| 1177 |
<tr data-model="openrouter/moonshotai/kimi-k2.5">
|
| 1178 |
+
<td class="rank mono sticky-0" data-label="#">#31</td>
|
| 1179 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (non-reasoning, Moonshot AI API)</td>
|
| 1180 |
<td class="num mono" data-label="Критичные/1000">
|
| 1181 |
|
|
|
|
| 1211 |
</tr>
|
| 1212 |
|
| 1213 |
<tr data-model="openai/t-tech/T-pro-it-2.0">
|
| 1214 |
+
<td class="rank mono sticky-0" data-label="#">#32</td>
|
| 1215 |
<td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
|
| 1216 |
<td class="num mono" data-label="Критичные/1000">
|
| 1217 |
|
|
|
|
| 1247 |
</tr>
|
| 1248 |
|
| 1249 |
<tr data-model="openrouter/openrouter/polaris-alpha">
|
| 1250 |
+
<td class="rank mono sticky-0" data-label="#">#33</td>
|
| 1251 |
<td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
|
| 1252 |
<td class="num mono" data-label="Критичные/1000">
|
| 1253 |
|
|
|
|
| 1283 |
</tr>
|
| 1284 |
|
| 1285 |
<tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
|
| 1286 |
+
<td class="rank mono sticky-0" data-label="#">#34</td>
|
| 1287 |
<td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview 0.6 (Arcee-AI API)</td>
|
| 1288 |
<td class="num mono" data-label="Критичные/1000">
|
| 1289 |
|
|
|
|
| 1319 |
</tr>
|
| 1320 |
|
| 1321 |
<tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
|
| 1322 |
+
<td class="rank mono sticky-0" data-label="#">#35</td>
|
| 1323 |
<td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
|
| 1324 |
<td class="num mono" data-label="Критичные/1000">
|
| 1325 |
|
|
|
|
| 1355 |
</tr>
|
| 1356 |
|
| 1357 |
<tr data-model="openrouter/z-ai/glm-4.7-flash">
|
| 1358 |
+
<td class="rank mono sticky-0" data-label="#">#36</td>
|
| 1359 |
<td class="model-name sticky-1" data-label="Модель">zai-org/GLM-4.7-Flash (z.ai API, reasoning, temp=0.6)</td>
|
| 1360 |
<td class="num mono" data-label="Критичные/1000">
|
| 1361 |
|
|
|
|
| 1391 |
</tr>
|
| 1392 |
|
| 1393 |
<tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
|
| 1394 |
+
<td class="rank mono sticky-0" data-label="#">#37</td>
|
| 1395 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
|
| 1396 |
<td class="num mono" data-label="Критичные/1000">
|
| 1397 |
|
|
|
|
| 1427 |
</tr>
|
| 1428 |
|
| 1429 |
<tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
|
| 1430 |
+
<td class="rank mono sticky-0" data-label="#">#38</td>
|
| 1431 |
<td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
|
| 1432 |
<td class="num mono" data-label="Критичные/1000">
|
| 1433 |
|
|
|
|
| 1463 |
</tr>
|
| 1464 |
|
| 1465 |
<tr data-model="openrouter/moonshotai/kimi-k2.5">
|
| 1466 |
+
<td class="rank mono sticky-0" data-label="#">#39</td>
|
| 1467 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (reasoning, temp=1, Moonshot AI API)</td>
|
| 1468 |
<td class="num mono" data-label="Критичные/1000">
|
| 1469 |
|
|
|
|
| 1499 |
</tr>
|
| 1500 |
|
| 1501 |
<tr data-model="openrouter/moonshotai/kimi-k2-0905">
|
| 1502 |
+
<td class="rank mono sticky-0" data-label="#">#40</td>
|
| 1503 |
<td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
|
| 1504 |
<td class="num mono" data-label="Критичные/1000">
|
| 1505 |
|
|
|
|
| 1535 |
</tr>
|
| 1536 |
|
| 1537 |
<tr data-model="openrouter/z-ai/glm-4.6">
|
| 1538 |
+
<td class="rank mono sticky-0" data-label="#">#41</td>
|
| 1539 |
<td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
|
| 1540 |
<td class="num mono" data-label="Критичные/1000">
|
| 1541 |
|
|
|
|
| 1571 |
</tr>
|
| 1572 |
|
| 1573 |
<tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
|
| 1574 |
+
<td class="rank mono sticky-0" data-label="#">#42</td>
|
| 1575 |
<td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview (Arcee-AI API)</td>
|
| 1576 |
<td class="num mono" data-label="Критичные/1000">
|
| 1577 |
|
|
|
|
| 1607 |
</tr>
|
| 1608 |
|
| 1609 |
<tr data-model="openrouter/openai/gpt-5">
|
| 1610 |
+
<td class="rank mono sticky-0" data-label="#">#43</td>
|
| 1611 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
|
| 1612 |
<td class="num mono" data-label="Критичные/1000">
|
| 1613 |
|
|
|
|
| 1643 |
</tr>
|
| 1644 |
|
| 1645 |
<tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
|
| 1646 |
+
<td class="rank mono sticky-0" data-label="#">#44</td>
|
| 1647 |
<td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
|
| 1648 |
<td class="num mono" data-label="Критичные/1000">
|
| 1649 |
|
|
|
|
| 1679 |
</tr>
|
| 1680 |
|
| 1681 |
<tr data-model="openrouter/openai/gpt-5">
|
| 1682 |
+
<td class="rank mono sticky-0" data-label="#">#45</td>
|
| 1683 |
<td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
|
| 1684 |
<td class="num mono" data-label="Критичные/1000">
|
| 1685 |
|
|
|
|
| 1715 |
</tr>
|
| 1716 |
|
| 1717 |
<tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
|
| 1718 |
+
<td class="rank mono sticky-0" data-label="#">#46</td>
|
| 1719 |
<td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
|
| 1720 |
<td class="num mono" data-label="Критичные/1000">
|
| 1721 |
|
|
|
|
| 1751 |
</tr>
|
| 1752 |
|
| 1753 |
<tr data-model="openrouter/stepfun/step-3.5-flash:free">
|
| 1754 |
+
<td class="rank mono sticky-0" data-label="#">#47</td>
|
| 1755 |
<td class="model-name sticky-1" data-label="Модель">Step-3.5-flash (StepFun API, fp8, temp=0.6, reasoning)</td>
|
| 1756 |
<td class="num mono" data-label="Критичные/1000">
|
| 1757 |
|
|
|
|
| 1787 |
</tr>
|
| 1788 |
|
| 1789 |
<tr data-model="openrouter/openai/gpt-oss-120b">
|
| 1790 |
+
<td class="rank mono sticky-0" data-label="#">#48</td>
|
| 1791 |
<td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
|
| 1792 |
<td class="num mono" data-label="Критичные/1000">
|
| 1793 |
|
|
|
|
| 1823 |
</tr>
|
| 1824 |
|
| 1825 |
<tr data-model="openai/gpt-4.1">
|
| 1826 |
+
<td class="rank mono sticky-0" data-label="#">#49</td>
|
| 1827 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
|
| 1828 |
<td class="num mono" data-label="Критичные/1000">
|
| 1829 |
|
|
|
|
| 1859 |
</tr>
|
| 1860 |
|
| 1861 |
<tr data-model="openrouter/nvidia/nemotron-3-nano-30b-a3b:free">
|
| 1862 |
+
<td class="rank mono sticky-0" data-label="#">#50</td>
|
| 1863 |
<td class="model-name sticky-1" data-label="Модель">Nemotron-3-Nano-30B-A3B (NVIDIA API, non-reasoning)</td>
|
| 1864 |
<td class="num mono" data-label="Критичные/1000">
|
| 1865 |
|
|
|
|
| 1895 |
</tr>
|
| 1896 |
|
| 1897 |
<tr data-model="mistral/ministral-3b-2512">
|
| 1898 |
+
<td class="rank mono sticky-0" data-label="#">#51</td>
|
| 1899 |
<td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-3B-Instruct-2512 (Mistral API)</td>
|
| 1900 |
<td class="num mono" data-label="Критичные/1000">
|
| 1901 |
|
|
|
|
| 1931 |
</tr>
|
| 1932 |
|
| 1933 |
<tr data-model="openrouter/mistralai/mistral-nemo">
|
| 1934 |
+
<td class="rank mono sticky-0" data-label="#">#52</td>
|
| 1935 |
<td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
|
| 1936 |
<td class="num mono" data-label="Критичные/1000">
|
| 1937 |
|
|
|
|
| 1967 |
</tr>
|
| 1968 |
|
| 1969 |
<tr data-model="openai/gpt-4.1-mini">
|
| 1970 |
+
<td class="rank mono sticky-0" data-label="#">#53</td>
|
| 1971 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
|
| 1972 |
<td class="num mono" data-label="Критичные/1000">
|
| 1973 |
|
|
|
|
| 2003 |
</tr>
|
| 2004 |
|
| 2005 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 2006 |
+
<td class="rank mono sticky-0" data-label="#">#54</td>
|
| 2007 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
|
| 2008 |
<td class="num mono" data-label="Критичные/1000">
|
| 2009 |
|
|
|
|
| 2039 |
</tr>
|
| 2040 |
|
| 2041 |
<tr data-model="openrouter/minimax/minimax-m2:free">
|
| 2042 |
+
<td class="rank mono sticky-0" data-label="#">#55</td>
|
| 2043 |
<td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
|
| 2044 |
<td class="num mono" data-label="Критичные/1000">
|
| 2045 |
|
|
|
|
| 2075 |
</tr>
|
| 2076 |
|
| 2077 |
<tr data-model="openai/gpt-4.1-nano">
|
| 2078 |
+
<td class="rank mono sticky-0" data-label="#">#56</td>
|
| 2079 |
<td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
|
| 2080 |
<td class="num mono" data-label="Критичные/1000">
|
| 2081 |
|
|
|
|
| 2111 |
</tr>
|
| 2112 |
|
| 2113 |
<tr data-model="openai/ai-sage/GigaChat3-10B-A1.8B-bf16">
|
| 2114 |
+
<td class="rank mono sticky-0" data-label="#">#57</td>
|
| 2115 |
<td class="model-name sticky-1" data-label="Модель">ai-sage/GigaChat3-10B-A1.8B-bf16 (sglang)</td>
|
| 2116 |
<td class="num mono" data-label="Критичные/1000">
|
| 2117 |
|
|
|
|
| 2147 |
</tr>
|
| 2148 |
|
| 2149 |
<tr data-model="openrouter/openai/gpt-oss-20b">
|
| 2150 |
+
<td class="rank mono sticky-0" data-label="#">#58</td>
|
| 2151 |
<td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
|
| 2152 |
<td class="num mono" data-label="Критичные/1000">
|
| 2153 |
|
|
|
|
| 2205 |
</div>
|
| 2206 |
<p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
|
| 2207 |
<p class="info-text">
|
| 2208 |
+
Обновлено: 2026-02-09 17:13:53 | Всего моделей: 58 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
|
| 2209 |
</p>
|
| 2210 |
</div>
|
| 2211 |
<script>
|