kristaller486 commited on
Commit
32b05d5
·
verified ·
1 Parent(s): 35b5bbd

add pony alpha

Browse files
Files changed (1) hide show
  1. index.html +75 -39
index.html CHANGED
@@ -778,8 +778,44 @@
778
  <td class="num mono" data-label="Всего токенов">88,360</td>
779
  </tr>
780
 
781
- <tr data-model="openai/ai-sage/GigaChat-20B-A3B-instruct-v1.5-bf16">
782
  <td class="rank mono sticky-0" data-label="#">#20</td>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
783
  <td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
784
  <td class="num mono" data-label="Критичные/1000">
785
 
@@ -815,7 +851,7 @@
815
  </tr>
816
 
817
  <tr data-model="deepseek/deepseek-reasoner">
818
- <td class="rank mono sticky-0" data-label="#">#21</td>
819
  <td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-reasoner (Deepseek API)</td>
820
  <td class="num mono" data-label="Критичные/1000">
821
 
@@ -851,7 +887,7 @@
851
  </tr>
852
 
853
  <tr data-model="mistral/ministral-14b-2512">
854
- <td class="rank mono sticky-0" data-label="#">#22</td>
855
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-14B-Instruct-2512 (Mistral API)</td>
856
  <td class="num mono" data-label="Критичные/1000">
857
 
@@ -887,7 +923,7 @@
887
  </tr>
888
 
889
  <tr data-model="litellm_proxy/deepseek-v3">
890
- <td class="rank mono sticky-0" data-label="#">#23</td>
891
  <td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
892
  <td class="num mono" data-label="Критичные/1000">
893
 
@@ -923,7 +959,7 @@
923
  </tr>
924
 
925
  <tr data-model="litellm_proxy/tmp-gemma-3n-e4b-it">
926
- <td class="rank mono sticky-0" data-label="#">#24</td>
927
  <td class="model-name sticky-1" data-label="Модель">google/gemma-3n-E4B-it (AI Studio)</td>
928
  <td class="num mono" data-label="Критичные/1000">
929
 
@@ -959,7 +995,7 @@
959
  </tr>
960
 
961
  <tr data-model="mistral/ministral-8b-2512">
962
- <td class="rank mono sticky-0" data-label="#">#25</td>
963
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-8B-Instruct-2512 (Mistral API)</td>
964
  <td class="num mono" data-label="Критичные/1000">
965
 
@@ -995,7 +1031,7 @@
995
  </tr>
996
 
997
  <tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
998
- <td class="rank mono sticky-0" data-label="#">#26</td>
999
  <td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
1000
  <td class="num mono" data-label="Критичные/1000">
1001
 
@@ -1031,7 +1067,7 @@
1031
  </tr>
1032
 
1033
  <tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
1034
- <td class="rank mono sticky-0" data-label="#">#27</td>
1035
  <td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
1036
  <td class="num mono" data-label="Критичные/1000">
1037
 
@@ -1067,7 +1103,7 @@
1067
  </tr>
1068
 
1069
  <tr data-model="openai/mimo-v2-flash">
1070
- <td class="rank mono sticky-0" data-label="#">#28</td>
1071
  <td class="model-name sticky-1" data-label="Модель">Xiaomi Mimo V2 Flash (Xiaomi API, non-reasoning)</td>
1072
  <td class="num mono" data-label="Критичные/1000">
1073
 
@@ -1103,7 +1139,7 @@
1103
  </tr>
1104
 
1105
  <tr data-model="openai/Qwen/Qwen3-32B">
1106
- <td class="rank mono sticky-0" data-label="#">#29</td>
1107
  <td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
1108
  <td class="num mono" data-label="Критичные/1000">
1109
 
@@ -1139,7 +1175,7 @@
1139
  </tr>
1140
 
1141
  <tr data-model="openrouter/moonshotai/kimi-k2.5">
1142
- <td class="rank mono sticky-0" data-label="#">#30</td>
1143
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (non-reasoning, Moonshot AI API)</td>
1144
  <td class="num mono" data-label="Критичные/1000">
1145
 
@@ -1175,7 +1211,7 @@
1175
  </tr>
1176
 
1177
  <tr data-model="openai/t-tech/T-pro-it-2.0">
1178
- <td class="rank mono sticky-0" data-label="#">#31</td>
1179
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
1180
  <td class="num mono" data-label="Критичные/1000">
1181
 
@@ -1211,7 +1247,7 @@
1211
  </tr>
1212
 
1213
  <tr data-model="openrouter/openrouter/polaris-alpha">
1214
- <td class="rank mono sticky-0" data-label="#">#32</td>
1215
  <td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
1216
  <td class="num mono" data-label="Критичные/1000">
1217
 
@@ -1247,7 +1283,7 @@
1247
  </tr>
1248
 
1249
  <tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
1250
- <td class="rank mono sticky-0" data-label="#">#33</td>
1251
  <td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview 0.6 (Arcee-AI API)</td>
1252
  <td class="num mono" data-label="Критичные/1000">
1253
 
@@ -1283,7 +1319,7 @@
1283
  </tr>
1284
 
1285
  <tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
1286
- <td class="rank mono sticky-0" data-label="#">#34</td>
1287
  <td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
1288
  <td class="num mono" data-label="Критичные/1000">
1289
 
@@ -1319,7 +1355,7 @@
1319
  </tr>
1320
 
1321
  <tr data-model="openrouter/z-ai/glm-4.7-flash">
1322
- <td class="rank mono sticky-0" data-label="#">#35</td>
1323
  <td class="model-name sticky-1" data-label="Модель">zai-org/GLM-4.7-Flash (z.ai API, reasoning, temp=0.6)</td>
1324
  <td class="num mono" data-label="Критичные/1000">
1325
 
@@ -1355,7 +1391,7 @@
1355
  </tr>
1356
 
1357
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
1358
- <td class="rank mono sticky-0" data-label="#">#36</td>
1359
  <td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
1360
  <td class="num mono" data-label="Критичные/1000">
1361
 
@@ -1391,7 +1427,7 @@
1391
  </tr>
1392
 
1393
  <tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
1394
- <td class="rank mono sticky-0" data-label="#">#37</td>
1395
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
1396
  <td class="num mono" data-label="Критичные/1000">
1397
 
@@ -1427,7 +1463,7 @@
1427
  </tr>
1428
 
1429
  <tr data-model="openrouter/moonshotai/kimi-k2.5">
1430
- <td class="rank mono sticky-0" data-label="#">#38</td>
1431
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (reasoning, temp=1, Moonshot AI API)</td>
1432
  <td class="num mono" data-label="Критичные/1000">
1433
 
@@ -1463,7 +1499,7 @@
1463
  </tr>
1464
 
1465
  <tr data-model="openrouter/moonshotai/kimi-k2-0905">
1466
- <td class="rank mono sticky-0" data-label="#">#39</td>
1467
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
1468
  <td class="num mono" data-label="Критичные/1000">
1469
 
@@ -1499,7 +1535,7 @@
1499
  </tr>
1500
 
1501
  <tr data-model="openrouter/z-ai/glm-4.6">
1502
- <td class="rank mono sticky-0" data-label="#">#40</td>
1503
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
1504
  <td class="num mono" data-label="Критичные/1000">
1505
 
@@ -1535,7 +1571,7 @@
1535
  </tr>
1536
 
1537
  <tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
1538
- <td class="rank mono sticky-0" data-label="#">#41</td>
1539
  <td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview (Arcee-AI API)</td>
1540
  <td class="num mono" data-label="Критичные/1000">
1541
 
@@ -1571,7 +1607,7 @@
1571
  </tr>
1572
 
1573
  <tr data-model="openrouter/openai/gpt-5">
1574
- <td class="rank mono sticky-0" data-label="#">#42</td>
1575
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
1576
  <td class="num mono" data-label="Критичные/1000">
1577
 
@@ -1607,7 +1643,7 @@
1607
  </tr>
1608
 
1609
  <tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
1610
- <td class="rank mono sticky-0" data-label="#">#43</td>
1611
  <td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
1612
  <td class="num mono" data-label="Критичные/1000">
1613
 
@@ -1643,7 +1679,7 @@
1643
  </tr>
1644
 
1645
  <tr data-model="openrouter/openai/gpt-5">
1646
- <td class="rank mono sticky-0" data-label="#">#44</td>
1647
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
1648
  <td class="num mono" data-label="Критичные/1000">
1649
 
@@ -1679,7 +1715,7 @@
1679
  </tr>
1680
 
1681
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
1682
- <td class="rank mono sticky-0" data-label="#">#45</td>
1683
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
1684
  <td class="num mono" data-label="Критичные/1000">
1685
 
@@ -1715,7 +1751,7 @@
1715
  </tr>
1716
 
1717
  <tr data-model="openrouter/stepfun/step-3.5-flash:free">
1718
- <td class="rank mono sticky-0" data-label="#">#46</td>
1719
  <td class="model-name sticky-1" data-label="Модель">Step-3.5-flash (StepFun API, fp8, temp=0.6, reasoning)</td>
1720
  <td class="num mono" data-label="Критичные/1000">
1721
 
@@ -1751,7 +1787,7 @@
1751
  </tr>
1752
 
1753
  <tr data-model="openrouter/openai/gpt-oss-120b">
1754
- <td class="rank mono sticky-0" data-label="#">#47</td>
1755
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
1756
  <td class="num mono" data-label="Критичные/1000">
1757
 
@@ -1787,7 +1823,7 @@
1787
  </tr>
1788
 
1789
  <tr data-model="openai/gpt-4.1">
1790
- <td class="rank mono sticky-0" data-label="#">#48</td>
1791
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
1792
  <td class="num mono" data-label="Критичные/1000">
1793
 
@@ -1823,7 +1859,7 @@
1823
  </tr>
1824
 
1825
  <tr data-model="openrouter/nvidia/nemotron-3-nano-30b-a3b:free">
1826
- <td class="rank mono sticky-0" data-label="#">#49</td>
1827
  <td class="model-name sticky-1" data-label="Модель">Nemotron-3-Nano-30B-A3B (NVIDIA API, non-reasoning)</td>
1828
  <td class="num mono" data-label="Критичные/1000">
1829
 
@@ -1859,7 +1895,7 @@
1859
  </tr>
1860
 
1861
  <tr data-model="mistral/ministral-3b-2512">
1862
- <td class="rank mono sticky-0" data-label="#">#50</td>
1863
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-3B-Instruct-2512 (Mistral API)</td>
1864
  <td class="num mono" data-label="Критичные/1000">
1865
 
@@ -1895,7 +1931,7 @@
1895
  </tr>
1896
 
1897
  <tr data-model="openrouter/mistralai/mistral-nemo">
1898
- <td class="rank mono sticky-0" data-label="#">#51</td>
1899
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
1900
  <td class="num mono" data-label="Критичные/1000">
1901
 
@@ -1931,7 +1967,7 @@
1931
  </tr>
1932
 
1933
  <tr data-model="openai/gpt-4.1-mini">
1934
- <td class="rank mono sticky-0" data-label="#">#52</td>
1935
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
1936
  <td class="num mono" data-label="Критичные/1000">
1937
 
@@ -1967,7 +2003,7 @@
1967
  </tr>
1968
 
1969
  <tr data-model="openrouter/minimax/minimax-m2:free">
1970
- <td class="rank mono sticky-0" data-label="#">#53</td>
1971
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
1972
  <td class="num mono" data-label="Критичные/1000">
1973
 
@@ -2003,7 +2039,7 @@
2003
  </tr>
2004
 
2005
  <tr data-model="openrouter/minimax/minimax-m2:free">
2006
- <td class="rank mono sticky-0" data-label="#">#54</td>
2007
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
2008
  <td class="num mono" data-label="Критичные/1000">
2009
 
@@ -2039,7 +2075,7 @@
2039
  </tr>
2040
 
2041
  <tr data-model="openai/gpt-4.1-nano">
2042
- <td class="rank mono sticky-0" data-label="#">#55</td>
2043
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
2044
  <td class="num mono" data-label="Критичные/1000">
2045
 
@@ -2075,7 +2111,7 @@
2075
  </tr>
2076
 
2077
  <tr data-model="openai/ai-sage/GigaChat3-10B-A1.8B-bf16">
2078
- <td class="rank mono sticky-0" data-label="#">#56</td>
2079
  <td class="model-name sticky-1" data-label="Модель">ai-sage/GigaChat3-10B-A1.8B-bf16 (sglang)</td>
2080
  <td class="num mono" data-label="Критичные/1000">
2081
 
@@ -2111,7 +2147,7 @@
2111
  </tr>
2112
 
2113
  <tr data-model="openrouter/openai/gpt-oss-20b">
2114
- <td class="rank mono sticky-0" data-label="#">#57</td>
2115
  <td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
2116
  <td class="num mono" data-label="Критичные/1000">
2117
 
@@ -2169,7 +2205,7 @@
2169
  </div>
2170
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
2171
  <p class="info-text">
2172
- Обновлено: 2026-02-02 10:15:23 | Всего моделей: 57 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
2173
  </p>
2174
  </div>
2175
  <script>
 
778
  <td class="num mono" data-label="Всего токенов">88,360</td>
779
  </tr>
780
 
781
+ <tr data-model="openrouter/openrouter/pony-alpha">
782
  <td class="rank mono sticky-0" data-label="#">#20</td>
783
+ <td class="model-name sticky-1" data-label="Модель">Pony Alpha (temp=0.6)</td>
784
+ <td class="num mono" data-label="Критичные/1000">
785
+
786
+ 0.22 ± 0.04
787
+
788
+ </td>
789
+ <td class="num mono" data-label="Обычные/1000">
790
+
791
+ 0.43 ± 0.04
792
+
793
+ </td>
794
+ <td class="num mono" data-label="Доп./1000">
795
+
796
+ 0.24 ± 0.02
797
+
798
+ </td>
799
+ <td data-label="Нормировано ошибок">
800
+ <div class="score-cell">
801
+ <div class="progress-bar">
802
+
803
+
804
+
805
+ <div class="progress-fill" style="width: 75.25%"></div>
806
+ </div>
807
+ <span class="score-value">
808
+
809
+ 0.99 ± 0.07
810
+
811
+ </span>
812
+ </div>
813
+ </td>
814
+ <td class="num mono" data-label="Всего токенов">126,482</td>
815
+ </tr>
816
+
817
+ <tr data-model="openai/ai-sage/GigaChat-20B-A3B-instruct-v1.5-bf16">
818
+ <td class="rank mono sticky-0" data-label="#">#21</td>
819
  <td class="model-name sticky-1" data-label="Модель">GigaChat-20B-A3B-instruct-v1.5 (SGLang)</td>
820
  <td class="num mono" data-label="Критичные/1000">
821
 
 
851
  </tr>
852
 
853
  <tr data-model="deepseek/deepseek-reasoner">
854
+ <td class="rank mono sticky-0" data-label="#">#22</td>
855
  <td class="model-name sticky-1" data-label="Модель">Deepseek-V3.2-reasoner (Deepseek API)</td>
856
  <td class="num mono" data-label="Критичные/1000">
857
 
 
887
  </tr>
888
 
889
  <tr data-model="mistral/ministral-14b-2512">
890
+ <td class="rank mono sticky-0" data-label="#">#23</td>
891
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-14B-Instruct-2512 (Mistral API)</td>
892
  <td class="num mono" data-label="Критичные/1000">
893
 
 
923
  </tr>
924
 
925
  <tr data-model="litellm_proxy/deepseek-v3">
926
+ <td class="rank mono sticky-0" data-label="#">#24</td>
927
  <td class="model-name sticky-1" data-label="Модель">Deepseek V3.2-Exp (Deepseek API)</td>
928
  <td class="num mono" data-label="Критичные/1000">
929
 
 
959
  </tr>
960
 
961
  <tr data-model="litellm_proxy/tmp-gemma-3n-e4b-it">
962
+ <td class="rank mono sticky-0" data-label="#">#25</td>
963
  <td class="model-name sticky-1" data-label="Модель">google/gemma-3n-E4B-it (AI Studio)</td>
964
  <td class="num mono" data-label="Критичные/1000">
965
 
 
995
  </tr>
996
 
997
  <tr data-model="mistral/ministral-8b-2512">
998
+ <td class="rank mono sticky-0" data-label="#">#26</td>
999
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-8B-Instruct-2512 (Mistral API)</td>
1000
  <td class="num mono" data-label="Критичные/1000">
1001
 
 
1031
  </tr>
1032
 
1033
  <tr data-model="openrouter/qwen/qwen3-next-80b-a3b-instruct">
1034
+ <td class="rank mono sticky-0" data-label="#">#27</td>
1035
  <td class="model-name sticky-1" data-label="Модель">Qwen3-Next-80B-A3B-Instruct (Alibaba API)</td>
1036
  <td class="num mono" data-label="Критичные/1000">
1037
 
 
1067
  </tr>
1068
 
1069
  <tr data-model="openrouter/baidu/ernie-4.5-300b-a47b">
1070
+ <td class="rank mono sticky-0" data-label="#">#28</td>
1071
  <td class="model-name sticky-1" data-label="Модель">baidu/ERNIE-4.5-300B-A47B-PT (Novita API)</td>
1072
  <td class="num mono" data-label="Критичные/1000">
1073
 
 
1103
  </tr>
1104
 
1105
  <tr data-model="openai/mimo-v2-flash">
1106
+ <td class="rank mono sticky-0" data-label="#">#29</td>
1107
  <td class="model-name sticky-1" data-label="Модель">Xiaomi Mimo V2 Flash (Xiaomi API, non-reasoning)</td>
1108
  <td class="num mono" data-label="Критичные/1000">
1109
 
 
1139
  </tr>
1140
 
1141
  <tr data-model="openai/Qwen/Qwen3-32B">
1142
+ <td class="rank mono sticky-0" data-label="#">#30</td>
1143
  <td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
1144
  <td class="num mono" data-label="Критичные/1000">
1145
 
 
1175
  </tr>
1176
 
1177
  <tr data-model="openrouter/moonshotai/kimi-k2.5">
1178
+ <td class="rank mono sticky-0" data-label="#">#31</td>
1179
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (non-reasoning, Moonshot AI API)</td>
1180
  <td class="num mono" data-label="Критичные/1000">
1181
 
 
1211
  </tr>
1212
 
1213
  <tr data-model="openai/t-tech/T-pro-it-2.0">
1214
+ <td class="rank mono sticky-0" data-label="#">#32</td>
1215
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
1216
  <td class="num mono" data-label="Критичные/1000">
1217
 
 
1247
  </tr>
1248
 
1249
  <tr data-model="openrouter/openrouter/polaris-alpha">
1250
+ <td class="rank mono sticky-0" data-label="#">#33</td>
1251
  <td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
1252
  <td class="num mono" data-label="Критичные/1000">
1253
 
 
1283
  </tr>
1284
 
1285
  <tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
1286
+ <td class="rank mono sticky-0" data-label="#">#34</td>
1287
  <td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview 0.6 (Arcee-AI API)</td>
1288
  <td class="num mono" data-label="Критичные/1000">
1289
 
 
1319
  </tr>
1320
 
1321
  <tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
1322
+ <td class="rank mono sticky-0" data-label="#">#35</td>
1323
  <td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
1324
  <td class="num mono" data-label="Критичные/1000">
1325
 
 
1355
  </tr>
1356
 
1357
  <tr data-model="openrouter/z-ai/glm-4.7-flash">
1358
+ <td class="rank mono sticky-0" data-label="#">#36</td>
1359
  <td class="model-name sticky-1" data-label="Модель">zai-org/GLM-4.7-Flash (z.ai API, reasoning, temp=0.6)</td>
1360
  <td class="num mono" data-label="Критичные/1000">
1361
 
 
1391
  </tr>
1392
 
1393
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
1394
+ <td class="rank mono sticky-0" data-label="#">#37</td>
1395
  <td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
1396
  <td class="num mono" data-label="Критичные/1000">
1397
 
 
1427
  </tr>
1428
 
1429
  <tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
1430
+ <td class="rank mono sticky-0" data-label="#">#38</td>
1431
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
1432
  <td class="num mono" data-label="Критичные/1000">
1433
 
 
1463
  </tr>
1464
 
1465
  <tr data-model="openrouter/moonshotai/kimi-k2.5">
1466
+ <td class="rank mono sticky-0" data-label="#">#39</td>
1467
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2.5 (reasoning, temp=1, Moonshot AI API)</td>
1468
  <td class="num mono" data-label="Критичные/1000">
1469
 
 
1499
  </tr>
1500
 
1501
  <tr data-model="openrouter/moonshotai/kimi-k2-0905">
1502
+ <td class="rank mono sticky-0" data-label="#">#40</td>
1503
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
1504
  <td class="num mono" data-label="Критичные/1000">
1505
 
 
1535
  </tr>
1536
 
1537
  <tr data-model="openrouter/z-ai/glm-4.6">
1538
+ <td class="rank mono sticky-0" data-label="#">#41</td>
1539
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
1540
  <td class="num mono" data-label="Критичные/1000">
1541
 
 
1571
  </tr>
1572
 
1573
  <tr data-model="openrouter/arcee-ai/trinity-large-preview:free">
1574
+ <td class="rank mono sticky-0" data-label="#">#42</td>
1575
  <td class="model-name sticky-1" data-label="Модель">arcee-ai/Trinity-Large-Preview (Arcee-AI API)</td>
1576
  <td class="num mono" data-label="Критичные/1000">
1577
 
 
1607
  </tr>
1608
 
1609
  <tr data-model="openrouter/openai/gpt-5">
1610
+ <td class="rank mono sticky-0" data-label="#">#43</td>
1611
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
1612
  <td class="num mono" data-label="Критичные/1000">
1613
 
 
1643
  </tr>
1644
 
1645
  <tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
1646
+ <td class="rank mono sticky-0" data-label="#">#44</td>
1647
  <td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
1648
  <td class="num mono" data-label="Критичные/1000">
1649
 
 
1679
  </tr>
1680
 
1681
  <tr data-model="openrouter/openai/gpt-5">
1682
+ <td class="rank mono sticky-0" data-label="#">#45</td>
1683
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
1684
  <td class="num mono" data-label="Критичные/1000">
1685
 
 
1715
  </tr>
1716
 
1717
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
1718
+ <td class="rank mono sticky-0" data-label="#">#46</td>
1719
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
1720
  <td class="num mono" data-label="Критичные/1000">
1721
 
 
1751
  </tr>
1752
 
1753
  <tr data-model="openrouter/stepfun/step-3.5-flash:free">
1754
+ <td class="rank mono sticky-0" data-label="#">#47</td>
1755
  <td class="model-name sticky-1" data-label="Модель">Step-3.5-flash (StepFun API, fp8, temp=0.6, reasoning)</td>
1756
  <td class="num mono" data-label="Критичные/1000">
1757
 
 
1787
  </tr>
1788
 
1789
  <tr data-model="openrouter/openai/gpt-oss-120b">
1790
+ <td class="rank mono sticky-0" data-label="#">#48</td>
1791
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
1792
  <td class="num mono" data-label="Критичные/1000">
1793
 
 
1823
  </tr>
1824
 
1825
  <tr data-model="openai/gpt-4.1">
1826
+ <td class="rank mono sticky-0" data-label="#">#49</td>
1827
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
1828
  <td class="num mono" data-label="Критичные/1000">
1829
 
 
1859
  </tr>
1860
 
1861
  <tr data-model="openrouter/nvidia/nemotron-3-nano-30b-a3b:free">
1862
+ <td class="rank mono sticky-0" data-label="#">#50</td>
1863
  <td class="model-name sticky-1" data-label="Модель">Nemotron-3-Nano-30B-A3B (NVIDIA API, non-reasoning)</td>
1864
  <td class="num mono" data-label="Критичные/1000">
1865
 
 
1895
  </tr>
1896
 
1897
  <tr data-model="mistral/ministral-3b-2512">
1898
+ <td class="rank mono sticky-0" data-label="#">#51</td>
1899
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-3B-Instruct-2512 (Mistral API)</td>
1900
  <td class="num mono" data-label="Критичные/1000">
1901
 
 
1931
  </tr>
1932
 
1933
  <tr data-model="openrouter/mistralai/mistral-nemo">
1934
+ <td class="rank mono sticky-0" data-label="#">#52</td>
1935
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
1936
  <td class="num mono" data-label="Критичные/1000">
1937
 
 
1967
  </tr>
1968
 
1969
  <tr data-model="openai/gpt-4.1-mini">
1970
+ <td class="rank mono sticky-0" data-label="#">#53</td>
1971
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
1972
  <td class="num mono" data-label="Критичные/1000">
1973
 
 
2003
  </tr>
2004
 
2005
  <tr data-model="openrouter/minimax/minimax-m2:free">
2006
+ <td class="rank mono sticky-0" data-label="#">#54</td>
2007
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
2008
  <td class="num mono" data-label="Критичные/1000">
2009
 
 
2039
  </tr>
2040
 
2041
  <tr data-model="openrouter/minimax/minimax-m2:free">
2042
+ <td class="rank mono sticky-0" data-label="#">#55</td>
2043
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
2044
  <td class="num mono" data-label="Критичные/1000">
2045
 
 
2075
  </tr>
2076
 
2077
  <tr data-model="openai/gpt-4.1-nano">
2078
+ <td class="rank mono sticky-0" data-label="#">#56</td>
2079
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
2080
  <td class="num mono" data-label="Критичные/1000">
2081
 
 
2111
  </tr>
2112
 
2113
  <tr data-model="openai/ai-sage/GigaChat3-10B-A1.8B-bf16">
2114
+ <td class="rank mono sticky-0" data-label="#">#57</td>
2115
  <td class="model-name sticky-1" data-label="Модель">ai-sage/GigaChat3-10B-A1.8B-bf16 (sglang)</td>
2116
  <td class="num mono" data-label="Критичные/1000">
2117
 
 
2147
  </tr>
2148
 
2149
  <tr data-model="openrouter/openai/gpt-oss-20b">
2150
+ <td class="rank mono sticky-0" data-label="#">#58</td>
2151
  <td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
2152
  <td class="num mono" data-label="Критичные/1000">
2153
 
 
2205
  </div>
2206
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
2207
  <p class="info-text">
2208
+ Обновлено: 2026-02-09 17:13:53 | Всего моделей: 58 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
2209
  </p>
2210
  </div>
2211
  <script>