kristaller486 commited on
Commit
595a1ac
·
verified ·
1 Parent(s): 4421455

add xiaomi mimo v2 flash

Browse files
Files changed (1) hide show
  1. index.html +60 -24
index.html CHANGED
@@ -1030,8 +1030,44 @@
1030
  <td class="num mono" data-label="Всего токенов">95,684</td>
1031
  </tr>
1032
 
1033
- <tr data-model="openai/Qwen/Qwen3-32B">
1034
  <td class="rank mono sticky-0" data-label="#">#27</td>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1035
  <td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
1036
  <td class="num mono" data-label="Критичные/1000">
1037
 
@@ -1067,7 +1103,7 @@
1067
  </tr>
1068
 
1069
  <tr data-model="openai/t-tech/T-pro-it-2.0">
1070
- <td class="rank mono sticky-0" data-label="#">#28</td>
1071
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
1072
  <td class="num mono" data-label="Критичные/1000">
1073
 
@@ -1103,7 +1139,7 @@
1103
  </tr>
1104
 
1105
  <tr data-model="openrouter/openrouter/polaris-alpha">
1106
- <td class="rank mono sticky-0" data-label="#">#29</td>
1107
  <td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
1108
  <td class="num mono" data-label="Критичные/1000">
1109
 
@@ -1139,7 +1175,7 @@
1139
  </tr>
1140
 
1141
  <tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
1142
- <td class="rank mono sticky-0" data-label="#">#30</td>
1143
  <td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
1144
  <td class="num mono" data-label="Критичные/1000">
1145
 
@@ -1175,7 +1211,7 @@
1175
  </tr>
1176
 
1177
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
1178
- <td class="rank mono sticky-0" data-label="#">#31</td>
1179
  <td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
1180
  <td class="num mono" data-label="Критичные/1000">
1181
 
@@ -1211,7 +1247,7 @@
1211
  </tr>
1212
 
1213
  <tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
1214
- <td class="rank mono sticky-0" data-label="#">#32</td>
1215
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
1216
  <td class="num mono" data-label="Критичные/1000">
1217
 
@@ -1247,7 +1283,7 @@
1247
  </tr>
1248
 
1249
  <tr data-model="openrouter/moonshotai/kimi-k2-0905">
1250
- <td class="rank mono sticky-0" data-label="#">#33</td>
1251
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
1252
  <td class="num mono" data-label="Критичные/1000">
1253
 
@@ -1283,7 +1319,7 @@
1283
  </tr>
1284
 
1285
  <tr data-model="openrouter/z-ai/glm-4.6">
1286
- <td class="rank mono sticky-0" data-label="#">#34</td>
1287
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
1288
  <td class="num mono" data-label="Критичные/1000">
1289
 
@@ -1319,7 +1355,7 @@
1319
  </tr>
1320
 
1321
  <tr data-model="openrouter/openai/gpt-5">
1322
- <td class="rank mono sticky-0" data-label="#">#35</td>
1323
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
1324
  <td class="num mono" data-label="Критичные/1000">
1325
 
@@ -1355,7 +1391,7 @@
1355
  </tr>
1356
 
1357
  <tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
1358
- <td class="rank mono sticky-0" data-label="#">#36</td>
1359
  <td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
1360
  <td class="num mono" data-label="Критичные/1000">
1361
 
@@ -1391,7 +1427,7 @@
1391
  </tr>
1392
 
1393
  <tr data-model="openrouter/openai/gpt-5">
1394
- <td class="rank mono sticky-0" data-label="#">#37</td>
1395
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
1396
  <td class="num mono" data-label="Критичные/1000">
1397
 
@@ -1427,7 +1463,7 @@
1427
  </tr>
1428
 
1429
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
1430
- <td class="rank mono sticky-0" data-label="#">#38</td>
1431
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
1432
  <td class="num mono" data-label="Критичные/1000">
1433
 
@@ -1463,7 +1499,7 @@
1463
  </tr>
1464
 
1465
  <tr data-model="openrouter/openai/gpt-oss-120b">
1466
- <td class="rank mono sticky-0" data-label="#">#39</td>
1467
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
1468
  <td class="num mono" data-label="Критичные/1000">
1469
 
@@ -1499,7 +1535,7 @@
1499
  </tr>
1500
 
1501
  <tr data-model="openai/gpt-4.1">
1502
- <td class="rank mono sticky-0" data-label="#">#40</td>
1503
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
1504
  <td class="num mono" data-label="Критичные/1000">
1505
 
@@ -1535,7 +1571,7 @@
1535
  </tr>
1536
 
1537
  <tr data-model="openrouter/nvidia/nemotron-3-nano-30b-a3b:free">
1538
- <td class="rank mono sticky-0" data-label="#">#41</td>
1539
  <td class="model-name sticky-1" data-label="Модель">Nemotron-3-Nano-30B-A3B (NVIDIA API, non-reasoning)</td>
1540
  <td class="num mono" data-label="Критичные/1000">
1541
 
@@ -1571,7 +1607,7 @@
1571
  </tr>
1572
 
1573
  <tr data-model="mistral/ministral-3b-2512">
1574
- <td class="rank mono sticky-0" data-label="#">#42</td>
1575
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-3B-Instruct-2512 (Mistral API)</td>
1576
  <td class="num mono" data-label="Критичные/1000">
1577
 
@@ -1607,7 +1643,7 @@
1607
  </tr>
1608
 
1609
  <tr data-model="openrouter/mistralai/mistral-nemo">
1610
- <td class="rank mono sticky-0" data-label="#">#43</td>
1611
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
1612
  <td class="num mono" data-label="Критичные/1000">
1613
 
@@ -1643,7 +1679,7 @@
1643
  </tr>
1644
 
1645
  <tr data-model="openai/gpt-4.1-mini">
1646
- <td class="rank mono sticky-0" data-label="#">#44</td>
1647
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
1648
  <td class="num mono" data-label="Критичные/1000">
1649
 
@@ -1679,7 +1715,7 @@
1679
  </tr>
1680
 
1681
  <tr data-model="openrouter/minimax/minimax-m2:free">
1682
- <td class="rank mono sticky-0" data-label="#">#45</td>
1683
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
1684
  <td class="num mono" data-label="Критичные/1000">
1685
 
@@ -1715,7 +1751,7 @@
1715
  </tr>
1716
 
1717
  <tr data-model="openrouter/minimax/minimax-m2:free">
1718
- <td class="rank mono sticky-0" data-label="#">#46</td>
1719
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
1720
  <td class="num mono" data-label="Критичные/1000">
1721
 
@@ -1751,7 +1787,7 @@
1751
  </tr>
1752
 
1753
  <tr data-model="openai/gpt-4.1-nano">
1754
- <td class="rank mono sticky-0" data-label="#">#47</td>
1755
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
1756
  <td class="num mono" data-label="Критичные/1000">
1757
 
@@ -1787,7 +1823,7 @@
1787
  </tr>
1788
 
1789
  <tr data-model="openai/ai-sage/GigaChat3-10B-A1.8B-bf16">
1790
- <td class="rank mono sticky-0" data-label="#">#48</td>
1791
  <td class="model-name sticky-1" data-label="Модель">ai-sage/GigaChat3-10B-A1.8B-bf16 (sglang)</td>
1792
  <td class="num mono" data-label="Критичные/1000">
1793
 
@@ -1823,7 +1859,7 @@
1823
  </tr>
1824
 
1825
  <tr data-model="openrouter/openai/gpt-oss-20b">
1826
- <td class="rank mono sticky-0" data-label="#">#49</td>
1827
  <td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
1828
  <td class="num mono" data-label="Критичные/1000">
1829
 
@@ -1881,7 +1917,7 @@
1881
  </div>
1882
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
1883
  <p class="info-text">
1884
- Обновлено: 2025-12-16 09:18:53 | Всего моделей: 49 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
1885
  </p>
1886
  </div>
1887
  <script>
 
1030
  <td class="num mono" data-label="Всего токенов">95,684</td>
1031
  </tr>
1032
 
1033
+ <tr data-model="openai/mimo-v2-flash">
1034
  <td class="rank mono sticky-0" data-label="#">#27</td>
1035
+ <td class="model-name sticky-1" data-label="Модель">Xiaomi Mimo V2 Flash (Xiaomi API, non-reasoning)</td>
1036
+ <td class="num mono" data-label="Критичные/1000">
1037
+
1038
+ 0.28 ± 0.05
1039
+
1040
+ </td>
1041
+ <td class="num mono" data-label="Обычные/1000">
1042
+
1043
+ 0.59 ± 0.01
1044
+
1045
+ </td>
1046
+ <td class="num mono" data-label="Доп./1000">
1047
+
1048
+ 0.20 ± 0.03
1049
+
1050
+ </td>
1051
+ <td data-label="Нормировано ошибок">
1052
+ <div class="score-cell">
1053
+ <div class="progress-bar">
1054
+
1055
+
1056
+
1057
+ <div class="progress-fill" style="width: 69.0%"></div>
1058
+ </div>
1059
+ <span class="score-value">
1060
+
1061
+ 1.24 ± 0.11
1062
+
1063
+ </span>
1064
+ </div>
1065
+ </td>
1066
+ <td class="num mono" data-label="Всего токенов">140,821</td>
1067
+ </tr>
1068
+
1069
+ <tr data-model="openai/Qwen/Qwen3-32B">
1070
+ <td class="rank mono sticky-0" data-label="#">#28</td>
1071
  <td class="model-name sticky-1" data-label="Модель">Qwen3-32B (SGLang, without reasoining)</td>
1072
  <td class="num mono" data-label="Критичные/1000">
1073
 
 
1103
  </tr>
1104
 
1105
  <tr data-model="openai/t-tech/T-pro-it-2.0">
1106
+ <td class="rank mono sticky-0" data-label="#">#29</td>
1107
  <td class="model-name sticky-1" data-label="Модель">t-tech/T-pro-it-2.0 (SGLang, without reasoning)</td>
1108
  <td class="num mono" data-label="Критичные/1000">
1109
 
 
1139
  </tr>
1140
 
1141
  <tr data-model="openrouter/openrouter/polaris-alpha">
1142
+ <td class="rank mono sticky-0" data-label="#">#30</td>
1143
  <td class="model-name sticky-1" data-label="Модель">Polaris Alpha</td>
1144
  <td class="num mono" data-label="Критичные/1000">
1145
 
 
1175
  </tr>
1176
 
1177
  <tr data-model="openai/tiiuae/Falcon-H1-34B-Instruct">
1178
+ <td class="rank mono sticky-0" data-label="#">#31</td>
1179
  <td class="model-name sticky-1" data-label="Модель">tiiuae/Falcon-H1-34B-Instruct (vllm)</td>
1180
  <td class="num mono" data-label="Критичные/1000">
1181
 
 
1211
  </tr>
1212
 
1213
  <tr data-model="openrouter/qwen/qwen3-235b-a22b-2507">
1214
+ <td class="rank mono sticky-0" data-label="#">#32</td>
1215
  <td class="model-name sticky-1" data-label="Модель">Qwen3-235B-A22B-2507-Instruct (Alibaba API)</td>
1216
  <td class="num mono" data-label="Критичные/1000">
1217
 
 
1247
  </tr>
1248
 
1249
  <tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
1250
+ <td class="rank mono sticky-0" data-label="#">#33</td>
1251
  <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
1252
  <td class="num mono" data-label="Критичные/1000">
1253
 
 
1283
  </tr>
1284
 
1285
  <tr data-model="openrouter/moonshotai/kimi-k2-0905">
1286
+ <td class="rank mono sticky-0" data-label="#">#34</td>
1287
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
1288
  <td class="num mono" data-label="Критичные/1000">
1289
 
 
1319
  </tr>
1320
 
1321
  <tr data-model="openrouter/z-ai/glm-4.6">
1322
+ <td class="rank mono sticky-0" data-label="#">#35</td>
1323
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
1324
  <td class="num mono" data-label="Критичные/1000">
1325
 
 
1355
  </tr>
1356
 
1357
  <tr data-model="openrouter/openai/gpt-5">
1358
+ <td class="rank mono sticky-0" data-label="#">#36</td>
1359
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
1360
  <td class="num mono" data-label="Критичные/1000">
1361
 
 
1391
  </tr>
1392
 
1393
  <tr data-model="openai/aquif-3.5-Max-42B-A3B.Q8_0.gguf">
1394
+ <td class="rank mono sticky-0" data-label="#">#37</td>
1395
  <td class="model-name sticky-1" data-label="Модель">aquif-ai/aquif-3.5-Plus-30B-A3B (Q8_0 llama.cpp, without reasoning)</td>
1396
  <td class="num mono" data-label="Критичные/1000">
1397
 
 
1427
  </tr>
1428
 
1429
  <tr data-model="openrouter/openai/gpt-5">
1430
+ <td class="rank mono sticky-0" data-label="#">#38</td>
1431
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
1432
  <td class="num mono" data-label="Критичные/1000">
1433
 
 
1463
  </tr>
1464
 
1465
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
1466
+ <td class="rank mono sticky-0" data-label="#">#39</td>
1467
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
1468
  <td class="num mono" data-label="Критичные/1000">
1469
 
 
1499
  </tr>
1500
 
1501
  <tr data-model="openrouter/openai/gpt-oss-120b">
1502
+ <td class="rank mono sticky-0" data-label="#">#40</td>
1503
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
1504
  <td class="num mono" data-label="Критичные/1000">
1505
 
 
1535
  </tr>
1536
 
1537
  <tr data-model="openai/gpt-4.1">
1538
+ <td class="rank mono sticky-0" data-label="#">#41</td>
1539
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1</td>
1540
  <td class="num mono" data-label="Критичные/1000">
1541
 
 
1571
  </tr>
1572
 
1573
  <tr data-model="openrouter/nvidia/nemotron-3-nano-30b-a3b:free">
1574
+ <td class="rank mono sticky-0" data-label="#">#42</td>
1575
  <td class="model-name sticky-1" data-label="Модель">Nemotron-3-Nano-30B-A3B (NVIDIA API, non-reasoning)</td>
1576
  <td class="num mono" data-label="Критичные/1000">
1577
 
 
1607
  </tr>
1608
 
1609
  <tr data-model="mistral/ministral-3b-2512">
1610
+ <td class="rank mono sticky-0" data-label="#">#43</td>
1611
  <td class="model-name sticky-1" data-label="Модель">mistralai/Ministral-3-3B-Instruct-2512 (Mistral API)</td>
1612
  <td class="num mono" data-label="Критичные/1000">
1613
 
 
1643
  </tr>
1644
 
1645
  <tr data-model="openrouter/mistralai/mistral-nemo">
1646
+ <td class="rank mono sticky-0" data-label="#">#44</td>
1647
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
1648
  <td class="num mono" data-label="Критичные/1000">
1649
 
 
1679
  </tr>
1680
 
1681
  <tr data-model="openai/gpt-4.1-mini">
1682
+ <td class="rank mono sticky-0" data-label="#">#45</td>
1683
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-mini</td>
1684
  <td class="num mono" data-label="Критичные/1000">
1685
 
 
1715
  </tr>
1716
 
1717
  <tr data-model="openrouter/minimax/minimax-m2:free">
1718
+ <td class="rank mono sticky-0" data-label="#">#46</td>
1719
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API)</td>
1720
  <td class="num mono" data-label="Критичные/1000">
1721
 
 
1751
  </tr>
1752
 
1753
  <tr data-model="openrouter/minimax/minimax-m2:free">
1754
+ <td class="rank mono sticky-0" data-label="#">#47</td>
1755
  <td class="model-name sticky-1" data-label="Модель">MiniMaxAI/MiniMax-M2 (Minimax API, recommend params)</td>
1756
  <td class="num mono" data-label="Критичные/1000">
1757
 
 
1787
  </tr>
1788
 
1789
  <tr data-model="openai/gpt-4.1-nano">
1790
+ <td class="rank mono sticky-0" data-label="#">#48</td>
1791
  <td class="model-name sticky-1" data-label="Модель">GPT-4.1-nano</td>
1792
  <td class="num mono" data-label="Критичные/1000">
1793
 
 
1823
  </tr>
1824
 
1825
  <tr data-model="openai/ai-sage/GigaChat3-10B-A1.8B-bf16">
1826
+ <td class="rank mono sticky-0" data-label="#">#49</td>
1827
  <td class="model-name sticky-1" data-label="Модель">ai-sage/GigaChat3-10B-A1.8B-bf16 (sglang)</td>
1828
  <td class="num mono" data-label="Критичные/1000">
1829
 
 
1859
  </tr>
1860
 
1861
  <tr data-model="openrouter/openai/gpt-oss-20b">
1862
+ <td class="rank mono sticky-0" data-label="#">#50</td>
1863
  <td class="model-name sticky-1" data-label="Модель">openai/gpt-oss-20b (Vertex API)</td>
1864
  <td class="num mono" data-label="Критичные/1000">
1865
 
 
1917
  </div>
1918
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
1919
  <p class="info-text">
1920
+ Обновлено: 2025-12-16 17:37:47 | Всего моделей: 50 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
1921
  </p>
1922
  </div>
1923
  <script>