kristaller486 commited on
Commit
2863afb
·
verified ·
1 Parent(s): cb8f2c6

add Qwen3-VL-8B-Instruct

Browse files
Files changed (1) hide show
  1. index.html +44 -8
index.html CHANGED
@@ -706,8 +706,44 @@
706
  <td class="num mono" data-label="Всего токенов">137,855</td>
707
  </tr>
708
 
709
- <tr data-model="openrouter/moonshotai/kimi-k2-0905">
710
  <td class="rank mono sticky-0" data-label="#">#18</td>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
711
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
712
  <td class="num mono" data-label="Критичные/1000">
713
 
@@ -743,7 +779,7 @@
743
  </tr>
744
 
745
  <tr data-model="openrouter/z-ai/glm-4.6">
746
- <td class="rank mono sticky-0" data-label="#">#19</td>
747
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
748
  <td class="num mono" data-label="Критичные/1000">
749
 
@@ -779,7 +815,7 @@
779
  </tr>
780
 
781
  <tr data-model="openrouter/openai/gpt-5">
782
- <td class="rank mono sticky-0" data-label="#">#20</td>
783
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
784
  <td class="num mono" data-label="Критичные/1000">
785
 
@@ -815,7 +851,7 @@
815
  </tr>
816
 
817
  <tr data-model="openrouter/openai/gpt-5">
818
- <td class="rank mono sticky-0" data-label="#">#21</td>
819
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
820
  <td class="num mono" data-label="Критичные/1000">
821
 
@@ -851,7 +887,7 @@
851
  </tr>
852
 
853
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
854
- <td class="rank mono sticky-0" data-label="#">#22</td>
855
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
856
  <td class="num mono" data-label="Критичные/1000">
857
 
@@ -887,7 +923,7 @@
887
  </tr>
888
 
889
  <tr data-model="openrouter/openai/gpt-oss-120b">
890
- <td class="rank mono sticky-0" data-label="#">#23</td>
891
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
892
  <td class="num mono" data-label="Критичные/1000">
893
 
@@ -923,7 +959,7 @@
923
  </tr>
924
 
925
  <tr data-model="openrouter/mistralai/mistral-nemo">
926
- <td class="rank mono sticky-0" data-label="#">#24</td>
927
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
928
  <td class="num mono" data-label="Критичные/1000">
929
 
@@ -981,7 +1017,7 @@
981
  </div>
982
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
983
  <p class="info-text">
984
- Обновлено: 2025-10-23 17:11:18 | Всего моделей: 24 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
985
  </p>
986
  </div>
987
  <script>
 
706
  <td class="num mono" data-label="Всего токенов">137,855</td>
707
  </tr>
708
 
709
+ <tr data-model="openrouter/qwen/qwen3-vl-8b-instruct">
710
  <td class="rank mono sticky-0" data-label="#">#18</td>
711
+ <td class="model-name sticky-1" data-label="Модель">Qwen3-VL-8B-Instruct (Alibaba API, presence_penalty=2)</td>
712
+ <td class="num mono" data-label="Критичные/1000">
713
+
714
+ 0.24 ± 0.03
715
+
716
+ </td>
717
+ <td class="num mono" data-label="Обычные/1000">
718
+
719
+ 1.02 ± 0.05
720
+
721
+ </td>
722
+ <td class="num mono" data-label="Доп./1000">
723
+
724
+ 0.32 ± 0.01
725
+
726
+ </td>
727
+ <td data-label="Нормировано ошибок">
728
+ <div class="score-cell">
729
+ <div class="progress-bar">
730
+
731
+
732
+
733
+ <div class="progress-fill" style="width: 40.07220216606498%"></div>
734
+ </div>
735
+ <span class="score-value">
736
+
737
+ 1.66 ± 0.11
738
+
739
+ </span>
740
+ </div>
741
+ </td>
742
+ <td class="num mono" data-label="Всего токенов">165,307</td>
743
+ </tr>
744
+
745
+ <tr data-model="openrouter/moonshotai/kimi-k2-0905">
746
+ <td class="rank mono sticky-0" data-label="#">#19</td>
747
  <td class="model-name sticky-1" data-label="Модель">moonshotai/Kimi-K2-Instruct-0905 (Novita API)</td>
748
  <td class="num mono" data-label="Критичные/1000">
749
 
 
779
  </tr>
780
 
781
  <tr data-model="openrouter/z-ai/glm-4.6">
782
+ <td class="rank mono sticky-0" data-label="#">#20</td>
783
  <td class="model-name sticky-1" data-label="Модель">GLM-4.6 (Z.ai API)</td>
784
  <td class="num mono" data-label="Критичные/1000">
785
 
 
815
  </tr>
816
 
817
  <tr data-model="openrouter/openai/gpt-5">
818
+ <td class="rank mono sticky-0" data-label="#">#21</td>
819
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: minimal)</td>
820
  <td class="num mono" data-label="Критичные/1000">
821
 
 
851
  </tr>
852
 
853
  <tr data-model="openrouter/openai/gpt-5">
854
+ <td class="rank mono sticky-0" data-label="#">#22</td>
855
  <td class="model-name sticky-1" data-label="Модель">GPT-5 (reasoning: low)</td>
856
  <td class="num mono" data-label="Критичные/1000">
857
 
 
887
  </tr>
888
 
889
  <tr data-model="openai/nvidia/NVIDIA-Nemotron-Nano-12B-v2">
890
+ <td class="rank mono sticky-0" data-label="#">#23</td>
891
  <td class="model-name sticky-1" data-label="Модель">nvidia/NVIDIA-Nemotron-Nano-12B-v2 (vllm, reasoning=false)</td>
892
  <td class="num mono" data-label="Критичные/1000">
893
 
 
923
  </tr>
924
 
925
  <tr data-model="openrouter/openai/gpt-oss-120b">
926
+ <td class="rank mono sticky-0" data-label="#">#24</td>
927
  <td class="model-name sticky-1" data-label="Модель">GPT-OSS-120B (Vertex AI API)</td>
928
  <td class="num mono" data-label="Критичные/1000">
929
 
 
959
  </tr>
960
 
961
  <tr data-model="openrouter/mistralai/mistral-nemo">
962
+ <td class="rank mono sticky-0" data-label="#">#25</td>
963
  <td class="model-name sticky-1" data-label="Модель">Mistral-Nemo (Mistral API)</td>
964
  <td class="num mono" data-label="Критичные/1000">
965
 
 
1017
  </div>
1018
  <p class="info-text">Если хотите, чтобы я добавил ту или иную модель в лидерборд - не стесняйтесь открыть issue/pull request на Github.</p>
1019
  <p class="info-text">
1020
+ Обновлено: 2025-10-24 14:31:35 | Всего моделей: 25 | <a href="https://github.com/kristaller486/RuQualBench">GitHub</a> | <a href="https://t.me/krists">Telegram</a>
1021
  </p>
1022
  </div>
1023
  <script>