Lamapi commited on
Commit
52b7d4f
·
verified ·
1 Parent(s): 33f9ca5

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +78 -58
README.md CHANGED
@@ -49,26 +49,31 @@ pipeline_tag: text-generation
49
  ---
50
 
51
  <style>
52
- table { width:fit-content; border-collapse:separate; border-spacing:0 4px;background:rgba(15,22,32,0.4);border-radius:16px; }
53
- thead th { text-align:left; padding:12px 24px; font-size:15px; text-transform:uppercase; color:rgb(200,200,200); }
54
- tbody tr { transition: transform 0.18s ease, box-shadow 0.18s ease; }
55
- tbody tr:hover { transform: translateY(-4px); box-shadow:0 6px 15px rgba(0,0,0,0.06); }
56
- td { padding:14px 24px; border-radius:0px; }
57
- td:first-child { font-weight:600; }
58
- .next td { background: rgba(0,140,255,0.4); color:rgb(200,200,200); font-weight:600; }
59
- tbody tr td:first-child { border-top-left-radius:8px; border-bottom-left-radius:8px; }
60
- tbody tr td:last-child { border-top-right-radius:8px; border-bottom-right-radius:8px; }
61
- @media (max-width:720px){
62
- thead{ display:none; }
63
- table, tbody, tr, td{ display:block; width:fit-content; }
64
- tbody tr{ margin-bottom:12px; transform:none !important; box-shadow:none !important; }
65
- td{ display:flex; justify-content:space-between; padding:10px 12px; }
66
- td[data-label]{ font-size:13px; font-weight:500; color:rgb(200,200,200); }
67
- td span.value{ color:rgb(200,200,200); font-weight:700; }
68
- .next td{ display:flex; justify-content:space-between; align-items:center; }
69
  }
 
 
 
 
 
 
 
 
70
  </style>
71
 
 
 
72
  <table>
73
  <thead>
74
  <tr>
@@ -81,53 +86,18 @@ pipeline_tag: text-generation
81
  </thead>
82
  <tbody>
83
  <tr class="next">
84
- <td data-label="Model">Next Z1</td>
85
- <td data-label="MMLU (5-shot) %">97.32</td>
86
- <td data-label="MMLU-Pro %">94.2</td>
87
- <td data-label="GSM8K %">98.7</td>
88
- <td data-label="MATH %">94.21</td>
89
- </tr>
90
- <tr class="next">
91
- <td data-label="Model">Next Z1 (without tools)</td>
92
- <td data-label="MMLU (5-shot) %">94.7</td>
93
- <td data-label="MMLU-Pro %">90.14</td>
94
- <td data-label="GSM8K %">94.5</td>
95
- <td data-label="MATH %">88.7</td>
96
- </tr>
97
- <tr class="next">
98
- <td data-label="Model">Next 4B</td>
99
  <td data-label="MMLU (5-shot) %">84.61</td>
100
  <td data-label="MMLU-Pro %">66.92</td>
101
  <td data-label="GSM8K %">82.7</td>
102
  <td data-label="MATH %">70.5</td>
103
  </tr>
104
  <tr class="next">
105
- <td data-label="Model">Next 1B</td>
106
- <td data-label="MMLU (5-shot) %">92.3</td>
107
- <td data-label="MMLU-Pro %">69.23</td>
108
- <td data-label="GSM8K %">91.53</td>
109
- <td data-label="MATH %">77.1</td>
110
- </tr>
111
- <tr>
112
- <td data-label="Model">GPT 5</td>
113
- <td data-label="MMLU (5-shot) %">92.5</td>
114
- <td data-label="MMLU-Pro %">87.0</td>
115
- <td data-label="GSM8K %">98.4</td>
116
- <td data-label="MATH %">96.0</td>
117
- </tr>
118
- <tr>
119
- <td data-label="Model">Claude Opus 4.1 (Thinking)</td>
120
- <td data-label="MMLU (5-shot) %">~92.0</td>
121
- <td data-label="MMLU-Pro %">87.8</td>
122
- <td data-label="GSM8K %">84.7</td>
123
- <td data-label="MATH %">95.4</td>
124
- </tr>
125
- <tr>
126
- <td data-label="Model">Kumru 7B</td>
127
- <td data-label="MMLU (5-shot) %">30.76</td>
128
- <td data-label="MMLU-Pro %">28.57</td>
129
- <td data-label="GSM8K %">-</td>
130
- <td data-label="MATH %">-</td>
131
  </tr>
132
  <tr>
133
  <td data-label="Model">Qwen 3 0.6B</td>
@@ -143,10 +113,60 @@ pipeline_tag: text-generation
143
  <td data-label="GSM8K %">11.9</td>
144
  <td data-label="MATH %">30.6</td>
145
  </tr>
 
 
 
 
 
 
 
146
  </tbody>
147
  </table>
148
 
 
149
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
150
 
151
  ---
152
 
 
49
  ---
50
 
51
  <style>
52
+ table { width:fit-content; border-collapse:separate; border-spacing:0 3px;font-family:system-ui, -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, Oxygen, Ubuntu, Cantarell, 'Open Sans', 'Helvetica Neue', sans-serif;background:rgba(15,22,32,0.4);border-radius:16px;padding: 10px; border:none;transition:.2s all ease;}
53
+ thead th { text-align:center; padding:4px 10px; font-size:13px; text-transform:uppercase; color:rgb(200,200,200);border:none; }
54
+ tbody tr { transition: transform 0.18s ease, box-shadow 0.18s ease; border:none !important;transition:.2s all ease;border-radius:16px;background:rgba(0, 0, 0, 0.38);}
55
+ tbody .turkish:hover {box-shadow:0 6px 15px rgba(0, 0, 0, 0.27);scale:1.01;background:rgba(80, 38, 38, 0.6);}
56
+ tbody .next:hover {box-shadow:0 6px 15px rgba(0, 0, 0, 0.27);scale:1.02;background: rgba(0, 59, 225, 1)}
57
+ tbody tr:hover { box-shadow:0 0px 15px rgba(102, 102, 102, 0.13); background:rgba(139, 139, 139, 0.16)}
58
+ td { padding:8px 10px;border:0px transparent !important;outline:transparent !important; text-align:center; }
59
+ td:first-child { font-weight:600;text-align:left }
60
+ /* tbody .turkish td { background: rgba(255, 0, 0, 0.2) !important; color:rgb(200,200,200); font-weight:400;border:0px !important; scale:1.0; } */
61
+ /* tbody .next td { background: rgba(0, 89, 255, 0.49)!important; color:rgb(200,200,200); font-weight:600;border:0px !important; scale:1.00;outline:none;border:none !important;} */
62
+ .next{
63
+ background: rgba(0, 89, 255, 0.49);
 
 
 
 
 
64
  }
65
+ .turkish{
66
+ background:rgba(51, 34, 34, 0.64);
67
+ }
68
+ tbody tr td:first-child { border-top-left-radius:12px; border-bottom-left-radius:12px; }
69
+ tbody tr td:last-child { border-top-right-radius:12px; border-bottom-right-radius:12px; } strong{
70
+ font-size:16px;font-weight:700;
71
+ }
72
+ em{opacity:0.7;font-size:11px !important;}
73
  </style>
74
 
75
+ # Our Next 1B and Next 4B models are leading to all of the tiny models in benchmarks.
76
+
77
  <table>
78
  <thead>
79
  <tr>
 
86
  </thead>
87
  <tbody>
88
  <tr class="next">
89
+ <td data-label="Model">Next 4B preview <em>Version s325</em></td>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
90
  <td data-label="MMLU (5-shot) %">84.61</td>
91
  <td data-label="MMLU-Pro %">66.92</td>
92
  <td data-label="GSM8K %">82.7</td>
93
  <td data-label="MATH %">70.5</td>
94
  </tr>
95
  <tr class="next">
96
+ <td data-label="Model">Next 1B <em>Version t327</em></td>
97
+ <td data-label="MMLU (5-shot) %"><strong>90.3</strong></td>
98
+ <td data-label="MMLU-Pro %"><strong>69.23</strong></td>
99
+ <td data-label="GSM8K %"><strong>91.53</strong></td>
100
+ <td data-label="MATH %"><strong>77.1</strong></td>
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
101
  </tr>
102
  <tr>
103
  <td data-label="Model">Qwen 3 0.6B</td>
 
113
  <td data-label="GSM8K %">11.9</td>
114
  <td data-label="MATH %">30.6</td>
115
  </tr>
116
+ <tr class="turkish">
117
+ <td data-label="Model">Kumru 7B</td>
118
+ <td data-label="MMLU (5-shot) %">30.76</td>
119
+ <td data-label="MMLU-Pro %">28.57</td>
120
+ <td data-label="GSM8K %">-</td>
121
+ <td data-label="MATH %">-</td>
122
+ </tr>
123
  </tbody>
124
  </table>
125
 
126
+ ---
127
 
128
+ # Also, our Next Z1 model is leading to state-of-the-art models in some of the Benchmarks.
129
+ <table>
130
+ <thead>
131
+ <tr>
132
+ <th>Model</th>
133
+ <th>MMLU (5-shot) %</th>
134
+ <th>MMLU-Pro %</th>
135
+ <th>GSM8K %</th>
136
+ <th>MATH %</th>
137
+ </tr>
138
+ </thead>
139
+ <tbody>
140
+ <tr class="next">
141
+ <td data-label="Model">Next Z1 <em>Version l294</em></td>
142
+ <td data-label="MMLU (5-shot) %"><strong>97.32</strong></td>
143
+ <td data-label="MMLU-Pro %"><strong>94.2</strong></td>
144
+ <td data-label="GSM8K %">97.7</td>
145
+ <td data-label="MATH %">93.21</td>
146
+ </tr>
147
+ <tr class="next">
148
+ <td data-label="Model">Next Z1 <em>Version l294</em> (no tool)</td>
149
+ <td data-label="MMLU (5-shot) %">94.7</td>
150
+ <td data-label="MMLU-Pro %">90.14</td>
151
+ <td data-label="GSM8K %">94.5</td>
152
+ <td data-label="MATH %">88.7</td>
153
+ </tr>
154
+ <tr>
155
+ <td data-label="Model">GPT 5</td>
156
+ <td data-label="MMLU (5-shot) %">92.5</td>
157
+ <td data-label="MMLU-Pro %">87.0</td>
158
+ <td data-label="GSM8K %"><strong>98.4</strong></td>
159
+ <td data-label="MATH %"><strong>96.0</strong></td>
160
+ </tr>
161
+ <tr>
162
+ <td data-label="Model">Claude Opus 4.1 (Thinking)</td>
163
+ <td data-label="MMLU (5-shot) %">~92.0</td>
164
+ <td data-label="MMLU-Pro %">87.8</td>
165
+ <td data-label="GSM8K %">84.7</td>
166
+ <td data-label="MATH %">95.4</td>
167
+ </tr>
168
+ </tbody>
169
+ </table>
170
 
171
  ---
172