Upload index.html
Browse files- index.html +111 -7
index.html
CHANGED
|
@@ -4,6 +4,7 @@
|
|
| 4 |
<meta charset="UTF-8">
|
| 5 |
<meta name="viewport" content="width=device-width, initial-scale=1.0">
|
| 6 |
<title>Tiny-ML Leaderboard</title>
|
|
|
|
| 7 |
<style>
|
| 8 |
:root {
|
| 9 |
--bg: #0d1117;
|
|
@@ -13,7 +14,8 @@
|
|
| 13 |
--accent: #58a6ff;
|
| 14 |
--green: #3fb950;
|
| 15 |
--orange: #d29922;
|
| 16 |
-
--
|
|
|
|
| 17 |
}
|
| 18 |
* { margin: 0; padding: 0; box-sizing: border-box; }
|
| 19 |
body { font-family: -apple-system,BlinkMacSystemFont,'Segoe UI',Helvetica,Arial,sans-serif; background: var(--bg); color: var(--text); padding: 2rem; }
|
|
@@ -22,20 +24,27 @@
|
|
| 22 |
.subtitle { color: #8b949e; margin-bottom: 2rem; font-size: .95rem; }
|
| 23 |
.note { background: var(--card); border: 1px solid var(--border); border-radius: 8px; padding: 1rem; margin-bottom: 2rem; font-size: .9rem; line-height: 1.5; }
|
| 24 |
.note a { color: var(--accent); }
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 25 |
table { width: 100%; border-collapse: collapse; font-size: .85rem; }
|
| 26 |
th { background: var(--card); padding: .75rem .5rem; text-align: center; border: 1px solid var(--border); font-weight: 600; white-space: nowrap; }
|
| 27 |
td { padding: .6rem .5rem; text-align: center; border: 1px solid var(--border); }
|
| 28 |
td:first-child, th:first-child { text-align: left; padding-left: 1rem; }
|
| 29 |
tr:hover td { background: rgba(88,166,255,.05); }
|
| 30 |
-
.group-row td { background: var(--bg); font-weight: 700; font-size: .8rem; text-transform: uppercase; letter-spacing: .08em; padding: .5rem; border-bottom: 2px solid var(--accent); color: var(--accent); }
|
| 31 |
.org-tag { display: inline-block; padding: .15rem .5rem; border-radius: 4px; font-size: .75rem; font-weight: 600; }
|
| 32 |
-
.org-compactai { background: #1f6feb33; color:
|
| 33 |
-
.org-supralabs { background: #3fb95033; color:
|
| 34 |
.best { color: var(--green); font-weight: 700; }
|
| 35 |
.na { color: #484f58; font-style: italic; }
|
| 36 |
.links a { color: var(--accent); text-decoration: none; }
|
| 37 |
.links a:hover { text-decoration: underline; }
|
| 38 |
-
.section-title { font-size: 1.2rem; margin: 2rem 0 1rem; padding-bottom: .5rem; border-bottom: 1px solid var(--border); }
|
| 39 |
footer { margin-top: 3rem; padding-top: 1.5rem; border-top: 1px solid var(--border); font-size: .8rem; color: #484f58; text-align: center; }
|
| 40 |
footer a { color: var(--accent); }
|
| 41 |
.methodology { margin-top: 2rem; }
|
|
@@ -43,6 +52,7 @@
|
|
| 43 |
.methodology p { font-size: .85rem; line-height: 1.6; color: #8b949e; }
|
| 44 |
@media (max-width: 768px) {
|
| 45 |
body { padding: 1rem; }
|
|
|
|
| 46 |
table { font-size: .75rem; }
|
| 47 |
th, td { padding: .4rem .3rem; }
|
| 48 |
}
|
|
@@ -61,7 +71,29 @@
|
|
| 61 |
<small>Also see the <a href="https://lh-tech.de/ai/compare-tiny-models.html" target="_blank">independent comparison page</a> by LH-Tech-AI.</small>
|
| 62 |
</div>
|
| 63 |
|
| 64 |
-
<h2 class="section-title">Benchmark
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 65 |
|
| 66 |
<table>
|
| 67 |
<thead>
|
|
@@ -242,7 +274,6 @@
|
|
| 242 |
</tbody>
|
| 243 |
</table>
|
| 244 |
|
| 245 |
-
|
| 246 |
<div class="methodology" style="margin-top:1.5rem">
|
| 247 |
<h3>Regarding the claim that Glint-1.3 is a "fake model with fake benchmarks"</h3>
|
| 248 |
|
|
@@ -333,5 +364,78 @@ All benchmark data is self-reported by model authors unless otherwise noted.</p>
|
|
| 333 |
</footer>
|
| 334 |
|
| 335 |
</div>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 336 |
</body>
|
| 337 |
</html>
|
|
|
|
| 4 |
<meta charset="UTF-8">
|
| 5 |
<meta name="viewport" content="width=device-width, initial-scale=1.0">
|
| 6 |
<title>Tiny-ML Leaderboard</title>
|
| 7 |
+
<script src="https://cdn.jsdelivr.net/npm/chart.js@4"></script>
|
| 8 |
<style>
|
| 9 |
:root {
|
| 10 |
--bg: #0d1117;
|
|
|
|
| 14 |
--accent: #58a6ff;
|
| 15 |
--green: #3fb950;
|
| 16 |
--orange: #d29922;
|
| 17 |
+
--compactai: #58a6ff;
|
| 18 |
+
--supralabs: #3fb950;
|
| 19 |
}
|
| 20 |
* { margin: 0; padding: 0; box-sizing: border-box; }
|
| 21 |
body { font-family: -apple-system,BlinkMacSystemFont,'Segoe UI',Helvetica,Arial,sans-serif; background: var(--bg); color: var(--text); padding: 2rem; }
|
|
|
|
| 24 |
.subtitle { color: #8b949e; margin-bottom: 2rem; font-size: .95rem; }
|
| 25 |
.note { background: var(--card); border: 1px solid var(--border); border-radius: 8px; padding: 1rem; margin-bottom: 2rem; font-size: .9rem; line-height: 1.5; }
|
| 26 |
.note a { color: var(--accent); }
|
| 27 |
+
.section-title { font-size: 1.2rem; margin: 2rem 0 1rem; padding-bottom: .5rem; border-bottom: 1px solid var(--border); }
|
| 28 |
+
.chart-grid { display: grid; grid-template-columns: 1fr 1fr; gap: 1.5rem; margin-bottom: 2rem; }
|
| 29 |
+
.chart-card { background: var(--card); border: 1px solid var(--border); border-radius: 8px; padding: 1rem; }
|
| 30 |
+
.chart-card.full { grid-column: 1 / -1; }
|
| 31 |
+
.chart-card h3 { font-size: .95rem; margin-bottom: .75rem; color: var(--text); }
|
| 32 |
+
.chart-card canvas { max-height: 360px; }
|
| 33 |
+
.legend { display: flex; gap: 1.5rem; margin-bottom: .75rem; font-size: .8rem; }
|
| 34 |
+
.legend-item { display: flex; align-items: center; gap: .4rem; }
|
| 35 |
+
.legend-dot { width: 10px; height: 10px; border-radius: 50%; }
|
| 36 |
table { width: 100%; border-collapse: collapse; font-size: .85rem; }
|
| 37 |
th { background: var(--card); padding: .75rem .5rem; text-align: center; border: 1px solid var(--border); font-weight: 600; white-space: nowrap; }
|
| 38 |
td { padding: .6rem .5rem; text-align: center; border: 1px solid var(--border); }
|
| 39 |
td:first-child, th:first-child { text-align: left; padding-left: 1rem; }
|
| 40 |
tr:hover td { background: rgba(88,166,255,.05); }
|
|
|
|
| 41 |
.org-tag { display: inline-block; padding: .15rem .5rem; border-radius: 4px; font-size: .75rem; font-weight: 600; }
|
| 42 |
+
.org-compactai { background: #1f6feb33; color: var(--compactai); }
|
| 43 |
+
.org-supralabs { background: #3fb95033; color: var(--supralabs); }
|
| 44 |
.best { color: var(--green); font-weight: 700; }
|
| 45 |
.na { color: #484f58; font-style: italic; }
|
| 46 |
.links a { color: var(--accent); text-decoration: none; }
|
| 47 |
.links a:hover { text-decoration: underline; }
|
|
|
|
| 48 |
footer { margin-top: 3rem; padding-top: 1.5rem; border-top: 1px solid var(--border); font-size: .8rem; color: #484f58; text-align: center; }
|
| 49 |
footer a { color: var(--accent); }
|
| 50 |
.methodology { margin-top: 2rem; }
|
|
|
|
| 52 |
.methodology p { font-size: .85rem; line-height: 1.6; color: #8b949e; }
|
| 53 |
@media (max-width: 768px) {
|
| 54 |
body { padding: 1rem; }
|
| 55 |
+
.chart-grid { grid-template-columns: 1fr; }
|
| 56 |
table { font-size: .75rem; }
|
| 57 |
th, td { padding: .4rem .3rem; }
|
| 58 |
}
|
|
|
|
| 71 |
<small>Also see the <a href="https://lh-tech.de/ai/compare-tiny-models.html" target="_blank">independent comparison page</a> by LH-Tech-AI.</small>
|
| 72 |
</div>
|
| 73 |
|
| 74 |
+
<h2 class="section-title">Benchmark Overview</h2>
|
| 75 |
+
|
| 76 |
+
<div class="legend">
|
| 77 |
+
<span class="legend-item"><span class="legend-dot" style="background:var(--compactai)"></span> CompactAI</span>
|
| 78 |
+
<span class="legend-item"><span class="legend-dot" style="background:var(--supralabs)"></span> SupraLabs</span>
|
| 79 |
+
</div>
|
| 80 |
+
|
| 81 |
+
<div class="chart-grid">
|
| 82 |
+
<div class="chart-card">
|
| 83 |
+
<h3>BLiMP ↑ (higher is better)</h3>
|
| 84 |
+
<canvas id="blimpChart"></canvas>
|
| 85 |
+
</div>
|
| 86 |
+
<div class="chart-card">
|
| 87 |
+
<h3>ARC-Easy ↑ (higher is better)</h3>
|
| 88 |
+
<canvas id="arcChart"></canvas>
|
| 89 |
+
</div>
|
| 90 |
+
<div class="chart-card full">
|
| 91 |
+
<h3>WikiText-2 ↓ (lower is better)</h3>
|
| 92 |
+
<canvas id="wikiChart"></canvas>
|
| 93 |
+
</div>
|
| 94 |
+
</div>
|
| 95 |
+
|
| 96 |
+
<h2 class="section-title">Detailed Results</h2>
|
| 97 |
|
| 98 |
<table>
|
| 99 |
<thead>
|
|
|
|
| 274 |
</tbody>
|
| 275 |
</table>
|
| 276 |
|
|
|
|
| 277 |
<div class="methodology" style="margin-top:1.5rem">
|
| 278 |
<h3>Regarding the claim that Glint-1.3 is a "fake model with fake benchmarks"</h3>
|
| 279 |
|
|
|
|
| 364 |
</footer>
|
| 365 |
|
| 366 |
</div>
|
| 367 |
+
<script>
|
| 368 |
+
const models = [
|
| 369 |
+
{ name: 'Supra-50M-Instruct', org: 'supralabs', blimp: 76.3, arc: 52.2, wiki: null },
|
| 370 |
+
{ name: 'Glint-1.3 (merged)', org: 'compactai', blimp: 68.7, arc: 32.5, wiki: 3.08 },
|
| 371 |
+
{ name: 'Supra-Mini-v5', org: 'supralabs', blimp: 63.5, arc: 34.4, wiki: 2.66 },
|
| 372 |
+
{ name: 'Glint-1', org: 'compactai', blimp: 61.2, arc: 32.0, wiki: 4.07 },
|
| 373 |
+
{ name: 'Supra-Mini-v4', org: 'supralabs', blimp: 60.7, arc: 31.5, wiki: 3.17 },
|
| 374 |
+
{ name: 'Glint-0.4', org: 'compactai', blimp: 58.5, arc: 31.0, wiki: 5.24 },
|
| 375 |
+
{ name: 'Supra-Mini-v3', org: 'supralabs', blimp: 55.3, arc: 27.3, wiki: 4.49 },
|
| 376 |
+
{ name: 'Supra-Mini-v2', org: 'supralabs', blimp: 53.5, arc: 26.8, wiki: 7.79 },
|
| 377 |
+
{ name: 'Glint-0.2', org: 'compactai', blimp: 49.8, arc: 27.0, wiki: null },
|
| 378 |
+
{ name: 'Glint-0.3', org: 'compactai', blimp: 47.3, arc: 25.5, wiki: null },
|
| 379 |
+
{ name: 'Glint-0.1', org: 'compactai', blimp: 46.7, arc: 21.0, wiki: null },
|
| 380 |
+
];
|
| 381 |
+
|
| 382 |
+
const colorMap = { compactai: '#58a6ff', supralabs: '#3fb950' };
|
| 383 |
+
const bgMap = { compactai: 'rgba(88,166,255,0.7)', supralabs: 'rgba(63,185,80,0.7)' };
|
| 384 |
+
|
| 385 |
+
function buildChart(canvasId, metric, label, reverse) {
|
| 386 |
+
const m = metric === 'wiki' ? 'wiki' : metric;
|
| 387 |
+
const fmt = metric === 'wiki' ? v => v.toFixed(2) : v => v.toFixed(1) + '%';
|
| 388 |
+
const sorted = models
|
| 389 |
+
.filter(d => d[metric] !== null)
|
| 390 |
+
.sort((a, b) => reverse ? a[metric] - b[metric] : b[metric] - a[metric]);
|
| 391 |
+
|
| 392 |
+
new Chart(document.getElementById(canvasId), {
|
| 393 |
+
type: 'bar',
|
| 394 |
+
data: {
|
| 395 |
+
labels: sorted.map(d => d.name),
|
| 396 |
+
datasets: [{
|
| 397 |
+
data: sorted.map(d => d[metric]),
|
| 398 |
+
backgroundColor: sorted.map(d => bgMap[d.org]),
|
| 399 |
+
borderColor: sorted.map(d => colorMap[d.org]),
|
| 400 |
+
borderWidth: 1,
|
| 401 |
+
borderRadius: 3,
|
| 402 |
+
}]
|
| 403 |
+
},
|
| 404 |
+
options: {
|
| 405 |
+
indexAxis: 'y',
|
| 406 |
+
responsive: true,
|
| 407 |
+
maintainAspectRatio: true,
|
| 408 |
+
plugins: {
|
| 409 |
+
legend: { display: false },
|
| 410 |
+
tooltip: {
|
| 411 |
+
callbacks: {
|
| 412 |
+
label: ctx => fmt(ctx.parsed.x)
|
| 413 |
+
}
|
| 414 |
+
}
|
| 415 |
+
},
|
| 416 |
+
scales: {
|
| 417 |
+
x: {
|
| 418 |
+
beginAtZero: true,
|
| 419 |
+
grid: { color: 'rgba(255,255,255,0.06)' },
|
| 420 |
+
ticks: { color: '#8b949e', callback: v => metric === 'wiki' ? v.toFixed(1) : v + '%' }
|
| 421 |
+
},
|
| 422 |
+
y: {
|
| 423 |
+
grid: { display: false },
|
| 424 |
+
ticks: {
|
| 425 |
+
color: '#c9d1d9',
|
| 426 |
+
font: { size: 11 },
|
| 427 |
+
autoSkip: false,
|
| 428 |
+
callback: label => label.length > 18 ? label.slice(0, 17) + '…' : label
|
| 429 |
+
}
|
| 430 |
+
}
|
| 431 |
+
}
|
| 432 |
+
}
|
| 433 |
+
});
|
| 434 |
+
}
|
| 435 |
+
|
| 436 |
+
buildChart('blimpChart', 'blimp', 'BLiMP Accuracy', false);
|
| 437 |
+
buildChart('arcChart', 'arc', 'ARC-Easy Accuracy', false);
|
| 438 |
+
buildChart('wikiChart', 'wiki', 'WikiText-2 Perplexity', true);
|
| 439 |
+
</script>
|
| 440 |
</body>
|
| 441 |
</html>
|