Update benchmark leaderboard
Browse files- index.html +73 -1
index.html
CHANGED
|
@@ -89,6 +89,27 @@
|
|
| 89 |
background: #111827; border: 1px solid #1e2a3a;
|
| 90 |
border-radius: 10px; padding: 24px 20px;
|
| 91 |
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 92 |
.footer { margin-top: 20px; font-size: 11px; color: #2d3748; text-align: right; }
|
| 93 |
::-webkit-scrollbar { height: 5px; background: #0d1117; }
|
| 94 |
::-webkit-scrollbar-thumb { background: #2d3748; border-radius: 3px; }
|
|
@@ -119,7 +140,16 @@
|
|
| 119 |
</table>
|
| 120 |
</div>
|
| 121 |
|
| 122 |
-
<p class="section-title">
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 123 |
<p class="subtitle" style="margin-bottom:20px">Weighted Score vs Exact Accuracy — all languages combined, sorted by Weighted Score</p>
|
| 124 |
<div class="chart-wrap">
|
| 125 |
<canvas id="globalChart"></canvas>
|
|
@@ -133,6 +163,7 @@
|
|
| 133 |
const ALL_LANGS = ["ar", "az", "be", "bg", "bo", "ca", "cn", "cs", "da", "de", "el", "en", "es", "et", "eu", "fa", "fi", "fr", "gl", "hu", "hv", "is", "it", "ka", "la", "li", "lv", "mk", "mt", "nl", "no", "pl", "pt", "ro", "ru", "sk", "sl", "sq", "sr", "stack", "sv", "tr", "uk"];
|
| 134 |
const LANG_NAMES = {"af": "Afrikaans", "ar": "Arabic", "az": "Azerbaijani", "be": "Belarusian", "bo": "Bosnian", "bg": "Bulgarian", "bn": "Bengali", "ca": "Catalan", "cs": "Czech", "cn": "Chinese", "cy": "Welsh", "da": "Danish", "de": "German", "el": "Greek", "en": "English", "eo": "Esperanto", "es": "Spanish", "et": "Estonian", "eu": "Basque", "fa": "Persian", "fi": "Finnish", "fr": "French", "ga": "Irish", "gl": "Galician", "gu": "Gujarati", "he": "Hebrew", "hi": "Hindi", "hr": "Croatian", "hu": "Hungarian", "hy": "Armenian", "hv": "Croatia", "id": "Indonesian", "is": "Icelandic", "it": "Italian", "ja": "Japanese", "ka": "Georgian", "kk": "Kazakh", "km": "Khmer", "kn": "Kannada", "ko": "Korean", "la": "Latin", "li": "Lithuanian", "lv": "Latvian", "mk": "Macedonian", "ml": "Malayalam", "mn": "Mongolian", "mr": "Marathi", "ms": "Malay", "mt": "Maltese", "my": "Burmese", "ne": "Nepali", "nl": "Dutch", "no": "Norwegian", "pa": "Punjabi", "pl": "Polish", "pt": "Portuguese", "ro": "Romanian", "ru": "Russian", "si": "Sinhala", "sk": "Slovak", "sl": "Slovenian", "sq": "Albanian", "sr": "Serbian", "sv": "Swedish", "sw": "Swahili", "ta": "Tamil", "te": "Telugu", "th": "Thai", "tl": "Filipino", "tr": "Turkish", "uk": "Ukrainian", "ur": "Urdu", "uz": "Uzbek", "vi": "Vietnamese", "zh": "Chinese", "zu": "Zulu"};
|
| 135 |
const LANG_COUNTS = {"ar": 1388, "az": 1395, "be": 1394, "bg": 1359, "bo": 1395, "ca": 1353, "cn": 2086, "cs": 1379, "da": 1384, "de": 688, "el": 1394, "en": 1391, "es": 1319, "et": 1388, "eu": 2087, "fa": 2097, "fi": 1384, "fr": 1379, "gl": 2098, "hu": 1396, "hv": 1396, "is": 1390, "it": 1391, "ka": 1311, "la": 2009, "li": 1393, "lv": 1395, "mk": 1399, "mt": 1397, "nl": 1395, "no": 1399, "pl": 2066, "pt": 1395, "ro": 1390, "ru": 1121, "sk": 1384, "sl": 1388, "sq": 1393, "sr": 1398, "stack": 2041, "sv": 1397, "tr": 1399, "uk": 1370};
|
|
|
|
| 136 |
|
| 137 |
function langName(c) { return LANG_NAMES[c] || c.toUpperCase(); }
|
| 138 |
|
|
@@ -267,6 +298,46 @@
|
|
| 267 |
});
|
| 268 |
}
|
| 269 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 270 |
// table
|
| 271 |
function render() {
|
| 272 |
renderChips();
|
|
@@ -334,6 +405,7 @@
|
|
| 334 |
|
| 335 |
render();
|
| 336 |
renderChart();
|
|
|
|
| 337 |
})();
|
| 338 |
</script>
|
| 339 |
</body>
|
|
|
|
| 89 |
background: #111827; border: 1px solid #1e2a3a;
|
| 90 |
border-radius: 10px; padding: 24px 20px;
|
| 91 |
}
|
| 92 |
+
.dist-wrap {
|
| 93 |
+
overflow-x: auto; border-radius: 10px;
|
| 94 |
+
border: 1px solid #1e2a3a; margin-bottom: 16px;
|
| 95 |
+
}
|
| 96 |
+
.dist-wrap table { border-collapse: collapse; width: auto; min-width: 100%; font-size: 12px; }
|
| 97 |
+
.dist-wrap thead tr { background: #111827; border-bottom: 2px solid #1e2a3a; }
|
| 98 |
+
.dist-wrap th {
|
| 99 |
+
padding: 10px 10px; white-space: nowrap; font-size: 10px;
|
| 100 |
+
text-transform: uppercase; letter-spacing: 0.07em; color: #475569; font-weight: 700;
|
| 101 |
+
}
|
| 102 |
+
.dist-wrap th.lang-h { text-align: left; width: 140px; padding-left: 14px; color: #64748b; }
|
| 103 |
+
.dist-wrap th.score-h { width: 70px; text-align: center; }
|
| 104 |
+
.dist-wrap th.total-h { width: 80px; text-align: center; color: #94a3b8; }
|
| 105 |
+
.dist-wrap td { padding: 8px 10px; border-bottom: 1px solid #0f1520; white-space: nowrap; }
|
| 106 |
+
.dist-wrap td.lang-d { padding-left: 14px; color: #cbd5e1; font-weight: 600; font-size: 12px; }
|
| 107 |
+
.dist-wrap td.count-d { text-align: center; font-size: 12px; }
|
| 108 |
+
.dist-wrap td.total-d { text-align: center; font-weight: 700; font-size: 12px; color: #94a3b8; }
|
| 109 |
+
.dist-bar {
|
| 110 |
+
display: inline-block; height: 6px; border-radius: 3px;
|
| 111 |
+
background: #2563eb; vertical-align: middle; margin-left: 4px; opacity: 0.7;
|
| 112 |
+
}
|
| 113 |
.footer { margin-top: 20px; font-size: 11px; color: #2d3748; text-align: right; }
|
| 114 |
::-webkit-scrollbar { height: 5px; background: #0d1117; }
|
| 115 |
::-webkit-scrollbar-thumb { background: #2d3748; border-radius: 3px; }
|
|
|
|
| 140 |
</table>
|
| 141 |
</div>
|
| 142 |
|
| 143 |
+
<p class="section-title">Dataset Distribution</p>
|
| 144 |
+
<p class="subtitle" style="margin-bottom:20px">Number of unique texts per rating score (1–6) for each language</p>
|
| 145 |
+
<div class="dist-wrap">
|
| 146 |
+
<table id="dist-table">
|
| 147 |
+
<thead id="dist-head"></thead>
|
| 148 |
+
<tbody id="dist-body"></tbody>
|
| 149 |
+
</table>
|
| 150 |
+
</div>
|
| 151 |
+
|
| 152 |
+
<p class="section-title" style="margin-top:52px">Global Model Comparison</p>
|
| 153 |
<p class="subtitle" style="margin-bottom:20px">Weighted Score vs Exact Accuracy — all languages combined, sorted by Weighted Score</p>
|
| 154 |
<div class="chart-wrap">
|
| 155 |
<canvas id="globalChart"></canvas>
|
|
|
|
| 163 |
const ALL_LANGS = ["ar", "az", "be", "bg", "bo", "ca", "cn", "cs", "da", "de", "el", "en", "es", "et", "eu", "fa", "fi", "fr", "gl", "hu", "hv", "is", "it", "ka", "la", "li", "lv", "mk", "mt", "nl", "no", "pl", "pt", "ro", "ru", "sk", "sl", "sq", "sr", "stack", "sv", "tr", "uk"];
|
| 164 |
const LANG_NAMES = {"af": "Afrikaans", "ar": "Arabic", "az": "Azerbaijani", "be": "Belarusian", "bo": "Bosnian", "bg": "Bulgarian", "bn": "Bengali", "ca": "Catalan", "cs": "Czech", "cn": "Chinese", "cy": "Welsh", "da": "Danish", "de": "German", "el": "Greek", "en": "English", "eo": "Esperanto", "es": "Spanish", "et": "Estonian", "eu": "Basque", "fa": "Persian", "fi": "Finnish", "fr": "French", "ga": "Irish", "gl": "Galician", "gu": "Gujarati", "he": "Hebrew", "hi": "Hindi", "hr": "Croatian", "hu": "Hungarian", "hy": "Armenian", "hv": "Croatia", "id": "Indonesian", "is": "Icelandic", "it": "Italian", "ja": "Japanese", "ka": "Georgian", "kk": "Kazakh", "km": "Khmer", "kn": "Kannada", "ko": "Korean", "la": "Latin", "li": "Lithuanian", "lv": "Latvian", "mk": "Macedonian", "ml": "Malayalam", "mn": "Mongolian", "mr": "Marathi", "ms": "Malay", "mt": "Maltese", "my": "Burmese", "ne": "Nepali", "nl": "Dutch", "no": "Norwegian", "pa": "Punjabi", "pl": "Polish", "pt": "Portuguese", "ro": "Romanian", "ru": "Russian", "si": "Sinhala", "sk": "Slovak", "sl": "Slovenian", "sq": "Albanian", "sr": "Serbian", "sv": "Swedish", "sw": "Swahili", "ta": "Tamil", "te": "Telugu", "th": "Thai", "tl": "Filipino", "tr": "Turkish", "uk": "Ukrainian", "ur": "Urdu", "uz": "Uzbek", "vi": "Vietnamese", "zh": "Chinese", "zu": "Zulu"};
|
| 165 |
const LANG_COUNTS = {"ar": 1388, "az": 1395, "be": 1394, "bg": 1359, "bo": 1395, "ca": 1353, "cn": 2086, "cs": 1379, "da": 1384, "de": 688, "el": 1394, "en": 1391, "es": 1319, "et": 1388, "eu": 2087, "fa": 2097, "fi": 1384, "fr": 1379, "gl": 2098, "hu": 1396, "hv": 1396, "is": 1390, "it": 1391, "ka": 1311, "la": 2009, "li": 1393, "lv": 1395, "mk": 1399, "mt": 1397, "nl": 1395, "no": 1399, "pl": 2066, "pt": 1395, "ro": 1390, "ru": 1121, "sk": 1384, "sl": 1388, "sq": 1393, "sr": 1398, "stack": 2041, "sv": 1397, "tr": 1399, "uk": 1370};
|
| 166 |
+
const LANG_DIST = {"ar": {"1": 347, "2": 345, "5": 347, "6": 349}, "az": {"1": 349, "2": 349, "5": 349, "6": 348}, "be": {"1": 347, "2": 348, "5": 350, "6": 349}, "bg": {"1": 349, "2": 349, "5": 349, "6": 312}, "bo": {"1": 350, "2": 349, "5": 349, "6": 347}, "ca": {"1": 322, "2": 348, "5": 347, "6": 336}, "cn": {"1": 342, "2": 349, "3": 348, "4": 349, "5": 349, "6": 349}, "cs": {"1": 341, "2": 344, "5": 348, "6": 346}, "da": {"1": 348, "2": 346, "5": 343, "6": 347}, "de": {"1": 346, "5": 342}, "el": {"1": 349, "2": 347, "5": 350, "6": 348}, "en": {"1": 347, "3": 347, "4": 350, "5": 347}, "es": {"1": 347, "2": 346, "5": 347, "6": 279}, "et": {"1": 347, "2": 347, "5": 346, "6": 348}, "eu": {"1": 345, "2": 348, "3": 347, "4": 348, "5": 349, "6": 350}, "fa": {"1": 349, "2": 350, "3": 349, "4": 350, "5": 349, "6": 350}, "fi": {"1": 344, "2": 347, "5": 346, "6": 347}, "fr": {"1": 349, "2": 348, "5": 350, "6": 332}, "gl": {"1": 350, "2": 349, "3": 350, "4": 349, "5": 350, "6": 350}, "hu": {"1": 350, "2": 349, "5": 347, "6": 350}, "hv": {"1": 350, "2": 348, "5": 348, "6": 350}, "is": {"1": 346, "2": 348, "5": 349, "6": 347}, "it": {"1": 346, "2": 349, "5": 348, "6": 348}, "ka": {"1": 265, "2": 349, "5": 348, "6": 349}, "la": {"1": 350, "2": 344, "3": 267, "4": 350, "5": 349, "6": 349}, "li": {"1": 347, "2": 350, "5": 348, "6": 348}, "lv": {"1": 349, "2": 350, "5": 348, "6": 348}, "mk": {"1": 350, "2": 350, "5": 349, "6": 350}, "mt": {"1": 350, "2": 348, "5": 349, "6": 350}, "nl": {"1": 348, "2": 350, "5": 349, "6": 348}, "no": {"1": 350, "2": 350, "5": 349, "6": 350}, "pl": {"1": 348, "2": 350, "3": 350, "4": 349, "5": 348, "6": 321}, "pt": {"1": 348, "2": 349, "5": 349, "6": 349}, "ro": {"1": 348, "2": 346, "5": 347, "6": 349}, "ru": {"1": 348, "2": 349, "5": 349, "6": 75}, "sk": {"1": 346, "2": 348, "5": 346, "6": 344}, "sl": {"1": 347, "2": 350, "5": 344, "6": 347}, "sq": {"1": 347, "2": 348, "5": 348, "6": 350}, "sr": {"1": 349, "2": 350, "5": 350, "6": 349}, "stack": {"1": 298, "2": 347, "3": 349, "4": 349, "5": 349, "6": 349}, "sv": {"1": 349, "2": 350, "5": 348, "6": 350}, "tr": {"1": 349, "2": 350, "5": 350, "6": 350}, "uk": {"1": 350, "2": 350, "5": 349, "6": 321}};
|
| 167 |
|
| 168 |
function langName(c) { return LANG_NAMES[c] || c.toUpperCase(); }
|
| 169 |
|
|
|
|
| 298 |
});
|
| 299 |
}
|
| 300 |
|
| 301 |
+
// distribution table
|
| 302 |
+
function renderDist() {
|
| 303 |
+
const scores = [1, 2, 3, 4, 5, 6];
|
| 304 |
+
const langs = [...ALL_LANGS];
|
| 305 |
+
|
| 306 |
+
// max count for bar scaling
|
| 307 |
+
let maxCount = 0;
|
| 308 |
+
langs.forEach(l => {
|
| 309 |
+
const d = LANG_DIST[l] || {};
|
| 310 |
+
scores.forEach(s => { if ((d[s]||0) > maxCount) maxCount = d[s]||0; });
|
| 311 |
+
});
|
| 312 |
+
|
| 313 |
+
// header
|
| 314 |
+
const head = document.getElementById('dist-head');
|
| 315 |
+
head.innerHTML = `<tr>
|
| 316 |
+
<th class="lang-h">Language</th>
|
| 317 |
+
${scores.map(s => `<th class="score-h">Rating ${s}</th>`).join('')}
|
| 318 |
+
<th class="total-h">Total texts</th>
|
| 319 |
+
</tr>`;
|
| 320 |
+
|
| 321 |
+
// body
|
| 322 |
+
const body = document.getElementById('dist-body');
|
| 323 |
+
body.innerHTML = langs.map(lang => {
|
| 324 |
+
const d = LANG_DIST[lang] || {};
|
| 325 |
+
const total = Object.values(d).reduce((a,b) => a+b, 0);
|
| 326 |
+
const cells = scores.map(s => {
|
| 327 |
+
const n = d[s] || 0;
|
| 328 |
+
const bar = maxCount > 0 ? Math.round((n / maxCount) * 48) : 0;
|
| 329 |
+
return `<td class="count-d">
|
| 330 |
+
${n > 0 ? `${n}<span class="dist-bar" style="width:${bar}px"></span>` : '<span style="color:#2d3748">—</span>'}
|
| 331 |
+
</td>`;
|
| 332 |
+
}).join('');
|
| 333 |
+
return `<tr>
|
| 334 |
+
<td class="lang-d">${langName(lang)}</td>
|
| 335 |
+
${cells}
|
| 336 |
+
<td class="total-d">${total.toLocaleString()}</td>
|
| 337 |
+
</tr>`;
|
| 338 |
+
}).join('');
|
| 339 |
+
}
|
| 340 |
+
|
| 341 |
// table
|
| 342 |
function render() {
|
| 343 |
renderChips();
|
|
|
|
| 405 |
|
| 406 |
render();
|
| 407 |
renderChart();
|
| 408 |
+
renderDist();
|
| 409 |
})();
|
| 410 |
</script>
|
| 411 |
</body>
|