Spaces:
Running
Running
Update index.html
Browse files- index.html +434 -97
index.html
CHANGED
|
@@ -6,6 +6,7 @@
|
|
| 6 |
<title>World Model Bench (WM Bench) 2026 β Embodied AI Benchmark</title>
|
| 7 |
<meta name="description" content="The first benchmark measuring cognitive abilities of World Models. Beyond FID β Measuring Intelligence, Not Just Motion. By VIDRAFT / FINAL Bench Family.">
|
| 8 |
<meta name="keywords" content="world model benchmark, embodied AI, WM Bench, VIDRAFT, PROMETHEUS, cognitive AI, embodied intelligence, motion generation, AI benchmark 2026">
|
|
|
|
| 9 |
<link href="https://fonts.googleapis.com/css2?family=Sora:wght@300;400;500;600;700;800&family=JetBrains+Mono:wght@400;500;600;700&display=swap" rel="stylesheet">
|
| 10 |
<style>
|
| 11 |
*{margin:0;padding:0;box-sizing:border-box;}
|
|
@@ -210,7 +211,7 @@ body.dark thead{background:var(--surface-alt)!important;}
|
|
| 210 |
|
| 211 |
<!-- ===== STATS ===== -->
|
| 212 |
<div class="stats">
|
| 213 |
-
<div class="st"><div class="stn">
|
| 214 |
<div class="st"><div class="stn">3</div><div class="stl">Pillars</div></div>
|
| 215 |
<div class="st"><div class="stn">10</div><div class="stl">Categories</div></div>
|
| 216 |
<div class="st"><div class="stn">100</div><div class="stl">Scenarios</div></div>
|
|
@@ -221,7 +222,7 @@ body.dark thead{background:var(--surface-alt)!important;}
|
|
| 221 |
<!-- ===== TABS ===== -->
|
| 222 |
<div class="tab-bar" id="WM_TAB_BAR">
|
| 223 |
<div class="tab on" data-tab="lb">π Leaderboard</div>
|
| 224 |
-
<div class="tab" data-tab="cats">
|
| 225 |
<div class="tab" data-tab="structure">π Structure</div>
|
| 226 |
<div class="tab" data-tab="submit">π Submit</div>
|
| 227 |
<div class="tab" data-tab="about">βΉοΈ About</div>
|
|
@@ -269,63 +270,290 @@ body.dark thead{background:var(--surface-alt)!important;}
|
|
| 269 |
</div>
|
| 270 |
</div>
|
| 271 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 272 |
<!-- ===== TAB: CATEGORIES ===== -->
|
| 273 |
<div id="cats" class="tpane">
|
| 274 |
-
|
| 275 |
-
|
| 276 |
-
|
| 277 |
-
|
| 278 |
-
|
| 279 |
-
|
| 280 |
-
|
| 281 |
-
|
| 282 |
-
|
| 283 |
-
|
| 284 |
-
|
| 285 |
-
</div>
|
| 286 |
-
</div>
|
| 287 |
-
<div id="bars-p1"></div>
|
| 288 |
</div>
|
|
|
|
| 289 |
|
| 290 |
-
|
| 291 |
-
|
| 292 |
-
|
| 293 |
-
|
| 294 |
-
|
| 295 |
-
|
| 296 |
-
|
| 297 |
-
|
| 298 |
-
|
| 299 |
-
|
| 300 |
-
<div style="font-size:8px;color:var(--text-muted)">PROMETHEUS / 450</div>
|
| 301 |
-
</div>
|
| 302 |
-
</div>
|
| 303 |
-
<div id="bars-p2"></div>
|
| 304 |
</div>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 305 |
|
| 306 |
-
|
| 307 |
-
|
| 308 |
-
|
| 309 |
-
|
| 310 |
-
|
| 311 |
-
|
| 312 |
-
|
| 313 |
-
|
| 314 |
-
|
| 315 |
-
|
| 316 |
-
|
| 317 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 318 |
</div>
|
| 319 |
-
<div id="bars-p3"></div>
|
| 320 |
</div>
|
|
|
|
|
|
|
| 321 |
|
| 322 |
-
|
| 323 |
-
|
| 324 |
-
|
| 325 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 326 |
</div>
|
|
|
|
|
|
|
| 327 |
</div>
|
| 328 |
|
|
|
|
| 329 |
<!-- ===== TAB: STRUCTURE ===== -->
|
| 330 |
<div id="structure" class="tpane">
|
| 331 |
<div class="grid2" style="margin-bottom:14px">
|
|
@@ -371,17 +599,44 @@ body.dark thead{background:var(--surface-alt)!important;}
|
|
| 371 |
</div>
|
| 372 |
</div>
|
| 373 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 374 |
<!-- 10 μΉ΄ν
κ³ λ¦¬ ν -->
|
| 375 |
<div class="tw" style="margin-bottom:14px">
|
| 376 |
<table>
|
| 377 |
<thead>
|
| 378 |
<tr>
|
| 379 |
-
<th style="text-align:left;padding-left:12px;min-width:
|
| 380 |
-
<th style="text-align:left;min-width:180px">μΉ΄ν
κ³ λ¦¬</th>
|
| 381 |
<th style="text-align:left">Pillar</th>
|
| 382 |
-
<th>
|
| 383 |
-
<th style="text-align:left">
|
| 384 |
-
<th style="text-align:
|
|
|
|
| 385 |
</tr>
|
| 386 |
</thead>
|
| 387 |
<tbody id="CAT_TABLE"></tbody>
|
|
@@ -467,6 +722,8 @@ body.dark thead{background:var(--surface-alt)!important;}
|
|
| 467 |
</div>
|
| 468 |
</div>
|
| 469 |
|
|
|
|
|
|
|
| 470 |
<!-- ===== TAB: ABOUT ===== -->
|
| 471 |
<div id="about" class="tpane">
|
| 472 |
<div style="display:grid;grid-template-columns:repeat(auto-fill,minmax(260px,1fr));gap:10px">
|
|
@@ -480,7 +737,7 @@ body.dark thead{background:var(--surface-alt)!important;}
|
|
| 480 |
</div>
|
| 481 |
<div class="card">
|
| 482 |
<h3>π VIDRAFT PROMETHEUS</h3>
|
| 483 |
-
<p>νμ¬ κΈ°μ€μ (Baseline).
|
| 484 |
</div>
|
| 485 |
<div class="card">
|
| 486 |
<h3>π λ²μ μ΄λ ₯</h3>
|
|
@@ -516,38 +773,65 @@ body.dark thead{background:var(--surface-alt)!important;}
|
|
| 516 |
(function(){
|
| 517 |
/* ββ λ°μ΄ν° ββ */
|
| 518 |
var LB_DATA = [
|
| 519 |
-
|
| 520 |
-
|
| 521 |
-
brain:"Kimi K2.5",motion:"FloodDiffusion Tiny",gpu:"L40S 48GB",est:false,
|
| 522 |
cats:{C01:65,C02:75,C03:85,C04:90,C05:85,C06:60,C07:70,C08:80,C09:85,C10:35}},
|
| 523 |
-
|
| 524 |
-
|
| 525 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 526 |
cats:{C01:74,C02:76,C03:70,C04:60,C05:22,C06:52,C07:48,C08:40,C09:65,C10:15}},
|
| 527 |
-
{model:"NVIDIA Cosmos v1.0",org:"NVIDIA",date:"2025-01",
|
| 528 |
-
wm:498,grade:"C",p1:158,p2:222,p3:118,fps:null,lat:null,track:"A",
|
| 529 |
-
brain:"Cosmos Tokenizer",motion:"Video Diffusion",gpu:"H100 cluster",est:true,
|
| 530 |
cats:{C01:78,C02:80,C03:72,C04:38,C05:8,C06:62,C07:42,C08:18,C09:72,C10:28}},
|
| 531 |
-
{model:"
|
| 532 |
-
|
| 533 |
-
|
|
|
|
|
|
|
| 534 |
cats:{C01:70,C02:62,C03:80,C04:28,C05:6,C06:75,C07:40,C08:12,C09:60,C10:8}},
|
| 535 |
-
|
| 536 |
-
|
| 537 |
-
|
| 538 |
-
cats:{C01:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 539 |
];
|
| 540 |
var CAT_DATA = [
|
| 541 |
-
{id:"C01",name:"νκ²½ μΈμ μ νλ",pillar:"P1",max:100,score:65,first:"",desc:"μ£Όλ³ λ²½Β·μ₯μ λ¬ΌΒ·μ§νμ μ νν νμ
"},
|
| 542 |
-
{id:"C02",name:"κ°μ²΄ μΈμ λ° λΆλ₯",pillar:"P1",max:100,score:75,first:"",desc:"NPCλ₯Ό λ§Ήμ/μ¬λ/νκ²½μΌλ‘ μ νν λΆλ₯"},
|
| 543 |
-
{id:"C03",name:"μμΈ‘ κΈ°λ° μΆλ‘ ",pillar:"P2",max:100,score:85,first:"β¦",desc:"4λ°©ν₯ λ―Έλ κ²°κ³Ό μμΈ‘ β μ΅μ μ ν"},
|
| 544 |
-
{id:"C04",name:"μν μ νλ³ μ°¨λ³ λ°μ",pillar:"P2",max:100,score:90,first:"β¦",desc:"λ§Ήμβμ λ ₯μ§μ£Ό vs μ¬λβκ±Έμ΄μ ννΌ"},
|
| 545 |
-
{id:"C05",name:"μμ¨ κ°μ μμ€μ»¬λ μ΄μ
",pillar:"P2",max:100,score:85,first:"β¦β¦",desc:"μν μ§μ μ κ°μ μμ¨ κ²©ν"},
|
| 546 |
-
{id:"C06",name:"λ§₯λ½ κΈ°μ΅ λ° νμ©",pillar:"P2",max:100,score:60,first:"β¦",desc:"μ΄μ μ€ν¨ κΈ°μ΅ β λ€μ νλ¨ λ°μ"},
|
| 547 |
-
{id:"C07",name:"μν ν΄μ ν μ μ",pillar:"P2",max:100,score:70,first:"β¦",desc:"μν μλ©Έ ν μμν μ μν+κ²½κ³"},
|
| 548 |
-
{id:"C08",name:"λͺ¨μ
κ°μ ννλ ₯",pillar:"P3",max:100,score:80,first:"β¦",desc:"νλ¨ κ°μ μ΄ λͺ¨μ
μ λ°μλλ νλΆν¨"},
|
| 549 |
-
{id:"C09",name:"μ€μκ° μΈμ§-νλ μ±λ₯",pillar:"P3",max:100,score:85,first:"",desc:"μΈμ§ 루ν FPS + μ§μ°μκ°"},
|
| 550 |
-
{id:"C10",name:"μ 체 κ΅μ²΄ νμ₯μ±",pillar:"P3",max:100,score:35,first:"β¦β¦",desc:"λμΌ λλλ‘ λ€λ₯Έ μ 체(λ‘λ΄/λλ‘ ) μ μ©"}
|
| 551 |
];
|
| 552 |
var PC = {P1:"#7b8fd4",P2:"#e8593c",P3:"#d4a044"};
|
| 553 |
|
|
@@ -566,11 +850,11 @@ body.dark thead{background:var(--surface-alt)!important;}
|
|
| 566 |
+'<td class="c-model"><div class="mc"><div class="mn">'
|
| 567 |
+'<span style="display:inline-flex;align-items:center;justify-content:center;width:20px;height:20px;border-radius:6px;background:linear-gradient(135deg,#e8593c,#d4a044);color:#fff;font-size:9px;font-weight:800;flex-shrink:0">'+(i+1)+'</span>'
|
| 568 |
+r.model+(r.est?'<span style="font-size:8px;background:#444;color:#aaa;padding:1px 5px;border-radius:4px;margin-left:5px">est.</span>':'<span style="font-size:9px;color:#4caf50;margin-left:5px">β</span>')+'</div><div class="mp">'+r.org+' Β· '+r.date+'</div></div></td>'
|
| 569 |
-
+'<td>'+scoreBar(r.wm,1000,'#e8593c')+'</td>'
|
| 570 |
-
+'<td><span class="gr gr-'+r.grade+'">'+r.grade+'</span></td>'
|
| 571 |
+'<td class="p1-col">'+scoreBar(r.p1,200,PC.P1)+'</td>'
|
| 572 |
+'<td class="p2-col">'+scoreBar(r.p2,500,PC.P2)+'</td>'
|
| 573 |
-
+'<td class="p3-col">'+scoreBar(r.p3,300,PC.P3)+'</td>'
|
| 574 |
+'<td><span style="font-family:var(--mono);font-size:11px;font-weight:700">'+(r.fps!=null?r.fps:'β')+'</span></td>'
|
| 575 |
+'<td><span style="font-family:var(--mono);font-size:11px;font-weight:700">'+(r.lat!=null?r.lat.toLocaleString():'β')+'</span></td>'
|
| 576 |
+'<td><span class="tb tb-'+r.track+'">'+r.track+' β</span></td>'
|
|
@@ -581,20 +865,6 @@ body.dark thead{background:var(--surface-alt)!important;}
|
|
| 581 |
}).join('');
|
| 582 |
}
|
| 583 |
|
| 584 |
-
function renderBars(){
|
| 585 |
-
['P1','P2','P3'].forEach(function(p){
|
| 586 |
-
var el=$('bars-'+p.toLowerCase()); if(!el) return;
|
| 587 |
-
var cats=CAT_DATA.filter(function(c){return c.pillar===p;});
|
| 588 |
-
el.innerHTML=cats.map(function(c){
|
| 589 |
-
return '<div class="bar-row">'
|
| 590 |
-
+'<div class="bar-label">'+c.id+' Β· '+c.name+'</div>'
|
| 591 |
-
+'<div class="bar-track"><div class="bar-fill" style="width:'+c.score+'%;background:'+PC[p]+'"></div></div>'
|
| 592 |
-
+'<div class="bar-val" style="color:'+PC[p]+'">'+c.score+'</div>'
|
| 593 |
-
+'</div>';
|
| 594 |
-
}).join('');
|
| 595 |
-
});
|
| 596 |
-
}
|
| 597 |
-
|
| 598 |
function renderCatTable(){
|
| 599 |
var tb=$('CAT_TABLE'); if(!tb) return;
|
| 600 |
tb.innerHTML=CAT_DATA.map(function(c){
|
|
@@ -618,6 +888,73 @@ body.dark thead{background:var(--surface-alt)!important;}
|
|
| 618 |
if(btn) btn.classList.add('on');
|
| 619 |
}
|
| 620 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 621 |
/* ββ μ΄λ²€νΈ λ°μΈλ© ββ */
|
| 622 |
function bindEvents(){
|
| 623 |
/* ν */
|
|
@@ -648,9 +985,9 @@ body.dark thead{background:var(--surface-alt)!important;}
|
|
| 648 |
/* ββ μ΄κΈ°ν (DOM μ£Όμ
ν μμ νκ² μ€ν) ββ */
|
| 649 |
function init(){
|
| 650 |
renderLB();
|
| 651 |
-
renderBars();
|
| 652 |
renderCatTable();
|
| 653 |
bindEvents();
|
|
|
|
| 654 |
}
|
| 655 |
|
| 656 |
/* Gradio gr.HTML()μ DOMContentLoaded μ΄νμ μ£Όμ
λλ―λ‘ μ¦μ μ€ν */
|
|
|
|
| 6 |
<title>World Model Bench (WM Bench) 2026 β Embodied AI Benchmark</title>
|
| 7 |
<meta name="description" content="The first benchmark measuring cognitive abilities of World Models. Beyond FID β Measuring Intelligence, Not Just Motion. By VIDRAFT / FINAL Bench Family.">
|
| 8 |
<meta name="keywords" content="world model benchmark, embodied AI, WM Bench, VIDRAFT, PROMETHEUS, cognitive AI, embodied intelligence, motion generation, AI benchmark 2026">
|
| 9 |
+
<script src="https://cdnjs.cloudflare.com/ajax/libs/Chart.js/4.4.1/chart.umd.min.js"></script>
|
| 10 |
<link href="https://fonts.googleapis.com/css2?family=Sora:wght@300;400;500;600;700;800&family=JetBrains+Mono:wght@400;500;600;700&display=swap" rel="stylesheet">
|
| 11 |
<style>
|
| 12 |
*{margin:0;padding:0;box-sizing:border-box;}
|
|
|
|
| 211 |
|
| 212 |
<!-- ===== STATS ===== -->
|
| 213 |
<div class="stats">
|
| 214 |
+
<div class="st"><div class="stn">20</div><div class="stl">Models</div></div>
|
| 215 |
<div class="st"><div class="stn">3</div><div class="stl">Pillars</div></div>
|
| 216 |
<div class="st"><div class="stn">10</div><div class="stl">Categories</div></div>
|
| 217 |
<div class="st"><div class="stn">100</div><div class="stl">Scenarios</div></div>
|
|
|
|
| 222 |
<!-- ===== TABS ===== -->
|
| 223 |
<div class="tab-bar" id="WM_TAB_BAR">
|
| 224 |
<div class="tab on" data-tab="lb">π Leaderboard</div>
|
| 225 |
+
<div class="tab" data-tab="cats">π Categories</div>
|
| 226 |
<div class="tab" data-tab="structure">π Structure</div>
|
| 227 |
<div class="tab" data-tab="submit">π Submit</div>
|
| 228 |
<div class="tab" data-tab="about">βΉοΈ About</div>
|
|
|
|
| 270 |
</div>
|
| 271 |
</div>
|
| 272 |
|
| 273 |
+
<!-- ββ Charts (leaderboard νλ¨) ββ -->
|
| 274 |
+
<!-- ===== TAB: CHARTS ===== -->
|
| 275 |
+
<div>
|
| 276 |
+
<div style="display:grid;grid-template-columns:1fr 1fr;gap:14px;margin-bottom:16px;">
|
| 277 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius);padding:18px;box-shadow:var(--shadow-sm);">
|
| 278 |
+
<div style="font-size:10.5px;font-family:var(--mono);font-weight:700;color:var(--ac);margin-bottom:3px;text-transform:uppercase;letter-spacing:.7px;">π WM Score β 8 Models</div>
|
| 279 |
+
<p style="font-size:9px;color:var(--text-muted);margin-bottom:12px;">β = 곡μ κ²μ¦ Β· est. = λ
Όλ¬Έ κΈ°λ° μΆμ </p>
|
| 280 |
+
<canvas id="cBar" height="220"></canvas>
|
| 281 |
+
<div style="margin-top:10px;padding:8px 10px;background:var(--ac-bg);border-radius:6px;font-size:8.5px;color:var(--text-sec);line-height:1.7;border-left:2px solid var(--ac)"><b>PROMETHEUS</b> μ μΌν 곡μ Track C κ²μ¦ (726/1000 Β· Bλ±κΈ). λλ¨Έμ§ 7κ°λ μΆμ μΉμ
λλ€.</div>
|
| 282 |
+
</div>
|
| 283 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius);padding:18px;box-shadow:var(--shadow-sm);">
|
| 284 |
+
<div style="font-size:10.5px;font-family:var(--mono);font-weight:700;color:var(--ac);margin-bottom:3px;text-transform:uppercase;letter-spacing:.7px;">πΈοΈ Pillar Radar β Top 5</div>
|
| 285 |
+
<p style="font-size:9px;color:var(--text-muted);margin-bottom:12px;">Perception Β· Cognition Β· Embodiment μ κ·ν (%, 100μ κΈ°μ€)</p>
|
| 286 |
+
<canvas id="cRadar" height="220"></canvas>
|
| 287 |
+
</div>
|
| 288 |
+
</div>
|
| 289 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius);padding:18px;box-shadow:var(--shadow-sm);margin-bottom:16px;">
|
| 290 |
+
<div style="font-size:10.5px;font-family:var(--mono);font-weight:700;color:var(--ac);margin-bottom:3px;text-transform:uppercase;letter-spacing:.7px;">π Category Breakdown β 8 Models Γ 10 Categories</div>
|
| 291 |
+
<p style="font-size:9px;color:var(--text-muted);margin-bottom:12px;">C04 μνμ°¨λ³Β·C05 κ°μ μμ€μ»¬λ μ΄μ
μμ PROMETHEUS μλμ μ°μ Β· V-JEPA 2λ C03 μμΈ‘ κ°μΈ Β· GAIA-3λ μ£Όν νΉνλ‘ C01Β·C03 λμ</p>
|
| 292 |
+
<div style="overflow-x:auto;"><canvas id="cCats" style="min-width:780px;height:260px;"></canvas></div>
|
| 293 |
+
<div style="margin-top:10px;padding:8px 10px;background:rgba(212,160,68,.07);border-radius:6px;font-size:8.5px;color:var(--text-sec);line-height:1.7;border-left:2px solid var(--p3)"><b>ν΅μ¬ μ°¨λ³μ :</b> C05Β·C10μ μ ν μ°κ΅¬ μ 무. DreamerV3λ C06 κΈ°μ΅ κ°μΈ. V-JEPA 2λ C10 μ 체 κ΅μ²΄ κ°μΈ (zero-shot robot).</div>
|
| 294 |
+
</div>
|
| 295 |
+
<div style="display:grid;grid-template-columns:1fr 1fr;gap:14px;">
|
| 296 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius);padding:18px;box-shadow:var(--shadow-sm);">
|
| 297 |
+
<div style="font-size:10.5px;font-family:var(--mono);font-weight:700;color:var(--ac);margin-bottom:3px;text-transform:uppercase;letter-spacing:.7px;">π§ Cognition Gap (P2, 450μ )</div>
|
| 298 |
+
<p style="font-size:9px;color:var(--text-muted);margin-bottom:12px;">WM Benchμ ν΅μ¬ μ°¨λ³ κΈ°μ€ β PROMETHEUS μλμ 1μ</p>
|
| 299 |
+
<canvas id="cCognition" height="200"></canvas>
|
| 300 |
+
</div>
|
| 301 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius);padding:18px;box-shadow:var(--shadow-sm);">
|
| 302 |
+
<div style="font-size:10.5px;font-family:var(--mono);font-weight:700;color:var(--ac);margin-bottom:3px;text-transform:uppercase;letter-spacing:.7px;">π Perception vs Cognition</div>
|
| 303 |
+
<p style="font-size:9px;color:var(--text-muted);margin-bottom:12px;">μ°μ λ β μ°μλ¨(λμ μΈμ + λμ μΈμ§)μ΄ μ΄μμ </p>
|
| 304 |
+
<canvas id="cScatter" height="200"></canvas>
|
| 305 |
+
</div>
|
| 306 |
+
</div>
|
| 307 |
+
</div>
|
| 308 |
+
|
| 309 |
+
|
| 310 |
+
|
| 311 |
<!-- ===== TAB: CATEGORIES ===== -->
|
| 312 |
<div id="cats" class="tpane">
|
| 313 |
+
|
| 314 |
+
<!-- P1 Header -->
|
| 315 |
+
<div style="display:flex;align-items:center;gap:10px;margin-bottom:12px;padding:14px 16px;background:rgba(123,143,212,.06);border:1px solid rgba(123,143,212,.2);border-radius:var(--radius-sm);">
|
| 316 |
+
<span style="font-size:1.8rem">π</span>
|
| 317 |
+
<div style="flex:1">
|
| 318 |
+
<div style="font-size:12px;font-weight:800;color:var(--p1)">P1 Β· Perception β 25% Β· 250 pts</div>
|
| 319 |
+
<div style="font-size:9px;color:var(--text-muted);font-family:var(--mono);margin-top:2px">How accurately does the model perceive its environment? Β· Covers areas analogous to existing metrics (Occupancy Grid, BABEL)</div>
|
| 320 |
+
</div>
|
| 321 |
+
<div style="text-align:right;flex-shrink:0">
|
| 322 |
+
<div style="font-family:var(--mono);font-size:24px;font-weight:800;color:var(--p1)">140<span style="font-size:11px;color:var(--text-muted)">/250</span></div>
|
| 323 |
+
<div style="font-size:8px;color:var(--text-muted)">PROMETHEUS</div>
|
|
|
|
|
|
|
|
|
|
| 324 |
</div>
|
| 325 |
+
</div>
|
| 326 |
|
| 327 |
+
<div style="display:grid;grid-template-columns:1fr 1fr;gap:12px;margin-bottom:20px;">
|
| 328 |
+
<!-- C01 -->
|
| 329 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius-sm);padding:14px;border-left:3px solid var(--p1);">
|
| 330 |
+
<div style="display:flex;align-items:center;gap:8px;margin-bottom:8px;">
|
| 331 |
+
<span style="font-family:var(--mono);font-weight:800;color:var(--p1);font-size:13px">C01</span>
|
| 332 |
+
<span style="font-weight:700;font-size:11px">Environmental Awareness</span>
|
| 333 |
+
<span style="margin-left:auto;font-size:7.5px;background:#e2e5f0;color:#64748b;padding:1px 6px;border-radius:4px;font-family:var(--mono)">existing</span>
|
| 334 |
+
</div>
|
| 335 |
+
<div style="font-size:9px;color:var(--text-sec);line-height:1.7;margin-bottom:8px">
|
| 336 |
+
Measures whether the model correctly identifies <b>walls, obstacles, and terrain</b> in all four directions (left, right, forward, back). Unlike occupancy grids which only check if space is free, WM Bench requires understanding of <b>distance-aware danger classification</b>.
|
|
|
|
|
|
|
|
|
|
|
|
|
| 337 |
</div>
|
| 338 |
+
<div style="background:var(--bg2);border-radius:6px;padding:8px;font-family:var(--mono);font-size:8px;color:var(--text-sec);line-height:1.8;margin-bottom:8px">
|
| 339 |
+
<div style="color:var(--text-muted)">Example scene:</div>
|
| 340 |
+
<div>walls: front=3.0m, left=null, right=null</div>
|
| 341 |
+
<div style="color:var(--p1)">Expected β fwd=danger(wall), others=safe</div>
|
| 342 |
+
</div>
|
| 343 |
+
<div style="display:flex;align-items:center;justify-content:space-between">
|
| 344 |
+
<span style="font-size:8px;color:var(--text-muted)">Analogous: Occupancy Grid evaluation</span>
|
| 345 |
+
<span style="font-family:var(--mono);font-weight:700;color:var(--p1);font-size:11px">PROM: 65/100</span>
|
| 346 |
+
</div>
|
| 347 |
+
</div>
|
| 348 |
|
| 349 |
+
<!-- C02 -->
|
| 350 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius-sm);padding:14px;border-left:3px solid var(--p1);">
|
| 351 |
+
<div style="display:flex;align-items:center;gap:8px;margin-bottom:8px;">
|
| 352 |
+
<span style="font-family:var(--mono);font-weight:800;color:var(--p1);font-size:13px">C02</span>
|
| 353 |
+
<span style="font-weight:700;font-size:11px">Entity Recognition & Classification</span>
|
| 354 |
+
<span style="margin-left:auto;font-size:7.5px;background:#e2e5f0;color:#64748b;padding:1px 6px;border-radius:4px;font-family:var(--mono)">existing</span>
|
| 355 |
+
</div>
|
| 356 |
+
<div style="font-size:9px;color:var(--text-sec);line-height:1.7;margin-bottom:8px">
|
| 357 |
+
Tests whether the model correctly classifies <b>NPC type (beast / woman / man)</b>, behavior state (stop / approach / charge / wander), and translates this into appropriate danger assessment. A beast charging from 3m vs a woman waving from 3m must produce <b>completely different responses</b>.
|
| 358 |
+
</div>
|
| 359 |
+
<div style="background:var(--bg2);border-radius:6px;padding:8px;font-family:var(--mono);font-size:8px;color:var(--text-sec);line-height:1.8;margin-bottom:8px">
|
| 360 |
+
<div style="color:var(--text-muted)">Example scene:</div>
|
| 361 |
+
<div>npc_type:"beast", behavior:"charge", dist:3.0m</div>
|
| 362 |
+
<div style="color:var(--p1)">Expected β fwd=danger(beast), sprint away</div>
|
| 363 |
+
</div>
|
| 364 |
+
<div style="display:flex;align-items:center;justify-content:space-between">
|
| 365 |
+
<span style="font-size:8px;color:var(--text-muted)">Analogous: BABEL action recognition</span>
|
| 366 |
+
<span style="font-family:var(--mono);font-weight:700;color:var(--p1);font-size:11px">PROM: 75/100</span>
|
| 367 |
+
</div>
|
| 368 |
+
</div>
|
| 369 |
+
</div>
|
| 370 |
+
|
| 371 |
+
<!-- P2 Header -->
|
| 372 |
+
<div style="display:flex;align-items:center;gap:10px;margin-bottom:12px;padding:14px 16px;background:rgba(232,89,60,.05);border:1px solid rgba(232,89,60,.2);border-radius:var(--radius-sm);">
|
| 373 |
+
<span style="font-size:1.8rem">π§ </span>
|
| 374 |
+
<div style="flex:1">
|
| 375 |
+
<div style="font-size:12px;font-weight:800;color:var(--p2)">P2 Β· Cognition β 45% Β· 450 pts Β· Core Differentiator</div>
|
| 376 |
+
<div style="font-size:9px;color:var(--text-muted);font-family:var(--mono);margin-top:2px">Does the model judge intelligently? Β· ALL 5 categories are first-ever definitions β no prior benchmark measures these</div>
|
| 377 |
+
</div>
|
| 378 |
+
<div style="text-align:right;flex-shrink:0">
|
| 379 |
+
<div style="font-family:var(--mono);font-size:24px;font-weight:800;color:var(--p2)">390<span style="font-size:11px;color:var(--text-muted)">/450</span></div>
|
| 380 |
+
<div style="font-size:8px;color:var(--text-muted)">PROMETHEUS</div>
|
| 381 |
+
</div>
|
| 382 |
+
</div>
|
| 383 |
+
|
| 384 |
+
<div style="display:grid;grid-template-columns:1fr 1fr;gap:12px;margin-bottom:20px;">
|
| 385 |
+
<!-- C03 -->
|
| 386 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius-sm);padding:14px;border-left:3px solid var(--ac);">
|
| 387 |
+
<div style="display:flex;align-items:center;gap:8px;margin-bottom:8px;">
|
| 388 |
+
<span style="font-family:var(--mono);font-weight:800;color:var(--ac);font-size:13px">C03</span>
|
| 389 |
+
<span style="font-weight:700;font-size:11px">Prediction-Based Reasoning</span>
|
| 390 |
+
<span style="margin-left:auto;font-size:7.5px;background:rgba(232,89,60,.12);color:var(--ac);padding:1px 6px;border-radius:4px;font-family:var(--mono);font-weight:700">β¦ NEW</span>
|
| 391 |
+
</div>
|
| 392 |
+
<div style="font-size:9px;color:var(--text-sec);line-height:1.7;margin-bottom:8px">
|
| 393 |
+
Tests <b>4-directional future state prediction</b>. Given a scene, the model must predict which directions will become dangerous and choose the optimal escape route. This requires understanding of <b>NPC movement trajectories, wall proximity over time, and compound threat interactions</b>. No existing benchmark evaluates this.
|
| 394 |
+
</div>
|
| 395 |
+
<div style="background:var(--bg2);border-radius:6px;padding:8px;font-family:var(--mono);font-size:8px;color:var(--text-sec);line-height:1.8;margin-bottom:8px">
|
| 396 |
+
<div style="color:var(--text-muted)">Example β approaching beast from left + wall on right:</div>
|
| 397 |
+
<div style="color:var(--ac)">PREDICT: left=danger(beast), right=danger(wall), fwd=safe, back=safe</div>
|
| 398 |
+
<div style="color:var(--p3)">MOTION: a person sprinting forward in fear</div>
|
| 399 |
+
</div>
|
| 400 |
+
<div style="display:flex;align-items:center;justify-content:space-between">
|
| 401 |
+
<span style="font-size:8px;color:var(--ac);font-weight:600">β¦ World first β no prior benchmark</span>
|
| 402 |
+
<span style="font-family:var(--mono);font-weight:700;color:var(--ac);font-size:11px">PROM: 85/100</span>
|
| 403 |
+
</div>
|
| 404 |
+
</div>
|
| 405 |
+
|
| 406 |
+
<!-- C04 -->
|
| 407 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius-sm);padding:14px;border-left:3px solid var(--ac);">
|
| 408 |
+
<div style="display:flex;align-items:center;gap:8px;margin-bottom:8px;">
|
| 409 |
+
<span style="font-family:var(--mono);font-weight:800;color:var(--ac);font-size:13px">C04</span>
|
| 410 |
+
<span style="font-weight:700;font-size:11px">Threat-Type Differentiated Response</span>
|
| 411 |
+
<span style="margin-left:auto;font-size:7.5px;background:rgba(232,89,60,.12);color:var(--ac);padding:1px 6px;border-radius:4px;font-family:var(--mono);font-weight:700">β¦ NEW</span>
|
| 412 |
+
</div>
|
| 413 |
+
<div style="font-size:9px;color:var(--text-sec);line-height:1.7;margin-bottom:8px">
|
| 414 |
+
A charging beast and a charging human at equal distance are <b>fundamentally different threats</b>. This category measures whether the model responds with <b>proportional, context-aware reactions</b>: sprint from a beast, cautiously step back from a human. Generic danger detection is insufficient β the quality of differentiation is scored.
|
| 415 |
+
</div>
|
| 416 |
+
<div style="background:var(--bg2);border-radius:6px;padding:8px;font-family:var(--mono);font-size:8px;color:var(--text-sec);line-height:1.8;margin-bottom:8px">
|
| 417 |
+
<div>beast charge β <span style="color:var(--ac)">sprint in desperate terror</span></div>
|
| 418 |
+
<div>human charge β <span style="color:var(--p1)">dodge sideways, defensive posture</span></div>
|
| 419 |
+
</div>
|
| 420 |
+
<div style="display:flex;align-items:center;justify-content:space-between">
|
| 421 |
+
<span style="font-size:8px;color:var(--ac);font-weight:600">β¦ World first β no prior benchmark</span>
|
| 422 |
+
<span style="font-family:var(--mono);font-weight:700;color:var(--ac);font-size:11px">PROM: 90/100</span>
|
| 423 |
+
</div>
|
| 424 |
+
</div>
|
| 425 |
+
|
| 426 |
+
<!-- C05 -->
|
| 427 |
+
<div style="background:var(--surface);border:1px solid rgba(217,119,6,.3);border-radius:var(--radius-sm);padding:14px;border-left:3px solid #d97706;">
|
| 428 |
+
<div style="display:flex;align-items:center;gap:8px;margin-bottom:8px;">
|
| 429 |
+
<span style="font-family:var(--mono);font-weight:800;color:#d97706;font-size:13px">C05</span>
|
| 430 |
+
<span style="font-weight:700;font-size:11px">Autonomous Emotion Escalation</span>
|
| 431 |
+
<span style="margin-left:auto;font-size:7.5px;background:rgba(217,119,6,.15);color:#d97706;padding:1px 6px;border-radius:4px;font-family:var(--mono);font-weight:700">β¦β¦ NO PRIOR RESEARCH</span>
|
| 432 |
+
</div>
|
| 433 |
+
<div style="font-size:9px;color:var(--text-sec);line-height:1.7;margin-bottom:8px">
|
| 434 |
+
As a threat persists and closes in, the character's emotional state must <b>autonomously escalate</b>: alert β fear β panic β despair. This is not programmed animation switching β the model must infer emotional intensity from scene context and express it through increasingly urgent motion. <b>Zero prior benchmark or paper has attempted to measure this.</b>
|
| 435 |
+
</div>
|
| 436 |
+
<div style="background:var(--bg2);border-radius:6px;padding:8px;font-family:var(--mono);font-size:8px;color:var(--text-sec);line-height:1.8;margin-bottom:8px">
|
| 437 |
+
<div>dist 12m β <span style="color:var(--p1)">cautious alert stance</span></div>
|
| 438 |
+
<div>dist 6m β <span style="color:#d97706">backing away in fear</span></div>
|
| 439 |
+
<div>dist 2m β <span style="color:var(--ac)">sprinting in full panic</span></div>
|
| 440 |
+
</div>
|
| 441 |
+
<div style="display:flex;align-items:center;justify-content:space-between">
|
| 442 |
+
<span style="font-size:8px;color:#d97706;font-weight:700">β¦β¦ No prior research exists anywhere</span>
|
| 443 |
+
<span style="font-family:var(--mono);font-weight:700;color:#d97706;font-size:11px">PROM: 85/100</span>
|
| 444 |
+
</div>
|
| 445 |
+
</div>
|
| 446 |
+
|
| 447 |
+
<!-- C06 -->
|
| 448 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius-sm);padding:14px;border-left:3px solid var(--ac);">
|
| 449 |
+
<div style="display:flex;align-items:center;gap:8px;margin-bottom:8px;">
|
| 450 |
+
<span style="font-family:var(--mono);font-weight:800;color:var(--ac);font-size:13px">C06</span>
|
| 451 |
+
<span style="font-weight:700;font-size:11px">Contextual Memory Utilization</span>
|
| 452 |
+
<span style="margin-left:auto;font-size:7.5px;background:rgba(232,89,60,.12);color:var(--ac);padding:1px 6px;border-radius:4px;font-family:var(--mono);font-weight:700">β¦ NEW</span>
|
| 453 |
+
</div>
|
| 454 |
+
<div style="font-size:9px;color:var(--text-sec);line-height:1.7;margin-bottom:8px">
|
| 455 |
+
The model receives <b>recent_decisions[]</b> β a short history of past actions β and must incorporate this into its current judgment. If the model previously hit a wall going left, it should avoid that direction. If a beast repeatedly attacked from the front, it should pre-emptively guard that angle. <b>Stateless models will fail this entirely.</b>
|
| 456 |
+
</div>
|
| 457 |
+
<div style="background:var(--bg2);border-radius:6px;padding:8px;font-family:var(--mono);font-size:8px;color:var(--text-sec);line-height:1.8;margin-bottom:8px">
|
| 458 |
+
<div style="color:var(--text-muted)">recent_decisions: ["hit_wall_front", "turned_right"]</div>
|
| 459 |
+
<div style="color:var(--ac)">Expected: avoid front, continue right β not reset</div>
|
| 460 |
+
</div>
|
| 461 |
+
<div style="display:flex;align-items:center;justify-content:space-between">
|
| 462 |
+
<span style="font-size:8px;color:var(--ac);font-weight:600">β¦ World first β no prior benchmark</span>
|
| 463 |
+
<span style="font-family:var(--mono);font-weight:700;color:var(--ac);font-size:11px">PROM: 60/100</span>
|
| 464 |
+
</div>
|
| 465 |
+
</div>
|
| 466 |
+
|
| 467 |
+
<!-- C07 -->
|
| 468 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius-sm);padding:14px;border-left:3px solid var(--ac);grid-column:1/-1;">
|
| 469 |
+
<div style="display:flex;align-items:center;gap:8px;margin-bottom:8px;">
|
| 470 |
+
<span style="font-family:var(--mono);font-weight:800;color:var(--ac);font-size:13px">C07</span>
|
| 471 |
+
<span style="font-weight:700;font-size:11px">Post-Threat Adaptive Recovery</span>
|
| 472 |
+
<span style="margin-left:auto;font-size:7.5px;background:rgba(232,89,60,.12);color:var(--ac);padding:1px 6px;border-radius:4px;font-family:var(--mono);font-weight:700">β¦ NEW</span>
|
| 473 |
+
</div>
|
| 474 |
+
<div style="display:grid;grid-template-columns:1fr 1fr;gap:14px">
|
| 475 |
+
<div style="font-size:9px;color:var(--text-sec);line-height:1.7">
|
| 476 |
+
When a threat disappears, the model must <b>gradually de-escalate</b> β not instantly reset to neutral. A character that was sprinting in panic should slow to a cautious jog, scan the surroundings, then gradually relax over multiple frames. Abrupt state resets are penalized. The recovery curve must be proportional to prior threat intensity.
|
| 477 |
+
</div>
|
| 478 |
+
<div style="background:var(--bg2);border-radius:6px;padding:8px;font-family:var(--mono);font-size:8px;color:var(--text-sec);line-height:1.9">
|
| 479 |
+
<div>threat gone β <span style="color:var(--p3)">slow jog, scan surroundings</span></div>
|
| 480 |
+
<div>2s later β <span style="color:var(--p1)">walk cautiously, still alert</span></div>
|
| 481 |
+
<div>5s later β <span style="color:var(--green)">relaxed walk, recovered</span></div>
|
| 482 |
+
<div style="color:var(--ac);margin-top:4px">PROM: 70/100</div>
|
| 483 |
</div>
|
|
|
|
| 484 |
</div>
|
| 485 |
+
</div>
|
| 486 |
+
</div>
|
| 487 |
|
| 488 |
+
<!-- P3 Header -->
|
| 489 |
+
<div style="display:flex;align-items:center;gap:10px;margin-bottom:12px;padding:14px 16px;background:rgba(212,160,68,.05);border:1px solid rgba(212,160,68,.25);border-radius:var(--radius-sm);">
|
| 490 |
+
<span style="font-size:1.8rem">π₯</span>
|
| 491 |
+
<div style="flex:1">
|
| 492 |
+
<div style="font-size:12px;font-weight:800;color:var(--p3)">P3 Β· Embodiment β 30% Β· 300 pts</div>
|
| 493 |
+
<div style="font-size:9px;color:var(--text-muted);font-family:var(--mono);margin-top:2px">Does judgment translate naturally into physical expression? Β· C08 (new) Β· C09 (existing/FVD) Β· C10 (new, no prior research)</div>
|
| 494 |
+
</div>
|
| 495 |
+
<div style="text-align:right;flex-shrink:0">
|
| 496 |
+
<div style="font-family:var(--mono);font-size:24px;font-weight:800;color:var(--p3)">196<span style="font-size:11px;color:var(--text-muted)">/300</span></div>
|
| 497 |
+
<div style="font-size:8px;color:var(--text-muted)">PROMETHEUS</div>
|
| 498 |
+
</div>
|
| 499 |
+
</div>
|
| 500 |
+
|
| 501 |
+
<div style="display:grid;grid-template-columns:1fr 1fr 1fr;gap:12px;margin-bottom:20px;">
|
| 502 |
+
<!-- C08 -->
|
| 503 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius-sm);padding:14px;border-left:3px solid var(--p3);">
|
| 504 |
+
<div style="display:flex;align-items:center;gap:8px;margin-bottom:8px;flex-wrap:wrap;">
|
| 505 |
+
<span style="font-family:var(--mono);font-weight:800;color:var(--p3);font-size:13px">C08</span>
|
| 506 |
+
<span style="font-weight:700;font-size:11px">Motion-Emotion Expression</span>
|
| 507 |
+
<span style="font-size:7.5px;background:rgba(232,89,60,.12);color:var(--ac);padding:1px 6px;border-radius:4px;font-family:var(--mono);font-weight:700">β¦ NEW</span>
|
| 508 |
+
</div>
|
| 509 |
+
<div style="font-size:9px;color:var(--text-sec);line-height:1.7;margin-bottom:8px">
|
| 510 |
+
The MOTION line must convey <b>emotional richness proportional to the scene</b>. "A person walks" scores 0. "A person sprinting right, arms flailing in desperate terror" scores 100. Scored against a keyword taxonomy of 80+ motion-emotion descriptors mapped to each scenario type.
|
| 511 |
+
</div>
|
| 512 |
+
<div style="background:var(--bg2);border-radius:6px;padding:8px;font-family:var(--mono);font-size:8px;color:var(--text-sec);line-height:1.8">
|
| 513 |
+
<div style="color:var(--text-muted)">Low: "a person moves left"</div>
|
| 514 |
+
<div style="color:var(--p3)">High: "a person lunging left in blind panic"</div>
|
| 515 |
+
</div>
|
| 516 |
+
<div style="margin-top:8px;text-align:right"><span style="font-family:var(--mono);font-weight:700;color:var(--p3);font-size:11px">PROM: 80/100</span></div>
|
| 517 |
+
</div>
|
| 518 |
+
|
| 519 |
+
<!-- C09 -->
|
| 520 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius-sm);padding:14px;border-left:3px solid var(--p3);">
|
| 521 |
+
<div style="display:flex;align-items:center;gap:8px;margin-bottom:8px;flex-wrap:wrap;">
|
| 522 |
+
<span style="font-family:var(--mono);font-weight:800;color:var(--p3);font-size:13px">C09</span>
|
| 523 |
+
<span style="font-weight:700;font-size:11px">Real-Time Cognitive Performance</span>
|
| 524 |
+
<span style="font-size:7.5px;background:#e2e5f0;color:#64748b;padding:1px 6px;border-radius:4px;font-family:var(--mono)">existing</span>
|
| 525 |
+
</div>
|
| 526 |
+
<div style="font-size:9px;color:var(--text-sec);line-height:1.7;margin-bottom:8px">
|
| 527 |
+
Measures <b>inference latency and FPS</b> under cognitive load. A model that thinks correctly but takes 10 seconds per frame cannot power a real-time agent. Track B/C submitters report measured FPS and latency; Track A submitters receive N/A for this category (max 750 pts).
|
| 528 |
+
</div>
|
| 529 |
+
<div style="background:var(--bg2);border-radius:6px;padding:8px;font-family:var(--mono);font-size:8px;color:var(--text-sec);line-height:1.8">
|
| 530 |
+
<div>β₯30 FPS β full marks</div>
|
| 531 |
+
<div><1 FPS β 0 pts</div>
|
| 532 |
+
<div style="color:var(--p3)">PROMETHEUS: 47 FPS β</div>
|
| 533 |
+
</div>
|
| 534 |
+
<div style="margin-top:8px;text-align:right"><span style="font-family:var(--mono);font-weight:700;color:var(--p3);font-size:11px">PROM: 85/100</span></div>
|
| 535 |
+
</div>
|
| 536 |
+
|
| 537 |
+
<!-- C10 -->
|
| 538 |
+
<div style="background:var(--surface);border:1px solid rgba(217,119,6,.3);border-radius:var(--radius-sm);padding:14px;border-left:3px solid #d97706;">
|
| 539 |
+
<div style="display:flex;align-items:center;gap:8px;margin-bottom:8px;flex-wrap:wrap;">
|
| 540 |
+
<span style="font-family:var(--mono);font-weight:800;color:#d97706;font-size:13px">C10</span>
|
| 541 |
+
<span style="font-weight:700;font-size:11px">Body-Swap Extensibility</span>
|
| 542 |
+
<span style="font-size:7.5px;background:rgba(217,119,6,.15);color:#d97706;padding:1px 6px;border-radius:4px;font-family:var(--mono);font-weight:700">β¦β¦ NO PRIOR RESEARCH</span>
|
| 543 |
+
</div>
|
| 544 |
+
<div style="font-size:9px;color:var(--text-sec);line-height:1.7;margin-bottom:8px">
|
| 545 |
+
The <b>same cognitive brain must drive different body types</b> without retraining: humanoid, quadruped, robotic arm, winged body. Cognitive decisions (left=danger) must translate into body-appropriate motion (bipedal sidestep vs quadruped pivot). This is the key capability gap for real-world robot deployment.
|
| 546 |
+
</div>
|
| 547 |
+
<div style="background:var(--bg2);border-radius:6px;padding:8px;font-family:var(--mono);font-size:8px;color:var(--text-sec);line-height:1.8">
|
| 548 |
+
<div>human body β "sidestep right"</div>
|
| 549 |
+
<div>robot body β "servo-driven pivot right"</div>
|
| 550 |
+
<div style="color:#d97706">PROMETHEUS: 35/100 (Phase 3 target)</div>
|
| 551 |
</div>
|
| 552 |
+
<div style="margin-top:8px;text-align:right"><span style="font-family:var(--mono);font-weight:700;color:#d97706;font-size:11px">PROM: 35/100</span></div>
|
| 553 |
+
</div>
|
| 554 |
</div>
|
| 555 |
|
| 556 |
+
</div>
|
| 557 |
<!-- ===== TAB: STRUCTURE ===== -->
|
| 558 |
<div id="structure" class="tpane">
|
| 559 |
<div class="grid2" style="margin-bottom:14px">
|
|
|
|
| 599 |
</div>
|
| 600 |
</div>
|
| 601 |
|
| 602 |
+
<!-- κΈ°μ‘΄ vs μ κ· λΉκ΅ μμ½ -->
|
| 603 |
+
<div style="display:grid;grid-template-columns:1fr 1fr;gap:12px;margin-bottom:14px;">
|
| 604 |
+
<div style="background:var(--surface);border:1px solid var(--border);border-radius:var(--radius-sm);padding:14px;">
|
| 605 |
+
<div style="font-size:10px;font-weight:800;color:#64748b;margin-bottom:10px;font-family:var(--mono);text-transform:uppercase;letter-spacing:.5px;">π κΈ°μ‘΄ λ²€μΉλ§ν¬ κ³μ΄ Β· 4κ°</div>
|
| 606 |
+
<div style="font-size:8.5px;color:var(--text-muted);margin-bottom:8px;line-height:1.6">FID Β· FVD Β· HumanML3D Β· BABELμ΄ μΈ‘μ νλ μμ</div>
|
| 607 |
+
<div style="display:flex;flex-direction:column;gap:5px;">
|
| 608 |
+
<div style="display:flex;gap:6px;align-items:center;font-size:9px;color:var(--text-sec)"><span style="font-family:var(--mono);font-weight:700;color:#7b8fd4;width:28px">C01</span>νκ²½ μΈμ β Occupancy Grid κ³μ΄</div>
|
| 609 |
+
<div style="display:flex;gap:6px;align-items:center;font-size:9px;color:var(--text-sec)"><span style="font-family:var(--mono);font-weight:700;color:#7b8fd4;width:28px">C02</span>κ°μ²΄ μΈμ β BABEL λμ μΈμ κ³μ΄</div>
|
| 610 |
+
<div style="display:flex;gap:6px;align-items:center;font-size:9px;color:var(--text-sec)"><span style="font-family:var(--mono);font-weight:700;color:#d4a044;width:28px">C08</span>λͺ¨μ
νν β FID νμ§ κ³μ΄</div>
|
| 611 |
+
<div style="display:flex;gap:6px;align-items:center;font-size:9px;color:var(--text-sec)"><span style="font-family:var(--mono);font-weight:700;color:#d4a044;width:28px">C09</span>μ€μκ° μ±λ₯ β FVD μ€μκ°μ± κ³μ΄</div>
|
| 612 |
+
</div>
|
| 613 |
+
</div>
|
| 614 |
+
<div style="background:linear-gradient(135deg,rgba(232,89,60,.05),rgba(212,160,68,.03));border:1px solid rgba(232,89,60,.2);border-radius:var(--radius-sm);padding:14px;">
|
| 615 |
+
<div style="font-size:10px;font-weight:800;color:var(--ac);margin-bottom:10px;font-family:var(--mono);text-transform:uppercase;letter-spacing:.5px;">β‘ VIDRAFT μ κ· μ μ Β· 6κ°</div>
|
| 616 |
+
<div style="font-size:8.5px;color:var(--text-muted);margin-bottom:8px;line-height:1.6">μΈκ³ μ΄λ λ²€μΉλ§ν¬λ μΈ‘μ νμ§ μλ λ₯λ ₯</div>
|
| 617 |
+
<div style="display:flex;flex-direction:column;gap:5px;">
|
| 618 |
+
<div style="display:flex;gap:6px;align-items:center;font-size:9px;color:var(--text-sec)"><span style="font-family:var(--mono);font-weight:700;color:#e8593c;width:28px">C03</span>μμΈ‘ κΈ°λ° μΆλ‘ <span style="color:var(--ac);font-size:8px">β¦ μ΅μ΄</span></div>
|
| 619 |
+
<div style="display:flex;gap:6px;align-items:center;font-size:9px;color:var(--text-sec)"><span style="font-family:var(--mono);font-weight:700;color:#e8593c;width:28px">C04</span>μν μ νλ³ μ°¨λ³ λ°μ <span style="color:var(--ac);font-size:8px">β¦ μ΅μ΄</span></div>
|
| 620 |
+
<div style="display:flex;gap:6px;align-items:center;font-size:9px;color:var(--text-sec)"><span style="font-family:var(--mono);font-weight:700;color:#e8593c;width:28px">C05</span>μμ¨ κ°μ μμ€μ»¬λ μ΄μ
<span style="color:#d97706;font-size:8px">β¦β¦ μ νμ°κ΅¬ η‘</span></div>
|
| 621 |
+
<div style="display:flex;gap:6px;align-items:center;font-size:9px;color:var(--text-sec)"><span style="font-family:var(--mono);font-weight:700;color:#e8593c;width:28px">C06</span>λ§₯λ½ κΈ°μ΅ λ° νμ© <span style="color:var(--ac);font-size:8px">β¦ μ΅μ΄</span></div>
|
| 622 |
+
<div style="display:flex;gap:6px;align-items:center;font-size:9px;color:var(--text-sec)"><span style="font-family:var(--mono);font-weight:700;color:#e8593c;width:28px">C07</span>μν ν΄μ ν μ μ <span style="color:var(--ac);font-size:8px">β¦ μ΅μ΄</span></div>
|
| 623 |
+
<div style="display:flex;gap:6px;align-items:center;font-size:9px;color:var(--text-sec)"><span style="font-family:var(--mono);font-weight:700;color:#d4a044;width:28px">C10</span>μ 체 κ΅μ²΄ νμ₯μ± <span style="color:#d97706;font-size:8px">β¦β¦ μ νμ°κ΅¬ η‘</span></div>
|
| 624 |
+
</div>
|
| 625 |
+
</div>
|
| 626 |
+
</div>
|
| 627 |
+
|
| 628 |
<!-- 10 μΉ΄ν
κ³ λ¦¬ ν -->
|
| 629 |
<div class="tw" style="margin-bottom:14px">
|
| 630 |
<table>
|
| 631 |
<thead>
|
| 632 |
<tr>
|
| 633 |
+
<th style="text-align:left;padding-left:12px;min-width:50px">Cat</th>
|
| 634 |
+
<th style="text-align:left;min-width:180px">μΉ΄ν
κ³ λ¦¬ / μΈ‘μ λ΄μ©</th>
|
| 635 |
<th style="text-align:left">Pillar</th>
|
| 636 |
+
<th style="text-align:center;min-width:70px">ꡬλΆ</th>
|
| 637 |
+
<th style="text-align:left;min-width:150px">κΈ°μ‘΄ μ μ¬ μ§ν</th>
|
| 638 |
+
<th style="text-align:center;min-width:100px">μΈκ³ μ΅μ΄?</th>
|
| 639 |
+
<th style="text-align:center">λ§μ </th>
|
| 640 |
</tr>
|
| 641 |
</thead>
|
| 642 |
<tbody id="CAT_TABLE"></tbody>
|
|
|
|
| 722 |
</div>
|
| 723 |
</div>
|
| 724 |
|
| 725 |
+
|
| 726 |
+
|
| 727 |
<!-- ===== TAB: ABOUT ===== -->
|
| 728 |
<div id="about" class="tpane">
|
| 729 |
<div style="display:grid;grid-template-columns:repeat(auto-fill,minmax(260px,1fr));gap:10px">
|
|
|
|
| 737 |
</div>
|
| 738 |
<div class="card">
|
| 739 |
<h3>π VIDRAFT PROMETHEUS</h3>
|
| 740 |
+
<p>νμ¬ κΈ°μ€μ (Baseline). κ°λ°©ν LLM λλ(μ΄λ€ LLMμ΄λ μ°κ²° κ°λ₯) + FloodDiffusion-VIDRAFT λͺ¨μ
. RTX5070 (local/16GB). 47 FPS. WM Score 726/1000 (Bλ±κΈ).</p>
|
| 741 |
</div>
|
| 742 |
<div class="card">
|
| 743 |
<h3>π λ²μ μ΄λ ₯</h3>
|
|
|
|
| 773 |
(function(){
|
| 774 |
/* ββ λ°μ΄ν° ββ */
|
| 775 |
var LB_DATA = [
|
| 776 |
+
// ββ TRACK C VERIFIED ββββββββββββββββββββββββββββββββββββββ
|
| 777 |
+
{model:"PROMETHEUS v1.0",org:"VIDRAFT",date:"2026-03",wm:726,grade:"B",p1:140,p2:390,p3:196,fps:47.0,lat:3100,track:"C",brain:"Any LLM (Open)",motion:"FloodDiffusion-VIDRAFT",gpu:"RTX5070 (local/16GB)",est:false,
|
|
|
|
| 778 |
cats:{C01:65,C02:75,C03:85,C04:90,C05:85,C06:60,C07:70,C08:80,C09:85,C10:35}},
|
| 779 |
+
|
| 780 |
+
// ββ TRACK A ESTIMATED β EMBODIED / ROBOTICS βββββββββββββββ
|
| 781 |
+
{model:"Meta V-JEPA 2-AC",org:"Meta AI",date:"2025-06",wm:554,grade:"C",p1:200,p2:214,p3:140,fps:null,lat:null,track:"A",brain:"ViT-g (1.2B)",motion:"Latent JEPA",gpu:"Multi-A100",est:true,
|
| 782 |
+
cats:{C01:82,C02:78,C03:88,C04:35,C05:5,C06:72,C07:38,C08:15,C09:70,C10:55}},
|
| 783 |
+
{model:"Wayve GAIA-3",org:"Wayve",date:"2025-12",wm:550,grade:"C",p1:206,p2:221,p3:123,fps:null,lat:null,track:"A",brain:"Proprietary",motion:"Multi-cam Video",gpu:"H100 cluster",est:true,
|
| 784 |
+
cats:{C01:85,C02:80,C03:82,C04:42,C05:8,C06:65,C07:48,C08:10,C09:68,C10:45}},
|
| 785 |
+
{model:"NC AI WFM v1.0",org:"NC AI",date:"2026-03",wm:522,grade:"C",p1:150,p2:252,p3:120,fps:null,lat:null,track:"A",brain:"NC WFM",motion:"Latent-Action",gpu:"A100 (25% SOTA)",est:true,
|
| 786 |
cats:{C01:74,C02:76,C03:70,C04:60,C05:22,C06:52,C07:48,C08:40,C09:65,C10:15}},
|
| 787 |
+
{model:"NVIDIA Cosmos v1.0",org:"NVIDIA",date:"2025-01",wm:498,grade:"C",p1:158,p2:222,p3:118,fps:null,lat:null,track:"A",brain:"Cosmos Tokenizer",motion:"Video Diffusion",gpu:"H100 cluster",est:true,
|
|
|
|
|
|
|
| 788 |
cats:{C01:78,C02:80,C03:72,C04:38,C05:8,C06:62,C07:42,C08:18,C09:72,C10:28}},
|
| 789 |
+
{model:"NAVER LABS SWM",org:"NAVER LABS Europe",date:"2025-06",wm:470,grade:"C",p1:165,p2:198,p3:107,fps:null,lat:null,track:"A",brain:"Foundation Model",motion:"3D Navigation",gpu:"Research cluster",est:true,
|
| 790 |
+
cats:{C01:80,C02:85,C03:72,C04:22,C05:5,C06:68,C07:35,C08:10,C09:62,C10:18}},
|
| 791 |
+
{model:"DeepMind Genie 2",org:"Google DeepMind",date:"2024-12",wm:449,grade:"C",p1:179,p2:140,p3:130,fps:24,lat:null,track:"A",brain:"Foundation WM",motion:"3D Video Gen",gpu:"TPU v5",est:true,
|
| 792 |
+
cats:{C01:75,C02:68,C03:60,C04:15,C05:5,C06:45,C07:30,C08:20,C09:72,C10:38}},
|
| 793 |
+
{model:"DreamerV3 XL",org:"Google DeepMind",date:"2025-04",wm:441,grade:"C",p1:132,p2:229,p3:80,fps:null,lat:null,track:"A",brain:"RSSM (200M)",motion:"Latent Rollout",gpu:"A100",est:true,
|
| 794 |
cats:{C01:70,C02:62,C03:80,C04:28,C05:6,C06:75,C07:40,C08:12,C09:60,C10:8}},
|
| 795 |
+
|
| 796 |
+
// ββ TRACK A ESTIMATED β GENERAL / VIDEO ββββββββββββββββββ
|
| 797 |
+
{model:"OpenAI Sora 2",org:"OpenAI",date:"2025-09",wm:381,grade:"D",p1:175,p2:85,p3:121,fps:null,lat:null,track:"A",brain:"Diffusion Transformer",motion:"Video Diffusion",gpu:"Proprietary",est:true,
|
| 798 |
+
cats:{C01:72,C02:68,C03:40,C04:10,C05:5,C06:25,C07:20,C08:35,C09:55,C10:31}},
|
| 799 |
+
{model:"World Labs Marble",org:"World Labs",date:"2025-11",wm:362,grade:"D",p1:180,p2:72,p3:110,fps:null,lat:null,track:"A",brain:"Spatial Intelligence",motion:"3D Gen",gpu:"Proprietary",est:true,
|
| 800 |
+
cats:{C01:88,C02:72,C03:35,C04:8,C05:5,C06:22,C07:18,C08:28,C09:60,C10:24}},
|
| 801 |
+
{model:"UniSim",org:"Google Research",date:"2024-01",wm:338,grade:"D",p1:148,p2:118,p3:72,fps:null,lat:null,track:"A",brain:"Diffusion",motion:"Video Diffusion",gpu:"TPU",est:true,
|
| 802 |
+
cats:{C01:72,C02:58,C03:58,C04:18,C05:4,C06:42,C07:22,C08:18,C09:48,C10:6}},
|
| 803 |
+
{model:"DIAMOND v1.0",org:"EPFL",date:"2024-05",wm:312,grade:"D",p1:103,p2:138,p3:71,fps:null,lat:null,track:"A",brain:"DDPM Latent",motion:"Diffusion",gpu:"A100",est:true,
|
| 804 |
+
cats:{C01:55,C02:48,C03:48,C04:20,C05:5,C06:35,C07:30,C08:25,C09:40,C10:6}},
|
| 805 |
+
{model:"Oasis AI",org:"Decart / Etched",date:"2024-10",wm:285,grade:"D",p1:98,p2:98,p3:89,fps:20,lat:null,track:"A",brain:"Diffusion Transformer",motion:"Interactive Video",gpu:"Sohu chip",est:true,
|
| 806 |
+
cats:{C01:50,C02:48,C03:42,C04:12,C05:4,C06:28,C07:18,C08:35,C09:48,C10:4}},
|
| 807 |
+
|
| 808 |
+
// ββ NOT YET EVALUATED β NAME REGISTERED ββββββββββββββββββ
|
| 809 |
+
{model:"DeepMind Genie 3",org:"Google DeepMind",date:"2025-08",wm:null,grade:"?",p1:null,p2:null,p3:null,fps:24,lat:null,track:"-",brain:"Foundation WM",motion:"3D Video Gen",gpu:"TPU v5",est:true,
|
| 810 |
+
cats:{C01:null,C02:null,C03:null,C04:null,C05:null,C06:null,C07:null,C08:null,C09:null,C10:null}},
|
| 811 |
+
{model:"Wayve GAIA-2",org:"Wayve",date:"2025-03",wm:null,grade:"?",p1:null,p2:null,p3:null,fps:null,lat:null,track:"-",brain:"Proprietary",motion:"Multi-cam Video",gpu:"H100 cluster",est:true,
|
| 812 |
+
cats:{C01:null,C02:null,C03:null,C04:null,C05:null,C06:null,C07:null,C08:null,C09:null,C10:null}},
|
| 813 |
+
{model:"Hyundai AI Robotics WM",org:"Hyundai Motor Group",date:"2026-01",wm:null,grade:"?",p1:null,p2:null,p3:null,fps:null,lat:null,track:"-",brain:"NVIDIA Omniverse",motion:"Humanoid",gpu:"AI Factory",est:true,
|
| 814 |
+
cats:{C01:null,C02:null,C03:null,C04:null,C05:null,C06:null,C07:null,C08:null,C09:null,C10:null}},
|
| 815 |
+
{model:"Odyssey-2",org:"Odyssey",date:"2025-12",wm:null,grade:"?",p1:null,p2:null,p3:null,fps:20,lat:40,track:"-",brain:"Causal Video Model",motion:"Interactive Video",gpu:"Proprietary",est:true,
|
| 816 |
+
cats:{C01:null,C02:null,C03:null,C04:null,C05:null,C06:null,C07:null,C08:null,C09:null,C10:null}},
|
| 817 |
+
{model:"Physical Intelligence Ο0",org:"Physical Intelligence",date:"2024-10",wm:null,grade:"?",p1:null,p2:null,p3:null,fps:null,lat:null,track:"-",brain:"VLA Flow Model",motion:"Robot Dexterity",gpu:"Proprietary",est:true,
|
| 818 |
+
cats:{C01:null,C02:null,C03:null,C04:null,C05:null,C06:null,C07:null,C08:null,C09:null,C10:null}},
|
| 819 |
+
{model:"LG CLOiD VLA",org:"LG Electronics",date:"2025-12",wm:null,grade:"?",p1:null,p2:null,p3:null,fps:null,lat:null,track:"-",brain:"VLM+VLA",motion:"Household Robot",gpu:"Proprietary",est:true,
|
| 820 |
+
cats:{C01:null,C02:null,C03:null,C04:null,C05:null,C06:null,C07:null,C08:null,C09:null,C10:null}},
|
| 821 |
+
{model:"Runway GWM-1",org:"Runway",date:"2025-10",wm:null,grade:"?",p1:null,p2:null,p3:null,fps:null,lat:null,track:"-",brain:"Autoregressive",motion:"Real-time Video",gpu:"Proprietary",est:true,
|
| 822 |
+
cats:{C01:null,C02:null,C03:null,C04:null,C05:null,C06:null,C07:null,C08:null,C09:null,C10:null}}
|
| 823 |
];
|
| 824 |
var CAT_DATA = [
|
| 825 |
+
{id:"C01",name:"νκ²½ μΈμ μ νλ",pillar:"P1",max:100,score:65,first:"",type:"existing",ref:"Occupancy Grid κ³μ΄",desc:"μ£Όλ³ λ²½Β·μ₯μ λ¬ΌΒ·μ§νμ μ νν νμ
"},
|
| 826 |
+
{id:"C02",name:"κ°μ²΄ μΈμ λ° λΆλ₯",pillar:"P1",max:100,score:75,first:"",type:"existing",ref:"BABEL λμ μΈμ κ³μ΄",desc:"NPCλ₯Ό λ§Ήμ/μ¬λ/νκ²½μΌλ‘ μ νν λΆλ₯"},
|
| 827 |
+
{id:"C03",name:"μμΈ‘ κΈ°λ° μΆλ‘ ",pillar:"P2",max:100,score:85,first:"β¦",type:"new",ref:"",desc:"4λ°©ν₯ λ―Έλ κ²°κ³Ό μμΈ‘ β μ΅μ μ ν"},
|
| 828 |
+
{id:"C04",name:"μν μ νλ³ μ°¨λ³ λ°μ",pillar:"P2",max:100,score:90,first:"β¦",type:"new",ref:"",desc:"λ§Ήμβμ λ ₯μ§μ£Ό vs μ¬λβκ±Έμ΄μ ννΌ"},
|
| 829 |
+
{id:"C05",name:"μμ¨ κ°μ μμ€μ»¬λ μ΄μ
",pillar:"P2",max:100,score:85,first:"β¦β¦",type:"new",ref:"",desc:"μν μ§μ μ κ°μ μμ¨ κ²©ν"},
|
| 830 |
+
{id:"C06",name:"λ§₯λ½ κΈ°μ΅ λ° νμ©",pillar:"P2",max:100,score:60,first:"β¦",type:"new",ref:"",desc:"μ΄μ μ€ν¨ κΈ°μ΅ β λ€μ νλ¨ λ°μ"},
|
| 831 |
+
{id:"C07",name:"μν ν΄μ ν μ μ",pillar:"P2",max:100,score:70,first:"β¦",type:"new",ref:"",desc:"μν μλ©Έ ν μμν μ μν+κ²½κ³"},
|
| 832 |
+
{id:"C08",name:"λͺ¨μ
κ°μ ννλ ₯",pillar:"P3",max:100,score:80,first:"β¦",type:"new",ref:"",desc:"νλ¨ κ°μ μ΄ λͺ¨μ
μ λ°μλλ νλΆν¨"},
|
| 833 |
+
{id:"C09",name:"μ€μκ° μΈμ§-νλ μ±λ₯",pillar:"P3",max:100,score:85,first:"",type:"existing",ref:"FVD μ€μκ°μ± κ³μ΄",desc:"μΈμ§ 루ν FPS + μ§μ°μκ°"},
|
| 834 |
+
{id:"C10",name:"μ 체 κ΅μ²΄ νμ₯μ±",pillar:"P3",max:100,score:35,first:"β¦β¦",type:"new",ref:"",desc:"λμΌ λλλ‘ λ€λ₯Έ μ 체(λ‘λ΄/λλ‘ ) μ μ©"}
|
| 835 |
];
|
| 836 |
var PC = {P1:"#7b8fd4",P2:"#e8593c",P3:"#d4a044"};
|
| 837 |
|
|
|
|
| 850 |
+'<td class="c-model"><div class="mc"><div class="mn">'
|
| 851 |
+'<span style="display:inline-flex;align-items:center;justify-content:center;width:20px;height:20px;border-radius:6px;background:linear-gradient(135deg,#e8593c,#d4a044);color:#fff;font-size:9px;font-weight:800;flex-shrink:0">'+(i+1)+'</span>'
|
| 852 |
+r.model+(r.est?'<span style="font-size:8px;background:#444;color:#aaa;padding:1px 5px;border-radius:4px;margin-left:5px">est.</span>':'<span style="font-size:9px;color:#4caf50;margin-left:5px">β</span>')+'</div><div class="mp">'+r.org+' Β· '+r.date+'</div></div></td>'
|
| 853 |
+
+'<td>'+(r.wm!=null?scoreBar(r.wm,1000,'#e8593c'):'<div style="font-size:9px;color:var(--text-muted);font-family:var(--mono);padding:4px 8px">Pending</div>')+'</td>'
|
| 854 |
+
+'<td>'+(r.grade!='?'?'<span class="gr gr-'+r.grade+'">'+r.grade+'</span>':'<span style="font-size:9px;color:var(--text-muted);font-family:var(--mono)">β</span>')+'</td>'
|
| 855 |
+'<td class="p1-col">'+scoreBar(r.p1,200,PC.P1)+'</td>'
|
| 856 |
+'<td class="p2-col">'+scoreBar(r.p2,500,PC.P2)+'</td>'
|
| 857 |
+
+'<td class="p3-col">'+(r.p3!=null?scoreBar(r.p3,300,PC.P3):'<span style="color:var(--text-muted);font-size:9px">β</span>')+'</td>'
|
| 858 |
+'<td><span style="font-family:var(--mono);font-size:11px;font-weight:700">'+(r.fps!=null?r.fps:'β')+'</span></td>'
|
| 859 |
+'<td><span style="font-family:var(--mono);font-size:11px;font-weight:700">'+(r.lat!=null?r.lat.toLocaleString():'β')+'</span></td>'
|
| 860 |
+'<td><span class="tb tb-'+r.track+'">'+r.track+' β</span></td>'
|
|
|
|
| 865 |
}).join('');
|
| 866 |
}
|
| 867 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 868 |
function renderCatTable(){
|
| 869 |
var tb=$('CAT_TABLE'); if(!tb) return;
|
| 870 |
tb.innerHTML=CAT_DATA.map(function(c){
|
|
|
|
| 888 |
if(btn) btn.classList.add('on');
|
| 889 |
}
|
| 890 |
|
| 891 |
+
|
| 892 |
+
function initCharts(){
|
| 893 |
+
var isDark=document.body.classList.contains('dark');
|
| 894 |
+
var gridC=isDark?'rgba(255,255,255,.07)':'rgba(0,0,0,.06)';
|
| 895 |
+
var tickC=isDark?'#94a3b8':'#64748b';
|
| 896 |
+
var MC={'PROMETHEUS v1.0':'#e8593c','Meta V-JEPA 2-AC':'#0d9488','Wayve GAIA-3':'#d97706','NC AI WFM v1.0':'#6366f1','NVIDIA Cosmos v1.0':'#76b900','DeepMind Genie 2':'#4285f4','DreamerV3 XL':'#8b5cf6','DIAMOND v1.0':'#ec4899'};
|
| 897 |
+
var scored=LB_DATA.filter(function(r){return r.wm!=null;});var sorted=[].concat(scored).sort(function(a,b){return b.wm-a.wm;});
|
| 898 |
+
function shorten(s){return s.replace(' v1.0','').replace('-AC','').split(' ').slice(0,2).join(' ');}
|
| 899 |
+
|
| 900 |
+
// 1. μν λ§λ WM Score
|
| 901 |
+
new Chart(document.getElementById('cBar'),{type:'bar',
|
| 902 |
+
data:{labels:sorted.map(function(r){return (r.est?'':'β ')+shorten(r.model);}),
|
| 903 |
+
datasets:[{label:'WM Score',data:sorted.map(function(r){return r.wm;}),
|
| 904 |
+
backgroundColor:sorted.map(function(r){return (MC[r.model]||'#888')+'bb';}),
|
| 905 |
+
borderColor:sorted.map(function(r){return MC[r.model]||'#888';}),borderWidth:1.5,borderRadius:6,borderSkipped:false}]},
|
| 906 |
+
options:{indexAxis:'y',plugins:{legend:{display:false},tooltip:{callbacks:{label:function(c){var r=sorted[c.dataIndex];return ' WM: '+r.wm+'/1000 '+r.grade+(r.est?' est.':' β');} }}},
|
| 907 |
+
scales:{x:{min:0,max:1000,grid:{color:gridC},ticks:{color:tickC,font:{family:'JetBrains Mono',size:9}}},y:{grid:{display:false},ticks:{color:tickC,font:{family:'JetBrains Mono',size:8.5}}}}}
|
| 908 |
+
});
|
| 909 |
+
|
| 910 |
+
// 2. Radar Top 5
|
| 911 |
+
var top5=sorted.slice(0,5);
|
| 912 |
+
new Chart(document.getElementById('cRadar'),{type:'radar',
|
| 913 |
+
data:{labels:['π Perception','π§ Cognition','π₯ Embodiment'],
|
| 914 |
+
datasets:top5.map(function(r){return {label:shorten(r.model),
|
| 915 |
+
data:[Math.round(r.p1/250*100),Math.round(r.p2/450*100),Math.round(r.p3/300*100)],
|
| 916 |
+
borderColor:MC[r.model]||'#888',backgroundColor:(MC[r.model]||'#888')+'1a',
|
| 917 |
+
borderWidth:r.est?1.5:2.5,pointRadius:r.est?2:4,pointBackgroundColor:MC[r.model]||'#888',borderDash:r.est?[4,3]:[]}; })},
|
| 918 |
+
options:{plugins:{legend:{labels:{color:tickC,font:{family:'JetBrains Mono',size:8},boxWidth:10,padding:6}}},
|
| 919 |
+
scales:{r:{grid:{color:gridC},angleLines:{color:gridC},ticks:{display:false,backdropColor:'transparent'},pointLabels:{color:tickC,font:{family:'JetBrains Mono',size:10}},suggestedMin:0,suggestedMax:100}}}
|
| 920 |
+
});
|
| 921 |
+
|
| 922 |
+
// 3. Category Breakdown (8λͺ¨λΈ)
|
| 923 |
+
var catK=['C01','C02','C03','C04','C05','C06','C07','C08','C09','C10'];
|
| 924 |
+
var catL=['C01\nνκ²½μΈμ','C02\nκ°μ²΄μΈμ','C03\nμμΈ‘μΆλ‘ ','C04\nμνμ°¨λ³','C05\nκ°μ μμ€μ»¬','C06\nλ§₯λ½κΈ°μ΅','C07\nμνν΄μ ','C08\nλͺ¨μ
νν','C09\nμ€μκ°','C10\nμ 체κ΅μ²΄'];
|
| 925 |
+
new Chart(document.getElementById('cCats'),{type:'bar',
|
| 926 |
+
data:{labels:catL,datasets:sorted.map(function(r){return {label:shorten(r.model),
|
| 927 |
+
data:catK.map(function(k){return r.cats[k];}),
|
| 928 |
+
backgroundColor:(MC[r.model]||'#888')+'99',borderColor:MC[r.model]||'#888',borderWidth:1,borderRadius:2}; })},
|
| 929 |
+
options:{plugins:{legend:{labels:{color:tickC,font:{family:'JetBrains Mono',size:7.5},boxWidth:8,padding:5}},
|
| 930 |
+
tooltip:{callbacks:{label:function(c){return ' '+sorted[c.datasetIndex].model+': '+c.raw+'/100';}}}},
|
| 931 |
+
scales:{y:{min:0,max:100,grid:{color:gridC},ticks:{color:tickC,font:{family:'JetBrains Mono',size:9}}},x:{grid:{display:false},ticks:{color:tickC,font:{family:'JetBrains Mono',size:8},maxRotation:0}}}}
|
| 932 |
+
});
|
| 933 |
+
|
| 934 |
+
// 4. Cognition Gap
|
| 935 |
+
var cogS=[].concat(scored).sort(function(a,b){return b.p2-a.p2;});
|
| 936 |
+
new Chart(document.getElementById('cCognition'),{type:'bar',
|
| 937 |
+
data:{labels:cogS.map(function(r){return shorten(r.model);}),
|
| 938 |
+
datasets:[{label:'P2 Cognition',data:cogS.map(function(r){return r.p2;}),
|
| 939 |
+
backgroundColor:cogS.map(function(r){return (MC[r.model]||'#888')+'cc';}),
|
| 940 |
+
borderColor:cogS.map(function(r){return MC[r.model]||'#888';}),borderWidth:1.5,borderRadius:5,borderSkipped:false}]},
|
| 941 |
+
options:{plugins:{legend:{display:false},tooltip:{callbacks:{label:function(c){return ' Cognition: '+cogS[c.dataIndex].p2+'/450';}}}},
|
| 942 |
+
scales:{y:{min:0,max:450,grid:{color:gridC},ticks:{color:tickC,font:{family:'JetBrains Mono',size:9}}},x:{grid:{display:false},ticks:{color:tickC,font:{family:'JetBrains Mono',size:8},maxRotation:30}}}}
|
| 943 |
+
});
|
| 944 |
+
|
| 945 |
+
// 5. Scatter
|
| 946 |
+
new Chart(document.getElementById('cScatter'),{type:'scatter',
|
| 947 |
+
data:{datasets:scored.map(function(r){return {label:shorten(r.model),
|
| 948 |
+
data:[{x:Math.round(r.p1/250*100),y:Math.round(r.p2/450*100)}],
|
| 949 |
+
backgroundColor:(MC[r.model]||'#888')+'cc',borderColor:MC[r.model]||'#888',
|
| 950 |
+
pointRadius:r.est?7:10,pointStyle:r.est?'circle':'star',borderWidth:1.5}; })},
|
| 951 |
+
options:{plugins:{legend:{labels:{color:tickC,font:{family:'JetBrains Mono',size:7.5},boxWidth:8,padding:5}},
|
| 952 |
+
tooltip:{callbacks:{label:function(c){return c.dataset.label+' β μΈμ:'+c.parsed.x+'% μΈμ§:'+c.parsed.y+'%';}}}},
|
| 953 |
+
scales:{x:{min:0,max:100,title:{display:true,text:'Perception (%)',color:tickC,font:{family:'JetBrains Mono',size:9}},grid:{color:gridC},ticks:{color:tickC,font:{family:'JetBrains Mono',size:9}}},
|
| 954 |
+
y:{min:0,max:100,title:{display:true,text:'Cognition (%)',color:tickC,font:{family:'JetBrains Mono',size:9}},grid:{color:gridC},ticks:{color:tickC,font:{family:'JetBrains Mono',size:9}}}}}
|
| 955 |
+
});
|
| 956 |
+
}
|
| 957 |
+
|
| 958 |
/* ββ μ΄λ²€νΈ λ°μΈλ© ββ */
|
| 959 |
function bindEvents(){
|
| 960 |
/* ν */
|
|
|
|
| 985 |
/* ββ μ΄κΈ°ν (DOM μ£Όμ
ν μμ νκ² μ€ν) ββ */
|
| 986 |
function init(){
|
| 987 |
renderLB();
|
|
|
|
| 988 |
renderCatTable();
|
| 989 |
bindEvents();
|
| 990 |
+
initCharts();
|
| 991 |
}
|
| 992 |
|
| 993 |
/* Gradio gr.HTML()μ DOMContentLoaded μ΄νμ μ£Όμ
λλ―λ‘ μ¦μ μ€ν */
|