Spaces:
Running
Running
Sync leaderboard: EOG + EVA 2026-06-10
Browse filesevaAccuracy:
old: Scribe v2.2 Realtime + GPT-5.4 + Eleven Flash v2 (ElevenAgents)=0.67, Nova 3 + GPT-5.4 + Sonic 3=0.5, GPT Realtime 2=0.5
new: Scribe v2.2 Realtime + GPT-5.4 + Eleven Flash v2 (ElevenAgents)=0.67, Grok Voice Think Fast 1.0=0.59, Nova 3 + GPT-5.4 + Sonic 3=0.5
evaExperience:
old: Scribe v2.2 Realtime + Claude Haiku 4.5 + Eleven Flash v2 (ElevenAgents)=0.82, Gemini 3.1 Flash Live=0.59, GPT Realtime 1.5=0.57
new: Scribe v2.2 Realtime + Claude Haiku 4.5 + Eleven Flash v2 (ElevenAgents)=0.82, Gemini 3.1 Flash Live=0.59, Grok Voice Think Fast 1.0=0.57
- data/leaderboard.json +17 -17
data/leaderboard.json
CHANGED
|
@@ -1,15 +1,15 @@
|
|
| 1 |
{
|
| 2 |
-
"updated": "2026-06-
|
| 3 |
"sources": {
|
| 4 |
"eog": {
|
| 5 |
"url": "https://raw.githubusercontent.com/EnterpriseOps-Gym/EnterpriseOps-Gym.github.io/main/script.js",
|
| 6 |
-
"hash": "sha256:
|
| 7 |
-
"fetchedAt": "2026-06-
|
| 8 |
},
|
| 9 |
"eva": {
|
| 10 |
"url": "https://raw.githubusercontent.com/ServiceNow/eva/main/website/src/data/leaderboardStats.json",
|
| 11 |
-
"hash": "sha256:
|
| 12 |
-
"fetchedAt": "2026-06-
|
| 13 |
}
|
| 14 |
},
|
| 15 |
"eog": {
|
|
@@ -71,20 +71,20 @@
|
|
| 71 |
},
|
| 72 |
{
|
| 73 |
"rank": 2,
|
| 74 |
-
"name": "
|
| 75 |
-
"subtitle": "
|
| 76 |
-
"score": 0.
|
| 77 |
-
"ciLower": 0.
|
| 78 |
-
"ciUpper": 0.
|
| 79 |
-
"bar":
|
| 80 |
},
|
| 81 |
{
|
| 82 |
"rank": 3,
|
| 83 |
-
"name": "GPT
|
| 84 |
-
"subtitle": "
|
| 85 |
"score": 0.5,
|
| 86 |
"ciLower": 0.46,
|
| 87 |
-
"ciUpper": 0.
|
| 88 |
"bar": 50
|
| 89 |
}
|
| 90 |
]
|
|
@@ -112,11 +112,11 @@
|
|
| 112 |
},
|
| 113 |
{
|
| 114 |
"rank": 3,
|
| 115 |
-
"name": "
|
| 116 |
-
"subtitle": "
|
| 117 |
"score": 0.57,
|
| 118 |
"ciLower": 0.53,
|
| 119 |
-
"ciUpper": 0.
|
| 120 |
"bar": 57
|
| 121 |
}
|
| 122 |
]
|
|
|
|
| 1 |
{
|
| 2 |
+
"updated": "2026-06-10T18:19:04.013Z",
|
| 3 |
"sources": {
|
| 4 |
"eog": {
|
| 5 |
"url": "https://raw.githubusercontent.com/EnterpriseOps-Gym/EnterpriseOps-Gym.github.io/main/script.js",
|
| 6 |
+
"hash": "sha256:f96e11145e82ffd4bb2654a9e7cf42f5ebd3b10f481aa1027be22a0d3a1badba",
|
| 7 |
+
"fetchedAt": "2026-06-10T18:19:04.012Z"
|
| 8 |
},
|
| 9 |
"eva": {
|
| 10 |
"url": "https://raw.githubusercontent.com/ServiceNow/eva/main/website/src/data/leaderboardStats.json",
|
| 11 |
+
"hash": "sha256:1f7a33021ffea8a3719c24cf31f75cfeff4b0271f77ef8abfd0063099081b288",
|
| 12 |
+
"fetchedAt": "2026-06-10T18:19:04.013Z"
|
| 13 |
}
|
| 14 |
},
|
| 15 |
"eog": {
|
|
|
|
| 71 |
},
|
| 72 |
{
|
| 73 |
"rank": 2,
|
| 74 |
+
"name": "Grok Voice Think Fast 1.0",
|
| 75 |
+
"subtitle": "Grok 路 Speech-to-Speech",
|
| 76 |
+
"score": 0.59,
|
| 77 |
+
"ciLower": 0.54,
|
| 78 |
+
"ciUpper": 0.64,
|
| 79 |
+
"bar": 59
|
| 80 |
},
|
| 81 |
{
|
| 82 |
"rank": 3,
|
| 83 |
+
"name": "Nova 3 + GPT-5.4 + Sonic 3",
|
| 84 |
+
"subtitle": "Mixed Models 路 Cascade",
|
| 85 |
"score": 0.5,
|
| 86 |
"ciLower": 0.46,
|
| 87 |
+
"ciUpper": 0.54,
|
| 88 |
"bar": 50
|
| 89 |
}
|
| 90 |
]
|
|
|
|
| 112 |
},
|
| 113 |
{
|
| 114 |
"rank": 3,
|
| 115 |
+
"name": "Grok Voice Think Fast 1.0",
|
| 116 |
+
"subtitle": "Grok 路 Speech-to-Speech",
|
| 117 |
"score": 0.57,
|
| 118 |
"ciLower": 0.53,
|
| 119 |
+
"ciUpper": 0.61,
|
| 120 |
"bar": 57
|
| 121 |
}
|
| 122 |
]
|