Spaces:
Running
Running
Update benchmarks with LoRA-bev-v9 results (May 2026)
Browse files- index.html +12 -12
index.html
CHANGED
|
@@ -329,7 +329,7 @@ const SECTIONS = [
|
|
| 329 |
{
|
| 330 |
title: "Synonym Recognition",
|
| 331 |
metric: "Recall@5",
|
| 332 |
-
scores: { dish_embed: 0.
|
| 333 |
},
|
| 334 |
{
|
| 335 |
title: "Cuisine Classification (19 cuisines)",
|
|
@@ -346,22 +346,22 @@ const SECTIONS = [
|
|
| 346 |
{
|
| 347 |
title: "Category Search",
|
| 348 |
metric: "NDCG@10",
|
| 349 |
-
scores: { dish_embed: 0.
|
| 350 |
},
|
| 351 |
{
|
| 352 |
title: "Typo-Tolerant Search",
|
| 353 |
metric: "NDCG@10",
|
| 354 |
-
scores: { dish_embed: 0.
|
| 355 |
},
|
| 356 |
{
|
| 357 |
title: "Food Search",
|
| 358 |
metric: "NDCG@10",
|
| 359 |
-
scores: { dish_embed: 0.
|
| 360 |
},
|
| 361 |
{
|
| 362 |
title: "Global Search",
|
| 363 |
metric: "NDCG@10",
|
| 364 |
-
scores: { dish_embed: 0.
|
| 365 |
}
|
| 366 |
]
|
| 367 |
},
|
|
@@ -374,22 +374,22 @@ const SECTIONS = [
|
|
| 374 |
{
|
| 375 |
title: "Indian Cuisine Matching",
|
| 376 |
metric: "F1",
|
| 377 |
-
scores: { dish_embed: 0.
|
| 378 |
},
|
| 379 |
{
|
| 380 |
title: "Cross-Language Matching",
|
| 381 |
metric: "F1",
|
| 382 |
-
scores: { dish_embed: 0.
|
| 383 |
},
|
| 384 |
{
|
| 385 |
title: "Bakery & Dessert Matching",
|
| 386 |
metric: "F1",
|
| 387 |
-
scores: { dish_embed: 0.
|
| 388 |
},
|
| 389 |
{
|
| 390 |
title: "Beverage Matching",
|
| 391 |
metric: "F1",
|
| 392 |
-
scores: { dish_embed: 0.
|
| 393 |
},
|
| 394 |
]
|
| 395 |
},
|
|
@@ -402,19 +402,19 @@ const SECTIONS = [
|
|
| 402 |
title: "Portion Size Sensitivity",
|
| 403 |
metric: "F1",
|
| 404 |
mode: "collapsed",
|
| 405 |
-
scores: { dish_embed: 0.
|
| 406 |
},
|
| 407 |
{
|
| 408 |
title: "Noisy Menu Matching",
|
| 409 |
metric: "F1",
|
| 410 |
mode: "collapsed",
|
| 411 |
-
scores: { dish_embed: 0.
|
| 412 |
},
|
| 413 |
{
|
| 414 |
title: "Bilingual Menu Matching",
|
| 415 |
metric: "F1",
|
| 416 |
mode: "collapsed",
|
| 417 |
-
scores: { dish_embed: 0.
|
| 418 |
},
|
| 419 |
{
|
| 420 |
title: "Embedding Stability",
|
|
|
|
| 329 |
{
|
| 330 |
title: "Synonym Recognition",
|
| 331 |
metric: "Recall@5",
|
| 332 |
+
scores: { dish_embed: 0.835, openai: 0.749, bge_m3: 0.707, qwen3: 0.514, e5_large: 0.661 }
|
| 333 |
},
|
| 334 |
{
|
| 335 |
title: "Cuisine Classification (19 cuisines)",
|
|
|
|
| 346 |
{
|
| 347 |
title: "Category Search",
|
| 348 |
metric: "NDCG@10",
|
| 349 |
+
scores: { dish_embed: 0.856, openai: 0.797, bge_m3: 0.759, qwen3: 0.802, e5_large: 0.799 }
|
| 350 |
},
|
| 351 |
{
|
| 352 |
title: "Typo-Tolerant Search",
|
| 353 |
metric: "NDCG@10",
|
| 354 |
+
scores: { dish_embed: 0.910, openai: 0.884, bge_m3: 0.902, qwen3: 0.892, e5_large: 0.907 }
|
| 355 |
},
|
| 356 |
{
|
| 357 |
title: "Food Search",
|
| 358 |
metric: "NDCG@10",
|
| 359 |
+
scores: { dish_embed: 0.944, openai: 0.925, bge_m3: 0.929, qwen3: 0.935, e5_large: 0.939 }
|
| 360 |
},
|
| 361 |
{
|
| 362 |
title: "Global Search",
|
| 363 |
metric: "NDCG@10",
|
| 364 |
+
scores: { dish_embed: 0.900, openai: 0.839, bge_m3: 0.886, qwen3: 0.875, e5_large: 0.860 }
|
| 365 |
}
|
| 366 |
]
|
| 367 |
},
|
|
|
|
| 374 |
{
|
| 375 |
title: "Indian Cuisine Matching",
|
| 376 |
metric: "F1",
|
| 377 |
+
scores: { dish_embed: 0.919, off_shelf: 0.754 }
|
| 378 |
},
|
| 379 |
{
|
| 380 |
title: "Cross-Language Matching",
|
| 381 |
metric: "F1",
|
| 382 |
+
scores: { dish_embed: 0.844, off_shelf: 0.258 }
|
| 383 |
},
|
| 384 |
{
|
| 385 |
title: "Bakery & Dessert Matching",
|
| 386 |
metric: "F1",
|
| 387 |
+
scores: { dish_embed: 0.783, off_shelf: 0.655 }
|
| 388 |
},
|
| 389 |
{
|
| 390 |
title: "Beverage Matching",
|
| 391 |
metric: "F1",
|
| 392 |
+
scores: { dish_embed: 0.744, off_shelf: 0.648 }
|
| 393 |
},
|
| 394 |
]
|
| 395 |
},
|
|
|
|
| 402 |
title: "Portion Size Sensitivity",
|
| 403 |
metric: "F1",
|
| 404 |
mode: "collapsed",
|
| 405 |
+
scores: { dish_embed: 0.885, off_shelf: 0.082 }
|
| 406 |
},
|
| 407 |
{
|
| 408 |
title: "Noisy Menu Matching",
|
| 409 |
metric: "F1",
|
| 410 |
mode: "collapsed",
|
| 411 |
+
scores: { dish_embed: 0.926, off_shelf: 0.914 }
|
| 412 |
},
|
| 413 |
{
|
| 414 |
title: "Bilingual Menu Matching",
|
| 415 |
metric: "F1",
|
| 416 |
mode: "collapsed",
|
| 417 |
+
scores: { dish_embed: 0.907, off_shelf: 0.879 }
|
| 418 |
},
|
| 419 |
{
|
| 420 |
title: "Embedding Stability",
|