adityapatni commited on
Commit
d77fe58
·
verified ·
1 Parent(s): 9d0d2b8

Update benchmarks with LoRA-bev-v9 results (May 2026)

Browse files
Files changed (1) hide show
  1. index.html +12 -12
index.html CHANGED
@@ -329,7 +329,7 @@ const SECTIONS = [
329
  {
330
  title: "Synonym Recognition",
331
  metric: "Recall@5",
332
- scores: { dish_embed: 0.808, openai: 0.749, bge_m3: 0.707, qwen3: 0.514, e5_large: 0.661 }
333
  },
334
  {
335
  title: "Cuisine Classification (19 cuisines)",
@@ -346,22 +346,22 @@ const SECTIONS = [
346
  {
347
  title: "Category Search",
348
  metric: "NDCG@10",
349
- scores: { dish_embed: 0.828, openai: 0.797, bge_m3: 0.759, qwen3: 0.802, e5_large: 0.799 }
350
  },
351
  {
352
  title: "Typo-Tolerant Search",
353
  metric: "NDCG@10",
354
- scores: { dish_embed: 0.920, openai: 0.884, bge_m3: 0.902, qwen3: 0.892, e5_large: 0.907 }
355
  },
356
  {
357
  title: "Food Search",
358
  metric: "NDCG@10",
359
- scores: { dish_embed: 0.943, openai: 0.925, bge_m3: 0.929, qwen3: 0.935, e5_large: 0.939 }
360
  },
361
  {
362
  title: "Global Search",
363
  metric: "NDCG@10",
364
- scores: { dish_embed: 0.891, openai: 0.839, bge_m3: 0.886, qwen3: 0.875, e5_large: 0.860 }
365
  }
366
  ]
367
  },
@@ -374,22 +374,22 @@ const SECTIONS = [
374
  {
375
  title: "Indian Cuisine Matching",
376
  metric: "F1",
377
- scores: { dish_embed: 0.916, off_shelf: 0.754 }
378
  },
379
  {
380
  title: "Cross-Language Matching",
381
  metric: "F1",
382
- scores: { dish_embed: 0.831, off_shelf: 0.258 }
383
  },
384
  {
385
  title: "Bakery & Dessert Matching",
386
  metric: "F1",
387
- scores: { dish_embed: 0.797, off_shelf: 0.655 }
388
  },
389
  {
390
  title: "Beverage Matching",
391
  metric: "F1",
392
- scores: { dish_embed: 0.747, off_shelf: 0.648 }
393
  },
394
  ]
395
  },
@@ -402,19 +402,19 @@ const SECTIONS = [
402
  title: "Portion Size Sensitivity",
403
  metric: "F1",
404
  mode: "collapsed",
405
- scores: { dish_embed: 0.877, off_shelf: 0.082 }
406
  },
407
  {
408
  title: "Noisy Menu Matching",
409
  metric: "F1",
410
  mode: "collapsed",
411
- scores: { dish_embed: 0.922, off_shelf: 0.914 }
412
  },
413
  {
414
  title: "Bilingual Menu Matching",
415
  metric: "F1",
416
  mode: "collapsed",
417
- scores: { dish_embed: 0.886, off_shelf: 0.879 }
418
  },
419
  {
420
  title: "Embedding Stability",
 
329
  {
330
  title: "Synonym Recognition",
331
  metric: "Recall@5",
332
+ scores: { dish_embed: 0.835, openai: 0.749, bge_m3: 0.707, qwen3: 0.514, e5_large: 0.661 }
333
  },
334
  {
335
  title: "Cuisine Classification (19 cuisines)",
 
346
  {
347
  title: "Category Search",
348
  metric: "NDCG@10",
349
+ scores: { dish_embed: 0.856, openai: 0.797, bge_m3: 0.759, qwen3: 0.802, e5_large: 0.799 }
350
  },
351
  {
352
  title: "Typo-Tolerant Search",
353
  metric: "NDCG@10",
354
+ scores: { dish_embed: 0.910, openai: 0.884, bge_m3: 0.902, qwen3: 0.892, e5_large: 0.907 }
355
  },
356
  {
357
  title: "Food Search",
358
  metric: "NDCG@10",
359
+ scores: { dish_embed: 0.944, openai: 0.925, bge_m3: 0.929, qwen3: 0.935, e5_large: 0.939 }
360
  },
361
  {
362
  title: "Global Search",
363
  metric: "NDCG@10",
364
+ scores: { dish_embed: 0.900, openai: 0.839, bge_m3: 0.886, qwen3: 0.875, e5_large: 0.860 }
365
  }
366
  ]
367
  },
 
374
  {
375
  title: "Indian Cuisine Matching",
376
  metric: "F1",
377
+ scores: { dish_embed: 0.919, off_shelf: 0.754 }
378
  },
379
  {
380
  title: "Cross-Language Matching",
381
  metric: "F1",
382
+ scores: { dish_embed: 0.844, off_shelf: 0.258 }
383
  },
384
  {
385
  title: "Bakery & Dessert Matching",
386
  metric: "F1",
387
+ scores: { dish_embed: 0.783, off_shelf: 0.655 }
388
  },
389
  {
390
  title: "Beverage Matching",
391
  metric: "F1",
392
+ scores: { dish_embed: 0.744, off_shelf: 0.648 }
393
  },
394
  ]
395
  },
 
402
  title: "Portion Size Sensitivity",
403
  metric: "F1",
404
  mode: "collapsed",
405
+ scores: { dish_embed: 0.885, off_shelf: 0.082 }
406
  },
407
  {
408
  title: "Noisy Menu Matching",
409
  metric: "F1",
410
  mode: "collapsed",
411
+ scores: { dish_embed: 0.926, off_shelf: 0.914 }
412
  },
413
  {
414
  title: "Bilingual Menu Matching",
415
  metric: "F1",
416
  mode: "collapsed",
417
+ scores: { dish_embed: 0.907, off_shelf: 0.879 }
418
  },
419
  {
420
  title: "Embedding Stability",