Spaces:
Running
Running
| { | |
| "timestamp": "2026-03-02T22:55:43", | |
| "corpus": { | |
| "main_docs": 1, | |
| "noisy_articles": 50, | |
| "total_queries": 12, | |
| "answerable": 8, | |
| "unanswerable": 4 | |
| }, | |
| "baseline": { | |
| "config": "BASELINE", | |
| "retrieval_metrics": { | |
| "avg_MRR": 1.0, | |
| "avg_P@1": 1.0, | |
| "avg_P@5": 0.825, | |
| "avg_Recall@5": 1.0, | |
| "avg_Noise@5": 0.675, | |
| "avg_latency_ms": 76.2 | |
| }, | |
| "per_query": [ | |
| { | |
| "topic": "Inner planets", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.6, | |
| "latency_ms": 115.22539998986758 | |
| }, | |
| { | |
| "topic": "Jupiter's GRS", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 0.3333333333333333, | |
| "P@5": 0.4, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.8, | |
| "latency_ms": 62.7888000162784 | |
| }, | |
| { | |
| "topic": "Photosynthesis", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.6, | |
| "latency_ms": 79.76240001153201 | |
| }, | |
| { | |
| "topic": "Water cycle", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 0.6666666666666666, | |
| "P@5": 0.4, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.8, | |
| "latency_ms": 72.7103000099305 | |
| }, | |
| { | |
| "topic": "Mars atmosphere", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.6, | |
| "latency_ms": 74.54569998662919 | |
| }, | |
| { | |
| "topic": "Gas giants", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.8, | |
| "latency_ms": 66.27070001559332 | |
| }, | |
| { | |
| "topic": "Earth's ocean", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.4, | |
| "latency_ms": 69.69810000737198 | |
| }, | |
| { | |
| "topic": "Mars moons", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 0.8, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.8, | |
| "latency_ms": 68.9604000071995 | |
| }, | |
| { | |
| "topic": "Mars colonies (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.8, | |
| "avg_score": 0.7802, | |
| "latency_ms": 65.06809999700636 | |
| }, | |
| { | |
| "topic": "Neptune rings (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.6, | |
| "avg_score": 0.7181, | |
| "latency_ms": 73.1231999816373 | |
| }, | |
| { | |
| "topic": "Speed of light (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.6, | |
| "avg_score": 0.8281, | |
| "latency_ms": 68.4973000024911 | |
| }, | |
| { | |
| "topic": "Andromeda planets (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.6, | |
| "avg_score": 0.7707, | |
| "latency_ms": 69.7150000196416 | |
| } | |
| ] | |
| }, | |
| "improved": { | |
| "config": "IMPROVED", | |
| "retrieval_metrics": { | |
| "avg_MRR": 1.0, | |
| "avg_P@1": 1.0, | |
| "avg_P@5": 0.85, | |
| "avg_Recall@5": 1.0, | |
| "avg_Noise@5": 0.6, | |
| "avg_latency_ms": 414.9 | |
| }, | |
| "per_query": [ | |
| { | |
| "topic": "Inner planets", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.4, | |
| "latency_ms": 2133.6938999884296 | |
| }, | |
| { | |
| "topic": "Jupiter's GRS", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 0.6666666666666666, | |
| "P@5": 0.4, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.6, | |
| "latency_ms": 164.43840001011267 | |
| }, | |
| { | |
| "topic": "Photosynthesis", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.6, | |
| "latency_ms": 175.91029999312013 | |
| }, | |
| { | |
| "topic": "Water cycle", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 0.6666666666666666, | |
| "P@5": 0.4, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.8, | |
| "latency_ms": 175.35750000388362 | |
| }, | |
| { | |
| "topic": "Mars atmosphere", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.4, | |
| "latency_ms": 184.09689998952672 | |
| }, | |
| { | |
| "topic": "Gas giants", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.8, | |
| "latency_ms": 162.61590001522563 | |
| }, | |
| { | |
| "topic": "Earth's ocean", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.6, | |
| "latency_ms": 173.08269999921322 | |
| }, | |
| { | |
| "topic": "Mars moons", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.6, | |
| "latency_ms": 150.08699998725206 | |
| }, | |
| { | |
| "topic": "Mars colonies (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.4, | |
| "avg_score": -10.4797, | |
| "latency_ms": 169.6016000059899 | |
| }, | |
| { | |
| "topic": "Neptune rings (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.8, | |
| "avg_score": -7.7276, | |
| "latency_ms": 155.08669998962432 | |
| }, | |
| { | |
| "topic": "Speed of light (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.8, | |
| "avg_score": -10.7558, | |
| "latency_ms": 151.54829999664798 | |
| }, | |
| { | |
| "topic": "Andromeda planets (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.4, | |
| "avg_score": -5.8766, | |
| "latency_ms": 173.95070000202395 | |
| } | |
| ] | |
| }, | |
| "improved_expansion": { | |
| "config": "IMPROVED+EXPANSION", | |
| "retrieval_metrics": { | |
| "avg_MRR": 1.0, | |
| "avg_P@1": 1.0, | |
| "avg_P@5": 0.85, | |
| "avg_Recall@5": 1.0, | |
| "avg_Noise@5": 0.575, | |
| "avg_latency_ms": 1397.1 | |
| }, | |
| "per_query": [ | |
| { | |
| "topic": "Inner planets", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.2, | |
| "latency_ms": 1301.3575999939349 | |
| }, | |
| { | |
| "topic": "Jupiter's GRS", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 0.6666666666666666, | |
| "P@5": 0.4, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.6, | |
| "latency_ms": 1181.4564999949653 | |
| }, | |
| { | |
| "topic": "Photosynthesis", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.6, | |
| "latency_ms": 1556.0503999877255 | |
| }, | |
| { | |
| "topic": "Water cycle", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 0.6666666666666666, | |
| "P@5": 0.4, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.8, | |
| "latency_ms": 1384.7440000099596 | |
| }, | |
| { | |
| "topic": "Mars atmosphere", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.4, | |
| "latency_ms": 1248.011999996379 | |
| }, | |
| { | |
| "topic": "Gas giants", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.8, | |
| "latency_ms": 1367.9938999994192 | |
| }, | |
| { | |
| "topic": "Earth's ocean", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.6, | |
| "latency_ms": 1851.1549000104424 | |
| }, | |
| { | |
| "topic": "Mars moons", | |
| "answerable": true, | |
| "P@1": 1.0, | |
| "P@3": 1.0, | |
| "P@5": 1.0, | |
| "MRR": 1.0, | |
| "Recall@5": 1.0, | |
| "Noise@5": 0.6, | |
| "latency_ms": 1286.2794999964535 | |
| }, | |
| { | |
| "topic": "Mars colonies (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.6, | |
| "avg_score": -10.4877, | |
| "latency_ms": 1852.3111999966204 | |
| }, | |
| { | |
| "topic": "Neptune rings (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.6, | |
| "avg_score": -8.6497, | |
| "latency_ms": 1130.814600008307 | |
| }, | |
| { | |
| "topic": "Speed of light (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.8, | |
| "avg_score": -10.7509, | |
| "latency_ms": 1104.37010001624 | |
| }, | |
| { | |
| "topic": "Andromeda planets (UNANS)", | |
| "answerable": false, | |
| "P@1": 0, | |
| "P@3": 0, | |
| "P@5": 0, | |
| "MRR": 0, | |
| "Recall@5": 0, | |
| "Noise@5": 0.4, | |
| "avg_score": -5.8766, | |
| "latency_ms": 1411.4279999921564 | |
| } | |
| ] | |
| }, | |
| "ragas": { | |
| "answer_relevancy": 0.833, | |
| "context_recall": 1.0, | |
| "faithfulness": 0.9688, | |
| "llm_context_precision_without_reference": 0.7431 | |
| } | |
| } |