{ "timestamp": "2026-03-02T22:55:43", "corpus": { "main_docs": 1, "noisy_articles": 50, "total_queries": 12, "answerable": 8, "unanswerable": 4 }, "baseline": { "config": "BASELINE", "retrieval_metrics": { "avg_MRR": 1.0, "avg_P@1": 1.0, "avg_P@5": 0.825, "avg_Recall@5": 1.0, "avg_Noise@5": 0.675, "avg_latency_ms": 76.2 }, "per_query": [ { "topic": "Inner planets", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.6, "latency_ms": 115.22539998986758 }, { "topic": "Jupiter's GRS", "answerable": true, "P@1": 1.0, "P@3": 0.3333333333333333, "P@5": 0.4, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.8, "latency_ms": 62.7888000162784 }, { "topic": "Photosynthesis", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.6, "latency_ms": 79.76240001153201 }, { "topic": "Water cycle", "answerable": true, "P@1": 1.0, "P@3": 0.6666666666666666, "P@5": 0.4, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.8, "latency_ms": 72.7103000099305 }, { "topic": "Mars atmosphere", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.6, "latency_ms": 74.54569998662919 }, { "topic": "Gas giants", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.8, "latency_ms": 66.27070001559332 }, { "topic": "Earth's ocean", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.4, "latency_ms": 69.69810000737198 }, { "topic": "Mars moons", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 0.8, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.8, "latency_ms": 68.9604000071995 }, { "topic": "Mars colonies (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.8, "avg_score": 0.7802, "latency_ms": 65.06809999700636 }, { "topic": "Neptune rings (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.6, "avg_score": 0.7181, "latency_ms": 73.1231999816373 }, { "topic": "Speed of light (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.6, "avg_score": 0.8281, "latency_ms": 68.4973000024911 }, { "topic": "Andromeda planets (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.6, "avg_score": 0.7707, "latency_ms": 69.7150000196416 } ] }, "improved": { "config": "IMPROVED", "retrieval_metrics": { "avg_MRR": 1.0, "avg_P@1": 1.0, "avg_P@5": 0.85, "avg_Recall@5": 1.0, "avg_Noise@5": 0.6, "avg_latency_ms": 414.9 }, "per_query": [ { "topic": "Inner planets", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.4, "latency_ms": 2133.6938999884296 }, { "topic": "Jupiter's GRS", "answerable": true, "P@1": 1.0, "P@3": 0.6666666666666666, "P@5": 0.4, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.6, "latency_ms": 164.43840001011267 }, { "topic": "Photosynthesis", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.6, "latency_ms": 175.91029999312013 }, { "topic": "Water cycle", "answerable": true, "P@1": 1.0, "P@3": 0.6666666666666666, "P@5": 0.4, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.8, "latency_ms": 175.35750000388362 }, { "topic": "Mars atmosphere", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.4, "latency_ms": 184.09689998952672 }, { "topic": "Gas giants", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.8, "latency_ms": 162.61590001522563 }, { "topic": "Earth's ocean", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.6, "latency_ms": 173.08269999921322 }, { "topic": "Mars moons", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.6, "latency_ms": 150.08699998725206 }, { "topic": "Mars colonies (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.4, "avg_score": -10.4797, "latency_ms": 169.6016000059899 }, { "topic": "Neptune rings (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.8, "avg_score": -7.7276, "latency_ms": 155.08669998962432 }, { "topic": "Speed of light (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.8, "avg_score": -10.7558, "latency_ms": 151.54829999664798 }, { "topic": "Andromeda planets (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.4, "avg_score": -5.8766, "latency_ms": 173.95070000202395 } ] }, "improved_expansion": { "config": "IMPROVED+EXPANSION", "retrieval_metrics": { "avg_MRR": 1.0, "avg_P@1": 1.0, "avg_P@5": 0.85, "avg_Recall@5": 1.0, "avg_Noise@5": 0.575, "avg_latency_ms": 1397.1 }, "per_query": [ { "topic": "Inner planets", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.2, "latency_ms": 1301.3575999939349 }, { "topic": "Jupiter's GRS", "answerable": true, "P@1": 1.0, "P@3": 0.6666666666666666, "P@5": 0.4, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.6, "latency_ms": 1181.4564999949653 }, { "topic": "Photosynthesis", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.6, "latency_ms": 1556.0503999877255 }, { "topic": "Water cycle", "answerable": true, "P@1": 1.0, "P@3": 0.6666666666666666, "P@5": 0.4, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.8, "latency_ms": 1384.7440000099596 }, { "topic": "Mars atmosphere", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.4, "latency_ms": 1248.011999996379 }, { "topic": "Gas giants", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.8, "latency_ms": 1367.9938999994192 }, { "topic": "Earth's ocean", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.6, "latency_ms": 1851.1549000104424 }, { "topic": "Mars moons", "answerable": true, "P@1": 1.0, "P@3": 1.0, "P@5": 1.0, "MRR": 1.0, "Recall@5": 1.0, "Noise@5": 0.6, "latency_ms": 1286.2794999964535 }, { "topic": "Mars colonies (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.6, "avg_score": -10.4877, "latency_ms": 1852.3111999966204 }, { "topic": "Neptune rings (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.6, "avg_score": -8.6497, "latency_ms": 1130.814600008307 }, { "topic": "Speed of light (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.8, "avg_score": -10.7509, "latency_ms": 1104.37010001624 }, { "topic": "Andromeda planets (UNANS)", "answerable": false, "P@1": 0, "P@3": 0, "P@5": 0, "MRR": 0, "Recall@5": 0, "Noise@5": 0.4, "avg_score": -5.8766, "latency_ms": 1411.4279999921564 } ] }, "ragas": { "answer_relevancy": 0.833, "context_recall": 1.0, "faithfulness": 0.9688, "llm_context_precision_without_reference": 0.7431 } }