notebook_lm_clone / tmp_eval_results.json
Abhinav Biju
Deploying RAG pipeline changes (excluding binary data)
182e0fa
{
"timestamp": "2026-03-02T22:55:43",
"corpus": {
"main_docs": 1,
"noisy_articles": 50,
"total_queries": 12,
"answerable": 8,
"unanswerable": 4
},
"baseline": {
"config": "BASELINE",
"retrieval_metrics": {
"avg_MRR": 1.0,
"avg_P@1": 1.0,
"avg_P@5": 0.825,
"avg_Recall@5": 1.0,
"avg_Noise@5": 0.675,
"avg_latency_ms": 76.2
},
"per_query": [
{
"topic": "Inner planets",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.6,
"latency_ms": 115.22539998986758
},
{
"topic": "Jupiter's GRS",
"answerable": true,
"P@1": 1.0,
"P@3": 0.3333333333333333,
"P@5": 0.4,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.8,
"latency_ms": 62.7888000162784
},
{
"topic": "Photosynthesis",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.6,
"latency_ms": 79.76240001153201
},
{
"topic": "Water cycle",
"answerable": true,
"P@1": 1.0,
"P@3": 0.6666666666666666,
"P@5": 0.4,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.8,
"latency_ms": 72.7103000099305
},
{
"topic": "Mars atmosphere",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.6,
"latency_ms": 74.54569998662919
},
{
"topic": "Gas giants",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.8,
"latency_ms": 66.27070001559332
},
{
"topic": "Earth's ocean",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.4,
"latency_ms": 69.69810000737198
},
{
"topic": "Mars moons",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 0.8,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.8,
"latency_ms": 68.9604000071995
},
{
"topic": "Mars colonies (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.8,
"avg_score": 0.7802,
"latency_ms": 65.06809999700636
},
{
"topic": "Neptune rings (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.6,
"avg_score": 0.7181,
"latency_ms": 73.1231999816373
},
{
"topic": "Speed of light (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.6,
"avg_score": 0.8281,
"latency_ms": 68.4973000024911
},
{
"topic": "Andromeda planets (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.6,
"avg_score": 0.7707,
"latency_ms": 69.7150000196416
}
]
},
"improved": {
"config": "IMPROVED",
"retrieval_metrics": {
"avg_MRR": 1.0,
"avg_P@1": 1.0,
"avg_P@5": 0.85,
"avg_Recall@5": 1.0,
"avg_Noise@5": 0.6,
"avg_latency_ms": 414.9
},
"per_query": [
{
"topic": "Inner planets",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.4,
"latency_ms": 2133.6938999884296
},
{
"topic": "Jupiter's GRS",
"answerable": true,
"P@1": 1.0,
"P@3": 0.6666666666666666,
"P@5": 0.4,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.6,
"latency_ms": 164.43840001011267
},
{
"topic": "Photosynthesis",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.6,
"latency_ms": 175.91029999312013
},
{
"topic": "Water cycle",
"answerable": true,
"P@1": 1.0,
"P@3": 0.6666666666666666,
"P@5": 0.4,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.8,
"latency_ms": 175.35750000388362
},
{
"topic": "Mars atmosphere",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.4,
"latency_ms": 184.09689998952672
},
{
"topic": "Gas giants",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.8,
"latency_ms": 162.61590001522563
},
{
"topic": "Earth's ocean",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.6,
"latency_ms": 173.08269999921322
},
{
"topic": "Mars moons",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.6,
"latency_ms": 150.08699998725206
},
{
"topic": "Mars colonies (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.4,
"avg_score": -10.4797,
"latency_ms": 169.6016000059899
},
{
"topic": "Neptune rings (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.8,
"avg_score": -7.7276,
"latency_ms": 155.08669998962432
},
{
"topic": "Speed of light (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.8,
"avg_score": -10.7558,
"latency_ms": 151.54829999664798
},
{
"topic": "Andromeda planets (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.4,
"avg_score": -5.8766,
"latency_ms": 173.95070000202395
}
]
},
"improved_expansion": {
"config": "IMPROVED+EXPANSION",
"retrieval_metrics": {
"avg_MRR": 1.0,
"avg_P@1": 1.0,
"avg_P@5": 0.85,
"avg_Recall@5": 1.0,
"avg_Noise@5": 0.575,
"avg_latency_ms": 1397.1
},
"per_query": [
{
"topic": "Inner planets",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.2,
"latency_ms": 1301.3575999939349
},
{
"topic": "Jupiter's GRS",
"answerable": true,
"P@1": 1.0,
"P@3": 0.6666666666666666,
"P@5": 0.4,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.6,
"latency_ms": 1181.4564999949653
},
{
"topic": "Photosynthesis",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.6,
"latency_ms": 1556.0503999877255
},
{
"topic": "Water cycle",
"answerable": true,
"P@1": 1.0,
"P@3": 0.6666666666666666,
"P@5": 0.4,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.8,
"latency_ms": 1384.7440000099596
},
{
"topic": "Mars atmosphere",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.4,
"latency_ms": 1248.011999996379
},
{
"topic": "Gas giants",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.8,
"latency_ms": 1367.9938999994192
},
{
"topic": "Earth's ocean",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.6,
"latency_ms": 1851.1549000104424
},
{
"topic": "Mars moons",
"answerable": true,
"P@1": 1.0,
"P@3": 1.0,
"P@5": 1.0,
"MRR": 1.0,
"Recall@5": 1.0,
"Noise@5": 0.6,
"latency_ms": 1286.2794999964535
},
{
"topic": "Mars colonies (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.6,
"avg_score": -10.4877,
"latency_ms": 1852.3111999966204
},
{
"topic": "Neptune rings (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.6,
"avg_score": -8.6497,
"latency_ms": 1130.814600008307
},
{
"topic": "Speed of light (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.8,
"avg_score": -10.7509,
"latency_ms": 1104.37010001624
},
{
"topic": "Andromeda planets (UNANS)",
"answerable": false,
"P@1": 0,
"P@3": 0,
"P@5": 0,
"MRR": 0,
"Recall@5": 0,
"Noise@5": 0.4,
"avg_score": -5.8766,
"latency_ms": 1411.4279999921564
}
]
},
"ragas": {
"answer_relevancy": 0.833,
"context_recall": 1.0,
"faithfulness": 0.9688,
"llm_context_precision_without_reference": 0.7431
}
}