Spaces:
Sleeping
Sleeping
Neural Arun
Identity Expansion: Integrated massive ArunCore documentation and master portfolio summary into live Vector DB
97f4848 | { | |
| "summary": { | |
| "total_questions": 30, | |
| "retrieval_accuracy": "83.33%", | |
| "generation_accuracy": "16.67%" | |
| }, | |
| "details": [ | |
| { | |
| "id": "eval_001", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "RAG Pipelines", | |
| "Autonomous Agents", | |
| "Data Scrapers" | |
| ] | |
| }, | |
| { | |
| "id": "eval_002", | |
| "retrieval": "PASS", | |
| "generation": "PASS", | |
| "missing": [] | |
| }, | |
| { | |
| "id": "eval_003", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Solving High-ROI bottlenecks", | |
| "Building scalable AI systems" | |
| ] | |
| }, | |
| { | |
| "id": "eval_004", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Non-linear path", | |
| "NEET/JEE background" | |
| ] | |
| }, | |
| { | |
| "id": "eval_005", | |
| "retrieval": "PASS", | |
| "generation": "PASS", | |
| "missing": [] | |
| }, | |
| { | |
| "id": "eval_006", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Accelerated independent learning", | |
| "Build-first execution" | |
| ] | |
| }, | |
| { | |
| "id": "eval_007", | |
| "retrieval": "FAIL", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Exact-reference routing" | |
| ] | |
| }, | |
| { | |
| "id": "eval_008", | |
| "retrieval": "FAIL", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Document-aware structural chunking" | |
| ] | |
| }, | |
| { | |
| "id": "eval_009", | |
| "retrieval": "FAIL", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Destroys structural boundary", | |
| "Context loss", | |
| "Section integrity" | |
| ] | |
| }, | |
| { | |
| "id": "eval_010", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Data privacy", | |
| "No cloud exposure for legal docs" | |
| ] | |
| }, | |
| { | |
| "id": "eval_011", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Structured CSV export" | |
| ] | |
| }, | |
| { | |
| "id": "eval_012", | |
| "retrieval": "PASS", | |
| "generation": "PASS", | |
| "missing": [] | |
| }, | |
| { | |
| "id": "eval_013", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Obfuscated CSS classes" | |
| ] | |
| }, | |
| { | |
| "id": "eval_014", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "asyncio.Semaphore", | |
| "Throttling" | |
| ] | |
| }, | |
| { | |
| "id": "eval_015", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Digital twin", | |
| "Tool-calling loop" | |
| ] | |
| }, | |
| { | |
| "id": "eval_016", | |
| "retrieval": "FAIL", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Graceful degradation" | |
| ] | |
| }, | |
| { | |
| "id": "eval_017", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "No code redeployment needed", | |
| "Separation of identity data" | |
| ] | |
| }, | |
| { | |
| "id": "eval_018", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Graceful fallback", | |
| "Returns 'I do not have information regarding this'", | |
| "Zero hallucination" | |
| ] | |
| }, | |
| { | |
| "id": "eval_019", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Democratizing value" | |
| ] | |
| }, | |
| { | |
| "id": "eval_020", | |
| "retrieval": "FAIL", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Daily-use utility" | |
| ] | |
| }, | |
| { | |
| "id": "eval_021", | |
| "retrieval": "PASS", | |
| "generation": "PASS", | |
| "missing": [] | |
| }, | |
| { | |
| "id": "eval_022", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Distributed crawler systems" | |
| ] | |
| }, | |
| { | |
| "id": "eval_023", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Avoids brittle wrappers", | |
| "Engineers robust solutions", | |
| "Systems engineering" | |
| ] | |
| }, | |
| { | |
| "id": "eval_024", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Series-prefix grouping" | |
| ] | |
| }, | |
| { | |
| "id": "eval_025", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "High accuracy over OCR" | |
| ] | |
| }, | |
| { | |
| "id": "eval_026", | |
| "retrieval": "PASS", | |
| "generation": "PASS", | |
| "missing": [] | |
| }, | |
| { | |
| "id": "eval_027", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Strictly minimal" | |
| ] | |
| }, | |
| { | |
| "id": "eval_028", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Polite refusal", | |
| "Out of bounds", | |
| "No hallucination" | |
| ] | |
| }, | |
| { | |
| "id": "eval_029", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Prayagraj, UP, India", | |
| "No exact address provided" | |
| ] | |
| }, | |
| { | |
| "id": "eval_030", | |
| "retrieval": "PASS", | |
| "generation": "FAIL", | |
| "missing": [ | |
| "Backend focused", | |
| "Python, FastAPI", | |
| "AI integrations", | |
| "Does not do frontend/Next.js currently" | |
| ] | |
| } | |
| ] | |
| } |