import pytest import os from rag.vectorstore import build_vectorstore import rag.vectorstore from langchain_core.embeddings import Embeddings from typing import List os.environ["OPENAI_API_KEY"] = "dummy_key" class MockEmbedding(Embeddings): def embed_documents(self, texts: List[str]) -> List[List[float]]: return [[0.0] * 1536 for _ in texts] def embed_query(self, text: str) -> List[float]: return [0.0] * 1536 def test_rag_pipeline_loads_and_retrieves(mocker, tmp_path): kb_file = tmp_path / "knowledge_base.md" kb_file.write_text(""" # AutoStream Pricing & Features ## Pro Plan * $79/month * Unlimited videos * 4K resolution * AI captions included """) mocker.patch('rag.vectorstore.get_embeddings', return_value=MockEmbedding()) vs = build_vectorstore(str(kb_file)) assert vs is not None mocker.patch('rag.retriever.get_vectorstore', return_value=vs) from rag.retriever import retrieve_documents docs = retrieve_documents("What does the Pro plan cost?", k=1) assert len(docs) > 0 assert "AutoStream" in docs[0] or "Pro Plan" in docs[0] or "$79/month" in docs[0]