File size: 1,013 Bytes
cf71c95 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 |
import pytest
import pandas as pd
from langchain.schema import Document
from app.processor import summarize # Adjust this import path as needed
@pytest.fixture
def dummy_pages():
return [
Document(
page_content="LangChain is a framework for developing LLM-based applications.",
metadata={"source": "sample_paper.pdf", "page": 1},
),
Document(
page_content="It provides utilities for prompt management, chains, and agents.",
metadata={"source": "sample_paper.pdf", "page": 2},
),
]
def test_summarize_documents_returns_dataframe(dummy_pages):
summary_df = summarize_documents(dummy_pages)
assert isinstance(summary_df, pd.DataFrame)
assert "file_name" in summary_df.columns
assert "page_number" in summary_df.columns
assert "chunks" in summary_df.columns
assert "concise_summary" in summary_df.columns
assert len(summary_df) == len(dummy_pages)
assert summary_df["page_number"].iloc[0] == 1
|