RAG / src /chunking.py
Rahbarnisa's picture
Upload 21 files
4321589 verified
raw
history blame contribute delete
343 Bytes
from langchain_text_splitters import RecursiveCharacterTextSplitter
def chunk_documents(documents):
text_splitter = RecursiveCharacterTextSplitter(
chunk_size=1000,
chunk_overlap=200,
separators=["\n\n", "\n", ".", " ", ""]
)
chunks = text_splitter.split_documents(documents)
return chunks