aitutor / documents /chunker.py
AptlyDigital's picture
Upload 3 files
68e634d verified
from langchain.text_splitter import RecursiveCharacterTextSplitter
class DocumentChunker:
def __init__(self, chunk_size=500, chunk_overlap=50):
self.splitter = RecursiveCharacterTextSplitter(
chunk_size=chunk_size,
chunk_overlap=chunk_overlap
)
def chunk_text(self, text):
return self.splitter.split_text(text)