RAG_Project / src /chunking.py
Rahbarnisa's picture
Upload 24 files
9a2d4ec verified
raw
history blame contribute delete
343 Bytes
from langchain_text_splitters import RecursiveCharacterTextSplitter
def chunk_documents(documents):
text_splitter = RecursiveCharacterTextSplitter(
chunk_size=1000,
chunk_overlap=200,
separators=["\n\n", "\n", ".", " ", ""]
)
chunks = text_splitter.split_documents(documents)
return chunks