updated chuck_size and overlap as they were too small

This commit is contained in:
Peter Morton 2025-06-02 18:41:08 -05:00
parent f0503e7aac
commit fde60f3341

View File

@ -52,7 +52,7 @@ def load_web_crawl(url):
# docs_list = [item for sublist in docs for item in sublist]
# Initialize a text splitter with specified chunk size and overlap
text_splitter = RecursiveCharacterTextSplitter.from_tiktoken_encoder(
chunk_size=250, chunk_overlap=0
chunk_size=1000, chunk_overlap=200
)
# Split the documents into chunks
return text_splitter.split_documents(docs)