We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent dfb4e31 commit a67faafCopy full SHA for a67faaf
1 file changed
rabbithole/loader.py
@@ -33,7 +33,7 @@ def load_file(file: UploadedFile) -> list[Document]:
33
Supported file types: PDF
34
:return: List of Document objects
35
"""
36
- text_splitter = TokenTextSplitter(model_name="davinci", chunk_size=2000, chunk_overlap=100)
+ text_splitter = TokenTextSplitter(encoding_name="cl100k_base", chunk_size=1000, chunk_overlap=100)
37
38
# Handle .docx files
39
if file.name.endswith(".docx"):
0 commit comments