File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -43,7 +43,15 @@ def load_file(file: UploadedFile) -> list[Document]:
4343 # Handle .pdf files
4444 elif file .name .endswith (".pdf" ):
4545 temp_file = save_to_temp_file (file )
46- return PyMuPDFLoader (file_path = temp_file ).load_and_split (text_splitter = text_splitter )
46+ pdf_doc = PyMuPDFLoader (file_path = temp_file ).load_and_split (text_splitter = text_splitter )
47+
48+ # Save transcription to temporary file
49+ temp_file = tempfile .NamedTemporaryFile (suffix = ".txt" , delete = False )
50+ temp_file .write ("\n " .join ([page .page_content for page in pdf_doc ]).encode ())
51+ temp_file .close ()
52+
53+ # Load the file using TextLoader
54+ return TextLoader (file_path = temp_file .name , encoding = "utf-8" ).load_and_split (text_splitter = text_splitter )
4755
4856 # Handle .txt files
4957 elif file .name .endswith (".txt" ):
You can’t perform that action at this time.
0 commit comments