Skip to content

Commit 36aa635

Browse files
authored
Merge pull request #4 from punitarani/more-loaders
Add support for docx, txt and images
2 parents f970b99 + 7a7e9b4 commit 36aa635

6 files changed

Lines changed: 429 additions & 38 deletions

File tree

app.py

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,8 @@
44
from langchain.schema import Document
55

66
from rabbithole import summarize_document
7-
from rabbithole.loader import load_file
8-
from rabbithole.mp3 import SUPPORTED_FILE_TYPES
7+
from rabbithole.loader import load_file, SUPPORTED_IMG_FILE_TYPES
8+
from rabbithole.mp3 import SUPPORTED_AV_FILE_TYPES
99

1010
# Global variables
1111
results = {}
@@ -36,7 +36,9 @@ def run_summarization(document: list[Document], doc_name: str):
3636

3737
st.title("RabbitHole")
3838

39-
uploaded_files = st.file_uploader("Upload content", type=["pdf", *SUPPORTED_FILE_TYPES], accept_multiple_files=True)
39+
uploaded_files = st.file_uploader("Upload content",
40+
type=["docx", "pdf", "txt", *SUPPORTED_IMG_FILE_TYPES, *SUPPORTED_AV_FILE_TYPES],
41+
accept_multiple_files=True)
4042

4143
if st.button("Summarize"):
4244
if not uploaded_files:

packages.txt

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,2 @@
1+
ffmpeg
2+
tesseract

0 commit comments

Comments
 (0)