mirror of
https://github.com/open-webui/open-webui.git
synced 2025-08-26 13:50:48 +02:00
Merge pull request #1050 from jannikstdl/rag-pdf-ocr
feat: added ocr functionality to the pdf loader
This commit is contained in:
@@ -425,7 +425,7 @@ def get_loader(filename: str, file_content_type: str, file_path: str):
|
||||
]
|
||||
|
||||
if file_ext == "pdf":
|
||||
loader = PyPDFLoader(file_path)
|
||||
loader = PyPDFLoader(file_path, extract_images=True)
|
||||
elif file_ext == "csv":
|
||||
loader = CSVLoader(file_path)
|
||||
elif file_ext == "rst":
|
||||
|
@@ -34,6 +34,7 @@ pandas
|
||||
openpyxl
|
||||
pyxlsb
|
||||
xlrd
|
||||
rapidocr-onnxruntime
|
||||
|
||||
faster-whisper
|
||||
|
||||
|
Reference in New Issue
Block a user