Update app.py
Browse files
app.py
CHANGED
@@ -6,8 +6,7 @@ from langchain.document_loaders import (
|
|
6 |
CSVLoader,
|
7 |
EverNoteLoader,
|
8 |
PDFMinerLoader,
|
9 |
-
|
10 |
-
MathpixPDFLoader,
|
11 |
TextLoader,
|
12 |
UnstructuredEmailLoader,
|
13 |
UnstructuredEPubLoader,
|
@@ -47,8 +46,7 @@ LOADER_MAPPING = {
|
|
47 |
".md": (UnstructuredMarkdownLoader, {}),
|
48 |
".odt": (UnstructuredODTLoader, {}),
|
49 |
#".pdf": (PDFMinerLoader, {}),
|
50 |
-
|
51 |
-
".pdf": (MathpixPDFLoader, {}),
|
52 |
".ppt": (UnstructuredPowerPointLoader, {}),
|
53 |
".pptx": (UnstructuredPowerPointLoader, {}),
|
54 |
".txt": (TextLoader, {"encoding": "utf8"}),
|
|
|
6 |
CSVLoader,
|
7 |
EverNoteLoader,
|
8 |
PDFMinerLoader,
|
9 |
+
PyPDFium2Loader,
|
|
|
10 |
TextLoader,
|
11 |
UnstructuredEmailLoader,
|
12 |
UnstructuredEPubLoader,
|
|
|
46 |
".md": (UnstructuredMarkdownLoader, {}),
|
47 |
".odt": (UnstructuredODTLoader, {}),
|
48 |
#".pdf": (PDFMinerLoader, {}),
|
49 |
+
".pdf": (PyPDFium2Loader, {}),
|
|
|
50 |
".ppt": (UnstructuredPowerPointLoader, {}),
|
51 |
".pptx": (UnstructuredPowerPointLoader, {}),
|
52 |
".txt": (TextLoader, {"encoding": "utf8"}),
|