Fix loader mapping order

This commit is contained in:
Fabio Rossini Sluzala 2023-05-17 22:38:30 -03:00
parent 652401cf29
commit ec126b51d8
No known key found for this signature in database
GPG Key ID: F9D569BBF49F437B

View File

@ -31,8 +31,8 @@ load_dotenv()
LOADER_MAPPING = { LOADER_MAPPING = {
".csv": (CSVLoader, {}), ".csv": (CSVLoader, {}),
# ".docx": (Docx2txtLoader, {}), # ".docx": (Docx2txtLoader, {}),
".docx": (UnstructuredWordDocumentLoader, {}),
".doc": (UnstructuredWordDocumentLoader, {}), ".doc": (UnstructuredWordDocumentLoader, {}),
".docx": (UnstructuredWordDocumentLoader, {}),
".enex": (EverNoteLoader, {}), ".enex": (EverNoteLoader, {}),
".eml": (UnstructuredEmailLoader, {}), ".eml": (UnstructuredEmailLoader, {}),
".epub": (UnstructuredEPubLoader, {}), ".epub": (UnstructuredEPubLoader, {}),
@ -40,8 +40,8 @@ LOADER_MAPPING = {
".md": (UnstructuredMarkdownLoader, {}), ".md": (UnstructuredMarkdownLoader, {}),
".odt": (UnstructuredODTLoader, {}), ".odt": (UnstructuredODTLoader, {}),
".pdf": (PDFMinerLoader, {}), ".pdf": (PDFMinerLoader, {}),
".pptx": (UnstructuredPowerPointLoader, {}),
".ppt": (UnstructuredPowerPointLoader, {}), ".ppt": (UnstructuredPowerPointLoader, {}),
".pptx": (UnstructuredPowerPointLoader, {}),
".txt": (TextLoader, {"encoding": "utf8"}), ".txt": (TextLoader, {"encoding": "utf8"}),
# Add more mappings for other file extensions and loaders as needed # Add more mappings for other file extensions and loaders as needed
} }