File tree Expand file tree Collapse file tree 2 files changed +3
-4
lines changed Expand file tree Collapse file tree 2 files changed +3
-4
lines changed Original file line number Diff line number Diff line change 273
273
274
274
DOCUMENT_LOADERS = {
275
275
".pdf" : "PyMuPDFLoader" ,
276
- ".docx" : "UnstructuredWordDocumentLoader" ,
277
- ".doc" : "UnstructuredWordDocumentLoader" ,
276
+ ".docx" : "Docx2txtLoader" ,
278
277
".txt" : "TextLoader" ,
279
278
".enex" : "EverNoteLoader" ,
280
279
".epub" : "UnstructuredEPubLoader" ,
Original file line number Diff line number Diff line change 7
7
from langchain .text_splitter import RecursiveCharacterTextSplitter
8
8
from langchain .document_loaders import (
9
9
PyMuPDFLoader ,
10
- UnstructuredWordDocumentLoader ,
10
+ Docx2txtLoader ,
11
11
TextLoader ,
12
12
EverNoteLoader ,
13
13
UnstructuredEPubLoader ,
@@ -67,7 +67,7 @@ def load_single_document(file_path: Path) -> Document:
67
67
elif file_extension == ".epub" :
68
68
loader = UnstructuredEPubLoader (str (file_path ), mode = "single" , strategy = "fast" )
69
69
elif file_extension == ".docx" :
70
- loader = UnstructuredWordDocumentLoader (str (file_path ), mode = "single" , strategy = "fast" )
70
+ loader = Docx2txtLoader (str (file_path ))
71
71
elif file_extension == ".rtf" :
72
72
loader = UnstructuredRTFLoader (str (file_path ), mode = "single" , strategy = "fast" )
73
73
elif file_extension == ".odt" :
You can’t perform that action at this time.
0 commit comments