Add .doc .ppt (Word and PowerPoint 97/2003 formats)
This commit is contained in:
		
							parent
							
								
									355b4be7c0
								
							
						
					
					
						commit
						66a9f9cde0
					
				|  | @ -32,6 +32,7 @@ LOADER_MAPPING = { | ||||||
|     ".csv": (CSVLoader, {}), |     ".csv": (CSVLoader, {}), | ||||||
|     # ".docx": (Docx2txtLoader, {}), |     # ".docx": (Docx2txtLoader, {}), | ||||||
|     ".docx": (UnstructuredWordDocumentLoader, {}), |     ".docx": (UnstructuredWordDocumentLoader, {}), | ||||||
|  |     ".doc": (UnstructuredWordDocumentLoader, {}), | ||||||
|     ".enex": (EverNoteLoader, {}), |     ".enex": (EverNoteLoader, {}), | ||||||
|     ".eml": (UnstructuredEmailLoader, {}), |     ".eml": (UnstructuredEmailLoader, {}), | ||||||
|     ".epub": (UnstructuredEPubLoader, {}), |     ".epub": (UnstructuredEPubLoader, {}), | ||||||
|  | @ -40,6 +41,7 @@ LOADER_MAPPING = { | ||||||
|     ".odt": (UnstructuredODTLoader, {}), |     ".odt": (UnstructuredODTLoader, {}), | ||||||
|     ".pdf": (PDFMinerLoader, {}), |     ".pdf": (PDFMinerLoader, {}), | ||||||
|     ".pptx": (UnstructuredPowerPointLoader, {}), |     ".pptx": (UnstructuredPowerPointLoader, {}), | ||||||
|  |     ".ppt": (UnstructuredPowerPointLoader, {}), | ||||||
|     ".txt": (TextLoader, {"encoding": "utf8"}), |     ".txt": (TextLoader, {"encoding": "utf8"}), | ||||||
|     # Add more mappings for other file extensions and loaders as needed |     # Add more mappings for other file extensions and loaders as needed | ||||||
| } | } | ||||||
|  |  | ||||||
		Loading…
	
		Reference in New Issue