from llama_index.readers.file.base import DEFAULT_FILE_EXTRACTOR file_extractor = DEFAULT_FILE_EXTRACTOR file_extractor.update( { ".pptx": PptxReader() }) docs = SimpleDirectoryReader("./data", file_extractor=file_extractor).load_data()
file_extractor = {".xml": XMLReader()} documents = SimpleDirectoryReader(..., file_extractor=file_extractor).load_data()