feat: changed doc_file to docx and update readme (#157)

This commit is contained in:
Sahil Kumar Yadav
2023-07-07 16:18:05 +05:30
committed by GitHub
parent 51adc5c886
commit 0bb3d0afe9
5 changed files with 21 additions and 18 deletions

View File

@@ -1,9 +1,8 @@
from langchain.document_loaders import UnstructuredWordDocumentLoader
from langchain.document_loaders import Docx2txtLoader
class DocFileLoader:
class DocxFileLoader:
def load_data(self, url):
loader = UnstructuredWordDocumentLoader(url)
loader = Docx2txtLoader(url)
output = []
data = loader.load()
content = data[0].page_content