in code/embedding-function/utilities/document_loading/word_document.py [0:0]
def load(self, document_url: str) -> List[SourceDocument]:
output = ""
document = Document(self._download_document(document_url))
for paragraph in document.paragraphs:
output += f"{self._get_opening_tag(paragraph.style.name)}{paragraph.text}{self._get_closing_tag(paragraph.style.name)}\n"
documents = [
SourceDocument(
content=output,
source=document_url,
offset=0,
page_number=0,
)
]
return documents