in code/embedding-function/utilities/document_loading/read.py [0:0]
def load(self, document_url: str) -> List[SourceDocument]:
azure_form_recognizer_client = AzureFormRecognizerClient()
pages_content = azure_form_recognizer_client.begin_analyze_document_from_url(
document_url, use_layout=False
)
documents = [
SourceDocument(
content=page["page_text"],
source=document_url,
page_number=page["page_number"],
offset=page["offset"],
)
for page in pages_content
]
return documents