from langchain_community.document_loaders import AzureAIDocumentIntelligenceLoader
url_path = "https://www.posb.com.sg/Resources/posb/docs/deposit/posb_deposits_guide.pdf"
endpoint = "https://<myendpoint>.cognitiveservices.azure.com/"
key = "<mykey>"
loader = AzureAIDocumentIntelligenceLoader(
api_endpoint=endpoint, api_key=key, url_path=url_path, api_model="prebuilt-layout"
)
documents = loader.load()
print(documents)
Hi. I'm trying to parse a document using Azure Document Intelligence using the langchain community document loader. When calling loader.load(), it's saying resource 404 not found. Do I need to configure anything extra in my azure platform?
Traceback (most recent call last):
File "/Users/elixander.tan/projects/azure/process_file_2.py", line 16, in <module>
res = obj.load()
^^^^^^^^^^
File "/opt/miniconda3/lib/python3.12/site-packages/langchain_core/document_loaders/base.py", line 30, in load
return list(self.lazy_load())
^^^^^^^^^^^^^^^^^^^^^^
File "/opt/miniconda3/lib/python3.12/site-packages/langchain_community/document_loaders/doc_intelligence.py", line 98, in lazy_load
yield from self.parser.parse_url(self.url_path) # type: ignore[arg-type]
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/opt/miniconda3/lib/python3.12/site-packages/langchain_community/document_loaders/parsers/doc_intelligence.py", line 98, in parse_url
poller = self.client.begin_analyze_document(
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/opt/miniconda3/lib/python3.12/site-packages/azure/core/tracing/decorator.py", line 94, in wrapper_use_tracer
return func(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^
File "/opt/miniconda3/lib/python3.12/site-packages/azure/ai/documentintelligence/_operations/_operations.py", line 3627, in begin_analyze_document
raw_result = self._analyze_document_initial( # type: ignore
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/opt/miniconda3/lib/python3.12/site-packages/azure/ai/documentintelligence/_operations/_operations.py", line 516, in _analyze_document_initial
map_error(status_code=response.status_code, response=response, error_map=error_map)
File "/opt/miniconda3/lib/python3.12/site-packages/azure/core/exceptions.py", line 161, in map_error
raise error
azure.core.exceptions.ResourceNotFoundError: (404) Resource not found
Code: 404