Hi anatolip
I am applying Document Intelligence feature one by one on my files, and facing the following error on just one file:
Unable to retrieve continuation token: cannot pickle '_io.BufferedReader' object
An error occurred: (InternalServerError) An unexpected error occurred. Code: InternalServerError Message: An unexpected error occurred. Exception Details: (FailedToSerializeAnalyzeResult) Failed to serialize analyze results, please contact support. Code: FailedToSerializeAnalyzeResult Message: Failed to serialize analyze results, please contact support
Detailed error log is:
File /Library/Frameworks/Python.framework/Versions/3.11/lib/python3.11/site-packages/langchain_community/document_loaders/doc_intelligence.py:82, in AzureAIDocumentIntelligenceLoader.load(self) 80 def load(self) -> List[Document]: 81 """Load given path as pages.""" ---> 82 return list(self.lazy_load()) File /Library/Frameworks/Python.framework/Versions/3.11/lib/python3.11/site-packages/langchain_community/document_loaders/doc_intelligence.py:90, in AzureAIDocumentIntelligenceLoader.lazy_load(self) 88 if self.file_path is not None: 89 blob = Blob.from_path(self.file_path) ---> 90 yield from self.parser.parse(blob) 91 else: 92 yield from self.parser.parse_url(self.url_path) File /Library/Frameworks/Python.framework/Versions/3.11/lib/python3.11/site-packages/langchain_community/document_loaders/base.py:111, in BaseBlobParser.parse(self, blob) 96 def parse(self, blob: Blob) -> List[Document]: 97 """Eagerly parse the blob into a document or documents. 98 99 This is a convenience method for interactive development environment. (...) 109 List of documents 110 """ --> 111 return list(self.lazy_parse(blob)) File /Library/Frameworks/Python.framework/Versions/3.11/lib/python3.11/site-packages/langchain_community/document_loaders/parsers/doc_intelligence.py:97, in AzureAIDocumentIntelligenceParser.lazy_parse(self, blob) 90 with blob.as_bytes_io() as file_obj: 91 poller = self.client.begin_analyze_document( 92 self.api_model, 93 file_obj, 94 content_type="application/octet-stream", 95 output_content_format="markdown" if self.mode == "markdown" else "text", 96 ) ---> 97 result = poller.result() 99 if self.mode in ["single", "markdown"]: 100 yield from self._generate_docs_single(result) File /Library/Frameworks/Python.framework/Versions/3.11/lib/python3.11/site-packages/azure/core/polling/_poller.py:251, in LROPoller.result(self, timeout) 242 def result(self, timeout: Optional[float] = None) -> PollingReturnType_co: 243 """Return the result of the long running operation, or 244 the result available after the specified timeout. 245 (...) 249 :raises ~azure.core.exceptions.HttpResponseError: Server problem with the query. 250 """ --> 251 self.wait(timeout) 252 return self._polling_method.resource() File /Library/Frameworks/Python.framework/Versions/3.11/lib/python3.11/site-packages/azure/core/tracing/decorator.py:78, in distributed_trace.<locals>.decorator.<locals>.wrapper_use_tracer(*args, **kwargs) 76 span_impl_type = settings.tracing_implementation() 77 if span_impl_type is None: ---> 78 return func(*args, **kwargs) 80 # Merge span is parameter is set, but only if no explicit parent are passed 81 if merge_span and not passed_in_parent: File /Library/Frameworks/Python.framework/Versions/3.11/lib/python3.11/site-packages/azure/core/polling/_poller.py:270, in LROPoller.wait(self, timeout) 266 self._thread.join(timeout=timeout) 267 try: 268 # Let's handle possible None in forgiveness here 269 # https://github.com/python/mypy/issues/8165 --> 270 raise self._exception # type: ignore 271 except TypeError: # Was None 272 pass File /Library/Frameworks/Python.framework/Versions/3.11/lib/python3.11/site-packages/azure/core/polling/_poller.py:185, in LROPoller._start(self) 181 """Start the long running operation. 182 On completion, runs any callbacks. 183 """ 184 try: --> 185 self._polling_method.run() 186 except AzureError as error: 187 if not error.continuation_token: File /Library/Frameworks/Python.framework/Versions/3.11/lib/python3.11/site-packages/azure/core/polling/base_polling.py:772, in LROBasePolling.run(self) 765 raise HttpResponseError( 766 response=self._pipeline_response.http_response, 767 message=str(err), 768 error=err, 769 ) from err 771 except OperationFailed as err: --> 772 raise HttpResponseError(response=self._pipeline_response.http_response, error=err) from err
How can I be helpful to fix this? Thanks
Published Feb 15, 2024
Version 1.0