Spaces:

pikaduck
/

policy-analyser

Sleeping

Sakshi commited on Mar 4

Commit

b099df3

1 Parent(s): 0557bd1

changed ContentFormat to DocumentContentFormat in ocr.py

Files changed (1) hide show

policy_analyser/ocr.py CHANGED Viewed

@@ -7,7 +7,7 @@
 import pymupdf4llm, pymupdf
 from azure.core.credentials import AzureKeyCredential
 from azure.ai.documentintelligence import DocumentIntelligenceClient
-from azure.ai.documentintelligence.models import AnalyzeDocumentRequest, ContentFormat, AnalyzeResult
 from policy_analyser import AZURE_LAYOUT_ENDPOINT, AZURE_LAYOUT_KEY, AZURE_LAYOUT_MODEL
@@ -44,7 +44,7 @@ class AzureDocumentIntelligenceOCR:
             poller = self.client.begin_analyze_document(
                 AZURE_LAYOUT_MODEL,
                 AnalyzeDocumentRequest(bytes_source = file_bytes),
-                output_content_format = ContentFormat.MARKDOWN
             )
             result = poller.result()
             return result.content, None

 import pymupdf4llm, pymupdf
 from azure.core.credentials import AzureKeyCredential
 from azure.ai.documentintelligence import DocumentIntelligenceClient
+from azure.ai.documentintelligence.models import AnalyzeDocumentRequest, DocumentContentFormat, AnalyzeResult
 from policy_analyser import AZURE_LAYOUT_ENDPOINT, AZURE_LAYOUT_KEY, AZURE_LAYOUT_MODEL
             poller = self.client.begin_analyze_document(
                 AZURE_LAYOUT_MODEL,
                 AnalyzeDocumentRequest(bytes_source = file_bytes),
+                output_content_format = DocumentContentFormat.MARKDOWN
             )
             result = poller.result()
             return result.content, None