googleapis
diff --git a/‎docs/dyn/documentai_v1.projects.locations.processors.html
Lines changed: 36 additions & 0 deletions b/‎docs/dyn/documentai_v1.projects.locations.processors.html
Lines changed: 36 additions & 0 deletions
diff --git a/‎docs/dyn/documentai_v1.projects.locations.processors.processorVersions.html
Lines changed: 36 additions & 0 deletions b/‎docs/dyn/documentai_v1.projects.locations.processors.processorVersions.html
Lines changed: 36 additions & 0 deletions
@@ -151,6 +151,22 @@ <h3>Method Details</h3>
       &quot;gcsUriPrefix&quot;: &quot;A String&quot;, # The URI prefix.
     },
   },
+  &quot;processOptions&quot;: { # Options for Process API # Inference-time options for the process API
+    &quot;ocrConfig&quot;: { # Config for Document OCR. # Only applicable to `OCR_PROCESSOR`. Returns error if set on other processor types.
+      &quot;advancedOcrOptions&quot;: [ # A list of advanced OCR options to further fine-tune OCR behavior. Current valid values are: - `legacy_layout`: a heuristics layout detection algorithm, which serves as an alternative to the current ML-based layout detection algorithm. Customers can choose the best suitable layout algorithm based on their situation.
+        &quot;A String&quot;,
+      ],
+      &quot;computeStyleInfo&quot;: True or False, # Turn on font id model and returns font style information.
+      &quot;enableImageQualityScores&quot;: True or False, # Enables intelligent document quality scores after OCR. Can help with diagnosing why OCR responses are of poor quality for a given input. Adds additional latency comparable to regular OCR to the process call.
+      &quot;enableNativePdfParsing&quot;: True or False, # Enables special handling for PDFs with existing text information. Results in better text extraction quality in such PDF inputs.
+      &quot;enableSymbol&quot;: True or False, # Includes symbol level OCR information if set to true.
+      &quot;hints&quot;: { # Hints for OCR Engine # Hints for the OCR model.
+        &quot;languageHints&quot;: [ # List of BCP-47 language codes to use for OCR. In most cases, not specifying it yields the best results since it enables automatic language detection. For languages based on the Latin alphabet, setting hints is not needed. In rare cases, when the language of the text in the image is known, setting a hint will help get better results (although it will be a significant hindrance if the hint is wrong).
+          &quot;A String&quot;,
+        ],
+      },
+    },
+  },
   &quot;skipHumanReview&quot;: True or False, # Whether human review should be skipped for this request. Default to `false`.
 }
 
@@ -429,6 +445,10 @@ <h3>Method Details</h3>
 
 { # Request message for the ProcessDocument method.
   &quot;fieldMask&quot;: &quot;A String&quot;, # Specifies which fields to include in the ProcessResponse.document output. Only supports top-level document and pages field, so it must be in the form of `{document_field_name}` or `pages.{page_field_name}`.
+  &quot;gcsDocument&quot;: { # Specifies a document stored on Cloud Storage. # A raw document on Google Cloud Storage.
+    &quot;gcsUri&quot;: &quot;A String&quot;, # The Cloud Storage object uri.
+    &quot;mimeType&quot;: &quot;A String&quot;, # An IANA MIME type (RFC6838) of the content.
+  },
   &quot;inlineDocument&quot;: { # Document represents the canonical document resource in Document AI. It is an interchange format that provides insights into documents and allows for collaboration between users and Document AI to iterate and optimize for quality. # An inline document proto.
     &quot;content&quot;: &quot;A String&quot;, # Optional. Inline document content, represented as a stream of bytes. Note: As with all `bytes` fields, protobuffers use a pure binary representation, whereas JSON representations use base64.
     &quot;entities&quot;: [ # A list of entities detected on Document.text. For document shards, entities in this list may cross shard boundaries.
@@ -1275,6 +1295,22 @@ <h3>Method Details</h3>
     ],
     &quot;uri&quot;: &quot;A String&quot;, # Optional. Currently supports Google Cloud Storage URI of the form `gs://bucket_name/object_name`. Object versioning is not supported. For more information, refer to [Google Cloud Storage Request URIs](https://cloud.google.com/storage/docs/reference-uris).
   },
+  &quot;processOptions&quot;: { # Options for Process API # Inference-time options for the process API
+    &quot;ocrConfig&quot;: { # Config for Document OCR. # Only applicable to `OCR_PROCESSOR`. Returns error if set on other processor types.
+      &quot;advancedOcrOptions&quot;: [ # A list of advanced OCR options to further fine-tune OCR behavior. Current valid values are: - `legacy_layout`: a heuristics layout detection algorithm, which serves as an alternative to the current ML-based layout detection algorithm. Customers can choose the best suitable layout algorithm based on their situation.
+        &quot;A String&quot;,
+      ],
+      &quot;computeStyleInfo&quot;: True or False, # Turn on font id model and returns font style information.
+      &quot;enableImageQualityScores&quot;: True or False, # Enables intelligent document quality scores after OCR. Can help with diagnosing why OCR responses are of poor quality for a given input. Adds additional latency comparable to regular OCR to the process call.
+      &quot;enableNativePdfParsing&quot;: True or False, # Enables special handling for PDFs with existing text information. Results in better text extraction quality in such PDF inputs.
+      &quot;enableSymbol&quot;: True or False, # Includes symbol level OCR information if set to true.
+      &quot;hints&quot;: { # Hints for OCR Engine # Hints for the OCR model.
+        &quot;languageHints&quot;: [ # List of BCP-47 language codes to use for OCR. In most cases, not specifying it yields the best results since it enables automatic language detection. For languages based on the Latin alphabet, setting hints is not needed. In rare cases, when the language of the text in the image is known, setting a hint will help get better results (although it will be a significant hindrance if the hint is wrong).
+          &quot;A String&quot;,
+        ],
+      },
+    },
+  },
   &quot;rawDocument&quot;: { # Payload message of raw document content (bytes). # A raw document content (bytes).
     &quot;content&quot;: &quot;A String&quot;, # Inline document content.
     &quot;mimeType&quot;: &quot;A String&quot;, # An IANA MIME type (RFC6838) indicating the nature and format of the content.
 
@@ -146,6 +146,22 @@ <h3>Method Details</h3>
       &quot;gcsUriPrefix&quot;: &quot;A String&quot;, # The URI prefix.
     },
   },
+  &quot;processOptions&quot;: { # Options for Process API # Inference-time options for the process API
+    &quot;ocrConfig&quot;: { # Config for Document OCR. # Only applicable to `OCR_PROCESSOR`. Returns error if set on other processor types.
+      &quot;advancedOcrOptions&quot;: [ # A list of advanced OCR options to further fine-tune OCR behavior. Current valid values are: - `legacy_layout`: a heuristics layout detection algorithm, which serves as an alternative to the current ML-based layout detection algorithm. Customers can choose the best suitable layout algorithm based on their situation.
+        &quot;A String&quot;,
+      ],
+      &quot;computeStyleInfo&quot;: True or False, # Turn on font id model and returns font style information.
+      &quot;enableImageQualityScores&quot;: True or False, # Enables intelligent document quality scores after OCR. Can help with diagnosing why OCR responses are of poor quality for a given input. Adds additional latency comparable to regular OCR to the process call.
+      &quot;enableNativePdfParsing&quot;: True or False, # Enables special handling for PDFs with existing text information. Results in better text extraction quality in such PDF inputs.
+      &quot;enableSymbol&quot;: True or False, # Includes symbol level OCR information if set to true.
+      &quot;hints&quot;: { # Hints for OCR Engine # Hints for the OCR model.
+        &quot;languageHints&quot;: [ # List of BCP-47 language codes to use for OCR. In most cases, not specifying it yields the best results since it enables automatic language detection. For languages based on the Latin alphabet, setting hints is not needed. In rare cases, when the language of the text in the image is known, setting a hint will help get better results (although it will be a significant hindrance if the hint is wrong).
+          &quot;A String&quot;,
+        ],
+      },
+    },
+  },
   &quot;skipHumanReview&quot;: True or False, # Whether human review should be skipped for this request. Default to `false`.
 }
 
@@ -525,6 +541,10 @@ <h3>Method Details</h3>
 
 { # Request message for the ProcessDocument method.
   &quot;fieldMask&quot;: &quot;A String&quot;, # Specifies which fields to include in the ProcessResponse.document output. Only supports top-level document and pages field, so it must be in the form of `{document_field_name}` or `pages.{page_field_name}`.
+  &quot;gcsDocument&quot;: { # Specifies a document stored on Cloud Storage. # A raw document on Google Cloud Storage.
+    &quot;gcsUri&quot;: &quot;A String&quot;, # The Cloud Storage object uri.
+    &quot;mimeType&quot;: &quot;A String&quot;, # An IANA MIME type (RFC6838) of the content.
+  },
   &quot;inlineDocument&quot;: { # Document represents the canonical document resource in Document AI. It is an interchange format that provides insights into documents and allows for collaboration between users and Document AI to iterate and optimize for quality. # An inline document proto.
     &quot;content&quot;: &quot;A String&quot;, # Optional. Inline document content, represented as a stream of bytes. Note: As with all `bytes` fields, protobuffers use a pure binary representation, whereas JSON representations use base64.
     &quot;entities&quot;: [ # A list of entities detected on Document.text. For document shards, entities in this list may cross shard boundaries.
@@ -1371,6 +1391,22 @@ <h3>Method Details</h3>
     ],
     &quot;uri&quot;: &quot;A String&quot;, # Optional. Currently supports Google Cloud Storage URI of the form `gs://bucket_name/object_name`. Object versioning is not supported. For more information, refer to [Google Cloud Storage Request URIs](https://cloud.google.com/storage/docs/reference-uris).
   },
+  &quot;processOptions&quot;: { # Options for Process API # Inference-time options for the process API
+    &quot;ocrConfig&quot;: { # Config for Document OCR. # Only applicable to `OCR_PROCESSOR`. Returns error if set on other processor types.
+      &quot;advancedOcrOptions&quot;: [ # A list of advanced OCR options to further fine-tune OCR behavior. Current valid values are: - `legacy_layout`: a heuristics layout detection algorithm, which serves as an alternative to the current ML-based layout detection algorithm. Customers can choose the best suitable layout algorithm based on their situation.
+        &quot;A String&quot;,
+      ],
+      &quot;computeStyleInfo&quot;: True or False, # Turn on font id model and returns font style information.
+      &quot;enableImageQualityScores&quot;: True or False, # Enables intelligent document quality scores after OCR. Can help with diagnosing why OCR responses are of poor quality for a given input. Adds additional latency comparable to regular OCR to the process call.
+      &quot;enableNativePdfParsing&quot;: True or False, # Enables special handling for PDFs with existing text information. Results in better text extraction quality in such PDF inputs.
+      &quot;enableSymbol&quot;: True or False, # Includes symbol level OCR information if set to true.
+      &quot;hints&quot;: { # Hints for OCR Engine # Hints for the OCR model.
+        &quot;languageHints&quot;: [ # List of BCP-47 language codes to use for OCR. In most cases, not specifying it yields the best results since it enables automatic language detection. For languages based on the Latin alphabet, setting hints is not needed. In rare cases, when the language of the text in the image is known, setting a hint will help get better results (although it will be a significant hindrance if the hint is wrong).
+          &quot;A String&quot;,
+        ],
+      },
+    },
+  },
   &quot;rawDocument&quot;: { # Payload message of raw document content (bytes). # A raw document content (bytes).
     &quot;content&quot;: &quot;A String&quot;, # Inline document content.
     &quot;mimeType&quot;: &quot;A String&quot;, # An IANA MIME type (RFC6838) indicating the nature and format of the content.