diff --git a/docs/dyn/discoveryengine_v1alpha.projects.locations.collections.dataStores.html b/docs/dyn/discoveryengine_v1alpha.projects.locations.collections.dataStores.html index 84c5eaf3adb..e870a7b55ae 100644 --- a/docs/dyn/discoveryengine_v1alpha.projects.locations.collections.dataStores.html +++ b/docs/dyn/discoveryengine_v1alpha.projects.locations.collections.dataStores.html @@ -321,14 +321,40 @@
Updates the DocumentProcessingConfig. DocumentProcessingConfig is a singleon resource of DataStore. It's empty when DataStore is created. The first call to this method will set up DocumentProcessingConfig. Args: - name: string, Output only. The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. (required) + name: string, The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. (required) body: object, The request body. The object takes the form of: { # A singleton resource of DataStore. It's empty when DataStore is created, which defaults to digital parser. The first call to DataStoreService.UpdateDocumentProcessingConfig method will initialize the config. - "name": "A String", # Output only. The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. - "ocrConfig": { # The OCR options for parsing documents. # The OCR config. Currently it only applies to PDFs. + "defaultParsingConfig": { # Related configurations applied to a specific type of document parser. # Configurations for default Document parser. If not specified, we will configure it as default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing. + "digitalParsingConfig": { # The digital parsing configurations for documents. # Configurations applied to digital parser. + }, + "layoutParsingConfig": { # The layout parsing configurations for documents. # Configurations applied to layout parser. + }, + "ocrParsingConfig": { # The OCR parsing configurations for documents. # Configurations applied to OCR parser. Currently it only applies to PDFs. + "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. + "A String", + ], + "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. + }, + }, + "name": "A String", # The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. + "ocrConfig": { # The OCR options for parsing documents. # [DEPRECATED] This field is deprecated. To specify OCR parsing config, please specify `ocr_parsing_config` in `default_parsing_config` field The OCR config. Currently it only applies to PDFs. "enabled": True or False, # Required. If OCR is enabled or not. OCR must be enabled for other OcrConfig options to apply. We will only perform OCR on the first 80 pages of the PDF files. "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. "A String", ], "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. }, + "parsingConfigOverrides": { # Map from file type to override the default parsing configuration based on the file type. Supported keys: * `pdf`: Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported. * `html`: Override parsing config for HTML files, only digital parsing and or layout parsing are supported. + "a_key": { # Related configurations applied to a specific type of document parser. + "digitalParsingConfig": { # The digital parsing configurations for documents. # Configurations applied to digital parser. + }, + "layoutParsingConfig": { # The layout parsing configurations for documents. # Configurations applied to layout parser. + }, + "ocrParsingConfig": { # The OCR parsing configurations for documents. # Configurations applied to OCR parser. Currently it only applies to PDFs. + "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. + "A String", + ], + "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. + }, + }, + }, } updateMask: string, Indicates which fields in the provided DocumentProcessingConfig to update. The following are the only supported fields: * DocumentProcessingConfig.ocr_config If not set, all supported fields are updated. @@ -524,14 +576,40 @@diff --git a/docs/dyn/discoveryengine_v1alpha.projects.locations.dataStores.html b/docs/dyn/discoveryengine_v1alpha.projects.locations.dataStores.html index 541218fed3f..33b0b6dc1bc 100644 --- a/docs/dyn/discoveryengine_v1alpha.projects.locations.dataStores.html +++ b/docs/dyn/discoveryengine_v1alpha.projects.locations.dataStores.html @@ -318,14 +318,40 @@Method Details
An object of the form: { # A singleton resource of DataStore. It's empty when DataStore is created, which defaults to digital parser. The first call to DataStoreService.UpdateDocumentProcessingConfig method will initialize the config. - "name": "A String", # Output only. The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. - "ocrConfig": { # The OCR options for parsing documents. # The OCR config. Currently it only applies to PDFs. + "defaultParsingConfig": { # Related configurations applied to a specific type of document parser. # Configurations for default Document parser. If not specified, we will configure it as default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing. + "digitalParsingConfig": { # The digital parsing configurations for documents. # Configurations applied to digital parser. + }, + "layoutParsingConfig": { # The layout parsing configurations for documents. # Configurations applied to layout parser. + }, + "ocrParsingConfig": { # The OCR parsing configurations for documents. # Configurations applied to OCR parser. Currently it only applies to PDFs. + "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. + "A String", + ], + "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. + }, + }, + "name": "A String", # The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. + "ocrConfig": { # The OCR options for parsing documents. # [DEPRECATED] This field is deprecated. To specify OCR parsing config, please specify `ocr_parsing_config` in `default_parsing_config` field The OCR config. Currently it only applies to PDFs. "enabled": True or False, # Required. If OCR is enabled or not. OCR must be enabled for other OcrConfig options to apply. We will only perform OCR on the first 80 pages of the PDF files. "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. "A String", ], "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. }, + "parsingConfigOverrides": { # Map from file type to override the default parsing configuration based on the file type. Supported keys: * `pdf`: Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported. * `html`: Override parsing config for HTML files, only digital parsing and or layout parsing are supported. + "a_key": { # Related configurations applied to a specific type of document parser. + "digitalParsingConfig": { # The digital parsing configurations for documents. # Configurations applied to digital parser. + }, + "layoutParsingConfig": { # The layout parsing configurations for documents. # Configurations applied to layout parser. + }, + "ocrParsingConfig": { # The OCR parsing configurations for documents. # Configurations applied to OCR parser. Currently it only applies to PDFs. + "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. + "A String", + ], + "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. + }, + }, + }, }
Updates the DocumentProcessingConfig. DocumentProcessingConfig is a singleon resource of DataStore. It's empty when DataStore is created. The first call to this method will set up DocumentProcessingConfig. Args: - name: string, Output only. The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. (required) + name: string, The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. (required) body: object, The request body. The object takes the form of: { # A singleton resource of DataStore. It's empty when DataStore is created, which defaults to digital parser. The first call to DataStoreService.UpdateDocumentProcessingConfig method will initialize the config. - "name": "A String", # Output only. The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. - "ocrConfig": { # The OCR options for parsing documents. # The OCR config. Currently it only applies to PDFs. + "defaultParsingConfig": { # Related configurations applied to a specific type of document parser. # Configurations for default Document parser. If not specified, we will configure it as default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing. + "digitalParsingConfig": { # The digital parsing configurations for documents. # Configurations applied to digital parser. + }, + "layoutParsingConfig": { # The layout parsing configurations for documents. # Configurations applied to layout parser. + }, + "ocrParsingConfig": { # The OCR parsing configurations for documents. # Configurations applied to OCR parser. Currently it only applies to PDFs. + "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. + "A String", + ], + "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. + }, + }, + "name": "A String", # The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. + "ocrConfig": { # The OCR options for parsing documents. # [DEPRECATED] This field is deprecated. To specify OCR parsing config, please specify `ocr_parsing_config` in `default_parsing_config` field The OCR config. Currently it only applies to PDFs. "enabled": True or False, # Required. If OCR is enabled or not. OCR must be enabled for other OcrConfig options to apply. We will only perform OCR on the first 80 pages of the PDF files. "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. "A String", ], "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. }, + "parsingConfigOverrides": { # Map from file type to override the default parsing configuration based on the file type. Supported keys: * `pdf`: Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported. * `html`: Override parsing config for HTML files, only digital parsing and or layout parsing are supported. + "a_key": { # Related configurations applied to a specific type of document parser. + "digitalParsingConfig": { # The digital parsing configurations for documents. # Configurations applied to digital parser. + }, + "layoutParsingConfig": { # The layout parsing configurations for documents. # Configurations applied to layout parser. + }, + "ocrParsingConfig": { # The OCR parsing configurations for documents. # Configurations applied to OCR parser. Currently it only applies to PDFs. + "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. + "A String", + ], + "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. + }, + }, + }, } updateMask: string, Indicates which fields in the provided DocumentProcessingConfig to update. The following are the only supported fields: * DocumentProcessingConfig.ocr_config If not set, all supported fields are updated. @@ -470,14 +522,40 @@diff --git a/googleapiclient/discovery_cache/documents/discoveryengine.v1alpha.json b/googleapiclient/discovery_cache/documents/discoveryengine.v1alpha.json index a52cb44957e..e38e257b392 100644 --- a/googleapiclient/discovery_cache/documents/discoveryengine.v1alpha.json +++ b/googleapiclient/discovery_cache/documents/discoveryengine.v1alpha.json @@ -629,7 +629,7 @@ ], "parameters": { "name": { -"description": "Output only. The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`.", +"description": "The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`.", "location": "path", "pattern": "^projects/[^/]+/locations/[^/]+/collections/[^/]+/dataStores/[^/]+/documentProcessingConfig$", "required": true, @@ -3134,7 +3134,7 @@ ], "parameters": { "name": { -"description": "Output only. The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`.", +"description": "The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`.", "location": "path", "pattern": "^projects/[^/]+/locations/[^/]+/dataStores/[^/]+/documentProcessingConfig$", "required": true, @@ -4596,7 +4596,7 @@ } } }, -"revision": "20240123", +"revision": "20240131", "rootUrl": "https://discoveryengine.googleapis.com/", "schemas": { "GoogleApiHttpBody": { @@ -6203,6 +6203,12 @@ }, "type": "object" }, +"GoogleCloudDiscoveryengineV1alphaDigitalParsingConfig": { +"description": "The digital parsing configurations for documents.", +"id": "GoogleCloudDiscoveryengineV1alphaDigitalParsingConfig", +"properties": {}, +"type": "object" +}, "GoogleCloudDiscoveryengineV1alphaDisableAdvancedSiteSearchMetadata": { "description": "Metadata related to the progress of the SiteSearchEngineService.DisableAdvancedSiteSearch operation. This will be returned by the google.longrunning.Operation.metadata field.", "id": "GoogleCloudDiscoveryengineV1alphaDisableAdvancedSiteSearchMetadata", @@ -6335,14 +6341,44 @@ "description": "A singleton resource of DataStore. It's empty when DataStore is created, which defaults to digital parser. The first call to DataStoreService.UpdateDocumentProcessingConfig method will initialize the config.", "id": "GoogleCloudDiscoveryengineV1alphaDocumentProcessingConfig", "properties": { +"defaultParsingConfig": { +"$ref": "GoogleCloudDiscoveryengineV1alphaDocumentProcessingConfigParsingConfig", +"description": "Configurations for default Document parser. If not specified, we will configure it as default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing." +}, "name": { -"description": "Output only. The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`.", -"readOnly": true, +"description": "The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`.", "type": "string" }, "ocrConfig": { "$ref": "GoogleCloudDiscoveryengineV1alphaOcrConfig", -"description": "The OCR config. Currently it only applies to PDFs." +"deprecated": true, +"description": "[DEPRECATED] This field is deprecated. To specify OCR parsing config, please specify `ocr_parsing_config` in `default_parsing_config` field The OCR config. Currently it only applies to PDFs." +}, +"parsingConfigOverrides": { +"additionalProperties": { +"$ref": "GoogleCloudDiscoveryengineV1alphaDocumentProcessingConfigParsingConfig" +}, +"description": "Map from file type to override the default parsing configuration based on the file type. Supported keys: * `pdf`: Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported. * `html`: Override parsing config for HTML files, only digital parsing and or layout parsing are supported.", +"type": "object" +} +}, +"type": "object" +}, +"GoogleCloudDiscoveryengineV1alphaDocumentProcessingConfigParsingConfig": { +"description": "Related configurations applied to a specific type of document parser.", +"id": "GoogleCloudDiscoveryengineV1alphaDocumentProcessingConfigParsingConfig", +"properties": { +"digitalParsingConfig": { +"$ref": "GoogleCloudDiscoveryengineV1alphaDigitalParsingConfig", +"description": "Configurations applied to digital parser." +}, +"layoutParsingConfig": { +"$ref": "GoogleCloudDiscoveryengineV1alphaLayoutParsingConfig", +"description": "Configurations applied to layout parser." +}, +"ocrParsingConfig": { +"$ref": "GoogleCloudDiscoveryengineV1alphaOcrParsingConfig", +"description": "Configurations applied to OCR parser. Currently it only applies to PDFs." } }, "type": "object" @@ -7248,6 +7284,12 @@ }, "type": "object" }, +"GoogleCloudDiscoveryengineV1alphaLayoutParsingConfig": { +"description": "The layout parsing configurations for documents.", +"id": "GoogleCloudDiscoveryengineV1alphaLayoutParsingConfig", +"properties": {}, +"type": "object" +}, "GoogleCloudDiscoveryengineV1alphaListConversationsResponse": { "description": "Response for ListConversations method.", "id": "GoogleCloudDiscoveryengineV1alphaListConversationsResponse", @@ -7401,6 +7443,7 @@ "type": "object" }, "GoogleCloudDiscoveryengineV1alphaOcrConfig": { +"deprecated": true, "description": "The OCR options for parsing documents.", "id": "GoogleCloudDiscoveryengineV1alphaOcrConfig", "properties": { @@ -7422,6 +7465,24 @@ }, "type": "object" }, +"GoogleCloudDiscoveryengineV1alphaOcrParsingConfig": { +"description": "The OCR parsing configurations for documents.", +"id": "GoogleCloudDiscoveryengineV1alphaOcrParsingConfig", +"properties": { +"enhancedDocumentElements": { +"description": "Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model.", +"items": { +"type": "string" +}, +"type": "array" +}, +"useNativeText": { +"description": "If true, will use native text instead of OCR text on pages containing native text.", +"type": "boolean" +} +}, +"type": "object" +}, "GoogleCloudDiscoveryengineV1alphaPageInfo": { "description": "Detailed page information.", "id": "GoogleCloudDiscoveryengineV1alphaPageInfo", diff --git a/googleapiclient/discovery_cache/documents/discoveryengine.v1beta.json b/googleapiclient/discovery_cache/documents/discoveryengine.v1beta.json index 6256e453021..3969e33d084 100644 --- a/googleapiclient/discovery_cache/documents/discoveryengine.v1beta.json +++ b/googleapiclient/discovery_cache/documents/discoveryengine.v1beta.json @@ -4164,7 +4164,7 @@ } } }, -"revision": "20240123", +"revision": "20240131", "rootUrl": "https://discoveryengine.googleapis.com/", "schemas": { "GoogleApiHttpBody": { @@ -5435,6 +5435,12 @@ }, "type": "object" }, +"GoogleCloudDiscoveryengineV1alphaDigitalParsingConfig": { +"description": "The digital parsing configurations for documents.", +"id": "GoogleCloudDiscoveryengineV1alphaDigitalParsingConfig", +"properties": {}, +"type": "object" +}, "GoogleCloudDiscoveryengineV1alphaDisableAdvancedSiteSearchMetadata": { "description": "Metadata related to the progress of the SiteSearchEngineService.DisableAdvancedSiteSearch operation. This will be returned by the google.longrunning.Operation.metadata field.", "id": "GoogleCloudDiscoveryengineV1alphaDisableAdvancedSiteSearchMetadata", @@ -5462,14 +5468,44 @@ "description": "A singleton resource of DataStore. It's empty when DataStore is created, which defaults to digital parser. The first call to DataStoreService.UpdateDocumentProcessingConfig method will initialize the config.", "id": "GoogleCloudDiscoveryengineV1alphaDocumentProcessingConfig", "properties": { +"defaultParsingConfig": { +"$ref": "GoogleCloudDiscoveryengineV1alphaDocumentProcessingConfigParsingConfig", +"description": "Configurations for default Document parser. If not specified, we will configure it as default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing." +}, "name": { -"description": "Output only. The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`.", -"readOnly": true, +"description": "The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`.", "type": "string" }, "ocrConfig": { "$ref": "GoogleCloudDiscoveryengineV1alphaOcrConfig", -"description": "The OCR config. Currently it only applies to PDFs." +"deprecated": true, +"description": "[DEPRECATED] This field is deprecated. To specify OCR parsing config, please specify `ocr_parsing_config` in `default_parsing_config` field The OCR config. Currently it only applies to PDFs." +}, +"parsingConfigOverrides": { +"additionalProperties": { +"$ref": "GoogleCloudDiscoveryengineV1alphaDocumentProcessingConfigParsingConfig" +}, +"description": "Map from file type to override the default parsing configuration based on the file type. Supported keys: * `pdf`: Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported. * `html`: Override parsing config for HTML files, only digital parsing and or layout parsing are supported.", +"type": "object" +} +}, +"type": "object" +}, +"GoogleCloudDiscoveryengineV1alphaDocumentProcessingConfigParsingConfig": { +"description": "Related configurations applied to a specific type of document parser.", +"id": "GoogleCloudDiscoveryengineV1alphaDocumentProcessingConfigParsingConfig", +"properties": { +"digitalParsingConfig": { +"$ref": "GoogleCloudDiscoveryengineV1alphaDigitalParsingConfig", +"description": "Configurations applied to digital parser." +}, +"layoutParsingConfig": { +"$ref": "GoogleCloudDiscoveryengineV1alphaLayoutParsingConfig", +"description": "Configurations applied to layout parser." +}, +"ocrParsingConfig": { +"$ref": "GoogleCloudDiscoveryengineV1alphaOcrParsingConfig", +"description": "Configurations applied to OCR parser. Currently it only applies to PDFs." } }, "type": "object" @@ -6098,7 +6134,14 @@ }, "type": "object" }, +"GoogleCloudDiscoveryengineV1alphaLayoutParsingConfig": { +"description": "The layout parsing configurations for documents.", +"id": "GoogleCloudDiscoveryengineV1alphaLayoutParsingConfig", +"properties": {}, +"type": "object" +}, "GoogleCloudDiscoveryengineV1alphaOcrConfig": { +"deprecated": true, "description": "The OCR options for parsing documents.", "id": "GoogleCloudDiscoveryengineV1alphaOcrConfig", "properties": { @@ -6120,6 +6163,24 @@ }, "type": "object" }, +"GoogleCloudDiscoveryengineV1alphaOcrParsingConfig": { +"description": "The OCR parsing configurations for documents.", +"id": "GoogleCloudDiscoveryengineV1alphaOcrParsingConfig", +"properties": { +"enhancedDocumentElements": { +"description": "Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model.", +"items": { +"type": "string" +}, +"type": "array" +}, +"useNativeText": { +"description": "If true, will use native text instead of OCR text on pages containing native text.", +"type": "boolean" +} +}, +"type": "object" +}, "GoogleCloudDiscoveryengineV1alphaPurgeDocumentsMetadata": { "description": "Metadata related to the progress of the PurgeDocuments operation. This will be returned by the google.longrunning.Operation.metadata field.", "id": "GoogleCloudDiscoveryengineV1alphaPurgeDocumentsMetadata",Method Details
An object of the form: { # A singleton resource of DataStore. It's empty when DataStore is created, which defaults to digital parser. The first call to DataStoreService.UpdateDocumentProcessingConfig method will initialize the config. - "name": "A String", # Output only. The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. - "ocrConfig": { # The OCR options for parsing documents. # The OCR config. Currently it only applies to PDFs. + "defaultParsingConfig": { # Related configurations applied to a specific type of document parser. # Configurations for default Document parser. If not specified, we will configure it as default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing. + "digitalParsingConfig": { # The digital parsing configurations for documents. # Configurations applied to digital parser. + }, + "layoutParsingConfig": { # The layout parsing configurations for documents. # Configurations applied to layout parser. + }, + "ocrParsingConfig": { # The OCR parsing configurations for documents. # Configurations applied to OCR parser. Currently it only applies to PDFs. + "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. + "A String", + ], + "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. + }, + }, + "name": "A String", # The full resource name of the Document Processing Config. Format: `projects/*/locations/*/collections/*/dataStores/*/documentProcessingConfig`. + "ocrConfig": { # The OCR options for parsing documents. # [DEPRECATED] This field is deprecated. To specify OCR parsing config, please specify `ocr_parsing_config` in `default_parsing_config` field The OCR config. Currently it only applies to PDFs. "enabled": True or False, # Required. If OCR is enabled or not. OCR must be enabled for other OcrConfig options to apply. We will only perform OCR on the first 80 pages of the PDF files. "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. "A String", ], "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. }, + "parsingConfigOverrides": { # Map from file type to override the default parsing configuration based on the file type. Supported keys: * `pdf`: Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported. * `html`: Override parsing config for HTML files, only digital parsing and or layout parsing are supported. + "a_key": { # Related configurations applied to a specific type of document parser. + "digitalParsingConfig": { # The digital parsing configurations for documents. # Configurations applied to digital parser. + }, + "layoutParsingConfig": { # The layout parsing configurations for documents. # Configurations applied to layout parser. + }, + "ocrParsingConfig": { # The OCR parsing configurations for documents. # Configurations applied to OCR parser. Currently it only applies to PDFs. + "enhancedDocumentElements": [ # Apply additional enhanced OCR processing to a list of document elements. Supported values: * `table`: advanced table parsing model. + "A String", + ], + "useNativeText": True or False, # If true, will use native text instead of OCR text on pages containing native text. + }, + }, + }, }