1. Packages
  2. Packages
  3. Google Cloud (GCP) Classic
  4. API Docs
  5. discoveryengine
  6. getDataStore
Viewing docs for Google Cloud v9.21.0
published on Friday, Apr 24, 2026 by Pulumi
gcp logo
Viewing docs for Google Cloud v9.21.0
published on Friday, Apr 24, 2026 by Pulumi

    Gets an existing Discovery Engine data store by ID or display name. See the official documentation and API.

    Example Usage

    By ID

    import * as pulumi from "@pulumi/pulumi";
    import * as gcp from "@pulumi/gcp";
    
    const example = gcp.discoveryengine.getDataStore({
        dataStoreId: "my-data-store",
    });
    
    import pulumi
    import pulumi_gcp as gcp
    
    example = gcp.discoveryengine.get_data_store(data_store_id="my-data-store")
    
    package main
    
    import (
    	"github.com/pulumi/pulumi-gcp/sdk/v9/go/gcp/discoveryengine"
    	"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
    )
    
    func main() {
    	pulumi.Run(func(ctx *pulumi.Context) error {
    		_, err := discoveryengine.LookupDataStore(ctx, &discoveryengine.LookupDataStoreArgs{
    			DataStoreId: pulumi.StringRef("my-data-store"),
    		}, nil)
    		if err != nil {
    			return err
    		}
    		return nil
    	})
    }
    
    using System.Collections.Generic;
    using System.Linq;
    using Pulumi;
    using Gcp = Pulumi.Gcp;
    
    return await Deployment.RunAsync(() => 
    {
        var example = Gcp.DiscoveryEngine.GetDataStore.Invoke(new()
        {
            DataStoreId = "my-data-store",
        });
    
    });
    
    package generated_program;
    
    import com.pulumi.Context;
    import com.pulumi.Pulumi;
    import com.pulumi.core.Output;
    import com.pulumi.gcp.discoveryengine.DiscoveryengineFunctions;
    import com.pulumi.gcp.discoveryengine.inputs.GetDataStoreArgs;
    import java.util.List;
    import java.util.ArrayList;
    import java.util.Map;
    import java.io.File;
    import java.nio.file.Files;
    import java.nio.file.Paths;
    
    public class App {
        public static void main(String[] args) {
            Pulumi.run(App::stack);
        }
    
        public static void stack(Context ctx) {
            final var example = DiscoveryengineFunctions.getDataStore(GetDataStoreArgs.builder()
                .dataStoreId("my-data-store")
                .build());
    
        }
    }
    
    variables:
      example:
        fn::invoke:
          function: gcp:discoveryengine:getDataStore
          arguments:
            dataStoreId: my-data-store
    

    By display name

    import * as pulumi from "@pulumi/pulumi";
    import * as gcp from "@pulumi/gcp";
    
    const example = gcp.discoveryengine.getDataStore({
        displayName: "My Data Store",
    });
    
    import pulumi
    import pulumi_gcp as gcp
    
    example = gcp.discoveryengine.get_data_store(display_name="My Data Store")
    
    package main
    
    import (
    	"github.com/pulumi/pulumi-gcp/sdk/v9/go/gcp/discoveryengine"
    	"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
    )
    
    func main() {
    	pulumi.Run(func(ctx *pulumi.Context) error {
    		_, err := discoveryengine.LookupDataStore(ctx, &discoveryengine.LookupDataStoreArgs{
    			DisplayName: pulumi.StringRef("My Data Store"),
    		}, nil)
    		if err != nil {
    			return err
    		}
    		return nil
    	})
    }
    
    using System.Collections.Generic;
    using System.Linq;
    using Pulumi;
    using Gcp = Pulumi.Gcp;
    
    return await Deployment.RunAsync(() => 
    {
        var example = Gcp.DiscoveryEngine.GetDataStore.Invoke(new()
        {
            DisplayName = "My Data Store",
        });
    
    });
    
    package generated_program;
    
    import com.pulumi.Context;
    import com.pulumi.Pulumi;
    import com.pulumi.core.Output;
    import com.pulumi.gcp.discoveryengine.DiscoveryengineFunctions;
    import com.pulumi.gcp.discoveryengine.inputs.GetDataStoreArgs;
    import java.util.List;
    import java.util.ArrayList;
    import java.util.Map;
    import java.io.File;
    import java.nio.file.Files;
    import java.nio.file.Paths;
    
    public class App {
        public static void main(String[] args) {
            Pulumi.run(App::stack);
        }
    
        public static void stack(Context ctx) {
            final var example = DiscoveryengineFunctions.getDataStore(GetDataStoreArgs.builder()
                .displayName("My Data Store")
                .build());
    
        }
    }
    
    variables:
      example:
        fn::invoke:
          function: gcp:discoveryengine:getDataStore
          arguments:
            displayName: My Data Store
    

    Using getDataStore

    Two invocation forms are available. The direct form accepts plain arguments and either blocks until the result value is available, or returns a Promise-wrapped result. The output form accepts Input-wrapped arguments and returns an Output-wrapped result.

    function getDataStore(args: GetDataStoreArgs, opts?: InvokeOptions): Promise<GetDataStoreResult>
    function getDataStoreOutput(args: GetDataStoreOutputArgs, opts?: InvokeOptions): Output<GetDataStoreResult>
    def get_data_store(data_store_id: Optional[str] = None,
                       display_name: Optional[str] = None,
                       location: Optional[str] = None,
                       project: Optional[str] = None,
                       opts: Optional[InvokeOptions] = None) -> GetDataStoreResult
    def get_data_store_output(data_store_id: Optional[pulumi.Input[str]] = None,
                       display_name: Optional[pulumi.Input[str]] = None,
                       location: Optional[pulumi.Input[str]] = None,
                       project: Optional[pulumi.Input[str]] = None,
                       opts: Optional[InvokeOptions] = None) -> Output[GetDataStoreResult]
    func LookupDataStore(ctx *Context, args *LookupDataStoreArgs, opts ...InvokeOption) (*LookupDataStoreResult, error)
    func LookupDataStoreOutput(ctx *Context, args *LookupDataStoreOutputArgs, opts ...InvokeOption) LookupDataStoreResultOutput

    > Note: This function is named LookupDataStore in the Go SDK.

    public static class GetDataStore 
    {
        public static Task<GetDataStoreResult> InvokeAsync(GetDataStoreArgs args, InvokeOptions? opts = null)
        public static Output<GetDataStoreResult> Invoke(GetDataStoreInvokeArgs args, InvokeOptions? opts = null)
    }
    public static CompletableFuture<GetDataStoreResult> getDataStore(GetDataStoreArgs args, InvokeOptions options)
    public static Output<GetDataStoreResult> getDataStore(GetDataStoreArgs args, InvokeOptions options)
    
    fn::invoke:
      function: gcp:discoveryengine/getDataStore:getDataStore
      arguments:
        # arguments dictionary

    The following arguments are supported:

    DataStoreId string
    The unique id of the data store. Exactly one of dataStoreId or displayName must be provided.
    DisplayName string
    The display name of the data store. Exactly one of dataStoreId or displayName must be provided. Returns an error if multiple data stores share the same display name.
    Location string
    The geographic location where the data store resides. The value can only be one of "global", "us" and "eu". Defaults to global.
    Project string
    The ID of the project in which the resource belongs. If it is not provided, the provider project is used.
    DataStoreId string
    The unique id of the data store. Exactly one of dataStoreId or displayName must be provided.
    DisplayName string
    The display name of the data store. Exactly one of dataStoreId or displayName must be provided. Returns an error if multiple data stores share the same display name.
    Location string
    The geographic location where the data store resides. The value can only be one of "global", "us" and "eu". Defaults to global.
    Project string
    The ID of the project in which the resource belongs. If it is not provided, the provider project is used.
    dataStoreId String
    The unique id of the data store. Exactly one of dataStoreId or displayName must be provided.
    displayName String
    The display name of the data store. Exactly one of dataStoreId or displayName must be provided. Returns an error if multiple data stores share the same display name.
    location String
    The geographic location where the data store resides. The value can only be one of "global", "us" and "eu". Defaults to global.
    project String
    The ID of the project in which the resource belongs. If it is not provided, the provider project is used.
    dataStoreId string
    The unique id of the data store. Exactly one of dataStoreId or displayName must be provided.
    displayName string
    The display name of the data store. Exactly one of dataStoreId or displayName must be provided. Returns an error if multiple data stores share the same display name.
    location string
    The geographic location where the data store resides. The value can only be one of "global", "us" and "eu". Defaults to global.
    project string
    The ID of the project in which the resource belongs. If it is not provided, the provider project is used.
    data_store_id str
    The unique id of the data store. Exactly one of dataStoreId or displayName must be provided.
    display_name str
    The display name of the data store. Exactly one of dataStoreId or displayName must be provided. Returns an error if multiple data stores share the same display name.
    location str
    The geographic location where the data store resides. The value can only be one of "global", "us" and "eu". Defaults to global.
    project str
    The ID of the project in which the resource belongs. If it is not provided, the provider project is used.
    dataStoreId String
    The unique id of the data store. Exactly one of dataStoreId or displayName must be provided.
    displayName String
    The display name of the data store. Exactly one of dataStoreId or displayName must be provided. Returns an error if multiple data stores share the same display name.
    location String
    The geographic location where the data store resides. The value can only be one of "global", "us" and "eu". Defaults to global.
    project String
    The ID of the project in which the resource belongs. If it is not provided, the provider project is used.

    getDataStore Result

    The following output properties are available:

    Supporting Types

    GetDataStoreAdvancedSiteSearchConfig

    DisableAutomaticRefresh bool
    If set true, automatic refresh is disabled for the DataStore.
    DisableInitialIndex bool
    If set true, initial indexing is disabled for the DataStore.
    DisableAutomaticRefresh bool
    If set true, automatic refresh is disabled for the DataStore.
    DisableInitialIndex bool
    If set true, initial indexing is disabled for the DataStore.
    disableAutomaticRefresh Boolean
    If set true, automatic refresh is disabled for the DataStore.
    disableInitialIndex Boolean
    If set true, initial indexing is disabled for the DataStore.
    disableAutomaticRefresh boolean
    If set true, automatic refresh is disabled for the DataStore.
    disableInitialIndex boolean
    If set true, initial indexing is disabled for the DataStore.
    disable_automatic_refresh bool
    If set true, automatic refresh is disabled for the DataStore.
    disable_initial_index bool
    If set true, initial indexing is disabled for the DataStore.
    disableAutomaticRefresh Boolean
    If set true, automatic refresh is disabled for the DataStore.
    disableInitialIndex Boolean
    If set true, initial indexing is disabled for the DataStore.

    GetDataStoreDocumentProcessingConfig

    ChunkingConfigs List<GetDataStoreDocumentProcessingConfigChunkingConfig>
    Whether chunking mode is enabled.
    DefaultParsingConfigs List<GetDataStoreDocumentProcessingConfigDefaultParsingConfig>
    Configurations for default Document parser. If not specified, this resource will be configured to use a default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing.
    Name string
    The full resource name of the Document Processing Config. Format: 'projects/{project}/locations/{location}/collections/{collection_id}/dataStores/{data_store_id}/documentProcessingConfig'.
    ParsingConfigOverrides List<GetDataStoreDocumentProcessingConfigParsingConfigOverride>
    Map from file type to override the default parsing configuration based on the file type. Supported keys:

    • 'pdf': Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported.
    • 'html': Override parsing config for HTML files, only digital parsing and or layout parsing are supported.
    • 'docx': Override parsing config for DOCX files, only digital parsing and or layout parsing are supported.
    ChunkingConfigs []GetDataStoreDocumentProcessingConfigChunkingConfig
    Whether chunking mode is enabled.
    DefaultParsingConfigs []GetDataStoreDocumentProcessingConfigDefaultParsingConfig
    Configurations for default Document parser. If not specified, this resource will be configured to use a default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing.
    Name string
    The full resource name of the Document Processing Config. Format: 'projects/{project}/locations/{location}/collections/{collection_id}/dataStores/{data_store_id}/documentProcessingConfig'.
    ParsingConfigOverrides []GetDataStoreDocumentProcessingConfigParsingConfigOverride
    Map from file type to override the default parsing configuration based on the file type. Supported keys:

    • 'pdf': Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported.
    • 'html': Override parsing config for HTML files, only digital parsing and or layout parsing are supported.
    • 'docx': Override parsing config for DOCX files, only digital parsing and or layout parsing are supported.
    chunkingConfigs List<GetDataStoreDocumentProcessingConfigChunkingConfig>
    Whether chunking mode is enabled.
    defaultParsingConfigs List<GetDataStoreDocumentProcessingConfigDefaultParsingConfig>
    Configurations for default Document parser. If not specified, this resource will be configured to use a default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing.
    name String
    The full resource name of the Document Processing Config. Format: 'projects/{project}/locations/{location}/collections/{collection_id}/dataStores/{data_store_id}/documentProcessingConfig'.
    parsingConfigOverrides List<GetDataStoreDocumentProcessingConfigParsingConfigOverride>
    Map from file type to override the default parsing configuration based on the file type. Supported keys:

    • 'pdf': Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported.
    • 'html': Override parsing config for HTML files, only digital parsing and or layout parsing are supported.
    • 'docx': Override parsing config for DOCX files, only digital parsing and or layout parsing are supported.
    chunkingConfigs GetDataStoreDocumentProcessingConfigChunkingConfig[]
    Whether chunking mode is enabled.
    defaultParsingConfigs GetDataStoreDocumentProcessingConfigDefaultParsingConfig[]
    Configurations for default Document parser. If not specified, this resource will be configured to use a default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing.
    name string
    The full resource name of the Document Processing Config. Format: 'projects/{project}/locations/{location}/collections/{collection_id}/dataStores/{data_store_id}/documentProcessingConfig'.
    parsingConfigOverrides GetDataStoreDocumentProcessingConfigParsingConfigOverride[]
    Map from file type to override the default parsing configuration based on the file type. Supported keys:

    • 'pdf': Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported.
    • 'html': Override parsing config for HTML files, only digital parsing and or layout parsing are supported.
    • 'docx': Override parsing config for DOCX files, only digital parsing and or layout parsing are supported.
    chunking_configs Sequence[GetDataStoreDocumentProcessingConfigChunkingConfig]
    Whether chunking mode is enabled.
    default_parsing_configs Sequence[GetDataStoreDocumentProcessingConfigDefaultParsingConfig]
    Configurations for default Document parser. If not specified, this resource will be configured to use a default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing.
    name str
    The full resource name of the Document Processing Config. Format: 'projects/{project}/locations/{location}/collections/{collection_id}/dataStores/{data_store_id}/documentProcessingConfig'.
    parsing_config_overrides Sequence[GetDataStoreDocumentProcessingConfigParsingConfigOverride]
    Map from file type to override the default parsing configuration based on the file type. Supported keys:

    • 'pdf': Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported.
    • 'html': Override parsing config for HTML files, only digital parsing and or layout parsing are supported.
    • 'docx': Override parsing config for DOCX files, only digital parsing and or layout parsing are supported.
    chunkingConfigs List<Property Map>
    Whether chunking mode is enabled.
    defaultParsingConfigs List<Property Map>
    Configurations for default Document parser. If not specified, this resource will be configured to use a default DigitalParsingConfig, and the default parsing config will be applied to all file types for Document parsing.
    name String
    The full resource name of the Document Processing Config. Format: 'projects/{project}/locations/{location}/collections/{collection_id}/dataStores/{data_store_id}/documentProcessingConfig'.
    parsingConfigOverrides List<Property Map>
    Map from file type to override the default parsing configuration based on the file type. Supported keys:

    • 'pdf': Override parsing config for PDF files, either digital parsing, ocr parsing or layout parsing is supported.
    • 'html': Override parsing config for HTML files, only digital parsing and or layout parsing are supported.
    • 'docx': Override parsing config for DOCX files, only digital parsing and or layout parsing are supported.

    GetDataStoreDocumentProcessingConfigChunkingConfig

    layoutBasedChunkingConfigs List<Property Map>
    Configuration for the layout based chunking.

    GetDataStoreDocumentProcessingConfigChunkingConfigLayoutBasedChunkingConfig

    ChunkSize int
    The token size limit for each chunk. Supported values: 100-500 (inclusive). Default value: 500.
    IncludeAncestorHeadings bool
    Whether to include appending different levels of headings to chunks from the middle of the document to prevent context loss. Default value: False.
    ChunkSize int
    The token size limit for each chunk. Supported values: 100-500 (inclusive). Default value: 500.
    IncludeAncestorHeadings bool
    Whether to include appending different levels of headings to chunks from the middle of the document to prevent context loss. Default value: False.
    chunkSize Integer
    The token size limit for each chunk. Supported values: 100-500 (inclusive). Default value: 500.
    includeAncestorHeadings Boolean
    Whether to include appending different levels of headings to chunks from the middle of the document to prevent context loss. Default value: False.
    chunkSize number
    The token size limit for each chunk. Supported values: 100-500 (inclusive). Default value: 500.
    includeAncestorHeadings boolean
    Whether to include appending different levels of headings to chunks from the middle of the document to prevent context loss. Default value: False.
    chunk_size int
    The token size limit for each chunk. Supported values: 100-500 (inclusive). Default value: 500.
    include_ancestor_headings bool
    Whether to include appending different levels of headings to chunks from the middle of the document to prevent context loss. Default value: False.
    chunkSize Number
    The token size limit for each chunk. Supported values: 100-500 (inclusive). Default value: 500.
    includeAncestorHeadings Boolean
    Whether to include appending different levels of headings to chunks from the middle of the document to prevent context loss. Default value: False.

    GetDataStoreDocumentProcessingConfigDefaultParsingConfig

    digitalParsingConfigs List<Property Map>
    Configurations applied to digital parser.
    layoutParsingConfigs List<Property Map>
    Configurations applied to layout parser.
    ocrParsingConfigs List<Property Map>
    Configurations applied to OCR parser. Currently it only applies to PDFs.

    GetDataStoreDocumentProcessingConfigDefaultParsingConfigLayoutParsingConfig

    EnableImageAnnotation bool
    If true, the LLM based annotation is added to the image during parsing.
    EnableTableAnnotation bool
    If true, the LLM based annotation is added to the table during parsing.
    ExcludeHtmlClasses List<string>
    List of HTML classes to exclude from the parsed content.
    ExcludeHtmlElements List<string>
    List of HTML elements to exclude from the parsed content.
    ExcludeHtmlIds List<string>
    List of HTML ids to exclude from the parsed content.
    StructuredContentTypes List<string>
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.
    EnableImageAnnotation bool
    If true, the LLM based annotation is added to the image during parsing.
    EnableTableAnnotation bool
    If true, the LLM based annotation is added to the table during parsing.
    ExcludeHtmlClasses []string
    List of HTML classes to exclude from the parsed content.
    ExcludeHtmlElements []string
    List of HTML elements to exclude from the parsed content.
    ExcludeHtmlIds []string
    List of HTML ids to exclude from the parsed content.
    StructuredContentTypes []string
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.
    enableImageAnnotation Boolean
    If true, the LLM based annotation is added to the image during parsing.
    enableTableAnnotation Boolean
    If true, the LLM based annotation is added to the table during parsing.
    excludeHtmlClasses List<String>
    List of HTML classes to exclude from the parsed content.
    excludeHtmlElements List<String>
    List of HTML elements to exclude from the parsed content.
    excludeHtmlIds List<String>
    List of HTML ids to exclude from the parsed content.
    structuredContentTypes List<String>
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.
    enableImageAnnotation boolean
    If true, the LLM based annotation is added to the image during parsing.
    enableTableAnnotation boolean
    If true, the LLM based annotation is added to the table during parsing.
    excludeHtmlClasses string[]
    List of HTML classes to exclude from the parsed content.
    excludeHtmlElements string[]
    List of HTML elements to exclude from the parsed content.
    excludeHtmlIds string[]
    List of HTML ids to exclude from the parsed content.
    structuredContentTypes string[]
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.
    enable_image_annotation bool
    If true, the LLM based annotation is added to the image during parsing.
    enable_table_annotation bool
    If true, the LLM based annotation is added to the table during parsing.
    exclude_html_classes Sequence[str]
    List of HTML classes to exclude from the parsed content.
    exclude_html_elements Sequence[str]
    List of HTML elements to exclude from the parsed content.
    exclude_html_ids Sequence[str]
    List of HTML ids to exclude from the parsed content.
    structured_content_types Sequence[str]
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.
    enableImageAnnotation Boolean
    If true, the LLM based annotation is added to the image during parsing.
    enableTableAnnotation Boolean
    If true, the LLM based annotation is added to the table during parsing.
    excludeHtmlClasses List<String>
    List of HTML classes to exclude from the parsed content.
    excludeHtmlElements List<String>
    List of HTML elements to exclude from the parsed content.
    excludeHtmlIds List<String>
    List of HTML ids to exclude from the parsed content.
    structuredContentTypes List<String>
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.

    GetDataStoreDocumentProcessingConfigDefaultParsingConfigOcrParsingConfig

    UseNativeText bool
    If true, will use native text instead of OCR text on pages containing native text.
    UseNativeText bool
    If true, will use native text instead of OCR text on pages containing native text.
    useNativeText Boolean
    If true, will use native text instead of OCR text on pages containing native text.
    useNativeText boolean
    If true, will use native text instead of OCR text on pages containing native text.
    use_native_text bool
    If true, will use native text instead of OCR text on pages containing native text.
    useNativeText Boolean
    If true, will use native text instead of OCR text on pages containing native text.

    GetDataStoreDocumentProcessingConfigParsingConfigOverride

    digitalParsingConfigs List<Property Map>
    Configurations applied to digital parser.
    fileType String
    layoutParsingConfigs List<Property Map>
    Configurations applied to layout parser.
    ocrParsingConfigs List<Property Map>
    Configurations applied to OCR parser. Currently it only applies to PDFs.

    GetDataStoreDocumentProcessingConfigParsingConfigOverrideLayoutParsingConfig

    EnableImageAnnotation bool
    If true, the LLM based annotation is added to the image during parsing.
    EnableTableAnnotation bool
    If true, the LLM based annotation is added to the table during parsing.
    ExcludeHtmlClasses List<string>
    List of HTML classes to exclude from the parsed content.
    ExcludeHtmlElements List<string>
    List of HTML elements to exclude from the parsed content.
    ExcludeHtmlIds List<string>
    List of HTML ids to exclude from the parsed content.
    StructuredContentTypes List<string>
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.
    EnableImageAnnotation bool
    If true, the LLM based annotation is added to the image during parsing.
    EnableTableAnnotation bool
    If true, the LLM based annotation is added to the table during parsing.
    ExcludeHtmlClasses []string
    List of HTML classes to exclude from the parsed content.
    ExcludeHtmlElements []string
    List of HTML elements to exclude from the parsed content.
    ExcludeHtmlIds []string
    List of HTML ids to exclude from the parsed content.
    StructuredContentTypes []string
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.
    enableImageAnnotation Boolean
    If true, the LLM based annotation is added to the image during parsing.
    enableTableAnnotation Boolean
    If true, the LLM based annotation is added to the table during parsing.
    excludeHtmlClasses List<String>
    List of HTML classes to exclude from the parsed content.
    excludeHtmlElements List<String>
    List of HTML elements to exclude from the parsed content.
    excludeHtmlIds List<String>
    List of HTML ids to exclude from the parsed content.
    structuredContentTypes List<String>
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.
    enableImageAnnotation boolean
    If true, the LLM based annotation is added to the image during parsing.
    enableTableAnnotation boolean
    If true, the LLM based annotation is added to the table during parsing.
    excludeHtmlClasses string[]
    List of HTML classes to exclude from the parsed content.
    excludeHtmlElements string[]
    List of HTML elements to exclude from the parsed content.
    excludeHtmlIds string[]
    List of HTML ids to exclude from the parsed content.
    structuredContentTypes string[]
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.
    enable_image_annotation bool
    If true, the LLM based annotation is added to the image during parsing.
    enable_table_annotation bool
    If true, the LLM based annotation is added to the table during parsing.
    exclude_html_classes Sequence[str]
    List of HTML classes to exclude from the parsed content.
    exclude_html_elements Sequence[str]
    List of HTML elements to exclude from the parsed content.
    exclude_html_ids Sequence[str]
    List of HTML ids to exclude from the parsed content.
    structured_content_types Sequence[str]
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.
    enableImageAnnotation Boolean
    If true, the LLM based annotation is added to the image during parsing.
    enableTableAnnotation Boolean
    If true, the LLM based annotation is added to the table during parsing.
    excludeHtmlClasses List<String>
    List of HTML classes to exclude from the parsed content.
    excludeHtmlElements List<String>
    List of HTML elements to exclude from the parsed content.
    excludeHtmlIds List<String>
    List of HTML ids to exclude from the parsed content.
    structuredContentTypes List<String>
    Contains the required structure types to extract from the document. Supported values: 'shareholder-structure'.

    GetDataStoreDocumentProcessingConfigParsingConfigOverrideOcrParsingConfig

    UseNativeText bool
    If true, will use native text instead of OCR text on pages containing native text.
    UseNativeText bool
    If true, will use native text instead of OCR text on pages containing native text.
    useNativeText Boolean
    If true, will use native text instead of OCR text on pages containing native text.
    useNativeText boolean
    If true, will use native text instead of OCR text on pages containing native text.
    use_native_text bool
    If true, will use native text instead of OCR text on pages containing native text.
    useNativeText Boolean
    If true, will use native text instead of OCR text on pages containing native text.

    Package Details

    Repository
    Google Cloud (GCP) Classic pulumi/pulumi-gcp
    License
    Apache-2.0
    Notes
    This Pulumi package is based on the google-beta Terraform Provider.
    gcp logo
    Viewing docs for Google Cloud v9.21.0
    published on Friday, Apr 24, 2026 by Pulumi
      Try Pulumi Cloud free. Your team will thank you.