1. Packages
  2. Packages
  3. DataRobot
  4. API Docs
  5. Workload
Viewing docs for DataRobot v0.10.38
published on Friday, May 22, 2026 by DataRobot, Inc.
datarobot logo
Viewing docs for DataRobot v0.10.38
published on Friday, May 22, 2026 by DataRobot, Inc.

    A Workload runs a containerized artifact in the cluster and exposes an inference endpoint.

    Several attributes (including runtime and artifact_id) trigger replacement when changed. To avoid downtime during replacements, it is recommended to set create_before_destroy in the resource lifecycle:

    import * as pulumi from "@pulumi/pulumi";
    
    import pulumi
    
    package main
    
    import (
    	"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
    )
    
    func main() {
    	pulumi.Run(func(ctx *pulumi.Context) error {
    		return nil
    	})
    }
    
    using System.Collections.Generic;
    using System.Linq;
    using Pulumi;
    
    return await Deployment.RunAsync(() => 
    {
    });
    
    package generated_program;
    
    import com.pulumi.Context;
    import com.pulumi.Pulumi;
    import com.pulumi.core.Output;
    import java.util.List;
    import java.util.ArrayList;
    import java.util.Map;
    import java.io.File;
    import java.nio.file.Files;
    import java.nio.file.Paths;
    
    public class App {
        public static void main(String[] args) {
            Pulumi.run(App::stack);
        }
    
        public static void stack(Context ctx) {
        }
    }
    
    {}
    
    Example coming soon!
    

    Create Workload Resource

    Resources are created with functions called constructors. To learn more about declaring and configuring resources, see Resources.

    Constructor syntax

    new Workload(name: string, args: WorkloadArgs, opts?: CustomResourceOptions);
    @overload
    def Workload(resource_name: str,
                 args: WorkloadArgs,
                 opts: Optional[ResourceOptions] = None)
    
    @overload
    def Workload(resource_name: str,
                 opts: Optional[ResourceOptions] = None,
                 artifact_id: Optional[str] = None,
                 runtime: Optional[WorkloadRuntimeArgs] = None,
                 description: Optional[str] = None,
                 importance: Optional[str] = None,
                 name: Optional[str] = None)
    func NewWorkload(ctx *Context, name string, args WorkloadArgs, opts ...ResourceOption) (*Workload, error)
    public Workload(string name, WorkloadArgs args, CustomResourceOptions? opts = null)
    public Workload(String name, WorkloadArgs args)
    public Workload(String name, WorkloadArgs args, CustomResourceOptions options)
    
    type: datarobot:Workload
    properties: # The arguments to resource properties.
    options: # Bag of options to control resource's behavior.
    
    
    resource "datarobot_workload" "name" {
        # resource properties
    }

    Parameters

    name string
    The unique name of the resource.
    args WorkloadArgs
    The arguments to resource properties.
    opts CustomResourceOptions
    Bag of options to control resource's behavior.
    resource_name str
    The unique name of the resource.
    args WorkloadArgs
    The arguments to resource properties.
    opts ResourceOptions
    Bag of options to control resource's behavior.
    ctx Context
    Context object for the current deployment.
    name string
    The unique name of the resource.
    args WorkloadArgs
    The arguments to resource properties.
    opts ResourceOption
    Bag of options to control resource's behavior.
    name string
    The unique name of the resource.
    args WorkloadArgs
    The arguments to resource properties.
    opts CustomResourceOptions
    Bag of options to control resource's behavior.
    name String
    The unique name of the resource.
    args WorkloadArgs
    The arguments to resource properties.
    options CustomResourceOptions
    Bag of options to control resource's behavior.

    Constructor example

    The following reference example uses placeholder values for all input properties.

    var workloadResource = new Datarobot.Workload("workloadResource", new()
    {
        ArtifactId = "string",
        Runtime = new Datarobot.Inputs.WorkloadRuntimeArgs
        {
            ContainerGroups = new[]
            {
                new Datarobot.Inputs.WorkloadRuntimeContainerGroupArgs
                {
                    Autoscaling = new Datarobot.Inputs.WorkloadRuntimeContainerGroupAutoscalingArgs
                    {
                        Policies = new[]
                        {
                            new Datarobot.Inputs.WorkloadRuntimeContainerGroupAutoscalingPolicyArgs
                            {
                                MaxCount = 0,
                                MinCount = 0,
                                ScalingMetric = "string",
                                Target = 0,
                                Priority = 0,
                            },
                        },
                        Enabled = false,
                    },
                    BundleSelectionPolicy = "string",
                    Containers = new[]
                    {
                        new Datarobot.Inputs.WorkloadRuntimeContainerGroupContainerArgs
                        {
                            Name = "string",
                            ResourceAllocation = new Datarobot.Inputs.WorkloadRuntimeContainerGroupContainerResourceAllocationArgs
                            {
                                Cpu = 0,
                                Gpu = 0,
                                GpuMemory = 0,
                                Memory = 0,
                            },
                        },
                    },
                    Name = "string",
                    ReplicaCount = 0,
                    ResourceBundles = new[]
                    {
                        "string",
                    },
                },
            },
        },
        Description = "string",
        Importance = "string",
        Name = "string",
    });
    
    example, err := datarobot.NewWorkload(ctx, "workloadResource", &datarobot.WorkloadArgs{
    	ArtifactId: pulumi.String("string"),
    	Runtime: &datarobot.WorkloadRuntimeArgs{
    		ContainerGroups: datarobot.WorkloadRuntimeContainerGroupArray{
    			&datarobot.WorkloadRuntimeContainerGroupArgs{
    				Autoscaling: &datarobot.WorkloadRuntimeContainerGroupAutoscalingArgs{
    					Policies: datarobot.WorkloadRuntimeContainerGroupAutoscalingPolicyArray{
    						&datarobot.WorkloadRuntimeContainerGroupAutoscalingPolicyArgs{
    							MaxCount:      pulumi.Int(0),
    							MinCount:      pulumi.Int(0),
    							ScalingMetric: pulumi.String("string"),
    							Target:        pulumi.Float64(0),
    							Priority:      pulumi.Int(0),
    						},
    					},
    					Enabled: pulumi.Bool(false),
    				},
    				BundleSelectionPolicy: pulumi.String("string"),
    				Containers: datarobot.WorkloadRuntimeContainerGroupContainerArray{
    					&datarobot.WorkloadRuntimeContainerGroupContainerArgs{
    						Name: pulumi.String("string"),
    						ResourceAllocation: &datarobot.WorkloadRuntimeContainerGroupContainerResourceAllocationArgs{
    							Cpu:       pulumi.Float64(0),
    							Gpu:       pulumi.Float64(0),
    							GpuMemory: pulumi.Int(0),
    							Memory:    pulumi.Int(0),
    						},
    					},
    				},
    				Name:         pulumi.String("string"),
    				ReplicaCount: pulumi.Int(0),
    				ResourceBundles: pulumi.StringArray{
    					pulumi.String("string"),
    				},
    			},
    		},
    	},
    	Description: pulumi.String("string"),
    	Importance:  pulumi.String("string"),
    	Name:        pulumi.String("string"),
    })
    
    resource "datarobot_workload" "workloadResource" {
      artifact_id = "string"
      runtime = {
        container_groups = [{
          "autoscaling" = {
            "policies" = [{
              "maxCount"      = 0
              "minCount"      = 0
              "scalingMetric" = "string"
              "target"        = 0
              "priority"      = 0
            }]
            "enabled" = false
          }
          "bundleSelectionPolicy" = "string"
          "containers" = [{
            "name" = "string"
            "resourceAllocation" = {
              "cpu"       = 0
              "gpu"       = 0
              "gpuMemory" = 0
              "memory"    = 0
            }
          }]
          "name"            = "string"
          "replicaCount"    = 0
          "resourceBundles" = ["string"]
        }]
      }
      description = "string"
      importance  = "string"
      name        = "string"
    }
    
    var workloadResource = new Workload("workloadResource", WorkloadArgs.builder()
        .artifactId("string")
        .runtime(WorkloadRuntimeArgs.builder()
            .containerGroups(WorkloadRuntimeContainerGroupArgs.builder()
                .autoscaling(WorkloadRuntimeContainerGroupAutoscalingArgs.builder()
                    .policies(WorkloadRuntimeContainerGroupAutoscalingPolicyArgs.builder()
                        .maxCount(0)
                        .minCount(0)
                        .scalingMetric("string")
                        .target(0.0)
                        .priority(0)
                        .build())
                    .enabled(false)
                    .build())
                .bundleSelectionPolicy("string")
                .containers(WorkloadRuntimeContainerGroupContainerArgs.builder()
                    .name("string")
                    .resourceAllocation(WorkloadRuntimeContainerGroupContainerResourceAllocationArgs.builder()
                        .cpu(0.0)
                        .gpu(0.0)
                        .gpuMemory(0)
                        .memory(0)
                        .build())
                    .build())
                .name("string")
                .replicaCount(0)
                .resourceBundles("string")
                .build())
            .build())
        .description("string")
        .importance("string")
        .name("string")
        .build());
    
    workload_resource = datarobot.Workload("workloadResource",
        artifact_id="string",
        runtime={
            "container_groups": [{
                "autoscaling": {
                    "policies": [{
                        "max_count": 0,
                        "min_count": 0,
                        "scaling_metric": "string",
                        "target": float(0),
                        "priority": 0,
                    }],
                    "enabled": False,
                },
                "bundle_selection_policy": "string",
                "containers": [{
                    "name": "string",
                    "resource_allocation": {
                        "cpu": float(0),
                        "gpu": float(0),
                        "gpu_memory": 0,
                        "memory": 0,
                    },
                }],
                "name": "string",
                "replica_count": 0,
                "resource_bundles": ["string"],
            }],
        },
        description="string",
        importance="string",
        name="string")
    
    const workloadResource = new datarobot.Workload("workloadResource", {
        artifactId: "string",
        runtime: {
            containerGroups: [{
                autoscaling: {
                    policies: [{
                        maxCount: 0,
                        minCount: 0,
                        scalingMetric: "string",
                        target: 0,
                        priority: 0,
                    }],
                    enabled: false,
                },
                bundleSelectionPolicy: "string",
                containers: [{
                    name: "string",
                    resourceAllocation: {
                        cpu: 0,
                        gpu: 0,
                        gpuMemory: 0,
                        memory: 0,
                    },
                }],
                name: "string",
                replicaCount: 0,
                resourceBundles: ["string"],
            }],
        },
        description: "string",
        importance: "string",
        name: "string",
    });
    
    type: datarobot:Workload
    properties:
        artifactId: string
        description: string
        importance: string
        name: string
        runtime:
            containerGroups:
                - autoscaling:
                    enabled: false
                    policies:
                        - maxCount: 0
                          minCount: 0
                          priority: 0
                          scalingMetric: string
                          target: 0
                  bundleSelectionPolicy: string
                  containers:
                    - name: string
                      resourceAllocation:
                        cpu: 0
                        gpu: 0
                        gpuMemory: 0
                        memory: 0
                  name: string
                  replicaCount: 0
                  resourceBundles:
                    - string
    

    Workload Resource Properties

    To learn more about resource properties and how to use them, see Inputs and Outputs in the Architecture and Concepts docs.

    Inputs

    In Python, inputs that are objects can be passed either as argument classes or as dictionary literals.

    The Workload resource accepts the following input properties:

    ArtifactId string
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    Runtime DataRobotWorkloadRuntime
    Runtime configuration for the Workload.
    Description string
    A human-readable description of the Workload.
    Importance string
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    Name string
    The name of the Workload.
    ArtifactId string
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    Runtime WorkloadRuntimeArgs
    Runtime configuration for the Workload.
    Description string
    A human-readable description of the Workload.
    Importance string
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    Name string
    The name of the Workload.
    artifact_id string
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    runtime object
    Runtime configuration for the Workload.
    description string
    A human-readable description of the Workload.
    importance string
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    name string
    The name of the Workload.
    artifactId String
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    runtime WorkloadRuntime
    Runtime configuration for the Workload.
    description String
    A human-readable description of the Workload.
    importance String
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    name String
    The name of the Workload.
    artifactId string
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    runtime WorkloadRuntime
    Runtime configuration for the Workload.
    description string
    A human-readable description of the Workload.
    importance string
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    name string
    The name of the Workload.
    artifact_id str
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    runtime WorkloadRuntimeArgs
    Runtime configuration for the Workload.
    description str
    A human-readable description of the Workload.
    importance str
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    name str
    The name of the Workload.
    artifactId String
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    runtime Property Map
    Runtime configuration for the Workload.
    description String
    A human-readable description of the Workload.
    importance String
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    name String
    The name of the Workload.

    Outputs

    All input properties are implicitly available as output properties. Additionally, the Workload resource produces the following output properties:

    Endpoint string
    The inference endpoint URL for the Workload.
    Id string
    The provider-assigned unique ID for this managed resource.
    Status string
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    Endpoint string
    The inference endpoint URL for the Workload.
    Id string
    The provider-assigned unique ID for this managed resource.
    Status string
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    endpoint string
    The inference endpoint URL for the Workload.
    id string
    The provider-assigned unique ID for this managed resource.
    status string
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    endpoint String
    The inference endpoint URL for the Workload.
    id String
    The provider-assigned unique ID for this managed resource.
    status String
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    endpoint string
    The inference endpoint URL for the Workload.
    id string
    The provider-assigned unique ID for this managed resource.
    status string
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    endpoint str
    The inference endpoint URL for the Workload.
    id str
    The provider-assigned unique ID for this managed resource.
    status str
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    endpoint String
    The inference endpoint URL for the Workload.
    id String
    The provider-assigned unique ID for this managed resource.
    status String
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.

    Look up Existing Workload Resource

    Get an existing Workload resource’s state with the given name, ID, and optional extra properties used to qualify the lookup.

    public static get(name: string, id: Input<ID>, state?: WorkloadState, opts?: CustomResourceOptions): Workload
    @staticmethod
    def get(resource_name: str,
            id: str,
            opts: Optional[ResourceOptions] = None,
            artifact_id: Optional[str] = None,
            description: Optional[str] = None,
            endpoint: Optional[str] = None,
            importance: Optional[str] = None,
            name: Optional[str] = None,
            runtime: Optional[WorkloadRuntimeArgs] = None,
            status: Optional[str] = None) -> Workload
    func GetWorkload(ctx *Context, name string, id IDInput, state *WorkloadState, opts ...ResourceOption) (*Workload, error)
    public static Workload Get(string name, Input<string> id, WorkloadState? state, CustomResourceOptions? opts = null)
    public static Workload get(String name, Output<String> id, WorkloadState state, CustomResourceOptions options)
    resources:  _:    type: datarobot:Workload    get:      id: ${id}
    import {
      to = datarobot_workload.example
      id = "${id}"
    }
    
    name
    The unique name of the resulting resource.
    id
    The unique provider ID of the resource to lookup.
    state
    Any extra arguments used during the lookup.
    opts
    A bag of options that control this resource's behavior.
    resource_name
    The unique name of the resulting resource.
    id
    The unique provider ID of the resource to lookup.
    name
    The unique name of the resulting resource.
    id
    The unique provider ID of the resource to lookup.
    state
    Any extra arguments used during the lookup.
    opts
    A bag of options that control this resource's behavior.
    name
    The unique name of the resulting resource.
    id
    The unique provider ID of the resource to lookup.
    state
    Any extra arguments used during the lookup.
    opts
    A bag of options that control this resource's behavior.
    name
    The unique name of the resulting resource.
    id
    The unique provider ID of the resource to lookup.
    state
    Any extra arguments used during the lookup.
    opts
    A bag of options that control this resource's behavior.
    The following state arguments are supported:
    ArtifactId string
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    Description string
    A human-readable description of the Workload.
    Endpoint string
    The inference endpoint URL for the Workload.
    Importance string
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    Name string
    The name of the Workload.
    Runtime DataRobotWorkloadRuntime
    Runtime configuration for the Workload.
    Status string
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    ArtifactId string
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    Description string
    A human-readable description of the Workload.
    Endpoint string
    The inference endpoint URL for the Workload.
    Importance string
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    Name string
    The name of the Workload.
    Runtime WorkloadRuntimeArgs
    Runtime configuration for the Workload.
    Status string
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    artifact_id string
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    description string
    A human-readable description of the Workload.
    endpoint string
    The inference endpoint URL for the Workload.
    importance string
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    name string
    The name of the Workload.
    runtime object
    Runtime configuration for the Workload.
    status string
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    artifactId String
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    description String
    A human-readable description of the Workload.
    endpoint String
    The inference endpoint URL for the Workload.
    importance String
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    name String
    The name of the Workload.
    runtime WorkloadRuntime
    Runtime configuration for the Workload.
    status String
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    artifactId string
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    description string
    A human-readable description of the Workload.
    endpoint string
    The inference endpoint URL for the Workload.
    importance string
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    name string
    The name of the Workload.
    runtime WorkloadRuntime
    Runtime configuration for the Workload.
    status string
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    artifact_id str
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    description str
    A human-readable description of the Workload.
    endpoint str
    The inference endpoint URL for the Workload.
    importance str
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    name str
    The name of the Workload.
    runtime WorkloadRuntimeArgs
    Runtime configuration for the Workload.
    status str
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.
    artifactId String
    ID of the Artifact version to deploy. When using datarobot.Artifact, reference datarobot_artifact.<name>.artifact_id (not .id). Changing this value forces a new Workload to be created.
    description String
    A human-readable description of the Workload.
    endpoint String
    The inference endpoint URL for the Workload.
    importance String
    Priority level for the Workload: critical, high, moderate, or low. Defaults to low.
    name String
    The name of the Workload.
    runtime Property Map
    Runtime configuration for the Workload.
    status String
    Current status of the Workload: unknown, submitted, initializing, running, stopping, stopped, or errored.

    Supporting Types

    WorkloadRuntime, WorkloadRuntimeArgs

    ContainerGroups []WorkloadRuntimeContainerGroup
    Per-group runtime configuration.
    container_groups list(object)
    Per-group runtime configuration.
    containerGroups WorkloadRuntimeContainerGroup[]
    Per-group runtime configuration.
    containerGroups List<Property Map>
    Per-group runtime configuration.

    WorkloadRuntimeContainerGroup, WorkloadRuntimeContainerGroupArgs

    Autoscaling DataRobotWorkloadRuntimeContainerGroupAutoscaling
    Autoscaling configuration. When set, takes precedence over replica_count.
    BundleSelectionPolicy string
    How to select among resource_bundles. Defaults to availability.
    Containers List<DataRobotWorkloadRuntimeContainerGroupContainer>
    Per-container resource allocation overrides.
    Name string
    Container group name (server-assigned, always default).
    ReplicaCount int
    Number of replicas. Cannot be set alongside autoscaling.enabled=true. Set to 0 to explicitly clear it.
    ResourceBundles List<string>
    Ordered list of resource bundle IDs. One is selected at scheduling time.
    Autoscaling WorkloadRuntimeContainerGroupAutoscaling
    Autoscaling configuration. When set, takes precedence over replica_count.
    BundleSelectionPolicy string
    How to select among resource_bundles. Defaults to availability.
    Containers []WorkloadRuntimeContainerGroupContainer
    Per-container resource allocation overrides.
    Name string
    Container group name (server-assigned, always default).
    ReplicaCount int
    Number of replicas. Cannot be set alongside autoscaling.enabled=true. Set to 0 to explicitly clear it.
    ResourceBundles []string
    Ordered list of resource bundle IDs. One is selected at scheduling time.
    autoscaling object
    Autoscaling configuration. When set, takes precedence over replica_count.
    bundle_selection_policy string
    How to select among resource_bundles. Defaults to availability.
    containers list(object)
    Per-container resource allocation overrides.
    name string
    Container group name (server-assigned, always default).
    replica_count number
    Number of replicas. Cannot be set alongside autoscaling.enabled=true. Set to 0 to explicitly clear it.
    resource_bundles list(string)
    Ordered list of resource bundle IDs. One is selected at scheduling time.
    autoscaling WorkloadRuntimeContainerGroupAutoscaling
    Autoscaling configuration. When set, takes precedence over replica_count.
    bundleSelectionPolicy String
    How to select among resource_bundles. Defaults to availability.
    containers List<WorkloadRuntimeContainerGroupContainer>
    Per-container resource allocation overrides.
    name String
    Container group name (server-assigned, always default).
    replicaCount Integer
    Number of replicas. Cannot be set alongside autoscaling.enabled=true. Set to 0 to explicitly clear it.
    resourceBundles List<String>
    Ordered list of resource bundle IDs. One is selected at scheduling time.
    autoscaling WorkloadRuntimeContainerGroupAutoscaling
    Autoscaling configuration. When set, takes precedence over replica_count.
    bundleSelectionPolicy string
    How to select among resource_bundles. Defaults to availability.
    containers WorkloadRuntimeContainerGroupContainer[]
    Per-container resource allocation overrides.
    name string
    Container group name (server-assigned, always default).
    replicaCount number
    Number of replicas. Cannot be set alongside autoscaling.enabled=true. Set to 0 to explicitly clear it.
    resourceBundles string[]
    Ordered list of resource bundle IDs. One is selected at scheduling time.
    autoscaling WorkloadRuntimeContainerGroupAutoscaling
    Autoscaling configuration. When set, takes precedence over replica_count.
    bundle_selection_policy str
    How to select among resource_bundles. Defaults to availability.
    containers Sequence[WorkloadRuntimeContainerGroupContainer]
    Per-container resource allocation overrides.
    name str
    Container group name (server-assigned, always default).
    replica_count int
    Number of replicas. Cannot be set alongside autoscaling.enabled=true. Set to 0 to explicitly clear it.
    resource_bundles Sequence[str]
    Ordered list of resource bundle IDs. One is selected at scheduling time.
    autoscaling Property Map
    Autoscaling configuration. When set, takes precedence over replica_count.
    bundleSelectionPolicy String
    How to select among resource_bundles. Defaults to availability.
    containers List<Property Map>
    Per-container resource allocation overrides.
    name String
    Container group name (server-assigned, always default).
    replicaCount Number
    Number of replicas. Cannot be set alongside autoscaling.enabled=true. Set to 0 to explicitly clear it.
    resourceBundles List<String>
    Ordered list of resource bundle IDs. One is selected at scheduling time.

    WorkloadRuntimeContainerGroupAutoscaling, WorkloadRuntimeContainerGroupAutoscalingArgs

    Policies List<DataRobotWorkloadRuntimeContainerGroupAutoscalingPolicy>
    Scaling policies that define when and how to scale.
    Enabled bool
    Whether autoscaling is enabled. Defaults to true.
    Policies []WorkloadRuntimeContainerGroupAutoscalingPolicy
    Scaling policies that define when and how to scale.
    Enabled bool
    Whether autoscaling is enabled. Defaults to true.
    policies list(object)
    Scaling policies that define when and how to scale.
    enabled bool
    Whether autoscaling is enabled. Defaults to true.
    policies List<WorkloadRuntimeContainerGroupAutoscalingPolicy>
    Scaling policies that define when and how to scale.
    enabled Boolean
    Whether autoscaling is enabled. Defaults to true.
    policies WorkloadRuntimeContainerGroupAutoscalingPolicy[]
    Scaling policies that define when and how to scale.
    enabled boolean
    Whether autoscaling is enabled. Defaults to true.
    policies Sequence[WorkloadRuntimeContainerGroupAutoscalingPolicy]
    Scaling policies that define when and how to scale.
    enabled bool
    Whether autoscaling is enabled. Defaults to true.
    policies List<Property Map>
    Scaling policies that define when and how to scale.
    enabled Boolean
    Whether autoscaling is enabled. Defaults to true.

    WorkloadRuntimeContainerGroupAutoscalingPolicy, WorkloadRuntimeContainerGroupAutoscalingPolicyArgs

    MaxCount int
    Maximum number of replicas.
    MinCount int
    Minimum number of replicas.
    ScalingMetric string
    Metric used for scaling decisions: cpuAverageUtilization, httpRequestsConcurrency, gpuCacheUtilization, or gpuRequestQueueDepth.
    Target double
    Target value for the scaling metric.
    Priority int
    Policy priority when multiple policies are defined.
    MaxCount int
    Maximum number of replicas.
    MinCount int
    Minimum number of replicas.
    ScalingMetric string
    Metric used for scaling decisions: cpuAverageUtilization, httpRequestsConcurrency, gpuCacheUtilization, or gpuRequestQueueDepth.
    Target float64
    Target value for the scaling metric.
    Priority int
    Policy priority when multiple policies are defined.
    max_count number
    Maximum number of replicas.
    min_count number
    Minimum number of replicas.
    scaling_metric string
    Metric used for scaling decisions: cpuAverageUtilization, httpRequestsConcurrency, gpuCacheUtilization, or gpuRequestQueueDepth.
    target number
    Target value for the scaling metric.
    priority number
    Policy priority when multiple policies are defined.
    maxCount Integer
    Maximum number of replicas.
    minCount Integer
    Minimum number of replicas.
    scalingMetric String
    Metric used for scaling decisions: cpuAverageUtilization, httpRequestsConcurrency, gpuCacheUtilization, or gpuRequestQueueDepth.
    target Double
    Target value for the scaling metric.
    priority Integer
    Policy priority when multiple policies are defined.
    maxCount number
    Maximum number of replicas.
    minCount number
    Minimum number of replicas.
    scalingMetric string
    Metric used for scaling decisions: cpuAverageUtilization, httpRequestsConcurrency, gpuCacheUtilization, or gpuRequestQueueDepth.
    target number
    Target value for the scaling metric.
    priority number
    Policy priority when multiple policies are defined.
    max_count int
    Maximum number of replicas.
    min_count int
    Minimum number of replicas.
    scaling_metric str
    Metric used for scaling decisions: cpuAverageUtilization, httpRequestsConcurrency, gpuCacheUtilization, or gpuRequestQueueDepth.
    target float
    Target value for the scaling metric.
    priority int
    Policy priority when multiple policies are defined.
    maxCount Number
    Maximum number of replicas.
    minCount Number
    Minimum number of replicas.
    scalingMetric String
    Metric used for scaling decisions: cpuAverageUtilization, httpRequestsConcurrency, gpuCacheUtilization, or gpuRequestQueueDepth.
    target Number
    Target value for the scaling metric.
    priority Number
    Policy priority when multiple policies are defined.

    WorkloadRuntimeContainerGroupContainer, WorkloadRuntimeContainerGroupContainerArgs

    Name string
    Container name. Must match a container declared in the artifact group.
    ResourceAllocation DataRobotWorkloadRuntimeContainerGroupContainerResourceAllocation
    Resource allocation for this container.
    Name string
    Container name. Must match a container declared in the artifact group.
    ResourceAllocation WorkloadRuntimeContainerGroupContainerResourceAllocation
    Resource allocation for this container.
    name string
    Container name. Must match a container declared in the artifact group.
    resource_allocation object
    Resource allocation for this container.
    name String
    Container name. Must match a container declared in the artifact group.
    resourceAllocation WorkloadRuntimeContainerGroupContainerResourceAllocation
    Resource allocation for this container.
    name string
    Container name. Must match a container declared in the artifact group.
    resourceAllocation WorkloadRuntimeContainerGroupContainerResourceAllocation
    Resource allocation for this container.
    name str
    Container name. Must match a container declared in the artifact group.
    resource_allocation WorkloadRuntimeContainerGroupContainerResourceAllocation
    Resource allocation for this container.
    name String
    Container name. Must match a container declared in the artifact group.
    resourceAllocation Property Map
    Resource allocation for this container.

    WorkloadRuntimeContainerGroupContainerResourceAllocation, WorkloadRuntimeContainerGroupContainerResourceAllocationArgs

    Cpu double
    CPU cores allocated to this container.
    Gpu double
    GPUs allocated to this container.
    GpuMemory int
    GPU VRAM allocated in bytes.
    Memory int
    RAM allocated in bytes.
    Cpu float64
    CPU cores allocated to this container.
    Gpu float64
    GPUs allocated to this container.
    GpuMemory int
    GPU VRAM allocated in bytes.
    Memory int
    RAM allocated in bytes.
    cpu number
    CPU cores allocated to this container.
    gpu number
    GPUs allocated to this container.
    gpu_memory number
    GPU VRAM allocated in bytes.
    memory number
    RAM allocated in bytes.
    cpu Double
    CPU cores allocated to this container.
    gpu Double
    GPUs allocated to this container.
    gpuMemory Integer
    GPU VRAM allocated in bytes.
    memory Integer
    RAM allocated in bytes.
    cpu number
    CPU cores allocated to this container.
    gpu number
    GPUs allocated to this container.
    gpuMemory number
    GPU VRAM allocated in bytes.
    memory number
    RAM allocated in bytes.
    cpu float
    CPU cores allocated to this container.
    gpu float
    GPUs allocated to this container.
    gpu_memory int
    GPU VRAM allocated in bytes.
    memory int
    RAM allocated in bytes.
    cpu Number
    CPU cores allocated to this container.
    gpu Number
    GPUs allocated to this container.
    gpuMemory Number
    GPU VRAM allocated in bytes.
    memory Number
    RAM allocated in bytes.

    Package Details

    Repository
    datarobot datarobot-community/pulumi-datarobot
    License
    Apache-2.0
    Notes
    This Pulumi package is based on the datarobot Terraform Provider.
    datarobot logo
    Viewing docs for DataRobot v0.10.38
    published on Friday, May 22, 2026 by DataRobot, Inc.

      Try Pulumi Cloud free.
      Your team will thank you.

      Start free trial