published on Friday, May 22, 2026 by DataRobot, Inc.
published on Friday, May 22, 2026 by DataRobot, Inc.
A Workload runs a containerized artifact in the cluster and exposes an inference endpoint.
Several attributes (including runtime and artifact_id) trigger replacement when changed. To avoid downtime during replacements, it is recommended to set create_before_destroy in the resource lifecycle:
import * as pulumi from "@pulumi/pulumi";
import pulumi
package main
import (
"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
)
func main() {
pulumi.Run(func(ctx *pulumi.Context) error {
return nil
})
}
using System.Collections.Generic;
using System.Linq;
using Pulumi;
return await Deployment.RunAsync(() =>
{
});
package generated_program;
import com.pulumi.Context;
import com.pulumi.Pulumi;
import com.pulumi.core.Output;
import java.util.List;
import java.util.ArrayList;
import java.util.Map;
import java.io.File;
import java.nio.file.Files;
import java.nio.file.Paths;
public class App {
public static void main(String[] args) {
Pulumi.run(App::stack);
}
public static void stack(Context ctx) {
}
}
{}
Example coming soon!
Create Workload Resource
Resources are created with functions called constructors. To learn more about declaring and configuring resources, see Resources.
Constructor syntax
new Workload(name: string, args: WorkloadArgs, opts?: CustomResourceOptions);@overload
def Workload(resource_name: str,
args: WorkloadArgs,
opts: Optional[ResourceOptions] = None)
@overload
def Workload(resource_name: str,
opts: Optional[ResourceOptions] = None,
artifact_id: Optional[str] = None,
runtime: Optional[WorkloadRuntimeArgs] = None,
description: Optional[str] = None,
importance: Optional[str] = None,
name: Optional[str] = None)func NewWorkload(ctx *Context, name string, args WorkloadArgs, opts ...ResourceOption) (*Workload, error)public Workload(string name, WorkloadArgs args, CustomResourceOptions? opts = null)
public Workload(String name, WorkloadArgs args)
public Workload(String name, WorkloadArgs args, CustomResourceOptions options)
type: datarobot:Workload
properties: # The arguments to resource properties.
options: # Bag of options to control resource's behavior.
resource "datarobot_workload" "name" {
# resource properties
}Parameters
- name string
- The unique name of the resource.
- args WorkloadArgs
- The arguments to resource properties.
- opts CustomResourceOptions
- Bag of options to control resource's behavior.
- resource_name str
- The unique name of the resource.
- args WorkloadArgs
- The arguments to resource properties.
- opts ResourceOptions
- Bag of options to control resource's behavior.
- ctx Context
- Context object for the current deployment.
- name string
- The unique name of the resource.
- args WorkloadArgs
- The arguments to resource properties.
- opts ResourceOption
- Bag of options to control resource's behavior.
- name string
- The unique name of the resource.
- args WorkloadArgs
- The arguments to resource properties.
- opts CustomResourceOptions
- Bag of options to control resource's behavior.
- name String
- The unique name of the resource.
- args WorkloadArgs
- The arguments to resource properties.
- options CustomResourceOptions
- Bag of options to control resource's behavior.
Constructor example
The following reference example uses placeholder values for all input properties.
var workloadResource = new Datarobot.Workload("workloadResource", new()
{
ArtifactId = "string",
Runtime = new Datarobot.Inputs.WorkloadRuntimeArgs
{
ContainerGroups = new[]
{
new Datarobot.Inputs.WorkloadRuntimeContainerGroupArgs
{
Autoscaling = new Datarobot.Inputs.WorkloadRuntimeContainerGroupAutoscalingArgs
{
Policies = new[]
{
new Datarobot.Inputs.WorkloadRuntimeContainerGroupAutoscalingPolicyArgs
{
MaxCount = 0,
MinCount = 0,
ScalingMetric = "string",
Target = 0,
Priority = 0,
},
},
Enabled = false,
},
BundleSelectionPolicy = "string",
Containers = new[]
{
new Datarobot.Inputs.WorkloadRuntimeContainerGroupContainerArgs
{
Name = "string",
ResourceAllocation = new Datarobot.Inputs.WorkloadRuntimeContainerGroupContainerResourceAllocationArgs
{
Cpu = 0,
Gpu = 0,
GpuMemory = 0,
Memory = 0,
},
},
},
Name = "string",
ReplicaCount = 0,
ResourceBundles = new[]
{
"string",
},
},
},
},
Description = "string",
Importance = "string",
Name = "string",
});
example, err := datarobot.NewWorkload(ctx, "workloadResource", &datarobot.WorkloadArgs{
ArtifactId: pulumi.String("string"),
Runtime: &datarobot.WorkloadRuntimeArgs{
ContainerGroups: datarobot.WorkloadRuntimeContainerGroupArray{
&datarobot.WorkloadRuntimeContainerGroupArgs{
Autoscaling: &datarobot.WorkloadRuntimeContainerGroupAutoscalingArgs{
Policies: datarobot.WorkloadRuntimeContainerGroupAutoscalingPolicyArray{
&datarobot.WorkloadRuntimeContainerGroupAutoscalingPolicyArgs{
MaxCount: pulumi.Int(0),
MinCount: pulumi.Int(0),
ScalingMetric: pulumi.String("string"),
Target: pulumi.Float64(0),
Priority: pulumi.Int(0),
},
},
Enabled: pulumi.Bool(false),
},
BundleSelectionPolicy: pulumi.String("string"),
Containers: datarobot.WorkloadRuntimeContainerGroupContainerArray{
&datarobot.WorkloadRuntimeContainerGroupContainerArgs{
Name: pulumi.String("string"),
ResourceAllocation: &datarobot.WorkloadRuntimeContainerGroupContainerResourceAllocationArgs{
Cpu: pulumi.Float64(0),
Gpu: pulumi.Float64(0),
GpuMemory: pulumi.Int(0),
Memory: pulumi.Int(0),
},
},
},
Name: pulumi.String("string"),
ReplicaCount: pulumi.Int(0),
ResourceBundles: pulumi.StringArray{
pulumi.String("string"),
},
},
},
},
Description: pulumi.String("string"),
Importance: pulumi.String("string"),
Name: pulumi.String("string"),
})
resource "datarobot_workload" "workloadResource" {
artifact_id = "string"
runtime = {
container_groups = [{
"autoscaling" = {
"policies" = [{
"maxCount" = 0
"minCount" = 0
"scalingMetric" = "string"
"target" = 0
"priority" = 0
}]
"enabled" = false
}
"bundleSelectionPolicy" = "string"
"containers" = [{
"name" = "string"
"resourceAllocation" = {
"cpu" = 0
"gpu" = 0
"gpuMemory" = 0
"memory" = 0
}
}]
"name" = "string"
"replicaCount" = 0
"resourceBundles" = ["string"]
}]
}
description = "string"
importance = "string"
name = "string"
}
var workloadResource = new Workload("workloadResource", WorkloadArgs.builder()
.artifactId("string")
.runtime(WorkloadRuntimeArgs.builder()
.containerGroups(WorkloadRuntimeContainerGroupArgs.builder()
.autoscaling(WorkloadRuntimeContainerGroupAutoscalingArgs.builder()
.policies(WorkloadRuntimeContainerGroupAutoscalingPolicyArgs.builder()
.maxCount(0)
.minCount(0)
.scalingMetric("string")
.target(0.0)
.priority(0)
.build())
.enabled(false)
.build())
.bundleSelectionPolicy("string")
.containers(WorkloadRuntimeContainerGroupContainerArgs.builder()
.name("string")
.resourceAllocation(WorkloadRuntimeContainerGroupContainerResourceAllocationArgs.builder()
.cpu(0.0)
.gpu(0.0)
.gpuMemory(0)
.memory(0)
.build())
.build())
.name("string")
.replicaCount(0)
.resourceBundles("string")
.build())
.build())
.description("string")
.importance("string")
.name("string")
.build());
workload_resource = datarobot.Workload("workloadResource",
artifact_id="string",
runtime={
"container_groups": [{
"autoscaling": {
"policies": [{
"max_count": 0,
"min_count": 0,
"scaling_metric": "string",
"target": float(0),
"priority": 0,
}],
"enabled": False,
},
"bundle_selection_policy": "string",
"containers": [{
"name": "string",
"resource_allocation": {
"cpu": float(0),
"gpu": float(0),
"gpu_memory": 0,
"memory": 0,
},
}],
"name": "string",
"replica_count": 0,
"resource_bundles": ["string"],
}],
},
description="string",
importance="string",
name="string")
const workloadResource = new datarobot.Workload("workloadResource", {
artifactId: "string",
runtime: {
containerGroups: [{
autoscaling: {
policies: [{
maxCount: 0,
minCount: 0,
scalingMetric: "string",
target: 0,
priority: 0,
}],
enabled: false,
},
bundleSelectionPolicy: "string",
containers: [{
name: "string",
resourceAllocation: {
cpu: 0,
gpu: 0,
gpuMemory: 0,
memory: 0,
},
}],
name: "string",
replicaCount: 0,
resourceBundles: ["string"],
}],
},
description: "string",
importance: "string",
name: "string",
});
type: datarobot:Workload
properties:
artifactId: string
description: string
importance: string
name: string
runtime:
containerGroups:
- autoscaling:
enabled: false
policies:
- maxCount: 0
minCount: 0
priority: 0
scalingMetric: string
target: 0
bundleSelectionPolicy: string
containers:
- name: string
resourceAllocation:
cpu: 0
gpu: 0
gpuMemory: 0
memory: 0
name: string
replicaCount: 0
resourceBundles:
- string
Workload Resource Properties
To learn more about resource properties and how to use them, see Inputs and Outputs in the Architecture and Concepts docs.
Inputs
In Python, inputs that are objects can be passed either as argument classes or as dictionary literals.
The Workload resource accepts the following input properties:
- Artifact
Id string - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - Runtime
Data
Robot Workload Runtime - Runtime configuration for the Workload.
- Description string
- A human-readable description of the Workload.
- Importance string
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - Name string
- The name of the Workload.
- Artifact
Id string - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - Runtime
Workload
Runtime Args - Runtime configuration for the Workload.
- Description string
- A human-readable description of the Workload.
- Importance string
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - Name string
- The name of the Workload.
- artifact_
id string - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - runtime object
- Runtime configuration for the Workload.
- description string
- A human-readable description of the Workload.
- importance string
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - name string
- The name of the Workload.
- artifact
Id String - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - runtime
Workload
Runtime - Runtime configuration for the Workload.
- description String
- A human-readable description of the Workload.
- importance String
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - name String
- The name of the Workload.
- artifact
Id string - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - runtime
Workload
Runtime - Runtime configuration for the Workload.
- description string
- A human-readable description of the Workload.
- importance string
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - name string
- The name of the Workload.
- artifact_
id str - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - runtime
Workload
Runtime Args - Runtime configuration for the Workload.
- description str
- A human-readable description of the Workload.
- importance str
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - name str
- The name of the Workload.
- artifact
Id String - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - runtime Property Map
- Runtime configuration for the Workload.
- description String
- A human-readable description of the Workload.
- importance String
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - name String
- The name of the Workload.
Outputs
All input properties are implicitly available as output properties. Additionally, the Workload resource produces the following output properties:
Look up Existing Workload Resource
Get an existing Workload resource’s state with the given name, ID, and optional extra properties used to qualify the lookup.
public static get(name: string, id: Input<ID>, state?: WorkloadState, opts?: CustomResourceOptions): Workload@staticmethod
def get(resource_name: str,
id: str,
opts: Optional[ResourceOptions] = None,
artifact_id: Optional[str] = None,
description: Optional[str] = None,
endpoint: Optional[str] = None,
importance: Optional[str] = None,
name: Optional[str] = None,
runtime: Optional[WorkloadRuntimeArgs] = None,
status: Optional[str] = None) -> Workloadfunc GetWorkload(ctx *Context, name string, id IDInput, state *WorkloadState, opts ...ResourceOption) (*Workload, error)public static Workload Get(string name, Input<string> id, WorkloadState? state, CustomResourceOptions? opts = null)public static Workload get(String name, Output<String> id, WorkloadState state, CustomResourceOptions options)resources: _: type: datarobot:Workload get: id: ${id}import {
to = datarobot_workload.example
id = "${id}"
}
- name
- The unique name of the resulting resource.
- id
- The unique provider ID of the resource to lookup.
- state
- Any extra arguments used during the lookup.
- opts
- A bag of options that control this resource's behavior.
- resource_name
- The unique name of the resulting resource.
- id
- The unique provider ID of the resource to lookup.
- name
- The unique name of the resulting resource.
- id
- The unique provider ID of the resource to lookup.
- state
- Any extra arguments used during the lookup.
- opts
- A bag of options that control this resource's behavior.
- name
- The unique name of the resulting resource.
- id
- The unique provider ID of the resource to lookup.
- state
- Any extra arguments used during the lookup.
- opts
- A bag of options that control this resource's behavior.
- name
- The unique name of the resulting resource.
- id
- The unique provider ID of the resource to lookup.
- state
- Any extra arguments used during the lookup.
- opts
- A bag of options that control this resource's behavior.
- Artifact
Id string - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - Description string
- A human-readable description of the Workload.
- Endpoint string
- The inference endpoint URL for the Workload.
- Importance string
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - Name string
- The name of the Workload.
- Runtime
Data
Robot Workload Runtime - Runtime configuration for the Workload.
- Status string
- Current status of the Workload:
unknown,submitted,initializing,running,stopping,stopped, orerrored.
- Artifact
Id string - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - Description string
- A human-readable description of the Workload.
- Endpoint string
- The inference endpoint URL for the Workload.
- Importance string
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - Name string
- The name of the Workload.
- Runtime
Workload
Runtime Args - Runtime configuration for the Workload.
- Status string
- Current status of the Workload:
unknown,submitted,initializing,running,stopping,stopped, orerrored.
- artifact_
id string - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - description string
- A human-readable description of the Workload.
- endpoint string
- The inference endpoint URL for the Workload.
- importance string
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - name string
- The name of the Workload.
- runtime object
- Runtime configuration for the Workload.
- status string
- Current status of the Workload:
unknown,submitted,initializing,running,stopping,stopped, orerrored.
- artifact
Id String - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - description String
- A human-readable description of the Workload.
- endpoint String
- The inference endpoint URL for the Workload.
- importance String
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - name String
- The name of the Workload.
- runtime
Workload
Runtime - Runtime configuration for the Workload.
- status String
- Current status of the Workload:
unknown,submitted,initializing,running,stopping,stopped, orerrored.
- artifact
Id string - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - description string
- A human-readable description of the Workload.
- endpoint string
- The inference endpoint URL for the Workload.
- importance string
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - name string
- The name of the Workload.
- runtime
Workload
Runtime - Runtime configuration for the Workload.
- status string
- Current status of the Workload:
unknown,submitted,initializing,running,stopping,stopped, orerrored.
- artifact_
id str - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - description str
- A human-readable description of the Workload.
- endpoint str
- The inference endpoint URL for the Workload.
- importance str
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - name str
- The name of the Workload.
- runtime
Workload
Runtime Args - Runtime configuration for the Workload.
- status str
- Current status of the Workload:
unknown,submitted,initializing,running,stopping,stopped, orerrored.
- artifact
Id String - ID of the Artifact version to deploy. When using
datarobot.Artifact, referencedatarobot_artifact.<name>.artifact_id(not.id). Changing this value forces a new Workload to be created. - description String
- A human-readable description of the Workload.
- endpoint String
- The inference endpoint URL for the Workload.
- importance String
- Priority level for the Workload:
critical,high,moderate, orlow. Defaults tolow. - name String
- The name of the Workload.
- runtime Property Map
- Runtime configuration for the Workload.
- status String
- Current status of the Workload:
unknown,submitted,initializing,running,stopping,stopped, orerrored.
Supporting Types
WorkloadRuntime, WorkloadRuntimeArgs
- Container
Groups List<DataRobot Workload Runtime Container Group> - Per-group runtime configuration.
- Container
Groups []WorkloadRuntime Container Group - Per-group runtime configuration.
- container_
groups list(object) - Per-group runtime configuration.
- container
Groups List<WorkloadRuntime Container Group> - Per-group runtime configuration.
- container
Groups WorkloadRuntime Container Group[] - Per-group runtime configuration.
- container_
groups Sequence[WorkloadRuntime Container Group] - Per-group runtime configuration.
- container
Groups List<Property Map> - Per-group runtime configuration.
WorkloadRuntimeContainerGroup, WorkloadRuntimeContainerGroupArgs
- Autoscaling
Data
Robot Workload Runtime Container Group Autoscaling - Autoscaling configuration. When set, takes precedence over
replica_count. - Bundle
Selection stringPolicy - How to select among
resource_bundles. Defaults toavailability. - Containers
List<Data
Robot Workload Runtime Container Group Container> - Per-container resource allocation overrides.
- Name string
- Container group name (server-assigned, always
default). - Replica
Count int - Number of replicas. Cannot be set alongside
autoscaling.enabled=true. Set to0to explicitly clear it. - Resource
Bundles List<string> - Ordered list of resource bundle IDs. One is selected at scheduling time.
- Autoscaling
Workload
Runtime Container Group Autoscaling - Autoscaling configuration. When set, takes precedence over
replica_count. - Bundle
Selection stringPolicy - How to select among
resource_bundles. Defaults toavailability. - Containers
[]Workload
Runtime Container Group Container - Per-container resource allocation overrides.
- Name string
- Container group name (server-assigned, always
default). - Replica
Count int - Number of replicas. Cannot be set alongside
autoscaling.enabled=true. Set to0to explicitly clear it. - Resource
Bundles []string - Ordered list of resource bundle IDs. One is selected at scheduling time.
- autoscaling object
- Autoscaling configuration. When set, takes precedence over
replica_count. - bundle_
selection_ stringpolicy - How to select among
resource_bundles. Defaults toavailability. - containers list(object)
- Per-container resource allocation overrides.
- name string
- Container group name (server-assigned, always
default). - replica_
count number - Number of replicas. Cannot be set alongside
autoscaling.enabled=true. Set to0to explicitly clear it. - resource_
bundles list(string) - Ordered list of resource bundle IDs. One is selected at scheduling time.
- autoscaling
Workload
Runtime Container Group Autoscaling - Autoscaling configuration. When set, takes precedence over
replica_count. - bundle
Selection StringPolicy - How to select among
resource_bundles. Defaults toavailability. - containers
List<Workload
Runtime Container Group Container> - Per-container resource allocation overrides.
- name String
- Container group name (server-assigned, always
default). - replica
Count Integer - Number of replicas. Cannot be set alongside
autoscaling.enabled=true. Set to0to explicitly clear it. - resource
Bundles List<String> - Ordered list of resource bundle IDs. One is selected at scheduling time.
- autoscaling
Workload
Runtime Container Group Autoscaling - Autoscaling configuration. When set, takes precedence over
replica_count. - bundle
Selection stringPolicy - How to select among
resource_bundles. Defaults toavailability. - containers
Workload
Runtime Container Group Container[] - Per-container resource allocation overrides.
- name string
- Container group name (server-assigned, always
default). - replica
Count number - Number of replicas. Cannot be set alongside
autoscaling.enabled=true. Set to0to explicitly clear it. - resource
Bundles string[] - Ordered list of resource bundle IDs. One is selected at scheduling time.
- autoscaling
Workload
Runtime Container Group Autoscaling - Autoscaling configuration. When set, takes precedence over
replica_count. - bundle_
selection_ strpolicy - How to select among
resource_bundles. Defaults toavailability. - containers
Sequence[Workload
Runtime Container Group Container] - Per-container resource allocation overrides.
- name str
- Container group name (server-assigned, always
default). - replica_
count int - Number of replicas. Cannot be set alongside
autoscaling.enabled=true. Set to0to explicitly clear it. - resource_
bundles Sequence[str] - Ordered list of resource bundle IDs. One is selected at scheduling time.
- autoscaling Property Map
- Autoscaling configuration. When set, takes precedence over
replica_count. - bundle
Selection StringPolicy - How to select among
resource_bundles. Defaults toavailability. - containers List<Property Map>
- Per-container resource allocation overrides.
- name String
- Container group name (server-assigned, always
default). - replica
Count Number - Number of replicas. Cannot be set alongside
autoscaling.enabled=true. Set to0to explicitly clear it. - resource
Bundles List<String> - Ordered list of resource bundle IDs. One is selected at scheduling time.
WorkloadRuntimeContainerGroupAutoscaling, WorkloadRuntimeContainerGroupAutoscalingArgs
- Policies
List<Data
Robot Workload Runtime Container Group Autoscaling Policy> - Scaling policies that define when and how to scale.
- Enabled bool
- Whether autoscaling is enabled. Defaults to true.
- Policies
[]Workload
Runtime Container Group Autoscaling Policy - Scaling policies that define when and how to scale.
- Enabled bool
- Whether autoscaling is enabled. Defaults to true.
- policies list(object)
- Scaling policies that define when and how to scale.
- enabled bool
- Whether autoscaling is enabled. Defaults to true.
- policies
List<Workload
Runtime Container Group Autoscaling Policy> - Scaling policies that define when and how to scale.
- enabled Boolean
- Whether autoscaling is enabled. Defaults to true.
- policies
Workload
Runtime Container Group Autoscaling Policy[] - Scaling policies that define when and how to scale.
- enabled boolean
- Whether autoscaling is enabled. Defaults to true.
- policies
Sequence[Workload
Runtime Container Group Autoscaling Policy] - Scaling policies that define when and how to scale.
- enabled bool
- Whether autoscaling is enabled. Defaults to true.
- policies List<Property Map>
- Scaling policies that define when and how to scale.
- enabled Boolean
- Whether autoscaling is enabled. Defaults to true.
WorkloadRuntimeContainerGroupAutoscalingPolicy, WorkloadRuntimeContainerGroupAutoscalingPolicyArgs
- Max
Count int - Maximum number of replicas.
- Min
Count int - Minimum number of replicas.
- Scaling
Metric string - Metric used for scaling decisions:
cpuAverageUtilization,httpRequestsConcurrency,gpuCacheUtilization, orgpuRequestQueueDepth. - Target double
- Target value for the scaling metric.
- Priority int
- Policy priority when multiple policies are defined.
- Max
Count int - Maximum number of replicas.
- Min
Count int - Minimum number of replicas.
- Scaling
Metric string - Metric used for scaling decisions:
cpuAverageUtilization,httpRequestsConcurrency,gpuCacheUtilization, orgpuRequestQueueDepth. - Target float64
- Target value for the scaling metric.
- Priority int
- Policy priority when multiple policies are defined.
- max_
count number - Maximum number of replicas.
- min_
count number - Minimum number of replicas.
- scaling_
metric string - Metric used for scaling decisions:
cpuAverageUtilization,httpRequestsConcurrency,gpuCacheUtilization, orgpuRequestQueueDepth. - target number
- Target value for the scaling metric.
- priority number
- Policy priority when multiple policies are defined.
- max
Count Integer - Maximum number of replicas.
- min
Count Integer - Minimum number of replicas.
- scaling
Metric String - Metric used for scaling decisions:
cpuAverageUtilization,httpRequestsConcurrency,gpuCacheUtilization, orgpuRequestQueueDepth. - target Double
- Target value for the scaling metric.
- priority Integer
- Policy priority when multiple policies are defined.
- max
Count number - Maximum number of replicas.
- min
Count number - Minimum number of replicas.
- scaling
Metric string - Metric used for scaling decisions:
cpuAverageUtilization,httpRequestsConcurrency,gpuCacheUtilization, orgpuRequestQueueDepth. - target number
- Target value for the scaling metric.
- priority number
- Policy priority when multiple policies are defined.
- max_
count int - Maximum number of replicas.
- min_
count int - Minimum number of replicas.
- scaling_
metric str - Metric used for scaling decisions:
cpuAverageUtilization,httpRequestsConcurrency,gpuCacheUtilization, orgpuRequestQueueDepth. - target float
- Target value for the scaling metric.
- priority int
- Policy priority when multiple policies are defined.
- max
Count Number - Maximum number of replicas.
- min
Count Number - Minimum number of replicas.
- scaling
Metric String - Metric used for scaling decisions:
cpuAverageUtilization,httpRequestsConcurrency,gpuCacheUtilization, orgpuRequestQueueDepth. - target Number
- Target value for the scaling metric.
- priority Number
- Policy priority when multiple policies are defined.
WorkloadRuntimeContainerGroupContainer, WorkloadRuntimeContainerGroupContainerArgs
- Name string
- Container name. Must match a container declared in the artifact group.
- Resource
Allocation DataRobot Workload Runtime Container Group Container Resource Allocation - Resource allocation for this container.
- Name string
- Container name. Must match a container declared in the artifact group.
- Resource
Allocation WorkloadRuntime Container Group Container Resource Allocation - Resource allocation for this container.
- name string
- Container name. Must match a container declared in the artifact group.
- resource_
allocation object - Resource allocation for this container.
- name String
- Container name. Must match a container declared in the artifact group.
- resource
Allocation WorkloadRuntime Container Group Container Resource Allocation - Resource allocation for this container.
- name string
- Container name. Must match a container declared in the artifact group.
- resource
Allocation WorkloadRuntime Container Group Container Resource Allocation - Resource allocation for this container.
- name str
- Container name. Must match a container declared in the artifact group.
- resource_
allocation WorkloadRuntime Container Group Container Resource Allocation - Resource allocation for this container.
- name String
- Container name. Must match a container declared in the artifact group.
- resource
Allocation Property Map - Resource allocation for this container.
WorkloadRuntimeContainerGroupContainerResourceAllocation, WorkloadRuntimeContainerGroupContainerResourceAllocationArgs
- cpu number
- CPU cores allocated to this container.
- gpu number
- GPUs allocated to this container.
- gpu_
memory number - GPU VRAM allocated in bytes.
- memory number
- RAM allocated in bytes.
- cpu float
- CPU cores allocated to this container.
- gpu float
- GPUs allocated to this container.
- gpu_
memory int - GPU VRAM allocated in bytes.
- memory int
- RAM allocated in bytes.
Package Details
- Repository
- datarobot datarobot-community/pulumi-datarobot
- License
- Apache-2.0
- Notes
- This Pulumi package is based on the
datarobotTerraform Provider.
published on Friday, May 22, 2026 by DataRobot, Inc.