scaleway.inference.Model
Explore with Pulumi AI
The scaleway.inference.Model resource allows you to upload and manage inference models in the Scaleway Inference ecosystem. Once registered, a model can be used in any scaleway.inference.Deployment resource.
Example Usage
Basic
import * as pulumi from "@pulumi/pulumi";
import * as scaleway from "@pulumiverse/scaleway";
const test = new scaleway.inference.Model("test", {
name: "my-awesome-model",
url: "https://huggingface.co/agentica-org/DeepCoder-14B-Preview",
secret: "my-secret-token",
});
import pulumi
import pulumiverse_scaleway as scaleway
test = scaleway.inference.Model("test",
name="my-awesome-model",
url="https://huggingface.co/agentica-org/DeepCoder-14B-Preview",
secret="my-secret-token")
package main
import (
"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
"github.com/pulumiverse/pulumi-scaleway/sdk/go/scaleway/inference"
)
func main() {
pulumi.Run(func(ctx *pulumi.Context) error {
_, err := inference.NewModel(ctx, "test", &inference.ModelArgs{
Name: pulumi.String("my-awesome-model"),
Url: pulumi.String("https://huggingface.co/agentica-org/DeepCoder-14B-Preview"),
Secret: pulumi.String("my-secret-token"),
})
if err != nil {
return err
}
return nil
})
}
using System.Collections.Generic;
using System.Linq;
using Pulumi;
using Scaleway = Pulumiverse.Scaleway;
return await Deployment.RunAsync(() =>
{
var test = new Scaleway.Inference.Model("test", new()
{
Name = "my-awesome-model",
Url = "https://huggingface.co/agentica-org/DeepCoder-14B-Preview",
Secret = "my-secret-token",
});
});
package generated_program;
import com.pulumi.Context;
import com.pulumi.Pulumi;
import com.pulumi.core.Output;
import com.pulumi.scaleway.inference.Model;
import com.pulumi.scaleway.inference.ModelArgs;
import java.util.List;
import java.util.ArrayList;
import java.util.Map;
import java.io.File;
import java.nio.file.Files;
import java.nio.file.Paths;
public class App {
public static void main(String[] args) {
Pulumi.run(App::stack);
}
public static void stack(Context ctx) {
var test = new Model("test", ModelArgs.builder()
.name("my-awesome-model")
.url("https://huggingface.co/agentica-org/DeepCoder-14B-Preview")
.secret("my-secret-token")
.build());
}
}
resources:
test:
type: scaleway:inference:Model
properties:
name: my-awesome-model
url: https://huggingface.co/agentica-org/DeepCoder-14B-Preview
secret: my-secret-token
Deploy your own model on your managed inference
import * as pulumi from "@pulumi/pulumi";
import * as scaleway from "@pulumiverse/scaleway";
const myModel = new scaleway.inference.Model("my_model", {
name: "my-awesome-model",
url: "https://huggingface.co/agentica-org/DeepCoder-14B-Preview",
secret: "my-secret-token",
});
const myDeployment = new scaleway.inference.Deployment("my_deployment", {
name: "test-inference-deployment-basic",
nodeType: "H100",
modelId: myModel.id,
publicEndpoint: {
isEnabled: true,
},
acceptEula: true,
});
import pulumi
import pulumiverse_scaleway as scaleway
my_model = scaleway.inference.Model("my_model",
name="my-awesome-model",
url="https://huggingface.co/agentica-org/DeepCoder-14B-Preview",
secret="my-secret-token")
my_deployment = scaleway.inference.Deployment("my_deployment",
name="test-inference-deployment-basic",
node_type="H100",
model_id=my_model.id,
public_endpoint={
"is_enabled": True,
},
accept_eula=True)
package main
import (
"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
"github.com/pulumiverse/pulumi-scaleway/sdk/go/scaleway/inference"
)
func main() {
pulumi.Run(func(ctx *pulumi.Context) error {
myModel, err := inference.NewModel(ctx, "my_model", &inference.ModelArgs{
Name: pulumi.String("my-awesome-model"),
Url: pulumi.String("https://huggingface.co/agentica-org/DeepCoder-14B-Preview"),
Secret: pulumi.String("my-secret-token"),
})
if err != nil {
return err
}
_, err = inference.NewDeployment(ctx, "my_deployment", &inference.DeploymentArgs{
Name: pulumi.String("test-inference-deployment-basic"),
NodeType: pulumi.String("H100"),
ModelId: myModel.ID(),
PublicEndpoint: &inference.DeploymentPublicEndpointArgs{
IsEnabled: pulumi.Bool(true),
},
AcceptEula: pulumi.Bool(true),
})
if err != nil {
return err
}
return nil
})
}
using System.Collections.Generic;
using System.Linq;
using Pulumi;
using Scaleway = Pulumiverse.Scaleway;
return await Deployment.RunAsync(() =>
{
var myModel = new Scaleway.Inference.Model("my_model", new()
{
Name = "my-awesome-model",
Url = "https://huggingface.co/agentica-org/DeepCoder-14B-Preview",
Secret = "my-secret-token",
});
var myDeployment = new Scaleway.Inference.Deployment("my_deployment", new()
{
Name = "test-inference-deployment-basic",
NodeType = "H100",
ModelId = myModel.Id,
PublicEndpoint = new Scaleway.Inference.Inputs.DeploymentPublicEndpointArgs
{
IsEnabled = true,
},
AcceptEula = true,
});
});
package generated_program;
import com.pulumi.Context;
import com.pulumi.Pulumi;
import com.pulumi.core.Output;
import com.pulumi.scaleway.inference.Model;
import com.pulumi.scaleway.inference.ModelArgs;
import com.pulumi.scaleway.inference.Deployment;
import com.pulumi.scaleway.inference.DeploymentArgs;
import com.pulumi.scaleway.inference.inputs.DeploymentPublicEndpointArgs;
import java.util.List;
import java.util.ArrayList;
import java.util.Map;
import java.io.File;
import java.nio.file.Files;
import java.nio.file.Paths;
public class App {
public static void main(String[] args) {
Pulumi.run(App::stack);
}
public static void stack(Context ctx) {
var myModel = new Model("myModel", ModelArgs.builder()
.name("my-awesome-model")
.url("https://huggingface.co/agentica-org/DeepCoder-14B-Preview")
.secret("my-secret-token")
.build());
var myDeployment = new Deployment("myDeployment", DeploymentArgs.builder()
.name("test-inference-deployment-basic")
.nodeType("H100")
.modelId(myModel.id())
.publicEndpoint(DeploymentPublicEndpointArgs.builder()
.isEnabled(true)
.build())
.acceptEula(true)
.build());
}
}
resources:
myModel:
type: scaleway:inference:Model
name: my_model
properties:
name: my-awesome-model
url: https://huggingface.co/agentica-org/DeepCoder-14B-Preview
secret: my-secret-token
myDeployment:
type: scaleway:inference:Deployment
name: my_deployment
properties:
name: test-inference-deployment-basic
nodeType: H100
modelId: ${myModel.id}
publicEndpoint:
isEnabled: true
acceptEula: true
Create Model Resource
Resources are created with functions called constructors. To learn more about declaring and configuring resources, see Resources.
Constructor syntax
new Model(name: string, args: ModelArgs, opts?: CustomResourceOptions);
@overload
def Model(resource_name: str,
args: ModelArgs,
opts: Optional[ResourceOptions] = None)
@overload
def Model(resource_name: str,
opts: Optional[ResourceOptions] = None,
url: Optional[str] = None,
name: Optional[str] = None,
project_id: Optional[str] = None,
region: Optional[str] = None,
secret: Optional[str] = None)
func NewModel(ctx *Context, name string, args ModelArgs, opts ...ResourceOption) (*Model, error)
public Model(string name, ModelArgs args, CustomResourceOptions? opts = null)
type: scaleway:inference:Model
properties: # The arguments to resource properties.
options: # Bag of options to control resource's behavior.
Parameters
- name string
- The unique name of the resource.
- args ModelArgs
- The arguments to resource properties.
- opts CustomResourceOptions
- Bag of options to control resource's behavior.
- resource_name str
- The unique name of the resource.
- args ModelArgs
- The arguments to resource properties.
- opts ResourceOptions
- Bag of options to control resource's behavior.
- ctx Context
- Context object for the current deployment.
- name string
- The unique name of the resource.
- args ModelArgs
- The arguments to resource properties.
- opts ResourceOption
- Bag of options to control resource's behavior.
- name string
- The unique name of the resource.
- args ModelArgs
- The arguments to resource properties.
- opts CustomResourceOptions
- Bag of options to control resource's behavior.
- name String
- The unique name of the resource.
- args ModelArgs
- The arguments to resource properties.
- options CustomResourceOptions
- Bag of options to control resource's behavior.
Constructor example
The following reference example uses placeholder values for all input properties.
var modelResource = new Scaleway.Inference.Model("modelResource", new()
{
Url = "string",
Name = "string",
ProjectId = "string",
Region = "string",
Secret = "string",
});
example, err := inference.NewModel(ctx, "modelResource", &inference.ModelArgs{
Url: pulumi.String("string"),
Name: pulumi.String("string"),
ProjectId: pulumi.String("string"),
Region: pulumi.String("string"),
Secret: pulumi.String("string"),
})
var modelResource = new Model("modelResource", ModelArgs.builder()
.url("string")
.name("string")
.projectId("string")
.region("string")
.secret("string")
.build());
model_resource = scaleway.inference.Model("modelResource",
url="string",
name="string",
project_id="string",
region="string",
secret="string")
const modelResource = new scaleway.inference.Model("modelResource", {
url: "string",
name: "string",
projectId: "string",
region: "string",
secret: "string",
});
type: scaleway:inference:Model
properties:
name: string
projectId: string
region: string
secret: string
url: string
Model Resource Properties
To learn more about resource properties and how to use them, see Inputs and Outputs in the Architecture and Concepts docs.
Inputs
In Python, inputs that are objects can be passed either as argument classes or as dictionary literals.
The Model resource accepts the following input properties:
- Url string
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
- Name string
- The name of the model. This must be unique within the project.
- Project
Id string project_id
) The ID of the project the deployment is associated with.- Region string
region
) The region in which the deployment is created.- Secret string
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
- Url string
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
- Name string
- The name of the model. This must be unique within the project.
- Project
Id string project_id
) The ID of the project the deployment is associated with.- Region string
region
) The region in which the deployment is created.- Secret string
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
- url String
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
- name String
- The name of the model. This must be unique within the project.
- project
Id String project_id
) The ID of the project the deployment is associated with.- region String
region
) The region in which the deployment is created.- secret String
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
- url string
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
- name string
- The name of the model. This must be unique within the project.
- project
Id string project_id
) The ID of the project the deployment is associated with.- region string
region
) The region in which the deployment is created.- secret string
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
- url str
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
- name str
- The name of the model. This must be unique within the project.
- project_
id str project_id
) The ID of the project the deployment is associated with.- region str
region
) The region in which the deployment is created.- secret str
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
- url String
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
- name String
- The name of the model. This must be unique within the project.
- project
Id String project_id
) The ID of the project the deployment is associated with.- region String
region
) The region in which the deployment is created.- secret String
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
Outputs
All input properties are implicitly available as output properties. Additionally, the Model resource produces the following output properties:
- Created
At string - The date and time of the creation of the model
- Description string
- A textual description of the model (if available).
- Has
Eula bool - Whether the model requires end-user license agreement acceptance before use.
- Id string
- The provider-assigned unique ID for this managed resource.
- Nodes
Supports List<Pulumiverse.Scaleway. Inference. Outputs. Model Nodes Support> - List of supported node types and their quantization options. Each entry contains:
- Parameter
Size intBits - Size, in bits, of the model parameters.
- Size
Bytes int - Total size, in bytes, of the model archive.
- Status string
- The current status of the model (e.g., ready, error, etc.).
- List<string>
- Tags associated with the model.
- Updated
At string - The date and time of the last update of the model
- Created
At string - The date and time of the creation of the model
- Description string
- A textual description of the model (if available).
- Has
Eula bool - Whether the model requires end-user license agreement acceptance before use.
- Id string
- The provider-assigned unique ID for this managed resource.
- Nodes
Supports []ModelNodes Support - List of supported node types and their quantization options. Each entry contains:
- Parameter
Size intBits - Size, in bits, of the model parameters.
- Size
Bytes int - Total size, in bytes, of the model archive.
- Status string
- The current status of the model (e.g., ready, error, etc.).
- []string
- Tags associated with the model.
- Updated
At string - The date and time of the last update of the model
- created
At String - The date and time of the creation of the model
- description String
- A textual description of the model (if available).
- has
Eula Boolean - Whether the model requires end-user license agreement acceptance before use.
- id String
- The provider-assigned unique ID for this managed resource.
- nodes
Supports List<ModelNodes Support> - List of supported node types and their quantization options. Each entry contains:
- parameter
Size IntegerBits - Size, in bits, of the model parameters.
- size
Bytes Integer - Total size, in bytes, of the model archive.
- status String
- The current status of the model (e.g., ready, error, etc.).
- List<String>
- Tags associated with the model.
- updated
At String - The date and time of the last update of the model
- created
At string - The date and time of the creation of the model
- description string
- A textual description of the model (if available).
- has
Eula boolean - Whether the model requires end-user license agreement acceptance before use.
- id string
- The provider-assigned unique ID for this managed resource.
- nodes
Supports ModelNodes Support[] - List of supported node types and their quantization options. Each entry contains:
- parameter
Size numberBits - Size, in bits, of the model parameters.
- size
Bytes number - Total size, in bytes, of the model archive.
- status string
- The current status of the model (e.g., ready, error, etc.).
- string[]
- Tags associated with the model.
- updated
At string - The date and time of the last update of the model
- created_
at str - The date and time of the creation of the model
- description str
- A textual description of the model (if available).
- has_
eula bool - Whether the model requires end-user license agreement acceptance before use.
- id str
- The provider-assigned unique ID for this managed resource.
- nodes_
supports Sequence[ModelNodes Support] - List of supported node types and their quantization options. Each entry contains:
- parameter_
size_ intbits - Size, in bits, of the model parameters.
- size_
bytes int - Total size, in bytes, of the model archive.
- status str
- The current status of the model (e.g., ready, error, etc.).
- Sequence[str]
- Tags associated with the model.
- updated_
at str - The date and time of the last update of the model
- created
At String - The date and time of the creation of the model
- description String
- A textual description of the model (if available).
- has
Eula Boolean - Whether the model requires end-user license agreement acceptance before use.
- id String
- The provider-assigned unique ID for this managed resource.
- nodes
Supports List<Property Map> - List of supported node types and their quantization options. Each entry contains:
- parameter
Size NumberBits - Size, in bits, of the model parameters.
- size
Bytes Number - Total size, in bytes, of the model archive.
- status String
- The current status of the model (e.g., ready, error, etc.).
- List<String>
- Tags associated with the model.
- updated
At String - The date and time of the last update of the model
Look up Existing Model Resource
Get an existing Model resource’s state with the given name, ID, and optional extra properties used to qualify the lookup.
public static get(name: string, id: Input<ID>, state?: ModelState, opts?: CustomResourceOptions): Model
@staticmethod
def get(resource_name: str,
id: str,
opts: Optional[ResourceOptions] = None,
created_at: Optional[str] = None,
description: Optional[str] = None,
has_eula: Optional[bool] = None,
name: Optional[str] = None,
nodes_supports: Optional[Sequence[ModelNodesSupportArgs]] = None,
parameter_size_bits: Optional[int] = None,
project_id: Optional[str] = None,
region: Optional[str] = None,
secret: Optional[str] = None,
size_bytes: Optional[int] = None,
status: Optional[str] = None,
tags: Optional[Sequence[str]] = None,
updated_at: Optional[str] = None,
url: Optional[str] = None) -> Model
func GetModel(ctx *Context, name string, id IDInput, state *ModelState, opts ...ResourceOption) (*Model, error)
public static Model Get(string name, Input<string> id, ModelState? state, CustomResourceOptions? opts = null)
public static Model get(String name, Output<String> id, ModelState state, CustomResourceOptions options)
resources: _: type: scaleway:inference:Model get: id: ${id}
- name
- The unique name of the resulting resource.
- id
- The unique provider ID of the resource to lookup.
- state
- Any extra arguments used during the lookup.
- opts
- A bag of options that control this resource's behavior.
- resource_name
- The unique name of the resulting resource.
- id
- The unique provider ID of the resource to lookup.
- name
- The unique name of the resulting resource.
- id
- The unique provider ID of the resource to lookup.
- state
- Any extra arguments used during the lookup.
- opts
- A bag of options that control this resource's behavior.
- name
- The unique name of the resulting resource.
- id
- The unique provider ID of the resource to lookup.
- state
- Any extra arguments used during the lookup.
- opts
- A bag of options that control this resource's behavior.
- name
- The unique name of the resulting resource.
- id
- The unique provider ID of the resource to lookup.
- state
- Any extra arguments used during the lookup.
- opts
- A bag of options that control this resource's behavior.
- Created
At string - The date and time of the creation of the model
- Description string
- A textual description of the model (if available).
- Has
Eula bool - Whether the model requires end-user license agreement acceptance before use.
- Name string
- The name of the model. This must be unique within the project.
- Nodes
Supports List<Pulumiverse.Scaleway. Inference. Inputs. Model Nodes Support> - List of supported node types and their quantization options. Each entry contains:
- Parameter
Size intBits - Size, in bits, of the model parameters.
- Project
Id string project_id
) The ID of the project the deployment is associated with.- Region string
region
) The region in which the deployment is created.- Secret string
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
- Size
Bytes int - Total size, in bytes, of the model archive.
- Status string
- The current status of the model (e.g., ready, error, etc.).
- List<string>
- Tags associated with the model.
- Updated
At string - The date and time of the last update of the model
- Url string
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
- Created
At string - The date and time of the creation of the model
- Description string
- A textual description of the model (if available).
- Has
Eula bool - Whether the model requires end-user license agreement acceptance before use.
- Name string
- The name of the model. This must be unique within the project.
- Nodes
Supports []ModelNodes Support Args - List of supported node types and their quantization options. Each entry contains:
- Parameter
Size intBits - Size, in bits, of the model parameters.
- Project
Id string project_id
) The ID of the project the deployment is associated with.- Region string
region
) The region in which the deployment is created.- Secret string
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
- Size
Bytes int - Total size, in bytes, of the model archive.
- Status string
- The current status of the model (e.g., ready, error, etc.).
- []string
- Tags associated with the model.
- Updated
At string - The date and time of the last update of the model
- Url string
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
- created
At String - The date and time of the creation of the model
- description String
- A textual description of the model (if available).
- has
Eula Boolean - Whether the model requires end-user license agreement acceptance before use.
- name String
- The name of the model. This must be unique within the project.
- nodes
Supports List<ModelNodes Support> - List of supported node types and their quantization options. Each entry contains:
- parameter
Size IntegerBits - Size, in bits, of the model parameters.
- project
Id String project_id
) The ID of the project the deployment is associated with.- region String
region
) The region in which the deployment is created.- secret String
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
- size
Bytes Integer - Total size, in bytes, of the model archive.
- status String
- The current status of the model (e.g., ready, error, etc.).
- List<String>
- Tags associated with the model.
- updated
At String - The date and time of the last update of the model
- url String
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
- created
At string - The date and time of the creation of the model
- description string
- A textual description of the model (if available).
- has
Eula boolean - Whether the model requires end-user license agreement acceptance before use.
- name string
- The name of the model. This must be unique within the project.
- nodes
Supports ModelNodes Support[] - List of supported node types and their quantization options. Each entry contains:
- parameter
Size numberBits - Size, in bits, of the model parameters.
- project
Id string project_id
) The ID of the project the deployment is associated with.- region string
region
) The region in which the deployment is created.- secret string
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
- size
Bytes number - Total size, in bytes, of the model archive.
- status string
- The current status of the model (e.g., ready, error, etc.).
- string[]
- Tags associated with the model.
- updated
At string - The date and time of the last update of the model
- url string
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
- created_
at str - The date and time of the creation of the model
- description str
- A textual description of the model (if available).
- has_
eula bool - Whether the model requires end-user license agreement acceptance before use.
- name str
- The name of the model. This must be unique within the project.
- nodes_
supports Sequence[ModelNodes Support Args] - List of supported node types and their quantization options. Each entry contains:
- parameter_
size_ intbits - Size, in bits, of the model parameters.
- project_
id str project_id
) The ID of the project the deployment is associated with.- region str
region
) The region in which the deployment is created.- secret str
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
- size_
bytes int - Total size, in bytes, of the model archive.
- status str
- The current status of the model (e.g., ready, error, etc.).
- Sequence[str]
- Tags associated with the model.
- updated_
at str - The date and time of the last update of the model
- url str
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
- created
At String - The date and time of the creation of the model
- description String
- A textual description of the model (if available).
- has
Eula Boolean - Whether the model requires end-user license agreement acceptance before use.
- name String
- The name of the model. This must be unique within the project.
- nodes
Supports List<Property Map> - List of supported node types and their quantization options. Each entry contains:
- parameter
Size NumberBits - Size, in bits, of the model parameters.
- project
Id String project_id
) The ID of the project the deployment is associated with.- region String
region
) The region in which the deployment is created.- secret String
- Authentication token used to pull the model from a private or gated URL (e.g., a Hugging Face access token with read permission).
- size
Bytes Number - Total size, in bytes, of the model archive.
- status String
- The current status of the model (e.g., ready, error, etc.).
- List<String>
- Tags associated with the model.
- updated
At String - The date and time of the last update of the model
- url String
- The HTTPS source URL from which the model will be downloaded. This is typically a Hugging Face repository URL (e.g., https://huggingface.co/agentica-org/DeepCoder-14B-Preview). The URL must be publicly accessible or require valid credentials via
secret
Supporting Types
ModelNodesSupport, ModelNodesSupportArgs
- Node
Type stringName - The type of node supported.
- Quantizations
List<Pulumiverse.
Scaleway. Inference. Inputs. Model Nodes Support Quantization> - A list of supported quantization options, including:
- Node
Type stringName - The type of node supported.
- Quantizations
[]Model
Nodes Support Quantization - A list of supported quantization options, including:
- node
Type StringName - The type of node supported.
- quantizations
List<Model
Nodes Support Quantization> - A list of supported quantization options, including:
- node
Type stringName - The type of node supported.
- quantizations
Model
Nodes Support Quantization[] - A list of supported quantization options, including:
- node_
type_ strname - The type of node supported.
- quantizations
Sequence[Model
Nodes Support Quantization] - A list of supported quantization options, including:
- node
Type StringName - The type of node supported.
- quantizations List<Property Map>
- A list of supported quantization options, including:
ModelNodesSupportQuantization, ModelNodesSupportQuantizationArgs
- Allowed bool
- Whether this quantization is allowed.
- Max
Context intSize - Maximum context length supported by this quantization.
- Quantization
Bits int - Number of bits used for quantization (e.g., 8, 16).
- Allowed bool
- Whether this quantization is allowed.
- Max
Context intSize - Maximum context length supported by this quantization.
- Quantization
Bits int - Number of bits used for quantization (e.g., 8, 16).
- allowed Boolean
- Whether this quantization is allowed.
- max
Context IntegerSize - Maximum context length supported by this quantization.
- quantization
Bits Integer - Number of bits used for quantization (e.g., 8, 16).
- allowed boolean
- Whether this quantization is allowed.
- max
Context numberSize - Maximum context length supported by this quantization.
- quantization
Bits number - Number of bits used for quantization (e.g., 8, 16).
- allowed bool
- Whether this quantization is allowed.
- max_
context_ intsize - Maximum context length supported by this quantization.
- quantization_
bits int - Number of bits used for quantization (e.g., 8, 16).
- allowed Boolean
- Whether this quantization is allowed.
- max
Context NumberSize - Maximum context length supported by this quantization.
- quantization
Bits Number - Number of bits used for quantization (e.g., 8, 16).
Import
Models can be imported using, {region}/{id}
, as shown below:
bash
$ pulumi import scaleway:inference/model:Model my_model fr-par/11111111-1111-1111-1111-111111111111
To learn more about importing existing cloud resources, see Importing resources.
Package Details
- Repository
- scaleway pulumiverse/pulumi-scaleway
- License
- Apache-2.0
- Notes
- This Pulumi package is based on the
scaleway
Terraform Provider.