AWS v6.83.0, Jun 16 25

AWS v6.83.0 published on Monday, Jun 16, 2025 by Pulumi

aws.glue.Job

Explore with Pulumi AI

AWS v6.83.0 published on Monday, Jun 16, 2025 by Pulumi

pulumi/pulumi-aws

Example Usage

Python Glue Job

import * as pulumi from "@pulumi/pulumi";
import * as aws from "@pulumi/aws";

// IAM role for Glue jobs
const glueJobRole = new aws.iam.Role("glue_job_role", {
    name: "glue-job-role",
    assumeRolePolicy: JSON.stringify({
        Version: "2012-10-17",
        Statement: [{
            Action: "sts:AssumeRole",
            Effect: "Allow",
            Principal: {
                Service: "glue.amazonaws.com",
            },
        }],
    }),
});
const etlJob = new aws.glue.Job("etl_job", {
    name: "example-etl-job",
    description: "An example Glue ETL job",
    roleArn: glueJobRole.arn,
    glueVersion: "5.0",
    maxRetries: 0,
    timeout: 2880,
    numberOfWorkers: 2,
    workerType: "G.1X",
    connections: [example.name],
    executionClass: "STANDARD",
    command: {
        scriptLocation: `s3://${glueScripts.bucket}/jobs/etl_job.py`,
        name: "glueetl",
        pythonVersion: "3",
    },
    notificationProperty: {
        notifyDelayAfter: 3,
    },
    defaultArguments: {
        "--job-language": "python",
        "--continuous-log-logGroup": "/aws-glue/jobs",
        "--enable-continuous-cloudwatch-log": "true",
        "--enable-continuous-log-filter": "true",
        "--enable-metrics": "",
        "--enable-auto-scaling": "true",
    },
    executionProperty: {
        maxConcurrentRuns: 1,
    },
    tags: {
        ManagedBy: "AWS",
    },
});
const glueEtlScript = new aws.s3.BucketObjectv2("glue_etl_script", {
    bucket: glueScripts.id,
    key: "jobs/etl_job.py",
    source: new pulumi.asset.FileAsset("jobs/etl_job.py"),
});

import pulumi
import json
import pulumi_aws as aws

# IAM role for Glue jobs
glue_job_role = aws.iam.Role("glue_job_role",
    name="glue-job-role",
    assume_role_policy=json.dumps({
        "Version": "2012-10-17",
        "Statement": [{
            "Action": "sts:AssumeRole",
            "Effect": "Allow",
            "Principal": {
                "Service": "glue.amazonaws.com",
            },
        }],
    }))
etl_job = aws.glue.Job("etl_job",
    name="example-etl-job",
    description="An example Glue ETL job",
    role_arn=glue_job_role.arn,
    glue_version="5.0",
    max_retries=0,
    timeout=2880,
    number_of_workers=2,
    worker_type="G.1X",
    connections=[example["name"]],
    execution_class="STANDARD",
    command={
        "script_location": f"s3://{glue_scripts['bucket']}/jobs/etl_job.py",
        "name": "glueetl",
        "python_version": "3",
    },
    notification_property={
        "notify_delay_after": 3,
    },
    default_arguments={
        "--job-language": "python",
        "--continuous-log-logGroup": "/aws-glue/jobs",
        "--enable-continuous-cloudwatch-log": "true",
        "--enable-continuous-log-filter": "true",
        "--enable-metrics": "",
        "--enable-auto-scaling": "true",
    },
    execution_property={
        "max_concurrent_runs": 1,
    },
    tags={
        "ManagedBy": "AWS",
    })
glue_etl_script = aws.s3.BucketObjectv2("glue_etl_script",
    bucket=glue_scripts["id"],
    key="jobs/etl_job.py",
    source=pulumi.FileAsset("jobs/etl_job.py"))

package main

import (
	"encoding/json"
	"fmt"

	"github.com/pulumi/pulumi-aws/sdk/v6/go/aws/glue"
	"github.com/pulumi/pulumi-aws/sdk/v6/go/aws/iam"
	"github.com/pulumi/pulumi-aws/sdk/v6/go/aws/s3"
	"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
)

func main() {
	pulumi.Run(func(ctx *pulumi.Context) error {
		tmpJSON0, err := json.Marshal(map[string]interface{}{
			"Version": "2012-10-17",
			"Statement": []map[string]interface{}{
				map[string]interface{}{
					"Action": "sts:AssumeRole",
					"Effect": "Allow",
					"Principal": map[string]interface{}{
						"Service": "glue.amazonaws.com",
					},
				},
			},
		})
		if err != nil {
			return err
		}
		json0 := string(tmpJSON0)
		// IAM role for Glue jobs
		glueJobRole, err := iam.NewRole(ctx, "glue_job_role", &iam.RoleArgs{
			Name:             pulumi.String("glue-job-role"),
			AssumeRolePolicy: pulumi.String(json0),
		})
		if err != nil {
			return err
		}
		_, err = glue.NewJob(ctx, "etl_job", &glue.JobArgs{
			Name:            pulumi.String("example-etl-job"),
			Description:     pulumi.String("An example Glue ETL job"),
			RoleArn:         glueJobRole.Arn,
			GlueVersion:     pulumi.String("5.0"),
			MaxRetries:      pulumi.Int(0),
			Timeout:         pulumi.Int(2880),
			NumberOfWorkers: pulumi.Int(2),
			WorkerType:      pulumi.String("G.1X"),
			Connections: pulumi.StringArray{
				example.Name,
			},
			ExecutionClass: pulumi.String("STANDARD"),
			Command: &glue.JobCommandArgs{
				ScriptLocation: pulumi.Sprintf("s3://%v/jobs/etl_job.py", glueScripts.Bucket),
				Name:           pulumi.String("glueetl"),
				PythonVersion:  pulumi.String("3"),
			},
			NotificationProperty: &glue.JobNotificationPropertyArgs{
				NotifyDelayAfter: pulumi.Int(3),
			},
			DefaultArguments: pulumi.StringMap{
				"--job-language":                     pulumi.String("python"),
				"--continuous-log-logGroup":          pulumi.String("/aws-glue/jobs"),
				"--enable-continuous-cloudwatch-log": pulumi.String("true"),
				"--enable-continuous-log-filter":     pulumi.String("true"),
				"--enable-metrics":                   pulumi.String(""),
				"--enable-auto-scaling":              pulumi.String("true"),
			},
			ExecutionProperty: &glue.JobExecutionPropertyArgs{
				MaxConcurrentRuns: pulumi.Int(1),
			},
			Tags: pulumi.StringMap{
				"ManagedBy": pulumi.String("AWS"),
			},
		})
		if err != nil {
			return err
		}
		_, err = s3.NewBucketObjectv2(ctx, "glue_etl_script", &s3.BucketObjectv2Args{
			Bucket: pulumi.Any(glueScripts.Id),
			Key:    pulumi.String("jobs/etl_job.py"),
			Source: pulumi.NewFileAsset("jobs/etl_job.py"),
		})
		if err != nil {
			return err
		}
		return nil
	})
}

using System.Collections.Generic;
using System.Linq;
using System.Text.Json;
using Pulumi;
using Aws = Pulumi.Aws;

return await Deployment.RunAsync(() => 
{
    // IAM role for Glue jobs
    var glueJobRole = new Aws.Iam.Role("glue_job_role", new()
    {
        Name = "glue-job-role",
        AssumeRolePolicy = JsonSerializer.Serialize(new Dictionary<string, object?>
        {
            ["Version"] = "2012-10-17",
            ["Statement"] = new[]
            {
                new Dictionary<string, object?>
                {
                    ["Action"] = "sts:AssumeRole",
                    ["Effect"] = "Allow",
                    ["Principal"] = new Dictionary<string, object?>
                    {
                        ["Service"] = "glue.amazonaws.com",
                    },
                },
            },
        }),
    });

    var etlJob = new Aws.Glue.Job("etl_job", new()
    {
        Name = "example-etl-job",
        Description = "An example Glue ETL job",
        RoleArn = glueJobRole.Arn,
        GlueVersion = "5.0",
        MaxRetries = 0,
        Timeout = 2880,
        NumberOfWorkers = 2,
        WorkerType = "G.1X",
        Connections = new[]
        {
            example.Name,
        },
        ExecutionClass = "STANDARD",
        Command = new Aws.Glue.Inputs.JobCommandArgs
        {
            ScriptLocation = $"s3://{glueScripts.Bucket}/jobs/etl_job.py",
            Name = "glueetl",
            PythonVersion = "3",
        },
        NotificationProperty = new Aws.Glue.Inputs.JobNotificationPropertyArgs
        {
            NotifyDelayAfter = 3,
        },
        DefaultArguments = 
        {
            { "--job-language", "python" },
            { "--continuous-log-logGroup", "/aws-glue/jobs" },
            { "--enable-continuous-cloudwatch-log", "true" },
            { "--enable-continuous-log-filter", "true" },
            { "--enable-metrics", "" },
            { "--enable-auto-scaling", "true" },
        },
        ExecutionProperty = new Aws.Glue.Inputs.JobExecutionPropertyArgs
        {
            MaxConcurrentRuns = 1,
        },
        Tags = 
        {
            { "ManagedBy", "AWS" },
        },
    });

    var glueEtlScript = new Aws.S3.BucketObjectv2("glue_etl_script", new()
    {
        Bucket = glueScripts.Id,
        Key = "jobs/etl_job.py",
        Source = new FileAsset("jobs/etl_job.py"),
    });

});

package generated_program;

import com.pulumi.Context;
import com.pulumi.Pulumi;
import com.pulumi.core.Output;
import com.pulumi.aws.iam.Role;
import com.pulumi.aws.iam.RoleArgs;
import com.pulumi.aws.glue.Job;
import com.pulumi.aws.glue.JobArgs;
import com.pulumi.aws.glue.inputs.JobCommandArgs;
import com.pulumi.aws.glue.inputs.JobNotificationPropertyArgs;
import com.pulumi.aws.glue.inputs.JobExecutionPropertyArgs;
import com.pulumi.aws.s3.BucketObjectv2;
import com.pulumi.aws.s3.BucketObjectv2Args;
import com.pulumi.asset.FileAsset;
import static com.pulumi.codegen.internal.Serialization.*;
import java.util.List;
import java.util.ArrayList;
import java.util.Map;
import java.io.File;
import java.nio.file.Files;
import java.nio.file.Paths;

public class App {
    public static void main(String[] args) {
        Pulumi.run(App::stack);
    }

    public static void stack(Context ctx) {
        // IAM role for Glue jobs
        var glueJobRole = new Role("glueJobRole", RoleArgs.builder()
            .name("glue-job-role")
            .assumeRolePolicy(serializeJson(
                jsonObject(
                    jsonProperty("Version", "2012-10-17"),
                    jsonProperty("Statement", jsonArray(jsonObject(
                        jsonProperty("Action", "sts:AssumeRole"),
                        jsonProperty("Effect", "Allow"),
                        jsonProperty("Principal", jsonObject(
                            jsonProperty("Service", "glue.amazonaws.com")
                        ))
                    )))
                )))
            .build());

        var etlJob = new Job("etlJob", JobArgs.builder()
            .name("example-etl-job")
            .description("An example Glue ETL job")
            .roleArn(glueJobRole.arn())
            .glueVersion("5.0")
            .maxRetries(0)
            .timeout(2880)
            .numberOfWorkers(2)
            .workerType("G.1X")
            .connections(example.name())
            .executionClass("STANDARD")
            .command(JobCommandArgs.builder()
                .scriptLocation(String.format("s3://%s/jobs/etl_job.py", glueScripts.bucket()))
                .name("glueetl")
                .pythonVersion("3")
                .build())
            .notificationProperty(JobNotificationPropertyArgs.builder()
                .notifyDelayAfter(3)
                .build())
            .defaultArguments(Map.ofEntries(
                Map.entry("--job-language", "python"),
                Map.entry("--continuous-log-logGroup", "/aws-glue/jobs"),
                Map.entry("--enable-continuous-cloudwatch-log", "true"),
                Map.entry("--enable-continuous-log-filter", "true"),
                Map.entry("--enable-metrics", ""),
                Map.entry("--enable-auto-scaling", "true")
            ))
            .executionProperty(JobExecutionPropertyArgs.builder()
                .maxConcurrentRuns(1)
                .build())
            .tags(Map.of("ManagedBy", "AWS"))
            .build());

        var glueEtlScript = new BucketObjectv2("glueEtlScript", BucketObjectv2Args.builder()
            .bucket(glueScripts.id())
            .key("jobs/etl_job.py")
            .source(new FileAsset("jobs/etl_job.py"))
            .build());

    }
}

resources:
  etlJob:
    type: aws:glue:Job
    name: etl_job
    properties:
      name: example-etl-job
      description: An example Glue ETL job
      roleArn: ${glueJobRole.arn}
      glueVersion: '5.0'
      maxRetries: 0
      timeout: 2880
      numberOfWorkers: 2
      workerType: G.1X
      connections:
        - ${example.name}
      executionClass: STANDARD
      command:
        scriptLocation: s3://${glueScripts.bucket}/jobs/etl_job.py
        name: glueetl
        pythonVersion: '3'
      notificationProperty:
        notifyDelayAfter: 3
      defaultArguments:
        --job-language: python
        --continuous-log-logGroup: /aws-glue/jobs
        --enable-continuous-cloudwatch-log: 'true'
        --enable-continuous-log-filter: 'true'
        --enable-metrics: ""
        --enable-auto-scaling: 'true'
      executionProperty:
        maxConcurrentRuns: 1
      tags:
        ManagedBy: AWS
  # IAM role for Glue jobs
  glueJobRole:
    type: aws:iam:Role
    name: glue_job_role
    properties:
      name: glue-job-role
      assumeRolePolicy:
        fn::toJSON:
          Version: 2012-10-17
          Statement:
            - Action: sts:AssumeRole
              Effect: Allow
              Principal:
                Service: glue.amazonaws.com
  glueEtlScript:
    type: aws:s3:BucketObjectv2
    name: glue_etl_script
    properties:
      bucket: ${glueScripts.id}
      key: jobs/etl_job.py
      source:
        fn::FileAsset: jobs/etl_job.py

Pythonshell Job

import * as pulumi from "@pulumi/pulumi";
import * as aws from "@pulumi/aws";

// IAM role for Glue jobs
const glueJobRole = new aws.iam.Role("glue_job_role", {
    name: "glue-job-role",
    assumeRolePolicy: JSON.stringify({
        Version: "2012-10-17",
        Statement: [{
            Action: "sts:AssumeRole",
            Effect: "Allow",
            Principal: {
                Service: "glue.amazonaws.com",
            },
        }],
    }),
});
const pythonShellJob = new aws.glue.Job("python_shell_job", {
    name: "example-python-shell-job",
    description: "An example Python shell job",
    roleArn: glueJobRole.arn,
    maxCapacity: 0.0625,
    maxRetries: 0,
    timeout: 2880,
    connections: [example.name],
    command: {
        scriptLocation: `s3://${glueScripts.bucket}/jobs/shell_job.py`,
        name: "pythonshell",
        pythonVersion: "3.9",
    },
    defaultArguments: {
        "--job-language": "python",
        "--continuous-log-logGroup": "/aws-glue/jobs",
        "--enable-continuous-cloudwatch-log": "true",
        "library-set": "analytics",
    },
    executionProperty: {
        maxConcurrentRuns: 1,
    },
    tags: {
        ManagedBy: "AWS",
    },
});
const pythonShellScript = new aws.s3.BucketObjectv2("python_shell_script", {
    bucket: glueScripts.id,
    key: "jobs/shell_job.py",
    source: new pulumi.asset.FileAsset("jobs/shell_job.py"),
});

import pulumi
import json
import pulumi_aws as aws

# IAM role for Glue jobs
glue_job_role = aws.iam.Role("glue_job_role",
    name="glue-job-role",
    assume_role_policy=json.dumps({
        "Version": "2012-10-17",
        "Statement": [{
            "Action": "sts:AssumeRole",
            "Effect": "Allow",
            "Principal": {
                "Service": "glue.amazonaws.com",
            },
        }],
    }))
python_shell_job = aws.glue.Job("python_shell_job",
    name="example-python-shell-job",
    description="An example Python shell job",
    role_arn=glue_job_role.arn,
    max_capacity=0.0625,
    max_retries=0,
    timeout=2880,
    connections=[example["name"]],
    command={
        "script_location": f"s3://{glue_scripts['bucket']}/jobs/shell_job.py",
        "name": "pythonshell",
        "python_version": "3.9",
    },
    default_arguments={
        "--job-language": "python",
        "--continuous-log-logGroup": "/aws-glue/jobs",
        "--enable-continuous-cloudwatch-log": "true",
        "library-set": "analytics",
    },
    execution_property={
        "max_concurrent_runs": 1,
    },
    tags={
        "ManagedBy": "AWS",
    })
python_shell_script = aws.s3.BucketObjectv2("python_shell_script",
    bucket=glue_scripts["id"],
    key="jobs/shell_job.py",
    source=pulumi.FileAsset("jobs/shell_job.py"))

package main

import (
	"encoding/json"
	"fmt"

	"github.com/pulumi/pulumi-aws/sdk/v6/go/aws/glue"
	"github.com/pulumi/pulumi-aws/sdk/v6/go/aws/iam"
	"github.com/pulumi/pulumi-aws/sdk/v6/go/aws/s3"
	"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
)

func main() {
	pulumi.Run(func(ctx *pulumi.Context) error {
		tmpJSON0, err := json.Marshal(map[string]interface{}{
			"Version": "2012-10-17",
			"Statement": []map[string]interface{}{
				map[string]interface{}{
					"Action": "sts:AssumeRole",
					"Effect": "Allow",
					"Principal": map[string]interface{}{
						"Service": "glue.amazonaws.com",
					},
				},
			},
		})
		if err != nil {
			return err
		}
		json0 := string(tmpJSON0)
		// IAM role for Glue jobs
		glueJobRole, err := iam.NewRole(ctx, "glue_job_role", &iam.RoleArgs{
			Name:             pulumi.String("glue-job-role"),
			AssumeRolePolicy: pulumi.String(json0),
		})
		if err != nil {
			return err
		}
		_, err = glue.NewJob(ctx, "python_shell_job", &glue.JobArgs{
			Name:        pulumi.String("example-python-shell-job"),
			Description: pulumi.String("An example Python shell job"),
			RoleArn:     glueJobRole.Arn,
			MaxCapacity: pulumi.Float64(0.0625),
			MaxRetries:  pulumi.Int(0),
			Timeout:     pulumi.Int(2880),
			Connections: pulumi.StringArray{
				example.Name,
			},
			Command: &glue.JobCommandArgs{
				ScriptLocation: pulumi.Sprintf("s3://%v/jobs/shell_job.py", glueScripts.Bucket),
				Name:           pulumi.String("pythonshell"),
				PythonVersion:  pulumi.String("3.9"),
			},
			DefaultArguments: pulumi.StringMap{
				"--job-language":                     pulumi.String("python"),
				"--continuous-log-logGroup":          pulumi.String("/aws-glue/jobs"),
				"--enable-continuous-cloudwatch-log": pulumi.String("true"),
				"library-set":                        pulumi.String("analytics"),
			},
			ExecutionProperty: &glue.JobExecutionPropertyArgs{
				MaxConcurrentRuns: pulumi.Int(1),
			},
			Tags: pulumi.StringMap{
				"ManagedBy": pulumi.String("AWS"),
			},
		})
		if err != nil {
			return err
		}
		_, err = s3.NewBucketObjectv2(ctx, "python_shell_script", &s3.BucketObjectv2Args{
			Bucket: pulumi.Any(glueScripts.Id),
			Key:    pulumi.String("jobs/shell_job.py"),
			Source: pulumi.NewFileAsset("jobs/shell_job.py"),
		})
		if err != nil {
			return err
		}
		return nil
	})
}

using System.Collections.Generic;
using System.Linq;
using System.Text.Json;
using Pulumi;
using Aws = Pulumi.Aws;

return await Deployment.RunAsync(() => 
{
    // IAM role for Glue jobs
    var glueJobRole = new Aws.Iam.Role("glue_job_role", new()
    {
        Name = "glue-job-role",
        AssumeRolePolicy = JsonSerializer.Serialize(new Dictionary<string, object?>
        {
            ["Version"] = "2012-10-17",
            ["Statement"] = new[]
            {
                new Dictionary<string, object?>
                {
                    ["Action"] = "sts:AssumeRole",
                    ["Effect"] = "Allow",
                    ["Principal"] = new Dictionary<string, object?>
                    {
                        ["Service"] = "glue.amazonaws.com",
                    },
                },
            },
        }),
    });

    var pythonShellJob = new Aws.Glue.Job("python_shell_job", new()
    {
        Name = "example-python-shell-job",
        Description = "An example Python shell job",
        RoleArn = glueJobRole.Arn,
        MaxCapacity = 0.0625,
        MaxRetries = 0,
        Timeout = 2880,
        Connections = new[]
        {
            example.Name,
        },
        Command = new Aws.Glue.Inputs.JobCommandArgs
        {
            ScriptLocation = $"s3://{glueScripts.Bucket}/jobs/shell_job.py",
            Name = "pythonshell",
            PythonVersion = "3.9",
        },
        DefaultArguments = 
        {
            { "--job-language", "python" },
            { "--continuous-log-logGroup", "/aws-glue/jobs" },
            { "--enable-continuous-cloudwatch-log", "true" },
            { "library-set", "analytics" },
        },
        ExecutionProperty = new Aws.Glue.Inputs.JobExecutionPropertyArgs
        {
            MaxConcurrentRuns = 1,
        },
        Tags = 
        {
            { "ManagedBy", "AWS" },
        },
    });

    var pythonShellScript = new Aws.S3.BucketObjectv2("python_shell_script", new()
    {
        Bucket = glueScripts.Id,
        Key = "jobs/shell_job.py",
        Source = new FileAsset("jobs/shell_job.py"),
    });

});

package generated_program;

import com.pulumi.Context;
import com.pulumi.Pulumi;
import com.pulumi.core.Output;
import com.pulumi.aws.iam.Role;
import com.pulumi.aws.iam.RoleArgs;
import com.pulumi.aws.glue.Job;
import com.pulumi.aws.glue.JobArgs;
import com.pulumi.aws.glue.inputs.JobCommandArgs;
import com.pulumi.aws.glue.inputs.JobExecutionPropertyArgs;
import com.pulumi.aws.s3.BucketObjectv2;
import com.pulumi.aws.s3.BucketObjectv2Args;
import com.pulumi.asset.FileAsset;
import static com.pulumi.codegen.internal.Serialization.*;
import java.util.List;
import java.util.ArrayList;
import java.util.Map;
import java.io.File;
import java.nio.file.Files;
import java.nio.file.Paths;

public class App {
    public static void main(String[] args) {
        Pulumi.run(App::stack);
    }

    public static void stack(Context ctx) {
        // IAM role for Glue jobs
        var glueJobRole = new Role("glueJobRole", RoleArgs.builder()
            .name("glue-job-role")
            .assumeRolePolicy(serializeJson(
                jsonObject(
                    jsonProperty("Version", "2012-10-17"),
                    jsonProperty("Statement", jsonArray(jsonObject(
                        jsonProperty("Action", "sts:AssumeRole"),
                        jsonProperty("Effect", "Allow"),
                        jsonProperty("Principal", jsonObject(
                            jsonProperty("Service", "glue.amazonaws.com")
                        ))
                    )))
                )))
            .build());

        var pythonShellJob = new Job("pythonShellJob", JobArgs.builder()
            .name("example-python-shell-job")
            .description("An example Python shell job")
            .roleArn(glueJobRole.arn())
            .maxCapacity(0.0625)
            .maxRetries(0)
            .timeout(2880)
            .connections(example.name())
            .command(JobCommandArgs.builder()
                .scriptLocation(String.format("s3://%s/jobs/shell_job.py", glueScripts.bucket()))
                .name("pythonshell")
                .pythonVersion("3.9")
                .build())
            .defaultArguments(Map.ofEntries(
                Map.entry("--job-language", "python"),
                Map.entry("--continuous-log-logGroup", "/aws-glue/jobs"),
                Map.entry("--enable-continuous-cloudwatch-log", "true"),
                Map.entry("library-set", "analytics")
            ))
            .executionProperty(JobExecutionPropertyArgs.builder()
                .maxConcurrentRuns(1)
                .build())
            .tags(Map.of("ManagedBy", "AWS"))
            .build());

        var pythonShellScript = new BucketObjectv2("pythonShellScript", BucketObjectv2Args.builder()
            .bucket(glueScripts.id())
            .key("jobs/shell_job.py")
            .source(new FileAsset("jobs/shell_job.py"))
            .build());

    }
}

resources:
  pythonShellJob:
    type: aws:glue:Job
    name: python_shell_job
    properties:
      name: example-python-shell-job
      description: An example Python shell job
      roleArn: ${glueJobRole.arn}
      maxCapacity: '0.0625'
      maxRetries: 0
      timeout: 2880
      connections:
        - ${example.name}
      command:
        scriptLocation: s3://${glueScripts.bucket}/jobs/shell_job.py
        name: pythonshell
        pythonVersion: '3.9'
      defaultArguments:
        --job-language: python
        --continuous-log-logGroup: /aws-glue/jobs
        --enable-continuous-cloudwatch-log: 'true'
        library-set: analytics
      executionProperty:
        maxConcurrentRuns: 1
      tags:
        ManagedBy: AWS
  # IAM role for Glue jobs
  glueJobRole:
    type: aws:iam:Role
    name: glue_job_role
    properties:
      name: glue-job-role
      assumeRolePolicy:
        fn::toJSON:
          Version: 2012-10-17
          Statement:
            - Action: sts:AssumeRole
              Effect: Allow
              Principal:
                Service: glue.amazonaws.com
  pythonShellScript:
    type: aws:s3:BucketObjectv2
    name: python_shell_script
    properties:
      bucket: ${glueScripts.id}
      key: jobs/shell_job.py
      source:
        fn::FileAsset: jobs/shell_job.py

Ray Job

import * as pulumi from "@pulumi/pulumi";
import * as aws from "@pulumi/aws";

const example = new aws.glue.Job("example", {
    name: "example",
    roleArn: exampleAwsIamRole.arn,
    glueVersion: "4.0",
    workerType: "Z.2X",
    command: {
        name: "glueray",
        pythonVersion: "3.9",
        runtime: "Ray2.4",
        scriptLocation: `s3://${exampleAwsS3Bucket.bucket}/example.py`,
    },
});

import pulumi
import pulumi_aws as aws

example = aws.glue.Job("example",
    name="example",
    role_arn=example_aws_iam_role["arn"],
    glue_version="4.0",
    worker_type="Z.2X",
    command={
        "name": "glueray",
        "python_version": "3.9",
        "runtime": "Ray2.4",
        "script_location": f"s3://{example_aws_s3_bucket['bucket']}/example.py",
    })

package main

import (
	"fmt"

	"github.com/pulumi/pulumi-aws/sdk/v6/go/aws/glue"
	"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
)

func main() {
	pulumi.Run(func(ctx *pulumi.Context) error {
		_, err := glue.NewJob(ctx, "example", &glue.JobArgs{
			Name:        pulumi.String("example"),
			RoleArn:     pulumi.Any(exampleAwsIamRole.Arn),
			GlueVersion: pulumi.String("4.0"),
			WorkerType:  pulumi.String("Z.2X"),
			Command: &glue.JobCommandArgs{
				Name:           pulumi.String("glueray"),
				PythonVersion:  pulumi.String("3.9"),
				Runtime:        pulumi.String("Ray2.4"),
				ScriptLocation: pulumi.Sprintf("s3://%v/example.py", exampleAwsS3Bucket.Bucket),
			},
		})
		if err != nil {
			return err
		}
		return nil
	})
}

using System.Collections.Generic;
using System.Linq;
using Pulumi;
using Aws = Pulumi.Aws;

return await Deployment.RunAsync(() => 
{
    var example = new Aws.Glue.Job("example", new()
    {
        Name = "example",
        RoleArn = exampleAwsIamRole.Arn,
        GlueVersion = "4.0",
        WorkerType = "Z.2X",
        Command = new Aws.Glue.Inputs.JobCommandArgs
        {
            Name = "glueray",
            PythonVersion = "3.9",
            Runtime = "Ray2.4",
            ScriptLocation = $"s3://{exampleAwsS3Bucket.Bucket}/example.py",
        },
    });

});

package generated_program;

import com.pulumi.Context;
import com.pulumi.Pulumi;
import com.pulumi.core.Output;
import com.pulumi.aws.glue.Job;
import com.pulumi.aws.glue.JobArgs;
import com.pulumi.aws.glue.inputs.JobCommandArgs;
import java.util.List;
import java.util.ArrayList;
import java.util.Map;
import java.io.File;
import java.nio.file.Files;
import java.nio.file.Paths;

public class App {
    public static void main(String[] args) {
        Pulumi.run(App::stack);
    }

    public static void stack(Context ctx) {
        var example = new Job("example", JobArgs.builder()
            .name("example")
            .roleArn(exampleAwsIamRole.arn())
            .glueVersion("4.0")
            .workerType("Z.2X")
            .command(JobCommandArgs.builder()
                .name("glueray")
                .pythonVersion("3.9")
                .runtime("Ray2.4")
                .scriptLocation(String.format("s3://%s/example.py", exampleAwsS3Bucket.bucket()))
                .build())
            .build());

    }
}

resources:
  example:
    type: aws:glue:Job
    properties:
      name: example
      roleArn: ${exampleAwsIamRole.arn}
      glueVersion: '4.0'
      workerType: Z.2X
      command:
        name: glueray
        pythonVersion: '3.9'
        runtime: Ray2.4
        scriptLocation: s3://${exampleAwsS3Bucket.bucket}/example.py

Scala Job

import * as pulumi from "@pulumi/pulumi";
import * as aws from "@pulumi/aws";

const example = new aws.glue.Job("example", {
    name: "example",
    roleArn: exampleAwsIamRole.arn,
    command: {
        scriptLocation: `s3://${exampleAwsS3Bucket.bucket}/example.scala`,
    },
    defaultArguments: {
        "--job-language": "scala",
    },
});

import pulumi
import pulumi_aws as aws

example = aws.glue.Job("example",
    name="example",
    role_arn=example_aws_iam_role["arn"],
    command={
        "script_location": f"s3://{example_aws_s3_bucket['bucket']}/example.scala",
    },
    default_arguments={
        "--job-language": "scala",
    })

package main

import (
	"fmt"

	"github.com/pulumi/pulumi-aws/sdk/v6/go/aws/glue"
	"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
)

func main() {
	pulumi.Run(func(ctx *pulumi.Context) error {
		_, err := glue.NewJob(ctx, "example", &glue.JobArgs{
			Name:    pulumi.String("example"),
			RoleArn: pulumi.Any(exampleAwsIamRole.Arn),
			Command: &glue.JobCommandArgs{
				ScriptLocation: pulumi.Sprintf("s3://%v/example.scala", exampleAwsS3Bucket.Bucket),
			},
			DefaultArguments: pulumi.StringMap{
				"--job-language": pulumi.String("scala"),
			},
		})
		if err != nil {
			return err
		}
		return nil
	})
}

using System.Collections.Generic;
using System.Linq;
using Pulumi;
using Aws = Pulumi.Aws;

return await Deployment.RunAsync(() => 
{
    var example = new Aws.Glue.Job("example", new()
    {
        Name = "example",
        RoleArn = exampleAwsIamRole.Arn,
        Command = new Aws.Glue.Inputs.JobCommandArgs
        {
            ScriptLocation = $"s3://{exampleAwsS3Bucket.Bucket}/example.scala",
        },
        DefaultArguments = 
        {
            { "--job-language", "scala" },
        },
    });

});

package generated_program;

import com.pulumi.Context;
import com.pulumi.Pulumi;
import com.pulumi.core.Output;
import com.pulumi.aws.glue.Job;
import com.pulumi.aws.glue.JobArgs;
import com.pulumi.aws.glue.inputs.JobCommandArgs;
import java.util.List;
import java.util.ArrayList;
import java.util.Map;
import java.io.File;
import java.nio.file.Files;
import java.nio.file.Paths;

public class App {
    public static void main(String[] args) {
        Pulumi.run(App::stack);
    }

    public static void stack(Context ctx) {
        var example = new Job("example", JobArgs.builder()
            .name("example")
            .roleArn(exampleAwsIamRole.arn())
            .command(JobCommandArgs.builder()
                .scriptLocation(String.format("s3://%s/example.scala", exampleAwsS3Bucket.bucket()))
                .build())
            .defaultArguments(Map.of("--job-language", "scala"))
            .build());

    }
}

resources:
  example:
    type: aws:glue:Job
    properties:
      name: example
      roleArn: ${exampleAwsIamRole.arn}
      command:
        scriptLocation: s3://${exampleAwsS3Bucket.bucket}/example.scala
      defaultArguments:
        --job-language: scala

Streaming Job

import * as pulumi from "@pulumi/pulumi";
import * as aws from "@pulumi/aws";

const example = new aws.glue.Job("example", {
    name: "example streaming job",
    roleArn: exampleAwsIamRole.arn,
    command: {
        name: "gluestreaming",
        scriptLocation: `s3://${exampleAwsS3Bucket.bucket}/example.script`,
    },
});

import pulumi
import pulumi_aws as aws

example = aws.glue.Job("example",
    name="example streaming job",
    role_arn=example_aws_iam_role["arn"],
    command={
        "name": "gluestreaming",
        "script_location": f"s3://{example_aws_s3_bucket['bucket']}/example.script",
    })

package main

import (
	"fmt"

	"github.com/pulumi/pulumi-aws/sdk/v6/go/aws/glue"
	"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
)

func main() {
	pulumi.Run(func(ctx *pulumi.Context) error {
		_, err := glue.NewJob(ctx, "example", &glue.JobArgs{
			Name:    pulumi.String("example streaming job"),
			RoleArn: pulumi.Any(exampleAwsIamRole.Arn),
			Command: &glue.JobCommandArgs{
				Name:           pulumi.String("gluestreaming"),
				ScriptLocation: pulumi.Sprintf("s3://%v/example.script", exampleAwsS3Bucket.Bucket),
			},
		})
		if err != nil {
			return err
		}
		return nil
	})
}

using System.Collections.Generic;
using System.Linq;
using Pulumi;
using Aws = Pulumi.Aws;

return await Deployment.RunAsync(() => 
{
    var example = new Aws.Glue.Job("example", new()
    {
        Name = "example streaming job",
        RoleArn = exampleAwsIamRole.Arn,
        Command = new Aws.Glue.Inputs.JobCommandArgs
        {
            Name = "gluestreaming",
            ScriptLocation = $"s3://{exampleAwsS3Bucket.Bucket}/example.script",
        },
    });

});

package generated_program;

import com.pulumi.Context;
import com.pulumi.Pulumi;
import com.pulumi.core.Output;
import com.pulumi.aws.glue.Job;
import com.pulumi.aws.glue.JobArgs;
import com.pulumi.aws.glue.inputs.JobCommandArgs;
import java.util.List;
import java.util.ArrayList;
import java.util.Map;
import java.io.File;
import java.nio.file.Files;
import java.nio.file.Paths;

public class App {
    public static void main(String[] args) {
        Pulumi.run(App::stack);
    }

    public static void stack(Context ctx) {
        var example = new Job("example", JobArgs.builder()
            .name("example streaming job")
            .roleArn(exampleAwsIamRole.arn())
            .command(JobCommandArgs.builder()
                .name("gluestreaming")
                .scriptLocation(String.format("s3://%s/example.script", exampleAwsS3Bucket.bucket()))
                .build())
            .build());

    }
}

resources:
  example:
    type: aws:glue:Job
    properties:
      name: example streaming job
      roleArn: ${exampleAwsIamRole.arn}
      command:
        name: gluestreaming
        scriptLocation: s3://${exampleAwsS3Bucket.bucket}/example.script

Enabling CloudWatch Logs and Metrics

import * as pulumi from "@pulumi/pulumi";
import * as aws from "@pulumi/aws";

const example = new aws.cloudwatch.LogGroup("example", {
    name: "example",
    retentionInDays: 14,
});
const exampleJob = new aws.glue.Job("example", {defaultArguments: {
    "--continuous-log-logGroup": example.name,
    "--enable-continuous-cloudwatch-log": "true",
    "--enable-continuous-log-filter": "true",
    "--enable-metrics": "",
}});

import pulumi
import pulumi_aws as aws

example = aws.cloudwatch.LogGroup("example",
    name="example",
    retention_in_days=14)
example_job = aws.glue.Job("example", default_arguments={
    "--continuous-log-logGroup": example.name,
    "--enable-continuous-cloudwatch-log": "true",
    "--enable-continuous-log-filter": "true",
    "--enable-metrics": "",
})

package main

import (
	"github.com/pulumi/pulumi-aws/sdk/v6/go/aws/cloudwatch"
	"github.com/pulumi/pulumi-aws/sdk/v6/go/aws/glue"
	"github.com/pulumi/pulumi/sdk/v3/go/pulumi"
)

func main() {
	pulumi.Run(func(ctx *pulumi.Context) error {
		example, err := cloudwatch.NewLogGroup(ctx, "example", &cloudwatch.LogGroupArgs{
			Name:            pulumi.String("example"),
			RetentionInDays: pulumi.Int(14),
		})
		if err != nil {
			return err
		}
		_, err = glue.NewJob(ctx, "example", &glue.JobArgs{
			DefaultArguments: pulumi.StringMap{
				"--continuous-log-logGroup":          example.Name,
				"--enable-continuous-cloudwatch-log": pulumi.String("true"),
				"--enable-continuous-log-filter":     pulumi.String("true"),
				"--enable-metrics":                   pulumi.String(""),
			},
		})
		if err != nil {
			return err
		}
		return nil
	})
}

using System.Collections.Generic;
using System.Linq;
using Pulumi;
using Aws = Pulumi.Aws;

return await Deployment.RunAsync(() => 
{
    var example = new Aws.CloudWatch.LogGroup("example", new()
    {
        Name = "example",
        RetentionInDays = 14,
    });

    var exampleJob = new Aws.Glue.Job("example", new()
    {
        DefaultArguments = 
        {
            { "--continuous-log-logGroup", example.Name },
            { "--enable-continuous-cloudwatch-log", "true" },
            { "--enable-continuous-log-filter", "true" },
            { "--enable-metrics", "" },
        },
    });

});

package generated_program;

import com.pulumi.Context;
import com.pulumi.Pulumi;
import com.pulumi.core.Output;
import com.pulumi.aws.cloudwatch.LogGroup;
import com.pulumi.aws.cloudwatch.LogGroupArgs;
import com.pulumi.aws.glue.Job;
import com.pulumi.aws.glue.JobArgs;
import java.util.List;
import java.util.ArrayList;
import java.util.Map;
import java.io.File;
import java.nio.file.Files;
import java.nio.file.Paths;

public class App {
    public static void main(String[] args) {
        Pulumi.run(App::stack);
    }

    public static void stack(Context ctx) {
        var example = new LogGroup("example", LogGroupArgs.builder()
            .name("example")
            .retentionInDays(14)
            .build());

        var exampleJob = new Job("exampleJob", JobArgs.builder()
            .defaultArguments(Map.ofEntries(
                Map.entry("--continuous-log-logGroup", example.name()),
                Map.entry("--enable-continuous-cloudwatch-log", "true"),
                Map.entry("--enable-continuous-log-filter", "true"),
                Map.entry("--enable-metrics", "")
            ))
            .build());

    }
}

resources:
  example:
    type: aws:cloudwatch:LogGroup
    properties:
      name: example
      retentionInDays: 14
  exampleJob:
    type: aws:glue:Job
    name: example
    properties:
      defaultArguments:
        --continuous-log-logGroup: ${example.name}
        --enable-continuous-cloudwatch-log: 'true'
        --enable-continuous-log-filter: 'true'
        --enable-metrics: ""

Create Job Resource

Resources are created with functions called constructors. To learn more about declaring and configuring resources, see Resources.

Constructor syntax

new Job(name: string, args: JobArgs, opts?: CustomResourceOptions);

@overload
def Job(resource_name: str,
        args: JobArgs,
        opts: Optional[ResourceOptions] = None)

@overload
def Job(resource_name: str,
        opts: Optional[ResourceOptions] = None,
        command: Optional[JobCommandArgs] = None,
        role_arn: Optional[str] = None,
        execution_property: Optional[JobExecutionPropertyArgs] = None,
        name: Optional[str] = None,
        execution_class: Optional[str] = None,
        default_arguments: Optional[Mapping[str, str]] = None,
        glue_version: Optional[str] = None,
        job_run_queuing_enabled: Optional[bool] = None,
        maintenance_window: Optional[str] = None,
        max_capacity: Optional[float] = None,
        max_retries: Optional[int] = None,
        description: Optional[str] = None,
        non_overridable_arguments: Optional[Mapping[str, str]] = None,
        notification_property: Optional[JobNotificationPropertyArgs] = None,
        number_of_workers: Optional[int] = None,
        connections: Optional[Sequence[str]] = None,
        security_configuration: Optional[str] = None,
        source_control_details: Optional[JobSourceControlDetailsArgs] = None,
        tags: Optional[Mapping[str, str]] = None,
        timeout: Optional[int] = None,
        worker_type: Optional[str] = None)

func NewJob(ctx *Context, name string, args JobArgs, opts ...ResourceOption) (*Job, error)

public Job(string name, JobArgs args, CustomResourceOptions? opts = null)

public Job(String name, JobArgs args)
public Job(String name, JobArgs args, CustomResourceOptions options)

type: aws:glue:Job
properties: # The arguments to resource properties.
options: # Bag of options to control resource's behavior.

Parameters

name string: The unique name of the resource.
args JobArgs: The arguments to resource properties.
opts CustomResourceOptions: Bag of options to control resource's behavior.

resource_name str: The unique name of the resource.
args JobArgs: The arguments to resource properties.
opts ResourceOptions: Bag of options to control resource's behavior.

ctx Context: Context object for the current deployment.
name string: The unique name of the resource.
args JobArgs: The arguments to resource properties.
opts ResourceOption: Bag of options to control resource's behavior.

name string: The unique name of the resource.
args JobArgs: The arguments to resource properties.
opts CustomResourceOptions: Bag of options to control resource's behavior.

name String: The unique name of the resource.
args JobArgs: The arguments to resource properties.
options CustomResourceOptions: Bag of options to control resource's behavior.

Constructor example

The following reference example uses placeholder values for all input properties.

var jobResource = new Aws.Glue.Job("jobResource", new()
{
    Command = new Aws.Glue.Inputs.JobCommandArgs
    {
        ScriptLocation = "string",
        Name = "string",
        PythonVersion = "string",
        Runtime = "string",
    },
    RoleArn = "string",
    ExecutionProperty = new Aws.Glue.Inputs.JobExecutionPropertyArgs
    {
        MaxConcurrentRuns = 0,
    },
    Name = "string",
    ExecutionClass = "string",
    DefaultArguments = 
    {
        { "string", "string" },
    },
    GlueVersion = "string",
    JobRunQueuingEnabled = false,
    MaintenanceWindow = "string",
    MaxCapacity = 0,
    MaxRetries = 0,
    Description = "string",
    NonOverridableArguments = 
    {
        { "string", "string" },
    },
    NotificationProperty = new Aws.Glue.Inputs.JobNotificationPropertyArgs
    {
        NotifyDelayAfter = 0,
    },
    NumberOfWorkers = 0,
    Connections = new[]
    {
        "string",
    },
    SecurityConfiguration = "string",
    SourceControlDetails = new Aws.Glue.Inputs.JobSourceControlDetailsArgs
    {
        AuthStrategy = "string",
        AuthToken = "string",
        Branch = "string",
        Folder = "string",
        LastCommitId = "string",
        Owner = "string",
        Provider = "string",
        Repository = "string",
    },
    Tags = 
    {
        { "string", "string" },
    },
    Timeout = 0,
    WorkerType = "string",
});

example, err := glue.NewJob(ctx, "jobResource", &glue.JobArgs{
	Command: &glue.JobCommandArgs{
		ScriptLocation: pulumi.String("string"),
		Name:           pulumi.String("string"),
		PythonVersion:  pulumi.String("string"),
		Runtime:        pulumi.String("string"),
	},
	RoleArn: pulumi.String("string"),
	ExecutionProperty: &glue.JobExecutionPropertyArgs{
		MaxConcurrentRuns: pulumi.Int(0),
	},
	Name:           pulumi.String("string"),
	ExecutionClass: pulumi.String("string"),
	DefaultArguments: pulumi.StringMap{
		"string": pulumi.String("string"),
	},
	GlueVersion:          pulumi.String("string"),
	JobRunQueuingEnabled: pulumi.Bool(false),
	MaintenanceWindow:    pulumi.String("string"),
	MaxCapacity:          pulumi.Float64(0),
	MaxRetries:           pulumi.Int(0),
	Description:          pulumi.String("string"),
	NonOverridableArguments: pulumi.StringMap{
		"string": pulumi.String("string"),
	},
	NotificationProperty: &glue.JobNotificationPropertyArgs{
		NotifyDelayAfter: pulumi.Int(0),
	},
	NumberOfWorkers: pulumi.Int(0),
	Connections: pulumi.StringArray{
		pulumi.String("string"),
	},
	SecurityConfiguration: pulumi.String("string"),
	SourceControlDetails: &glue.JobSourceControlDetailsArgs{
		AuthStrategy: pulumi.String("string"),
		AuthToken:    pulumi.String("string"),
		Branch:       pulumi.String("string"),
		Folder:       pulumi.String("string"),
		LastCommitId: pulumi.String("string"),
		Owner:        pulumi.String("string"),
		Provider:     pulumi.String("string"),
		Repository:   pulumi.String("string"),
	},
	Tags: pulumi.StringMap{
		"string": pulumi.String("string"),
	},
	Timeout:    pulumi.Int(0),
	WorkerType: pulumi.String("string"),
})

var jobResource = new Job("jobResource", JobArgs.builder()
    .command(JobCommandArgs.builder()
        .scriptLocation("string")
        .name("string")
        .pythonVersion("string")
        .runtime("string")
        .build())
    .roleArn("string")
    .executionProperty(JobExecutionPropertyArgs.builder()
        .maxConcurrentRuns(0)
        .build())
    .name("string")
    .executionClass("string")
    .defaultArguments(Map.of("string", "string"))
    .glueVersion("string")
    .jobRunQueuingEnabled(false)
    .maintenanceWindow("string")
    .maxCapacity(0.0)
    .maxRetries(0)
    .description("string")
    .nonOverridableArguments(Map.of("string", "string"))
    .notificationProperty(JobNotificationPropertyArgs.builder()
        .notifyDelayAfter(0)
        .build())
    .numberOfWorkers(0)
    .connections("string")
    .securityConfiguration("string")
    .sourceControlDetails(JobSourceControlDetailsArgs.builder()
        .authStrategy("string")
        .authToken("string")
        .branch("string")
        .folder("string")
        .lastCommitId("string")
        .owner("string")
        .provider("string")
        .repository("string")
        .build())
    .tags(Map.of("string", "string"))
    .timeout(0)
    .workerType("string")
    .build());

job_resource = aws.glue.Job("jobResource",
    command={
        "script_location": "string",
        "name": "string",
        "python_version": "string",
        "runtime": "string",
    },
    role_arn="string",
    execution_property={
        "max_concurrent_runs": 0,
    },
    name="string",
    execution_class="string",
    default_arguments={
        "string": "string",
    },
    glue_version="string",
    job_run_queuing_enabled=False,
    maintenance_window="string",
    max_capacity=0,
    max_retries=0,
    description="string",
    non_overridable_arguments={
        "string": "string",
    },
    notification_property={
        "notify_delay_after": 0,
    },
    number_of_workers=0,
    connections=["string"],
    security_configuration="string",
    source_control_details={
        "auth_strategy": "string",
        "auth_token": "string",
        "branch": "string",
        "folder": "string",
        "last_commit_id": "string",
        "owner": "string",
        "provider": "string",
        "repository": "string",
    },
    tags={
        "string": "string",
    },
    timeout=0,
    worker_type="string")

const jobResource = new aws.glue.Job("jobResource", {
    command: {
        scriptLocation: "string",
        name: "string",
        pythonVersion: "string",
        runtime: "string",
    },
    roleArn: "string",
    executionProperty: {
        maxConcurrentRuns: 0,
    },
    name: "string",
    executionClass: "string",
    defaultArguments: {
        string: "string",
    },
    glueVersion: "string",
    jobRunQueuingEnabled: false,
    maintenanceWindow: "string",
    maxCapacity: 0,
    maxRetries: 0,
    description: "string",
    nonOverridableArguments: {
        string: "string",
    },
    notificationProperty: {
        notifyDelayAfter: 0,
    },
    numberOfWorkers: 0,
    connections: ["string"],
    securityConfiguration: "string",
    sourceControlDetails: {
        authStrategy: "string",
        authToken: "string",
        branch: "string",
        folder: "string",
        lastCommitId: "string",
        owner: "string",
        provider: "string",
        repository: "string",
    },
    tags: {
        string: "string",
    },
    timeout: 0,
    workerType: "string",
});

type: aws:glue:Job
properties:
    command:
        name: string
        pythonVersion: string
        runtime: string
        scriptLocation: string
    connections:
        - string
    defaultArguments:
        string: string
    description: string
    executionClass: string
    executionProperty:
        maxConcurrentRuns: 0
    glueVersion: string
    jobRunQueuingEnabled: false
    maintenanceWindow: string
    maxCapacity: 0
    maxRetries: 0
    name: string
    nonOverridableArguments:
        string: string
    notificationProperty:
        notifyDelayAfter: 0
    numberOfWorkers: 0
    roleArn: string
    securityConfiguration: string
    sourceControlDetails:
        authStrategy: string
        authToken: string
        branch: string
        folder: string
        lastCommitId: string
        owner: string
        provider: string
        repository: string
    tags:
        string: string
    timeout: 0
    workerType: string

Job Resource Properties

To learn more about resource properties and how to use them, see Inputs and Outputs in the Architecture and Concepts docs.

Inputs

In Python, inputs that are objects can be passed either as argument classes or as dictionary literals.

The Job resource accepts the following input properties:

Command JobCommand

The command of the job. Defined below.

RoleArn string

The ARN of the IAM role associated with this job.

Connections List<string>

The list of connections used for this job.

DefaultArguments Dictionary<string, string>

The map of default arguments for this job. You can specify arguments here that your own job-execution script consumes, as well as arguments that AWS Glue itself consumes. For information about how to specify and consume your own Job arguments, see the Calling AWS Glue APIs in Python topic in the developer guide. For information about the key-value pairs that AWS Glue consumes to set up your job, see the Special Parameters Used by AWS Glue topic in the developer guide.

Description string

Description of the job.

ExecutionClass string

Indicates whether the job is run with a standard or flexible execution class. The standard execution class is ideal for time-sensitive workloads that require fast job startup and dedicated resources. Valid value: FLEX, STANDARD.

ExecutionProperty JobExecutionProperty

Execution property of the job. Defined below.

GlueVersion string

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

JobRunQueuingEnabled bool

Specifies whether job run queuing is enabled for the job runs for this job. A value of true means job run queuing is enabled for the job runs. If false or not populated, the job runs will not be considered for queueing.

MaintenanceWindow string

Specifies the day of the week and hour for the maintenance window for streaming jobs.

MaxCapacity double

The maximum number of AWS Glue data processing units (DPUs) that can be allocated when this job runs. Required when pythonshell is set, accept either 0.0625 or 1.0. Use number_of_workers and worker_type arguments instead with glue_version 2.0 and above.

MaxRetries int

The maximum number of times to retry this job if it fails.

Name string

The name you assign to this job. It must be unique in your account.

NonOverridableArguments Dictionary<string, string>

Non-overridable arguments for this job, specified as name-value pairs.

NotificationProperty JobNotificationProperty

Notification property of the job. Defined below.

NumberOfWorkers int

The number of workers of a defined workerType that are allocated when a job runs.

SecurityConfiguration string

The name of the Security Configuration to be associated with the job.

SourceControlDetails JobSourceControlDetails

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

Tags Dictionary<string, string>

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

Timeout int

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

WorkerType string

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

Command JobCommandArgs

The command of the job. Defined below.

RoleArn string

The ARN of the IAM role associated with this job.

Connections []string

The list of connections used for this job.

DefaultArguments map[string]string

Description string

Description of the job.

ExecutionClass string

ExecutionProperty JobExecutionPropertyArgs

Execution property of the job. Defined below.

GlueVersion string

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

JobRunQueuingEnabled bool

MaintenanceWindow string

Specifies the day of the week and hour for the maintenance window for streaming jobs.

MaxCapacity float64

MaxRetries int

The maximum number of times to retry this job if it fails.

Name string

The name you assign to this job. It must be unique in your account.

NonOverridableArguments map[string]string

Non-overridable arguments for this job, specified as name-value pairs.

NotificationProperty JobNotificationPropertyArgs

Notification property of the job. Defined below.

NumberOfWorkers int

The number of workers of a defined workerType that are allocated when a job runs.

SecurityConfiguration string

The name of the Security Configuration to be associated with the job.

SourceControlDetails JobSourceControlDetailsArgs

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

Tags map[string]string

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

Timeout int

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

WorkerType string

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

command JobCommand

The command of the job. Defined below.

roleArn String

The ARN of the IAM role associated with this job.

connections List<String>

The list of connections used for this job.

defaultArguments Map<String,String>

description String

Description of the job.

executionClass String

executionProperty JobExecutionProperty

Execution property of the job. Defined below.

glueVersion String

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

jobRunQueuingEnabled Boolean

maintenanceWindow String

Specifies the day of the week and hour for the maintenance window for streaming jobs.

maxCapacity Double

maxRetries Integer

The maximum number of times to retry this job if it fails.

name String

The name you assign to this job. It must be unique in your account.

nonOverridableArguments Map<String,String>

Non-overridable arguments for this job, specified as name-value pairs.

notificationProperty JobNotificationProperty

Notification property of the job. Defined below.

numberOfWorkers Integer

The number of workers of a defined workerType that are allocated when a job runs.

securityConfiguration String

The name of the Security Configuration to be associated with the job.

sourceControlDetails JobSourceControlDetails

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

tags Map<String,String>

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

timeout Integer

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

workerType String

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

command JobCommand

The command of the job. Defined below.

roleArn string

The ARN of the IAM role associated with this job.

connections string[]

The list of connections used for this job.

defaultArguments {[key: string]: string}

description string

Description of the job.

executionClass string

executionProperty JobExecutionProperty

Execution property of the job. Defined below.

glueVersion string

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

jobRunQueuingEnabled boolean

maintenanceWindow string

Specifies the day of the week and hour for the maintenance window for streaming jobs.

maxCapacity number

maxRetries number

The maximum number of times to retry this job if it fails.

name string

The name you assign to this job. It must be unique in your account.

nonOverridableArguments {[key: string]: string}

Non-overridable arguments for this job, specified as name-value pairs.

notificationProperty JobNotificationProperty

Notification property of the job. Defined below.

numberOfWorkers number

The number of workers of a defined workerType that are allocated when a job runs.

securityConfiguration string

The name of the Security Configuration to be associated with the job.

sourceControlDetails JobSourceControlDetails

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

tags {[key: string]: string}

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

timeout number

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

workerType string

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

command JobCommandArgs

The command of the job. Defined below.

role_arn str

The ARN of the IAM role associated with this job.

connections Sequence[str]

The list of connections used for this job.

default_arguments Mapping[str, str]

description str

Description of the job.

execution_class str

execution_property JobExecutionPropertyArgs

Execution property of the job. Defined below.

glue_version str

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

job_run_queuing_enabled bool

maintenance_window str

Specifies the day of the week and hour for the maintenance window for streaming jobs.

max_capacity float

max_retries int

The maximum number of times to retry this job if it fails.

name str

The name you assign to this job. It must be unique in your account.

non_overridable_arguments Mapping[str, str]

Non-overridable arguments for this job, specified as name-value pairs.

notification_property JobNotificationPropertyArgs

Notification property of the job. Defined below.

number_of_workers int

The number of workers of a defined workerType that are allocated when a job runs.

security_configuration str

The name of the Security Configuration to be associated with the job.

source_control_details JobSourceControlDetailsArgs

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

tags Mapping[str, str]

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

timeout int

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

worker_type str

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

command Property Map

The command of the job. Defined below.

roleArn String

The ARN of the IAM role associated with this job.

connections List<String>

The list of connections used for this job.

defaultArguments Map<String>

description String

Description of the job.

executionClass String

executionProperty Property Map

Execution property of the job. Defined below.

glueVersion String

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

jobRunQueuingEnabled Boolean

maintenanceWindow String

Specifies the day of the week and hour for the maintenance window for streaming jobs.

maxCapacity Number

maxRetries Number

The maximum number of times to retry this job if it fails.

name String

The name you assign to this job. It must be unique in your account.

nonOverridableArguments Map<String>

Non-overridable arguments for this job, specified as name-value pairs.

notificationProperty Property Map

Notification property of the job. Defined below.

numberOfWorkers Number

The number of workers of a defined workerType that are allocated when a job runs.

securityConfiguration String

The name of the Security Configuration to be associated with the job.

sourceControlDetails Property Map

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

tags Map<String>

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

timeout Number

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

workerType String

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

Outputs

All input properties are implicitly available as output properties. Additionally, the Job resource produces the following output properties:

Arn string: Amazon Resource Name (ARN) of Glue Job
Id string: The provider-assigned unique ID for this managed resource.
TagsAll Dictionary<string, string>: A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.
Deprecated: Please use tags instead.

Arn string: Amazon Resource Name (ARN) of Glue Job
Id string: The provider-assigned unique ID for this managed resource.
TagsAll map[string]string: A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.
Deprecated: Please use tags instead.

arn String: Amazon Resource Name (ARN) of Glue Job
id String: The provider-assigned unique ID for this managed resource.
tagsAll Map<String,String>: A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.
Deprecated: Please use tags instead.

arn string: Amazon Resource Name (ARN) of Glue Job
id string: The provider-assigned unique ID for this managed resource.
tagsAll {[key: string]: string}: A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.
Deprecated: Please use tags instead.

arn str: Amazon Resource Name (ARN) of Glue Job
id str: The provider-assigned unique ID for this managed resource.
tags_all Mapping[str, str]: A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.
Deprecated: Please use tags instead.

arn String: Amazon Resource Name (ARN) of Glue Job
id String: The provider-assigned unique ID for this managed resource.
tagsAll Map<String>: A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.
Deprecated: Please use tags instead.

Look up Existing Job Resource

Get an existing Job resource’s state with the given name, ID, and optional extra properties used to qualify the lookup.

public static get(name: string, id: Input<ID>, state?: JobState, opts?: CustomResourceOptions): Job

@staticmethod
def get(resource_name: str,
        id: str,
        opts: Optional[ResourceOptions] = None,
        arn: Optional[str] = None,
        command: Optional[JobCommandArgs] = None,
        connections: Optional[Sequence[str]] = None,
        default_arguments: Optional[Mapping[str, str]] = None,
        description: Optional[str] = None,
        execution_class: Optional[str] = None,
        execution_property: Optional[JobExecutionPropertyArgs] = None,
        glue_version: Optional[str] = None,
        job_run_queuing_enabled: Optional[bool] = None,
        maintenance_window: Optional[str] = None,
        max_capacity: Optional[float] = None,
        max_retries: Optional[int] = None,
        name: Optional[str] = None,
        non_overridable_arguments: Optional[Mapping[str, str]] = None,
        notification_property: Optional[JobNotificationPropertyArgs] = None,
        number_of_workers: Optional[int] = None,
        role_arn: Optional[str] = None,
        security_configuration: Optional[str] = None,
        source_control_details: Optional[JobSourceControlDetailsArgs] = None,
        tags: Optional[Mapping[str, str]] = None,
        tags_all: Optional[Mapping[str, str]] = None,
        timeout: Optional[int] = None,
        worker_type: Optional[str] = None) -> Job

func GetJob(ctx *Context, name string, id IDInput, state *JobState, opts ...ResourceOption) (*Job, error)

public static Job Get(string name, Input<string> id, JobState? state, CustomResourceOptions? opts = null)

public static Job get(String name, Output<String> id, JobState state, CustomResourceOptions options)

resources:  _:    type: aws:glue:Job    get:      id: ${id}

name: The unique name of the resulting resource.
id: The unique provider ID of the resource to lookup.
state: Any extra arguments used during the lookup.
opts: A bag of options that control this resource's behavior.

resource_name: The unique name of the resulting resource.
id: The unique provider ID of the resource to lookup.

name: The unique name of the resulting resource.
id: The unique provider ID of the resource to lookup.
state: Any extra arguments used during the lookup.
opts: A bag of options that control this resource's behavior.

name: The unique name of the resulting resource.
id: The unique provider ID of the resource to lookup.
state: Any extra arguments used during the lookup.
opts: A bag of options that control this resource's behavior.

name: The unique name of the resulting resource.
id: The unique provider ID of the resource to lookup.
state: Any extra arguments used during the lookup.
opts: A bag of options that control this resource's behavior.

The following state arguments are supported:

Arn string

Amazon Resource Name (ARN) of Glue Job

Command JobCommand

The command of the job. Defined below.

Connections List<string>

The list of connections used for this job.

DefaultArguments Dictionary<string, string>

Description string

Description of the job.

ExecutionClass string

ExecutionProperty JobExecutionProperty

Execution property of the job. Defined below.

GlueVersion string

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

JobRunQueuingEnabled bool

MaintenanceWindow string

Specifies the day of the week and hour for the maintenance window for streaming jobs.

MaxCapacity double

MaxRetries int

The maximum number of times to retry this job if it fails.

Name string

The name you assign to this job. It must be unique in your account.

NonOverridableArguments Dictionary<string, string>

Non-overridable arguments for this job, specified as name-value pairs.

NotificationProperty JobNotificationProperty

Notification property of the job. Defined below.

NumberOfWorkers int

The number of workers of a defined workerType that are allocated when a job runs.

RoleArn string

The ARN of the IAM role associated with this job.

SecurityConfiguration string

The name of the Security Configuration to be associated with the job.

SourceControlDetails JobSourceControlDetails

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

Tags Dictionary<string, string>

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

TagsAll Dictionary<string, string>

A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.

Deprecated: Please use tags instead.

Timeout int

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

WorkerType string

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

Arn string

Amazon Resource Name (ARN) of Glue Job

Command JobCommandArgs

The command of the job. Defined below.

Connections []string

The list of connections used for this job.

DefaultArguments map[string]string

Description string

Description of the job.

ExecutionClass string

ExecutionProperty JobExecutionPropertyArgs

Execution property of the job. Defined below.

GlueVersion string

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

JobRunQueuingEnabled bool

MaintenanceWindow string

Specifies the day of the week and hour for the maintenance window for streaming jobs.

MaxCapacity float64

MaxRetries int

The maximum number of times to retry this job if it fails.

Name string

The name you assign to this job. It must be unique in your account.

NonOverridableArguments map[string]string

Non-overridable arguments for this job, specified as name-value pairs.

NotificationProperty JobNotificationPropertyArgs

Notification property of the job. Defined below.

NumberOfWorkers int

The number of workers of a defined workerType that are allocated when a job runs.

RoleArn string

The ARN of the IAM role associated with this job.

SecurityConfiguration string

The name of the Security Configuration to be associated with the job.

SourceControlDetails JobSourceControlDetailsArgs

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

Tags map[string]string

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

TagsAll map[string]string

A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.

Deprecated: Please use tags instead.

Timeout int

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

WorkerType string

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

arn String

Amazon Resource Name (ARN) of Glue Job

command JobCommand

The command of the job. Defined below.

connections List<String>

The list of connections used for this job.

defaultArguments Map<String,String>

description String

Description of the job.

executionClass String

executionProperty JobExecutionProperty

Execution property of the job. Defined below.

glueVersion String

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

jobRunQueuingEnabled Boolean

maintenanceWindow String

Specifies the day of the week and hour for the maintenance window for streaming jobs.

maxCapacity Double

maxRetries Integer

The maximum number of times to retry this job if it fails.

name String

The name you assign to this job. It must be unique in your account.

nonOverridableArguments Map<String,String>

Non-overridable arguments for this job, specified as name-value pairs.

notificationProperty JobNotificationProperty

Notification property of the job. Defined below.

numberOfWorkers Integer

The number of workers of a defined workerType that are allocated when a job runs.

roleArn String

The ARN of the IAM role associated with this job.

securityConfiguration String

The name of the Security Configuration to be associated with the job.

sourceControlDetails JobSourceControlDetails

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

tags Map<String,String>

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

tagsAll Map<String,String>

A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.

Deprecated: Please use tags instead.

timeout Integer

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

workerType String

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

arn string

Amazon Resource Name (ARN) of Glue Job

command JobCommand

The command of the job. Defined below.

connections string[]

The list of connections used for this job.

defaultArguments {[key: string]: string}

description string

Description of the job.

executionClass string

executionProperty JobExecutionProperty

Execution property of the job. Defined below.

glueVersion string

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

jobRunQueuingEnabled boolean

maintenanceWindow string

Specifies the day of the week and hour for the maintenance window for streaming jobs.

maxCapacity number

maxRetries number

The maximum number of times to retry this job if it fails.

name string

The name you assign to this job. It must be unique in your account.

nonOverridableArguments {[key: string]: string}

Non-overridable arguments for this job, specified as name-value pairs.

notificationProperty JobNotificationProperty

Notification property of the job. Defined below.

numberOfWorkers number

The number of workers of a defined workerType that are allocated when a job runs.

roleArn string

The ARN of the IAM role associated with this job.

securityConfiguration string

The name of the Security Configuration to be associated with the job.

sourceControlDetails JobSourceControlDetails

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

tags {[key: string]: string}

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

tagsAll {[key: string]: string}

A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.

Deprecated: Please use tags instead.

timeout number

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

workerType string

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

arn str

Amazon Resource Name (ARN) of Glue Job

command JobCommandArgs

The command of the job. Defined below.

connections Sequence[str]

The list of connections used for this job.

default_arguments Mapping[str, str]

description str

Description of the job.

execution_class str

execution_property JobExecutionPropertyArgs

Execution property of the job. Defined below.

glue_version str

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

job_run_queuing_enabled bool

maintenance_window str

Specifies the day of the week and hour for the maintenance window for streaming jobs.

max_capacity float

max_retries int

The maximum number of times to retry this job if it fails.

name str

The name you assign to this job. It must be unique in your account.

non_overridable_arguments Mapping[str, str]

Non-overridable arguments for this job, specified as name-value pairs.

notification_property JobNotificationPropertyArgs

Notification property of the job. Defined below.

number_of_workers int

The number of workers of a defined workerType that are allocated when a job runs.

role_arn str

The ARN of the IAM role associated with this job.

security_configuration str

The name of the Security Configuration to be associated with the job.

source_control_details JobSourceControlDetailsArgs

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

tags Mapping[str, str]

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

tags_all Mapping[str, str]

A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.

Deprecated: Please use tags instead.

timeout int

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

worker_type str

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

arn String

Amazon Resource Name (ARN) of Glue Job

command Property Map

The command of the job. Defined below.

connections List<String>

The list of connections used for this job.

defaultArguments Map<String>

description String

Description of the job.

executionClass String

executionProperty Property Map

Execution property of the job. Defined below.

glueVersion String

The version of glue to use, for example "1.0". Ray jobs should set this to 4.0 or greater. For information about available versions, see the AWS Glue Release Notes.

jobRunQueuingEnabled Boolean

maintenanceWindow String

Specifies the day of the week and hour for the maintenance window for streaming jobs.

maxCapacity Number

maxRetries Number

The maximum number of times to retry this job if it fails.

name String

The name you assign to this job. It must be unique in your account.

nonOverridableArguments Map<String>

Non-overridable arguments for this job, specified as name-value pairs.

notificationProperty Property Map

Notification property of the job. Defined below.

numberOfWorkers Number

The number of workers of a defined workerType that are allocated when a job runs.

roleArn String

The ARN of the IAM role associated with this job.

securityConfiguration String

The name of the Security Configuration to be associated with the job.

sourceControlDetails Property Map

The details for a source control configuration for a job, allowing synchronization of job artifacts to or from a remote repository. Defined below.

tags Map<String>

Key-value map of resource tags. If configured with a provider default_tags configuration block present, tags with matching keys will overwrite those defined at the provider-level.

tagsAll Map<String>

A map of tags assigned to the resource, including those inherited from the provider default_tags configuration block.

Deprecated: Please use tags instead.

timeout Number

The job timeout in minutes. The default is 2880 minutes (48 hours) for glueetl and pythonshell jobs, and null (unlimited) for gluestreaming jobs.

workerType String

The type of predefined worker that is allocated when a job runs. Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs. Accepts the value Z.2X for Ray jobs.

For the Standard worker type, each worker provides 4 vCPU, 16 GB of memory and a 50GB disk, and 2 executors per worker.
For the G.1X worker type, each worker maps to 1 DPU (4 vCPU, 16 GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.2X worker type, each worker maps to 2 DPU (8 vCPU, 32 GB of memory, 128 GB disk), and provides 1 executor per worker. Recommended for memory-intensive jobs.
For the G.4X worker type, each worker maps to 4 DPU (16 vCPUs, 64 GB of memory) with 256GB disk (approximately 235GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.8X worker type, each worker maps to 8 DPU (32 vCPUs, 128 GB of memory) with 512GB disk (approximately 487GB free), and provides 1 executor per worker. Recommended for memory-intensive jobs. Only available for Glue version 3.0. Available AWS Regions: US East (Ohio), US East (N. Virginia), US West (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe (Ireland), and Europe (Stockholm).
For the G.025X worker type, each worker maps to 0.25 DPU (2 vCPU, 4GB of memory, 64 GB disk), and provides 1 executor per worker. Recommended for low volume streaming jobs. Only available for Glue version 3.0.
For the Z.2X worker type, each worker maps to 2 M-DPU (8vCPU, 64 GB of m emory, 128 GB disk), and provides up to 8 Ray workers based on the autoscaler.

Supporting Types

JobCommand, JobCommandArgs

ScriptLocation string: Specifies the S3 path to a script that executes a job.
Name string: The name of the job command. Defaults to glueetl. Use pythonshell for Python Shell Job Type, glueray for Ray Job Type, or gluestreaming for Streaming Job Type. max_capacity needs to be set if pythonshell is chosen.
PythonVersion string: The Python version being used to execute a Python shell job. Allowed values are 2, 3 or 3.9. Version 3 refers to Python 3.11 when glue_version is set to 5.0.
Runtime string: In Ray jobs, runtime is used to specify the versions of Ray, Python and additional libraries available in your environment. This field is not used in other job types. For supported runtime environment values, see Working with Ray jobs in the Glue Developer Guide.

ScriptLocation string: Specifies the S3 path to a script that executes a job.
Name string: The name of the job command. Defaults to glueetl. Use pythonshell for Python Shell Job Type, glueray for Ray Job Type, or gluestreaming for Streaming Job Type. max_capacity needs to be set if pythonshell is chosen.
PythonVersion string: The Python version being used to execute a Python shell job. Allowed values are 2, 3 or 3.9. Version 3 refers to Python 3.11 when glue_version is set to 5.0.
Runtime string: In Ray jobs, runtime is used to specify the versions of Ray, Python and additional libraries available in your environment. This field is not used in other job types. For supported runtime environment values, see Working with Ray jobs in the Glue Developer Guide.

scriptLocation String: Specifies the S3 path to a script that executes a job.
name String: The name of the job command. Defaults to glueetl. Use pythonshell for Python Shell Job Type, glueray for Ray Job Type, or gluestreaming for Streaming Job Type. max_capacity needs to be set if pythonshell is chosen.
pythonVersion String: The Python version being used to execute a Python shell job. Allowed values are 2, 3 or 3.9. Version 3 refers to Python 3.11 when glue_version is set to 5.0.
runtime String: In Ray jobs, runtime is used to specify the versions of Ray, Python and additional libraries available in your environment. This field is not used in other job types. For supported runtime environment values, see Working with Ray jobs in the Glue Developer Guide.

scriptLocation string: Specifies the S3 path to a script that executes a job.
name string: The name of the job command. Defaults to glueetl. Use pythonshell for Python Shell Job Type, glueray for Ray Job Type, or gluestreaming for Streaming Job Type. max_capacity needs to be set if pythonshell is chosen.
pythonVersion string: The Python version being used to execute a Python shell job. Allowed values are 2, 3 or 3.9. Version 3 refers to Python 3.11 when glue_version is set to 5.0.
runtime string: In Ray jobs, runtime is used to specify the versions of Ray, Python and additional libraries available in your environment. This field is not used in other job types. For supported runtime environment values, see Working with Ray jobs in the Glue Developer Guide.

script_location str: Specifies the S3 path to a script that executes a job.
name str: The name of the job command. Defaults to glueetl. Use pythonshell for Python Shell Job Type, glueray for Ray Job Type, or gluestreaming for Streaming Job Type. max_capacity needs to be set if pythonshell is chosen.
python_version str: The Python version being used to execute a Python shell job. Allowed values are 2, 3 or 3.9. Version 3 refers to Python 3.11 when glue_version is set to 5.0.
runtime str: In Ray jobs, runtime is used to specify the versions of Ray, Python and additional libraries available in your environment. This field is not used in other job types. For supported runtime environment values, see Working with Ray jobs in the Glue Developer Guide.

scriptLocation String: Specifies the S3 path to a script that executes a job.
name String: The name of the job command. Defaults to glueetl. Use pythonshell for Python Shell Job Type, glueray for Ray Job Type, or gluestreaming for Streaming Job Type. max_capacity needs to be set if pythonshell is chosen.
pythonVersion String: The Python version being used to execute a Python shell job. Allowed values are 2, 3 or 3.9. Version 3 refers to Python 3.11 when glue_version is set to 5.0.
runtime String: In Ray jobs, runtime is used to specify the versions of Ray, Python and additional libraries available in your environment. This field is not used in other job types. For supported runtime environment values, see Working with Ray jobs in the Glue Developer Guide.

JobExecutionProperty, JobExecutionPropertyArgs

MaxConcurrentRuns int: The maximum number of concurrent runs allowed for a job. The default is 1.

MaxConcurrentRuns int: The maximum number of concurrent runs allowed for a job. The default is 1.

maxConcurrentRuns Integer: The maximum number of concurrent runs allowed for a job. The default is 1.

maxConcurrentRuns number: The maximum number of concurrent runs allowed for a job. The default is 1.

max_concurrent_runs int: The maximum number of concurrent runs allowed for a job. The default is 1.

maxConcurrentRuns Number: The maximum number of concurrent runs allowed for a job. The default is 1.

JobNotificationProperty, JobNotificationPropertyArgs

NotifyDelayAfter int: After a job run starts, the number of minutes to wait before sending a job run delay notification.

NotifyDelayAfter int: After a job run starts, the number of minutes to wait before sending a job run delay notification.

notifyDelayAfter Integer: After a job run starts, the number of minutes to wait before sending a job run delay notification.

notifyDelayAfter number: After a job run starts, the number of minutes to wait before sending a job run delay notification.

notify_delay_after int: After a job run starts, the number of minutes to wait before sending a job run delay notification.

notifyDelayAfter Number: After a job run starts, the number of minutes to wait before sending a job run delay notification.

JobSourceControlDetails, JobSourceControlDetailsArgs

AuthStrategy string: The type of authentication, which can be an authentication token stored in Amazon Web Services Secrets Manager, or a personal access token. Valid values are: PERSONAL_ACCESS_TOKEN and AWS_SECRETS_MANAGER.
AuthToken string: The value of an authorization token.
Branch string: A branch in the remote repository.
Folder string: A folder in the remote repository.
LastCommitId string: The last commit ID for a commit in the remote repository.
Owner string: The owner of the remote repository that contains the job artifacts.
Provider string: The provider for the remote repository. Valid values are: GITHUB, GITLAB, BITBUCKET, and AWS_CODE_COMMIT.
Repository string: The name of the remote repository that contains the job artifacts.

AuthStrategy string: The type of authentication, which can be an authentication token stored in Amazon Web Services Secrets Manager, or a personal access token. Valid values are: PERSONAL_ACCESS_TOKEN and AWS_SECRETS_MANAGER.
AuthToken string: The value of an authorization token.
Branch string: A branch in the remote repository.
Folder string: A folder in the remote repository.
LastCommitId string: The last commit ID for a commit in the remote repository.
Owner string: The owner of the remote repository that contains the job artifacts.
Provider string: The provider for the remote repository. Valid values are: GITHUB, GITLAB, BITBUCKET, and AWS_CODE_COMMIT.
Repository string: The name of the remote repository that contains the job artifacts.

authStrategy String: The type of authentication, which can be an authentication token stored in Amazon Web Services Secrets Manager, or a personal access token. Valid values are: PERSONAL_ACCESS_TOKEN and AWS_SECRETS_MANAGER.
authToken String: The value of an authorization token.
branch String: A branch in the remote repository.
folder String: A folder in the remote repository.
lastCommitId String: The last commit ID for a commit in the remote repository.
owner String: The owner of the remote repository that contains the job artifacts.
provider String: The provider for the remote repository. Valid values are: GITHUB, GITLAB, BITBUCKET, and AWS_CODE_COMMIT.
repository String: The name of the remote repository that contains the job artifacts.

authStrategy string: The type of authentication, which can be an authentication token stored in Amazon Web Services Secrets Manager, or a personal access token. Valid values are: PERSONAL_ACCESS_TOKEN and AWS_SECRETS_MANAGER.
authToken string: The value of an authorization token.
branch string: A branch in the remote repository.
folder string: A folder in the remote repository.
lastCommitId string: The last commit ID for a commit in the remote repository.
owner string: The owner of the remote repository that contains the job artifacts.
provider string: The provider for the remote repository. Valid values are: GITHUB, GITLAB, BITBUCKET, and AWS_CODE_COMMIT.
repository string: The name of the remote repository that contains the job artifacts.

auth_strategy str: The type of authentication, which can be an authentication token stored in Amazon Web Services Secrets Manager, or a personal access token. Valid values are: PERSONAL_ACCESS_TOKEN and AWS_SECRETS_MANAGER.
auth_token str: The value of an authorization token.
branch str: A branch in the remote repository.
folder str: A folder in the remote repository.
last_commit_id str: The last commit ID for a commit in the remote repository.
owner str: The owner of the remote repository that contains the job artifacts.
provider str: The provider for the remote repository. Valid values are: GITHUB, GITLAB, BITBUCKET, and AWS_CODE_COMMIT.
repository str: The name of the remote repository that contains the job artifacts.

authStrategy String: The type of authentication, which can be an authentication token stored in Amazon Web Services Secrets Manager, or a personal access token. Valid values are: PERSONAL_ACCESS_TOKEN and AWS_SECRETS_MANAGER.
authToken String: The value of an authorization token.
branch String: A branch in the remote repository.
folder String: A folder in the remote repository.
lastCommitId String: The last commit ID for a commit in the remote repository.
owner String: The owner of the remote repository that contains the job artifacts.
provider String: The provider for the remote repository. Valid values are: GITHUB, GITLAB, BITBUCKET, and AWS_CODE_COMMIT.
repository String: The name of the remote repository that contains the job artifacts.

Import

Using pulumi import, import Glue Jobs using name. For example:

$ pulumi import aws:glue/job:Job MyJob MyJob

To learn more about importing existing cloud resources, see Importing resources.

Package Details

Repository: AWS Classic pulumi/pulumi-aws
License: Apache-2.0
Notes: This Pulumi package is based on the aws Terraform Provider.

AWS v6.83.0 published on Monday, Jun 16, 2025 by Pulumi

pulumi/pulumi-aws

aws.glue.Job

On this page

On this page

Example Usage

Python Glue Job

Pythonshell Job

Ray Job

Scala Job

Streaming Job

Enabling CloudWatch Logs and Metrics

Create Job Resource

Constructor syntax

Parameters

Constructor example

Job Resource Properties

Inputs

Outputs

Look up Existing Job Resource

Supporting Types

JobCommand, JobCommandArgs

JobExecutionProperty, JobExecutionPropertyArgs

JobNotificationProperty, JobNotificationPropertyArgs

JobSourceControlDetails, JobSourceControlDetailsArgs

Import

Package Details

On this page

On this page