Namespace Pulumi.Aws.Glue

Classes

CatalogDatabase

Provides a Glue Catalog Database Resource. You can refer to the Glue Developer Guide for a full explanation of the Glue Data Catalog functionality

Example Usage

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var awsGlueCatalogDatabase = new Aws.Glue.CatalogDatabase(&quot;awsGlueCatalogDatabase&quot;, new Aws.Glue.CatalogDatabaseArgs
    {
        Name = &quot;MyCatalogDatabase&quot;,
    });
}

}

CatalogDatabaseArgs

CatalogDatabaseState

CatalogTable

Provides a Glue Catalog Table Resource. You can refer to the Glue Developer Guide for a full explanation of the Glue Data Catalog functionality.

Example Usage

Basic Table

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var awsGlueCatalogTable = new Aws.Glue.CatalogTable(&quot;awsGlueCatalogTable&quot;, new Aws.Glue.CatalogTableArgs
    {
        DatabaseName = &quot;MyCatalogDatabase&quot;,
        Name = &quot;MyCatalogTable&quot;,
    });
}

}

Parquet Table for Athena

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var awsGlueCatalogTable = new Aws.Glue.CatalogTable(&quot;awsGlueCatalogTable&quot;, new Aws.Glue.CatalogTableArgs
    {
        DatabaseName = &quot;MyCatalogDatabase&quot;,
        Name = &quot;MyCatalogTable&quot;,
        Parameters = 
        {
            { &quot;EXTERNAL&quot;, &quot;TRUE&quot; },
            { &quot;parquet.compression&quot;, &quot;SNAPPY&quot; },
        },
        StorageDescriptor = new Aws.Glue.Inputs.CatalogTableStorageDescriptorArgs
        {
            Columns = 
            {
                new Aws.Glue.Inputs.CatalogTableStorageDescriptorColumnArgs
                {
                    Name = &quot;my_string&quot;,
                    Type = &quot;string&quot;,
                },
                new Aws.Glue.Inputs.CatalogTableStorageDescriptorColumnArgs
                {
                    Name = &quot;my_double&quot;,
                    Type = &quot;double&quot;,
                },
                new Aws.Glue.Inputs.CatalogTableStorageDescriptorColumnArgs
                {
                    Comment = &quot;&quot;,
                    Name = &quot;my_date&quot;,
                    Type = &quot;date&quot;,
                },
                new Aws.Glue.Inputs.CatalogTableStorageDescriptorColumnArgs
                {
                    Comment = &quot;&quot;,
                    Name = &quot;my_bigint&quot;,
                    Type = &quot;bigint&quot;,
                },
                new Aws.Glue.Inputs.CatalogTableStorageDescriptorColumnArgs
                {
                    Comment = &quot;&quot;,
                    Name = &quot;my_struct&quot;,
                    Type = &quot;struct&lt;my_nested_string:string>&quot;,
                },
            },
            InputFormat = &quot;org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat&quot;,
            Location = &quot;s3://my-bucket/event-streams/my-stream&quot;,
            OutputFormat = &quot;org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat&quot;,
            SerDeInfo = new Aws.Glue.Inputs.CatalogTableStorageDescriptorSerDeInfoArgs
            {
                Name = &quot;my-stream&quot;,
                Parameters = 
                {
                    { &quot;serialization.format&quot;, 1 },
                },
                SerializationLibrary = &quot;org.apache.hadoop.hive.ql.io.parquet.serde.ParquetHiveSerDe&quot;,
            },
        },
        TableType = &quot;EXTERNAL_TABLE&quot;,
    });
}

}

CatalogTableArgs

CatalogTableState

Classifier

Provides a Glue Classifier resource.

NOTE: It is only valid to create one type of classifier (csv, grok, JSON, or XML). Changing classifier types will recreate the classifier.

Example Usage

Csv Classifier

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Classifier(&quot;example&quot;, new Aws.Glue.ClassifierArgs
    {
        CsvClassifier = new Aws.Glue.Inputs.ClassifierCsvClassifierArgs
        {
            AllowSingleColumn = false,
            ContainsHeader = &quot;PRESENT&quot;,
            Delimiter = &quot;,&quot;,
            DisableValueTrimming = false,
            Header = 
            {
                &quot;example1&quot;,
                &quot;example2&quot;,
            },
            QuoteSymbol = &quot;&apos;&quot;,
        },
    });
}

}

Grok Classifier

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Classifier(&quot;example&quot;, new Aws.Glue.ClassifierArgs
    {
        GrokClassifier = new Aws.Glue.Inputs.ClassifierGrokClassifierArgs
        {
            Classification = &quot;example&quot;,
            GrokPattern = &quot;example&quot;,
        },
    });
}

}

JSON Classifier

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Classifier(&quot;example&quot;, new Aws.Glue.ClassifierArgs
    {
        JsonClassifier = new Aws.Glue.Inputs.ClassifierJsonClassifierArgs
        {
            JsonPath = &quot;example&quot;,
        },
    });
}

}

XML Classifier

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Classifier(&quot;example&quot;, new Aws.Glue.ClassifierArgs
    {
        XmlClassifier = new Aws.Glue.Inputs.ClassifierXmlClassifierArgs
        {
            Classification = &quot;example&quot;,
            RowTag = &quot;example&quot;,
        },
    });
}

}

ClassifierArgs

ClassifierState

Connection

Provides a Glue Connection resource.

Example Usage

Non-VPC Connection

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Connection(&quot;example&quot;, new Aws.Glue.ConnectionArgs
    {
        ConnectionProperties = 
        {
            { &quot;JDBC_CONNECTION_URL&quot;, &quot;jdbc:mysql://example.com/exampledatabase&quot; },
            { &quot;PASSWORD&quot;, &quot;examplepassword&quot; },
            { &quot;USERNAME&quot;, &quot;exampleusername&quot; },
        },
    });
}

}

VPC Connection

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Connection(&quot;example&quot;, new Aws.Glue.ConnectionArgs
    {
        ConnectionProperties = 
        {
            { &quot;JDBC_CONNECTION_URL&quot;, $&quot;jdbc:mysql://{aws_rds_cluster.Example.Endpoint}/exampledatabase&quot; },
            { &quot;PASSWORD&quot;, &quot;examplepassword&quot; },
            { &quot;USERNAME&quot;, &quot;exampleusername&quot; },
        },
        PhysicalConnectionRequirements = new Aws.Glue.Inputs.ConnectionPhysicalConnectionRequirementsArgs
        {
            AvailabilityZone = aws_subnet.Example.Availability_zone,
            SecurityGroupIdList = 
            {
                aws_security_group.Example.Id,
            },
            SubnetId = aws_subnet.Example.Id,
        },
    });
}

}

ConnectionArgs

ConnectionState

Crawler

Manages a Glue Crawler. More information can be found in the AWS Glue Developer Guide

Example Usage

DynamoDB Target

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Crawler(&quot;example&quot;, new Aws.Glue.CrawlerArgs
    {
        DatabaseName = aws_glue_catalog_database.Example.Name,
        DynamodbTargets = 
        {
            new Aws.Glue.Inputs.CrawlerDynamodbTargetArgs
            {
                Path = &quot;table-name&quot;,
            },
        },
        Role = aws_iam_role.Example.Arn,
    });
}

}

JDBC Target

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Crawler(&quot;example&quot;, new Aws.Glue.CrawlerArgs
    {
        DatabaseName = aws_glue_catalog_database.Example.Name,
        JdbcTargets = 
        {
            new Aws.Glue.Inputs.CrawlerJdbcTargetArgs
            {
                ConnectionName = aws_glue_connection.Example.Name,
                Path = &quot;database-name/%&quot;,
            },
        },
        Role = aws_iam_role.Example.Arn,
    });
}

}

S3 Target

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Crawler(&quot;example&quot;, new Aws.Glue.CrawlerArgs
    {
        DatabaseName = aws_glue_catalog_database.Example.Name,
        Role = aws_iam_role.Example.Arn,
        S3Targets = 
        {
            new Aws.Glue.Inputs.CrawlerS3TargetArgs
            {
                Path = $&quot;s3://{aws_s3_bucket.Example.Bucket}&quot;,
            },
        },
    });
}

}

Catalog Target

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Crawler(&quot;example&quot;, new Aws.Glue.CrawlerArgs
    {
        CatalogTargets = 
        {
            new Aws.Glue.Inputs.CrawlerCatalogTargetArgs
            {
                DatabaseName = aws_glue_catalog_database.Example.Name,
                Tables = 
                {
                    aws_glue_catalog_table.Example.Name,
                },
            },
        },
        Configuration = @&quot;{
&quot;&quot;Version&quot;&quot;:1.0,
&quot;&quot;Grouping&quot;&quot;: {
&quot;&quot;TableGroupingPolicy&quot;&quot;: &quot;&quot;CombineCompatibleSchemas&quot;&quot;
}
}

&quot;,
        DatabaseName = aws_glue_catalog_database.Example.Name,
        Role = aws_iam_role.Example.Arn,
        SchemaChangePolicy = new Aws.Glue.Inputs.CrawlerSchemaChangePolicyArgs
        {
            DeleteBehavior = &quot;LOG&quot;,
        },
    });
}

}

CrawlerArgs

CrawlerState

GetScript

GetScriptArgs

GetScriptResult

Job

Provides a Glue Job resource.

Glue functionality, such as monitoring and logging of jobs, is typically managed with the default_arguments argument. See the Special Parameters Used by AWS Glue topic in the Glue developer guide for additional information.

Example Usage

Python Job

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Job(&quot;example&quot;, new Aws.Glue.JobArgs
    {
        Command = new Aws.Glue.Inputs.JobCommandArgs
        {
            ScriptLocation = $&quot;s3://{aws_s3_bucket.Example.Bucket}/example.py&quot;,
        },
        RoleArn = aws_iam_role.Example.Arn,
    });
}

}

Scala Job

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Job(&quot;example&quot;, new Aws.Glue.JobArgs
    {
        Command = new Aws.Glue.Inputs.JobCommandArgs
        {
            ScriptLocation = $&quot;s3://{aws_s3_bucket.Example.Bucket}/example.scala&quot;,
        },
        DefaultArguments = 
        {
            { &quot;--job-language&quot;, &quot;scala&quot; },
        },
        RoleArn = aws_iam_role.Example.Arn,
    });
}

}

Enabling CloudWatch Logs and Metrics

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var exampleLogGroup = new Aws.CloudWatch.LogGroup(&quot;exampleLogGroup&quot;, new Aws.CloudWatch.LogGroupArgs
    {
        RetentionInDays = 14,
    });
    var exampleJob = new Aws.Glue.Job(&quot;exampleJob&quot;, new Aws.Glue.JobArgs
    {
        DefaultArguments = 
        {
            { &quot;--continuous-log-logGroup&quot;, exampleLogGroup.Name },
            { &quot;--enable-continuous-cloudwatch-log&quot;, &quot;true&quot; },
            { &quot;--enable-continuous-log-filter&quot;, &quot;true&quot; },
            { &quot;--enable-metrics&quot;, &quot;&quot; },
        },
    });
}

}

JobArgs

JobState

SecurityConfiguration

Manages a Glue Security Configuration.

Example Usage

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.SecurityConfiguration(&quot;example&quot;, new Aws.Glue.SecurityConfigurationArgs
    {
        EncryptionConfiguration = new Aws.Glue.Inputs.SecurityConfigurationEncryptionConfigurationArgs
        {
            CloudwatchEncryption = new Aws.Glue.Inputs.SecurityConfigurationEncryptionConfigurationCloudwatchEncryptionArgs
            {
                CloudwatchEncryptionMode = &quot;DISABLED&quot;,
            },
            JobBookmarksEncryption = new Aws.Glue.Inputs.SecurityConfigurationEncryptionConfigurationJobBookmarksEncryptionArgs
            {
                JobBookmarksEncryptionMode = &quot;DISABLED&quot;,
            },
            S3Encryption = new Aws.Glue.Inputs.SecurityConfigurationEncryptionConfigurationS3EncryptionArgs
            {
                KmsKeyArn = data.Aws_kms_key.Example.Arn,
                S3EncryptionMode = &quot;SSE-KMS&quot;,
            },
        },
    });
}

}

SecurityConfigurationArgs

SecurityConfigurationState

Trigger

Manages a Glue Trigger resource.

Example Usage

Conditional Trigger

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Trigger(&quot;example&quot;, new Aws.Glue.TriggerArgs
    {
        Actions = 
        {
            new Aws.Glue.Inputs.TriggerActionArgs
            {
                JobName = aws_glue_job.Example1.Name,
            },
        },
        Predicate = new Aws.Glue.Inputs.TriggerPredicateArgs
        {
            Conditions = 
            {
                new Aws.Glue.Inputs.TriggerPredicateConditionArgs
                {
                    JobName = aws_glue_job.Example2.Name,
                    State = &quot;SUCCEEDED&quot;,
                },
            },
        },
        Type = &quot;CONDITIONAL&quot;,
    });
}

}

On-Demand Trigger

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Trigger(&quot;example&quot;, new Aws.Glue.TriggerArgs
    {
        Actions = 
        {
            new Aws.Glue.Inputs.TriggerActionArgs
            {
                JobName = aws_glue_job.Example.Name,
            },
        },
        Type = &quot;ON_DEMAND&quot;,
    });
}

}

Scheduled Trigger

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Trigger(&quot;example&quot;, new Aws.Glue.TriggerArgs
    {
        Actions = 
        {
            new Aws.Glue.Inputs.TriggerActionArgs
            {
                JobName = aws_glue_job.Example.Name,
            },
        },
        Schedule = &quot;cron(15 12 * * ? *)&quot;,
        Type = &quot;SCHEDULED&quot;,
    });
}

}

Conditional Trigger with Crawler Action

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Trigger(&quot;example&quot;, new Aws.Glue.TriggerArgs
    {
        Actions = 
        {
            new Aws.Glue.Inputs.TriggerActionArgs
            {
                CrawlerName = aws_glue_crawler.Example1.Name,
            },
        },
        Predicate = new Aws.Glue.Inputs.TriggerPredicateArgs
        {
            Conditions = 
            {
                new Aws.Glue.Inputs.TriggerPredicateConditionArgs
                {
                    JobName = aws_glue_job.Example2.Name,
                    State = &quot;SUCCEEDED&quot;,
                },
            },
        },
        Type = &quot;CONDITIONAL&quot;,
    });
}

}

Conditional Trigger with Crawler Condition

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Trigger(&quot;example&quot;, new Aws.Glue.TriggerArgs
    {
        Actions = 
        {
            new Aws.Glue.Inputs.TriggerActionArgs
            {
                JobName = aws_glue_job.Example1.Name,
            },
        },
        Predicate = new Aws.Glue.Inputs.TriggerPredicateArgs
        {
            Conditions = 
            {
                new Aws.Glue.Inputs.TriggerPredicateConditionArgs
                {
                    CrawlState = &quot;SUCCEEDED&quot;,
                    CrawlerName = aws_glue_crawler.Example2.Name,
                },
            },
        },
        Type = &quot;CONDITIONAL&quot;,
    });
}

}

TriggerArgs

TriggerState

Workflow

Provides a Glue Workflow resource. The workflow graph (DAG) can be build using the aws.glue.Trigger resource. See the example below for creating a graph with four nodes (two triggers and two jobs).

Example Usage

using Pulumi;
using Aws = Pulumi.Aws;

class MyStack : Stack
{
public MyStack()
{
    var example = new Aws.Glue.Workflow(&quot;example&quot;, new Aws.Glue.WorkflowArgs
    {
    });
    var example_start = new Aws.Glue.Trigger(&quot;example-start&quot;, new Aws.Glue.TriggerArgs
    {
        Actions = 
        {
            new Aws.Glue.Inputs.TriggerActionArgs
            {
                JobName = &quot;example-job&quot;,
            },
        },
        Type = &quot;ON_DEMAND&quot;,
        WorkflowName = example.Name,
    });
    var example_inner = new Aws.Glue.Trigger(&quot;example-inner&quot;, new Aws.Glue.TriggerArgs
    {
        Actions = 
        {
            new Aws.Glue.Inputs.TriggerActionArgs
            {
                JobName = &quot;another-example-job&quot;,
            },
        },
        Predicate = new Aws.Glue.Inputs.TriggerPredicateArgs
        {
            Conditions = 
            {
                new Aws.Glue.Inputs.TriggerPredicateConditionArgs
                {
                    JobName = &quot;example-job&quot;,
                    State = &quot;SUCCEEDED&quot;,
                },
            },
        },
        Type = &quot;CONDITIONAL&quot;,
        WorkflowName = example.Name,
    });
}

}