lib/aws-sdk-glue/client.rb in aws-sdk-glue-1.149.0 vs lib/aws-sdk-glue/client.rb in aws-sdk-glue-1.150.0
- old
+ new
@@ -824,10 +824,17 @@
# resp.crawlers[0].targets.iceberg_targets[0].paths[0] #=> String
# resp.crawlers[0].targets.iceberg_targets[0].connection_name #=> String
# resp.crawlers[0].targets.iceberg_targets[0].exclusions #=> Array
# resp.crawlers[0].targets.iceberg_targets[0].exclusions[0] #=> String
# resp.crawlers[0].targets.iceberg_targets[0].maximum_traversal_depth #=> Integer
+ # resp.crawlers[0].targets.hudi_targets #=> Array
+ # resp.crawlers[0].targets.hudi_targets[0].paths #=> Array
+ # resp.crawlers[0].targets.hudi_targets[0].paths[0] #=> String
+ # resp.crawlers[0].targets.hudi_targets[0].connection_name #=> String
+ # resp.crawlers[0].targets.hudi_targets[0].exclusions #=> Array
+ # resp.crawlers[0].targets.hudi_targets[0].exclusions[0] #=> String
+ # resp.crawlers[0].targets.hudi_targets[0].maximum_traversal_depth #=> Integer
# resp.crawlers[0].database_name #=> String
# resp.crawlers[0].description #=> String
# resp.crawlers[0].classifiers #=> Array
# resp.crawlers[0].classifiers[0] #=> String
# resp.crawlers[0].recrawl_policy.recrawl_behavior #=> String, one of "CRAWL_EVERYTHING", "CRAWL_NEW_FOLDERS_ONLY", "CRAWL_EVENT_MODE"
@@ -2793,10 +2800,18 @@
# connection_name: "ConnectionName",
# exclusions: ["Path"],
# maximum_traversal_depth: 1,
# },
# ],
+ # hudi_targets: [
+ # {
+ # paths: ["Path"],
+ # connection_name: "ConnectionName",
+ # exclusions: ["Path"],
+ # maximum_traversal_depth: 1,
+ # },
+ # ],
# },
# schedule: "CronExpression",
# classifiers: ["NameString"],
# table_prefix: "TablePrefix",
# schema_change_policy: {
@@ -3352,33 +3367,54 @@
# The number of workers of a defined `workerType` that are allocated
# when a job runs.
#
# @option params [String] :worker_type
# The type of predefined worker that is allocated when a job runs.
- # Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs.
+ # Accepts a value of G.1X, G.2X, G.4X, G.8X or G.025X for Spark jobs.
# Accepts the value Z.2X for Ray jobs.
#
- # * For the `Standard` worker type, each worker provides 4 vCPU, 16 GB
- # of memory and a 50GB disk, and 2 executors per worker.
+ # * For the `G.1X` worker type, each worker maps to 1 DPU (4 vCPUs, 16
+ # GB of memory) with 84GB disk (approximately 34GB free), and provides
+ # 1 executor per worker. We recommend this worker type for workloads
+ # such as data transforms, joins, and queries, to offers a scalable
+ # and cost effective way to run most jobs.
#
- # * For the `G.1X` worker type, each worker maps to 1 DPU (4 vCPU, 16 GB
- # of memory, 64 GB disk), and provides 1 executor per worker. We
- # recommend this worker type for memory-intensive jobs.
+ # * For the `G.2X` worker type, each worker maps to 2 DPU (8 vCPUs, 32
+ # GB of memory) with 128GB disk (approximately 77GB free), and
+ # provides 1 executor per worker. We recommend this worker type for
+ # workloads such as data transforms, joins, and queries, to offers a
+ # scalable and cost effective way to run most jobs.
#
- # * For the `G.2X` worker type, each worker maps to 2 DPU (8 vCPU, 32 GB
- # of memory, 128 GB disk), and provides 1 executor per worker. We
- # recommend this worker type for memory-intensive jobs.
+ # * For the `G.4X` worker type, each worker maps to 4 DPU (16 vCPUs, 64
+ # GB of memory) with 256GB disk (approximately 235GB free), and
+ # provides 1 executor per worker. We recommend this worker type for
+ # jobs whose workloads contain your most demanding transforms,
+ # aggregations, joins, and queries. This worker type is available only
+ # for Glue version 3.0 or later Spark ETL jobs in the following Amazon
+ # Web Services Regions: US East (Ohio), US East (N. Virginia), US West
+ # (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia
+ # Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe
+ # (Ireland), and Europe (Stockholm).
#
- # * For the `G.025X` worker type, each worker maps to 0.25 DPU (2 vCPU,
- # 4 GB of memory, 64 GB disk), and provides 1 executor per worker. We
- # recommend this worker type for low volume streaming jobs. This
- # worker type is only available for Glue version 3.0 streaming jobs.
+ # * For the `G.8X` worker type, each worker maps to 8 DPU (32 vCPUs, 128
+ # GB of memory) with 512GB disk (approximately 487GB free), and
+ # provides 1 executor per worker. We recommend this worker type for
+ # jobs whose workloads contain your most demanding transforms,
+ # aggregations, joins, and queries. This worker type is available only
+ # for Glue version 3.0 or later Spark ETL jobs, in the same Amazon Web
+ # Services Regions as supported for the `G.4X` worker type.
#
- # * For the `Z.2X` worker type, each worker maps to 2 M-DPU (8vCPU, 64
- # GB of m emory, 128 GB disk), and provides up to 8 Ray workers based
- # on the autoscaler.
+ # * For the `G.025X` worker type, each worker maps to 0.25 DPU (2 vCPUs,
+ # 4 GB of memory) with 84GB disk (approximately 34GB free), and
+ # provides 1 executor per worker. We recommend this worker type for
+ # low volume streaming jobs. This worker type is only available for
+ # Glue version 3.0 streaming jobs.
#
+ # * For the `Z.2X` worker type, each worker maps to 2 M-DPU (8vCPUs, 64
+ # GB of memory) with 128 GB disk (approximately 120GB free), and
+ # provides up to 8 Ray workers based on the autoscaler.
+ #
# @option params [Hash<String,Types::CodeGenConfigurationNode>] :code_gen_configuration_nodes
# The representation of a directed acyclic graph on which both the Glue
# Studio visual component and Glue Studio code generation is based.
#
# @option params [String] :execution_class
@@ -4112,29 +4148,49 @@
# @option params [Integer] :number_of_workers
# The number of workers of a defined `WorkerType` to use for the
# session.
#
# @option params [String] :worker_type
- # The type of predefined worker that is allocated to use for the
- # session. Accepts a value of Standard, G.1X, G.2X, or G.025X.
+ # The type of predefined worker that is allocated when a job runs.
+ # Accepts a value of G.1X, G.2X, G.4X, or G.8X for Spark jobs. Accepts
+ # the value Z.2X for Ray notebooks.
#
- # * For the `Standard` worker type, each worker provides 4 vCPU, 16 GB
- # of memory and a 50GB disk, and 2 executors per worker.
+ # * For the `G.1X` worker type, each worker maps to 1 DPU (4 vCPUs, 16
+ # GB of memory) with 84GB disk (approximately 34GB free), and provides
+ # 1 executor per worker. We recommend this worker type for workloads
+ # such as data transforms, joins, and queries, to offers a scalable
+ # and cost effective way to run most jobs.
#
- # * For the `G.1X` worker type, each worker maps to 1 DPU (4 vCPU, 16 GB
- # of memory, 64 GB disk), and provides 1 executor per worker. We
- # recommend this worker type for memory-intensive jobs.
+ # * For the `G.2X` worker type, each worker maps to 2 DPU (8 vCPUs, 32
+ # GB of memory) with 128GB disk (approximately 77GB free), and
+ # provides 1 executor per worker. We recommend this worker type for
+ # workloads such as data transforms, joins, and queries, to offers a
+ # scalable and cost effective way to run most jobs.
#
- # * For the `G.2X` worker type, each worker maps to 2 DPU (8 vCPU, 32 GB
- # of memory, 128 GB disk), and provides 1 executor per worker. We
- # recommend this worker type for memory-intensive jobs.
+ # * For the `G.4X` worker type, each worker maps to 4 DPU (16 vCPUs, 64
+ # GB of memory) with 256GB disk (approximately 235GB free), and
+ # provides 1 executor per worker. We recommend this worker type for
+ # jobs whose workloads contain your most demanding transforms,
+ # aggregations, joins, and queries. This worker type is available only
+ # for Glue version 3.0 or later Spark ETL jobs in the following Amazon
+ # Web Services Regions: US East (Ohio), US East (N. Virginia), US West
+ # (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia
+ # Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe
+ # (Ireland), and Europe (Stockholm).
#
- # * For the `G.025X` worker type, each worker maps to 0.25 DPU (2 vCPU,
- # 4 GB of memory, 64 GB disk), and provides 1 executor per worker. We
- # recommend this worker type for low volume streaming jobs. This
- # worker type is only available for Glue version 3.0 streaming jobs.
+ # * For the `G.8X` worker type, each worker maps to 8 DPU (32 vCPUs, 128
+ # GB of memory) with 512GB disk (approximately 487GB free), and
+ # provides 1 executor per worker. We recommend this worker type for
+ # jobs whose workloads contain your most demanding transforms,
+ # aggregations, joins, and queries. This worker type is available only
+ # for Glue version 3.0 or later Spark ETL jobs, in the same Amazon Web
+ # Services Regions as supported for the `G.4X` worker type.
#
+ # * For the `Z.2X` worker type, each worker maps to 2 M-DPU (8vCPUs, 64
+ # GB of memory) with 128 GB disk (approximately 120GB free), and
+ # provides up to 8 Ray workers based on the autoscaler.
+ #
# @option params [String] :security_configuration
# The name of the SecurityConfiguration structure to be used with the
# session
#
# @option params [String] :glue_version
@@ -6040,10 +6096,17 @@
# resp.crawler.targets.iceberg_targets[0].paths[0] #=> String
# resp.crawler.targets.iceberg_targets[0].connection_name #=> String
# resp.crawler.targets.iceberg_targets[0].exclusions #=> Array
# resp.crawler.targets.iceberg_targets[0].exclusions[0] #=> String
# resp.crawler.targets.iceberg_targets[0].maximum_traversal_depth #=> Integer
+ # resp.crawler.targets.hudi_targets #=> Array
+ # resp.crawler.targets.hudi_targets[0].paths #=> Array
+ # resp.crawler.targets.hudi_targets[0].paths[0] #=> String
+ # resp.crawler.targets.hudi_targets[0].connection_name #=> String
+ # resp.crawler.targets.hudi_targets[0].exclusions #=> Array
+ # resp.crawler.targets.hudi_targets[0].exclusions[0] #=> String
+ # resp.crawler.targets.hudi_targets[0].maximum_traversal_depth #=> Integer
# resp.crawler.database_name #=> String
# resp.crawler.description #=> String
# resp.crawler.classifiers #=> Array
# resp.crawler.classifiers[0] #=> String
# resp.crawler.recrawl_policy.recrawl_behavior #=> String, one of "CRAWL_EVERYTHING", "CRAWL_NEW_FOLDERS_ONLY", "CRAWL_EVENT_MODE"
@@ -6194,10 +6257,17 @@
# resp.crawlers[0].targets.iceberg_targets[0].paths[0] #=> String
# resp.crawlers[0].targets.iceberg_targets[0].connection_name #=> String
# resp.crawlers[0].targets.iceberg_targets[0].exclusions #=> Array
# resp.crawlers[0].targets.iceberg_targets[0].exclusions[0] #=> String
# resp.crawlers[0].targets.iceberg_targets[0].maximum_traversal_depth #=> Integer
+ # resp.crawlers[0].targets.hudi_targets #=> Array
+ # resp.crawlers[0].targets.hudi_targets[0].paths #=> Array
+ # resp.crawlers[0].targets.hudi_targets[0].paths[0] #=> String
+ # resp.crawlers[0].targets.hudi_targets[0].connection_name #=> String
+ # resp.crawlers[0].targets.hudi_targets[0].exclusions #=> Array
+ # resp.crawlers[0].targets.hudi_targets[0].exclusions[0] #=> String
+ # resp.crawlers[0].targets.hudi_targets[0].maximum_traversal_depth #=> Integer
# resp.crawlers[0].database_name #=> String
# resp.crawlers[0].description #=> String
# resp.crawlers[0].classifiers #=> Array
# resp.crawlers[0].classifiers[0] #=> String
# resp.crawlers[0].recrawl_policy.recrawl_behavior #=> String, one of "CRAWL_EVERYTHING", "CRAWL_NEW_FOLDERS_ONLY", "CRAWL_EVENT_MODE"
@@ -13929,33 +13999,54 @@
# @option params [Types::NotificationProperty] :notification_property
# Specifies configuration properties of a job run notification.
#
# @option params [String] :worker_type
# The type of predefined worker that is allocated when a job runs.
- # Accepts a value of Standard, G.1X, G.2X, or G.025X for Spark jobs.
+ # Accepts a value of G.1X, G.2X, G.4X, G.8X or G.025X for Spark jobs.
# Accepts the value Z.2X for Ray jobs.
#
- # * For the `Standard` worker type, each worker provides 4 vCPU, 16 GB
- # of memory and a 50GB disk, and 2 executors per worker.
+ # * For the `G.1X` worker type, each worker maps to 1 DPU (4 vCPUs, 16
+ # GB of memory) with 84GB disk (approximately 34GB free), and provides
+ # 1 executor per worker. We recommend this worker type for workloads
+ # such as data transforms, joins, and queries, to offers a scalable
+ # and cost effective way to run most jobs.
#
- # * For the `G.1X` worker type, each worker maps to 1 DPU (4 vCPU, 16 GB
- # of memory, 64 GB disk), and provides 1 executor per worker. We
- # recommend this worker type for memory-intensive jobs.
+ # * For the `G.2X` worker type, each worker maps to 2 DPU (8 vCPUs, 32
+ # GB of memory) with 128GB disk (approximately 77GB free), and
+ # provides 1 executor per worker. We recommend this worker type for
+ # workloads such as data transforms, joins, and queries, to offers a
+ # scalable and cost effective way to run most jobs.
#
- # * For the `G.2X` worker type, each worker maps to 2 DPU (8 vCPU, 32 GB
- # of memory, 128 GB disk), and provides 1 executor per worker. We
- # recommend this worker type for memory-intensive jobs.
+ # * For the `G.4X` worker type, each worker maps to 4 DPU (16 vCPUs, 64
+ # GB of memory) with 256GB disk (approximately 235GB free), and
+ # provides 1 executor per worker. We recommend this worker type for
+ # jobs whose workloads contain your most demanding transforms,
+ # aggregations, joins, and queries. This worker type is available only
+ # for Glue version 3.0 or later Spark ETL jobs in the following Amazon
+ # Web Services Regions: US East (Ohio), US East (N. Virginia), US West
+ # (Oregon), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia
+ # Pacific (Tokyo), Canada (Central), Europe (Frankfurt), Europe
+ # (Ireland), and Europe (Stockholm).
#
- # * For the `G.025X` worker type, each worker maps to 0.25 DPU (2 vCPU,
- # 4 GB of memory, 64 GB disk), and provides 1 executor per worker. We
- # recommend this worker type for low volume streaming jobs. This
- # worker type is only available for Glue version 3.0 streaming jobs.
+ # * For the `G.8X` worker type, each worker maps to 8 DPU (32 vCPUs, 128
+ # GB of memory) with 512GB disk (approximately 487GB free), and
+ # provides 1 executor per worker. We recommend this worker type for
+ # jobs whose workloads contain your most demanding transforms,
+ # aggregations, joins, and queries. This worker type is available only
+ # for Glue version 3.0 or later Spark ETL jobs, in the same Amazon Web
+ # Services Regions as supported for the `G.4X` worker type.
#
- # * For the `Z.2X` worker type, each worker maps to 2 DPU (8vCPU, 64 GB
- # of m emory, 128 GB disk), and provides up to 8 Ray workers (one per
- # vCPU) based on the autoscaler.
+ # * For the `G.025X` worker type, each worker maps to 0.25 DPU (2 vCPUs,
+ # 4 GB of memory) with 84GB disk (approximately 34GB free), and
+ # provides 1 executor per worker. We recommend this worker type for
+ # low volume streaming jobs. This worker type is only available for
+ # Glue version 3.0 streaming jobs.
#
+ # * For the `Z.2X` worker type, each worker maps to 2 M-DPU (8vCPUs, 64
+ # GB of memory) with 128 GB disk (approximately 120GB free), and
+ # provides up to 8 Ray workers based on the autoscaler.
+ #
# @option params [Integer] :number_of_workers
# The number of workers of a defined `workerType` that are allocated
# when a job runs.
#
# @option params [String] :execution_class
@@ -14896,10 +14987,18 @@
# connection_name: "ConnectionName",
# exclusions: ["Path"],
# maximum_traversal_depth: 1,
# },
# ],
+ # hudi_targets: [
+ # {
+ # paths: ["Path"],
+ # connection_name: "ConnectionName",
+ # exclusions: ["Path"],
+ # maximum_traversal_depth: 1,
+ # },
+ # ],
# },
# schedule: "CronExpression",
# classifiers: ["NameString"],
# table_prefix: "TablePrefix",
# schema_change_policy: {
@@ -15952,10 +16051,10 @@
operation: config.api.operation(operation_name),
client: self,
params: params,
config: config)
context[:gem_name] = 'aws-sdk-glue'
- context[:gem_version] = '1.149.0'
+ context[:gem_version] = '1.150.0'
Seahorse::Client::Request.new(handlers, context)
end
# @api private
# @deprecated