aws-sdk-glue 1.86.0 → 1.90.0

Sign up to get free protection for your applications and to get access to all the features.
@@ -49,6 +49,7 @@ module Aws::Glue
49
49
  BatchGetTriggersResponse = Shapes::StructureShape.new(name: 'BatchGetTriggersResponse')
50
50
  BatchGetWorkflowsRequest = Shapes::StructureShape.new(name: 'BatchGetWorkflowsRequest')
51
51
  BatchGetWorkflowsResponse = Shapes::StructureShape.new(name: 'BatchGetWorkflowsResponse')
52
+ BatchSize = Shapes::IntegerShape.new(name: 'BatchSize')
52
53
  BatchStopJobRunError = Shapes::StructureShape.new(name: 'BatchStopJobRunError')
53
54
  BatchStopJobRunErrorList = Shapes::ListShape.new(name: 'BatchStopJobRunErrorList')
54
55
  BatchStopJobRunJobRunIdList = Shapes::ListShape.new(name: 'BatchStopJobRunJobRunIdList')
@@ -62,6 +63,7 @@ module Aws::Glue
62
63
  BatchUpdatePartitionRequestEntry = Shapes::StructureShape.new(name: 'BatchUpdatePartitionRequestEntry')
63
64
  BatchUpdatePartitionRequestEntryList = Shapes::ListShape.new(name: 'BatchUpdatePartitionRequestEntryList')
64
65
  BatchUpdatePartitionResponse = Shapes::StructureShape.new(name: 'BatchUpdatePartitionResponse')
66
+ BatchWindow = Shapes::IntegerShape.new(name: 'BatchWindow')
65
67
  BinaryColumnStatisticsData = Shapes::StructureShape.new(name: 'BinaryColumnStatisticsData')
66
68
  Blob = Shapes::BlobShape.new(name: 'Blob')
67
69
  Boolean = Shapes::BooleanShape.new(name: 'Boolean')
@@ -276,6 +278,7 @@ module Aws::Glue
276
278
  ErrorMessageString = Shapes::StringShape.new(name: 'ErrorMessageString')
277
279
  ErrorString = Shapes::StringShape.new(name: 'ErrorString')
278
280
  EvaluationMetrics = Shapes::StructureShape.new(name: 'EvaluationMetrics')
281
+ EventBatchingCondition = Shapes::StructureShape.new(name: 'EventBatchingCondition')
279
282
  ExecutionProperty = Shapes::StructureShape.new(name: 'ExecutionProperty')
280
283
  ExecutionTime = Shapes::IntegerShape.new(name: 'ExecutionTime')
281
284
  ExistCondition = Shapes::StringShape.new(name: 'ExistCondition')
@@ -653,6 +656,7 @@ module Aws::Glue
653
656
  StartTriggerResponse = Shapes::StructureShape.new(name: 'StartTriggerResponse')
654
657
  StartWorkflowRunRequest = Shapes::StructureShape.new(name: 'StartWorkflowRunRequest')
655
658
  StartWorkflowRunResponse = Shapes::StructureShape.new(name: 'StartWorkflowRunResponse')
659
+ StartingEventBatchCondition = Shapes::StructureShape.new(name: 'StartingEventBatchCondition')
656
660
  StopCrawlerRequest = Shapes::StructureShape.new(name: 'StopCrawlerRequest')
657
661
  StopCrawlerResponse = Shapes::StructureShape.new(name: 'StopCrawlerResponse')
658
662
  StopCrawlerScheduleRequest = Shapes::StructureShape.new(name: 'StopCrawlerScheduleRequest')
@@ -1423,6 +1427,7 @@ module Aws::Glue
1423
1427
  CreateTriggerRequest.add_member(:description, Shapes::ShapeRef.new(shape: DescriptionString, location_name: "Description"))
1424
1428
  CreateTriggerRequest.add_member(:start_on_creation, Shapes::ShapeRef.new(shape: BooleanValue, location_name: "StartOnCreation"))
1425
1429
  CreateTriggerRequest.add_member(:tags, Shapes::ShapeRef.new(shape: TagsMap, location_name: "Tags"))
1430
+ CreateTriggerRequest.add_member(:event_batching_condition, Shapes::ShapeRef.new(shape: EventBatchingCondition, location_name: "EventBatchingCondition"))
1426
1431
  CreateTriggerRequest.struct_class = Types::CreateTriggerRequest
1427
1432
 
1428
1433
  CreateTriggerResponse.add_member(:name, Shapes::ShapeRef.new(shape: NameString, location_name: "Name"))
@@ -1740,6 +1745,10 @@ module Aws::Glue
1740
1745
  EvaluationMetrics.add_member(:find_matches_metrics, Shapes::ShapeRef.new(shape: FindMatchesMetrics, location_name: "FindMatchesMetrics"))
1741
1746
  EvaluationMetrics.struct_class = Types::EvaluationMetrics
1742
1747
 
1748
+ EventBatchingCondition.add_member(:batch_size, Shapes::ShapeRef.new(shape: BatchSize, required: true, location_name: "BatchSize"))
1749
+ EventBatchingCondition.add_member(:batch_window, Shapes::ShapeRef.new(shape: BatchWindow, location_name: "BatchWindow"))
1750
+ EventBatchingCondition.struct_class = Types::EventBatchingCondition
1751
+
1743
1752
  ExecutionProperty.add_member(:max_concurrent_runs, Shapes::ShapeRef.new(shape: MaxConcurrentRuns, location_name: "MaxConcurrentRuns"))
1744
1753
  ExecutionProperty.struct_class = Types::ExecutionProperty
1745
1754
 
@@ -2842,6 +2851,7 @@ module Aws::Glue
2842
2851
  S3Target.add_member(:path, Shapes::ShapeRef.new(shape: Path, location_name: "Path"))
2843
2852
  S3Target.add_member(:exclusions, Shapes::ShapeRef.new(shape: PathList, location_name: "Exclusions"))
2844
2853
  S3Target.add_member(:connection_name, Shapes::ShapeRef.new(shape: ConnectionName, location_name: "ConnectionName"))
2854
+ S3Target.add_member(:sample_size, Shapes::ShapeRef.new(shape: NullableInteger, location_name: "SampleSize"))
2845
2855
  S3Target.struct_class = Types::S3Target
2846
2856
 
2847
2857
  S3TargetList.member = Shapes::ShapeRef.new(shape: S3Target)
@@ -3016,6 +3026,10 @@ module Aws::Glue
3016
3026
  StartWorkflowRunResponse.add_member(:run_id, Shapes::ShapeRef.new(shape: IdString, location_name: "RunId"))
3017
3027
  StartWorkflowRunResponse.struct_class = Types::StartWorkflowRunResponse
3018
3028
 
3029
+ StartingEventBatchCondition.add_member(:batch_size, Shapes::ShapeRef.new(shape: NullableInteger, location_name: "BatchSize"))
3030
+ StartingEventBatchCondition.add_member(:batch_window, Shapes::ShapeRef.new(shape: NullableInteger, location_name: "BatchWindow"))
3031
+ StartingEventBatchCondition.struct_class = Types::StartingEventBatchCondition
3032
+
3019
3033
  StopCrawlerRequest.add_member(:name, Shapes::ShapeRef.new(shape: NameString, required: true, location_name: "Name"))
3020
3034
  StopCrawlerRequest.struct_class = Types::StopCrawlerRequest
3021
3035
 
@@ -3201,6 +3215,7 @@ module Aws::Glue
3201
3215
  Trigger.add_member(:schedule, Shapes::ShapeRef.new(shape: GenericString, location_name: "Schedule"))
3202
3216
  Trigger.add_member(:actions, Shapes::ShapeRef.new(shape: ActionList, location_name: "Actions"))
3203
3217
  Trigger.add_member(:predicate, Shapes::ShapeRef.new(shape: Predicate, location_name: "Predicate"))
3218
+ Trigger.add_member(:event_batching_condition, Shapes::ShapeRef.new(shape: EventBatchingCondition, location_name: "EventBatchingCondition"))
3204
3219
  Trigger.struct_class = Types::Trigger
3205
3220
 
3206
3221
  TriggerList.member = Shapes::ShapeRef.new(shape: Trigger)
@@ -3215,6 +3230,7 @@ module Aws::Glue
3215
3230
  TriggerUpdate.add_member(:schedule, Shapes::ShapeRef.new(shape: GenericString, location_name: "Schedule"))
3216
3231
  TriggerUpdate.add_member(:actions, Shapes::ShapeRef.new(shape: ActionList, location_name: "Actions"))
3217
3232
  TriggerUpdate.add_member(:predicate, Shapes::ShapeRef.new(shape: Predicate, location_name: "Predicate"))
3233
+ TriggerUpdate.add_member(:event_batching_condition, Shapes::ShapeRef.new(shape: EventBatchingCondition, location_name: "EventBatchingCondition"))
3218
3234
  TriggerUpdate.struct_class = Types::TriggerUpdate
3219
3235
 
3220
3236
  UntagResourceRequest.add_member(:resource_arn, Shapes::ShapeRef.new(shape: GlueResourceArn, required: true, location_name: "ResourceArn"))
@@ -3461,6 +3477,7 @@ module Aws::Glue
3461
3477
  WorkflowRun.add_member(:error_message, Shapes::ShapeRef.new(shape: ErrorString, location_name: "ErrorMessage"))
3462
3478
  WorkflowRun.add_member(:statistics, Shapes::ShapeRef.new(shape: WorkflowRunStatistics, location_name: "Statistics"))
3463
3479
  WorkflowRun.add_member(:graph, Shapes::ShapeRef.new(shape: WorkflowGraph, location_name: "Graph"))
3480
+ WorkflowRun.add_member(:starting_event_batch_condition, Shapes::ShapeRef.new(shape: StartingEventBatchCondition, location_name: "StartingEventBatchCondition"))
3464
3481
  WorkflowRun.struct_class = Types::WorkflowRun
3465
3482
 
3466
3483
  WorkflowRunProperties.key = Shapes::ShapeRef.new(shape: IdString)
@@ -43,7 +43,7 @@ module Aws::Glue
43
43
  # }
44
44
  #
45
45
  # @!attribute [rw] job_name
46
- # The name of a job to be executed.
46
+ # The name of a job to be run.
47
47
  # @return [String]
48
48
  #
49
49
  # @!attribute [rw] arguments
@@ -51,15 +51,15 @@ module Aws::Glue
51
51
  # they replace the default arguments set in the job definition itself.
52
52
  #
53
53
  # You can specify arguments here that your own job-execution script
54
- # consumes, as well as arguments that AWS Glue itself consumes.
54
+ # consumes, as well as arguments that Glue itself consumes.
55
55
  #
56
56
  # For information about how to specify and consume your own Job
57
- # arguments, see the [Calling AWS Glue APIs in Python][1] topic in the
57
+ # arguments, see the [Calling Glue APIs in Python][1] topic in the
58
58
  # developer guide.
59
59
  #
60
- # For information about the key-value pairs that AWS Glue consumes to
61
- # set up your job, see the [Special Parameters Used by AWS Glue][2]
62
- # topic in the developer guide.
60
+ # For information about the key-value pairs that Glue consumes to set
61
+ # up your job, see the [Special Parameters Used by Glue][2] topic in
62
+ # the developer guide.
63
63
  #
64
64
  #
65
65
  #
@@ -225,7 +225,7 @@ module Aws::Glue
225
225
  #
226
226
  # @!attribute [rw] catalog_id
227
227
  # The ID of the catalog in which the partition is to be created.
228
- # Currently, this should be the AWS account ID.
228
+ # Currently, this should be the Amazon Web Services account ID.
229
229
  # @return [String]
230
230
  #
231
231
  # @!attribute [rw] database_name
@@ -277,7 +277,7 @@ module Aws::Glue
277
277
  #
278
278
  # @!attribute [rw] catalog_id
279
279
  # The ID of the Data Catalog in which the connections reside. If none
280
- # is provided, the AWS account ID is used by default.
280
+ # is provided, the Amazon Web Services account ID is used by default.
281
281
  # @return [String]
282
282
  #
283
283
  # @!attribute [rw] connection_name_list
@@ -328,7 +328,8 @@ module Aws::Glue
328
328
  #
329
329
  # @!attribute [rw] catalog_id
330
330
  # The ID of the Data Catalog where the partition to be deleted
331
- # resides. If none is provided, the AWS account ID is used by default.
331
+ # resides. If none is provided, the Amazon Web Services account ID is
332
+ # used by default.
332
333
  # @return [String]
333
334
  #
334
335
  # @!attribute [rw] database_name
@@ -380,7 +381,7 @@ module Aws::Glue
380
381
  #
381
382
  # @!attribute [rw] catalog_id
382
383
  # The ID of the Data Catalog where the table resides. If none is
383
- # provided, the AWS account ID is used by default.
384
+ # provided, the Amazon Web Services account ID is used by default.
384
385
  # @return [String]
385
386
  #
386
387
  # @!attribute [rw] database_name
@@ -427,7 +428,7 @@ module Aws::Glue
427
428
  #
428
429
  # @!attribute [rw] catalog_id
429
430
  # The ID of the Data Catalog where the tables reside. If none is
430
- # provided, the AWS account ID is used by default.
431
+ # provided, the Amazon Web Services account ID is used by default.
431
432
  # @return [String]
432
433
  #
433
434
  # @!attribute [rw] database_name
@@ -597,7 +598,8 @@ module Aws::Glue
597
598
  #
598
599
  # @!attribute [rw] catalog_id
599
600
  # The ID of the Data Catalog where the partitions in question reside.
600
- # If none is supplied, the AWS account ID is used by default.
601
+ # If none is supplied, the Amazon Web Services account ID is used by
602
+ # default.
601
603
  # @return [String]
602
604
  #
603
605
  # @!attribute [rw] database_name
@@ -906,7 +908,7 @@ module Aws::Glue
906
908
  #
907
909
  # @!attribute [rw] catalog_id
908
910
  # The ID of the catalog in which the partition is to be updated.
909
- # Currently, this should be the AWS account ID.
911
+ # Currently, this should be the Amazon Web Services account ID.
910
912
  # @return [String]
911
913
  #
912
914
  # @!attribute [rw] database_name
@@ -1147,7 +1149,7 @@ module Aws::Glue
1147
1149
  include Aws::Structure
1148
1150
  end
1149
1151
 
1150
- # Specifies a table definition in the AWS Glue Data Catalog.
1152
+ # Specifies a table definition in the Glue Data Catalog.
1151
1153
  #
1152
1154
  # @note When making an API call, you may pass CatalogEntry
1153
1155
  # data as a hash:
@@ -1198,7 +1200,7 @@ module Aws::Glue
1198
1200
  include Aws::Structure
1199
1201
  end
1200
1202
 
1201
- # Specifies an AWS Glue Data Catalog target.
1203
+ # Specifies an Glue Data Catalog target.
1202
1204
  #
1203
1205
  # @note When making an API call, you may pass CatalogTarget
1204
1206
  # data as a hash:
@@ -1229,13 +1231,13 @@ module Aws::Glue
1229
1231
  # data as a hash:
1230
1232
  #
1231
1233
  # {
1232
- # data_format: "AVRO", # required, accepts AVRO
1234
+ # data_format: "AVRO", # required, accepts AVRO, JSON
1233
1235
  # schema_definition: "SchemaDefinitionString", # required
1234
1236
  # }
1235
1237
  #
1236
1238
  # @!attribute [rw] data_format
1237
- # The data format of the schema definition. Currently only `AVRO` is
1238
- # supported.
1239
+ # The data format of the schema definition. Currently `AVRO` and
1240
+ # `JSON` are supported.
1239
1241
  # @return [String]
1240
1242
  #
1241
1243
  # @!attribute [rw] schema_definition
@@ -1273,10 +1275,10 @@ module Aws::Glue
1273
1275
  # classifier creates a schema in the form of a `StructType` object that
1274
1276
  # matches that data format.
1275
1277
  #
1276
- # You can use the standard classifiers that AWS Glue provides, or you
1277
- # can write your own classifiers to best categorize your data sources
1278
- # and specify the appropriate schemas to use for them. A classifier can
1279
- # be a `grok` classifier, an `XML` classifier, a `JSON` classifier, or a
1278
+ # You can use the standard classifiers that Glue provides, or you can
1279
+ # write your own classifiers to best categorize your data sources and
1280
+ # specify the appropriate schemas to use for them. A classifier can be a
1281
+ # `grok` classifier, an `XML` classifier, a `JSON` classifier, or a
1280
1282
  # custom `CSV` classifier, as specified in one of the fields in the
1281
1283
  # `Classifier` object.
1282
1284
  #
@@ -1948,20 +1950,20 @@ module Aws::Glue
1948
1950
  # false.
1949
1951
  #
1950
1952
  # * `CUSTOM_JDBC_CERT` - An Amazon S3 location specifying the
1951
- # customer's root certificate. AWS Glue uses this root certificate
1952
- # to validate the customer’s certificate when connecting to the
1953
- # customer database. AWS Glue only handles X.509 certificates. The
1953
+ # customer's root certificate. Glue uses this root certificate to
1954
+ # validate the customer’s certificate when connecting to the
1955
+ # customer database. Glue only handles X.509 certificates. The
1954
1956
  # certificate provided must be DER-encoded and supplied in Base64
1955
1957
  # encoding PEM format.
1956
1958
  #
1957
1959
  # * `SKIP_CUSTOM_JDBC_CERT_VALIDATION` - By default, this is `false`.
1958
- # AWS Glue validates the Signature algorithm and Subject Public Key
1960
+ # Glue validates the Signature algorithm and Subject Public Key
1959
1961
  # Algorithm for the customer certificate. The only permitted
1960
1962
  # algorithms for the Signature algorithm are SHA256withRSA,
1961
1963
  # SHA384withRSA or SHA512withRSA. For the Subject Public Key
1962
1964
  # Algorithm, the key length must be at least 2048. You can set the
1963
- # value of this property to `true` to skip AWS Glue’s validation of
1964
- # the customer certificate.
1965
+ # value of this property to `true` to skip Glue’s validation of the
1966
+ # customer certificate.
1965
1967
  #
1966
1968
  # * `CUSTOM_JDBC_CERT_STRING` - A custom JDBC certificate string which
1967
1969
  # is used for domain match or distinguished name match to prevent a
@@ -1984,8 +1986,8 @@ module Aws::Glue
1984
1986
  # file (.pem format). The default is an empty string.
1985
1987
  #
1986
1988
  # * `KAFKA_SKIP_CUSTOM_CERT_VALIDATION` - Whether to skip the
1987
- # validation of the CA cert file or not. AWS Glue validates for
1988
- # three algorithms: SHA256withRSA, SHA384withRSA and SHA512withRSA.
1989
+ # validation of the CA cert file or not. Glue validates for three
1990
+ # algorithms: SHA256withRSA, SHA384withRSA and SHA512withRSA.
1989
1991
  # Default value is "false".
1990
1992
  #
1991
1993
  # * `SECRET_ID` - The secret ID used for the secret manager of
@@ -1999,6 +2001,24 @@ module Aws::Glue
1999
2001
  #
2000
2002
  # * `CONNECTOR_CLASS_NAME` - The connector class name for a
2001
2003
  # MARKETPLACE or CUSTOM connection.
2004
+ #
2005
+ # * `KAFKA_CLIENT_KEYSTORE` - The Amazon S3 location of the client
2006
+ # keystore file for Kafka client side authentication (Optional).
2007
+ #
2008
+ # * `KAFKA_CLIENT_KEYSTORE_PASSWORD` - The password to access the
2009
+ # provided keystore (Optional).
2010
+ #
2011
+ # * `KAFKA_CLIENT_KEY_PASSWORD` - A keystore can consist of multiple
2012
+ # keys, so this is the password to access the client key to be used
2013
+ # with the Kafka server side key (Optional).
2014
+ #
2015
+ # * `ENCRYPTED_KAFKA_CLIENT_KEYSTORE_PASSWORD` - The encrypted version
2016
+ # of the Kafka client keystore password (if the user has the Glue
2017
+ # encrypt passwords setting selected).
2018
+ #
2019
+ # * `ENCRYPTED_KAFKA_CLIENT_KEY_PASSWORD` - The encrypted version of
2020
+ # the Kafka client key password (if the user has the Glue encrypt
2021
+ # passwords setting selected).
2002
2022
  # @return [Hash<String,String>]
2003
2023
  #
2004
2024
  # @!attribute [rw] physical_connection_requirements
@@ -2080,12 +2100,12 @@ module Aws::Glue
2080
2100
  # within an Amazon Virtual Private Cloud environment (Amazon VPC).
2081
2101
  #
2082
2102
  # * `MARKETPLACE` - Uses configuration settings contained in a
2083
- # connector purchased from AWS Marketplace to read from and write to
2084
- # data stores that are not natively supported by AWS Glue.
2103
+ # connector purchased from Marketplace to read from and write to
2104
+ # data stores that are not natively supported by Glue.
2085
2105
  #
2086
2106
  # * `CUSTOM` - Uses configuration settings contained in a custom
2087
2107
  # connector to read from and write to data stores that are not
2088
- # natively supported by AWS Glue.
2108
+ # natively supported by Glue.
2089
2109
  #
2090
2110
  # SFTP is not supported.
2091
2111
  # @return [String]
@@ -2123,14 +2143,14 @@ module Aws::Glue
2123
2143
  # enable catalog encryption or only password encryption.
2124
2144
  #
2125
2145
  # When a `CreationConnection` request arrives containing a password, the
2126
- # Data Catalog first encrypts the password using your AWS KMS key. It
2127
- # then encrypts the whole connection object again if catalog encryption
2128
- # is also enabled.
2146
+ # Data Catalog first encrypts the password using your KMS key. It then
2147
+ # encrypts the whole connection object again if catalog encryption is
2148
+ # also enabled.
2129
2149
  #
2130
- # This encryption requires that you set AWS KMS key permissions to
2131
- # enable or restrict access on the password key according to your
2132
- # security requirements. For example, you might want only administrators
2133
- # to have decrypt permission on the password key.
2150
+ # This encryption requires that you set KMS key permissions to enable or
2151
+ # restrict access on the password key according to your security
2152
+ # requirements. For example, you might want only administrators to have
2153
+ # decrypt permission on the password key.
2134
2154
  #
2135
2155
  # @note When making an API call, you may pass ConnectionPasswordEncryption
2136
2156
  # data as a hash:
@@ -2148,11 +2168,11 @@ module Aws::Glue
2148
2168
  # @return [Boolean]
2149
2169
  #
2150
2170
  # @!attribute [rw] aws_kms_key_id
2151
- # An AWS KMS key that is used to encrypt the connection password.
2171
+ # An KMS key that is used to encrypt the connection password.
2152
2172
  #
2153
2173
  # If connection password protection is enabled, the caller of
2154
2174
  # `CreateConnection` and `UpdateConnection` needs at least
2155
- # `kms:Encrypt` permission on the specified AWS KMS key, to encrypt
2175
+ # `kms:Encrypt` permission on the specified KMS key, to encrypt
2156
2176
  # passwords before storing them in the Data Catalog.
2157
2177
  #
2158
2178
  # You can set the decrypt permission to enable or restrict access on
@@ -2230,8 +2250,7 @@ module Aws::Glue
2230
2250
 
2231
2251
  # Specifies a crawler program that examines a data source and uses
2232
2252
  # classifiers to try to determine its schema. If successful, the crawler
2233
- # records metadata concerning the data source in the AWS Glue Data
2234
- # Catalog.
2253
+ # records metadata concerning the data source in the Glue Data Catalog.
2235
2254
  #
2236
2255
  # @!attribute [rw] name
2237
2256
  # The name of the crawler.
@@ -2313,11 +2332,11 @@ module Aws::Glue
2313
2332
  # @!attribute [rw] configuration
2314
2333
  # Crawler configuration information. This versioned JSON string allows
2315
2334
  # users to specify aspects of a crawler's behavior. For more
2316
- # information, see [Configuring a Crawler][1].
2335
+ # information, see [Include and Exclude Patterns][1].
2317
2336
  #
2318
2337
  #
2319
2338
  #
2320
- # [1]: https://docs.aws.amazon.com/glue/latest/dg/crawler-configuration.html
2339
+ # [1]: https://docs.aws.amazon.com/glue/latest/dg/define-crawler.html#crawler-data-stores-exclude
2321
2340
  # @return [String]
2322
2341
  #
2323
2342
  # @!attribute [rw] crawler_security_configuration
@@ -2469,6 +2488,7 @@ module Aws::Glue
2469
2488
  # path: "Path",
2470
2489
  # exclusions: ["Path"],
2471
2490
  # connection_name: "ConnectionName",
2491
+ # sample_size: 1,
2472
2492
  # },
2473
2493
  # ],
2474
2494
  # jdbc_targets: [
@@ -2517,7 +2537,7 @@ module Aws::Glue
2517
2537
  # @return [Array<Types::DynamoDBTarget>]
2518
2538
  #
2519
2539
  # @!attribute [rw] catalog_targets
2520
- # Specifies AWS Glue Data Catalog targets.
2540
+ # Specifies Glue Data Catalog targets.
2521
2541
  # @return [Array<Types::CatalogTarget>]
2522
2542
  #
2523
2543
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/CrawlerTargets AWS API Documentation
@@ -2616,7 +2636,8 @@ module Aws::Glue
2616
2636
  #
2617
2637
  # @!attribute [rw] catalog_id
2618
2638
  # The ID of the Data Catalog in which to create the connection. If
2619
- # none is provided, the AWS account ID is used by default.
2639
+ # none is provided, the Amazon Web Services account ID is used by
2640
+ # default.
2620
2641
  # @return [String]
2621
2642
  #
2622
2643
  # @!attribute [rw] connection_input
@@ -2650,6 +2671,7 @@ module Aws::Glue
2650
2671
  # path: "Path",
2651
2672
  # exclusions: ["Path"],
2652
2673
  # connection_name: "ConnectionName",
2674
+ # sample_size: 1,
2653
2675
  # },
2654
2676
  # ],
2655
2677
  # jdbc_targets: [
@@ -2710,7 +2732,7 @@ module Aws::Glue
2710
2732
  # @return [String]
2711
2733
  #
2712
2734
  # @!attribute [rw] database_name
2713
- # The AWS Glue database where results are written, such as:
2735
+ # The Glue database where results are written, such as:
2714
2736
  # `arn:aws:daylight:us-east-1::database/sometable/*`.
2715
2737
  # @return [String]
2716
2738
  #
@@ -2773,8 +2795,8 @@ module Aws::Glue
2773
2795
  #
2774
2796
  # @!attribute [rw] tags
2775
2797
  # The tags to use with this crawler request. You may use tags to limit
2776
- # access to the crawler. For more information about tags in AWS Glue,
2777
- # see [AWS Tags in AWS Glue][1] in the developer guide.
2798
+ # access to the crawler. For more information about tags in Glue, see
2799
+ # [Amazon Web Services Tags in Glue][1] in the developer guide.
2778
2800
  #
2779
2801
  #
2780
2802
  #
@@ -2895,7 +2917,7 @@ module Aws::Glue
2895
2917
  #
2896
2918
  # @!attribute [rw] catalog_id
2897
2919
  # The ID of the Data Catalog in which to create the database. If none
2898
- # is provided, the AWS account ID is used by default.
2920
+ # is provided, the Amazon Web Services account ID is used by default.
2899
2921
  # @return [String]
2900
2922
  #
2901
2923
  # @!attribute [rw] database_input
@@ -2979,8 +3001,8 @@ module Aws::Glue
2979
3001
  # @return [Array<String>]
2980
3002
  #
2981
3003
  # @!attribute [rw] number_of_nodes
2982
- # The number of AWS Glue Data Processing Units (DPUs) to allocate to
2983
- # this `DevEndpoint`.
3004
+ # The number of Glue Data Processing Units (DPUs) to allocate to this
3005
+ # `DevEndpoint`.
2984
3006
  # @return [Integer]
2985
3007
  #
2986
3008
  # @!attribute [rw] worker_type
@@ -3005,10 +3027,10 @@ module Aws::Glue
3005
3027
  #
3006
3028
  # @!attribute [rw] glue_version
3007
3029
  # Glue version determines the versions of Apache Spark and Python that
3008
- # AWS Glue supports. The Python version indicates the version
3009
- # supported for running your ETL scripts on development endpoints.
3030
+ # Glue supports. The Python version indicates the version supported
3031
+ # for running your ETL scripts on development endpoints.
3010
3032
  #
3011
- # For more information about the available AWS Glue versions and
3033
+ # For more information about the available Glue versions and
3012
3034
  # corresponding Spark and Python versions, see [Glue version][1] in
3013
3035
  # the developer guide.
3014
3036
  #
@@ -3061,8 +3083,8 @@ module Aws::Glue
3061
3083
  #
3062
3084
  # @!attribute [rw] tags
3063
3085
  # The tags to use with this DevEndpoint. You may use tags to limit
3064
- # access to the DevEndpoint. For more information about tags in AWS
3065
- # Glue, see [AWS Tags in AWS Glue][1] in the developer guide.
3086
+ # access to the DevEndpoint. For more information about tags in Glue,
3087
+ # see [Amazon Web Services Tags in Glue][1] in the developer guide.
3066
3088
  #
3067
3089
  #
3068
3090
  #
@@ -3125,8 +3147,8 @@ module Aws::Glue
3125
3147
  # @return [Integer]
3126
3148
  #
3127
3149
  # @!attribute [rw] number_of_nodes
3128
- # The number of AWS Glue Data Processing Units (DPUs) allocated to
3129
- # this DevEndpoint.
3150
+ # The number of Glue Data Processing Units (DPUs) allocated to this
3151
+ # DevEndpoint.
3130
3152
  # @return [Integer]
3131
3153
  #
3132
3154
  # @!attribute [rw] worker_type
@@ -3136,8 +3158,16 @@ module Aws::Glue
3136
3158
  #
3137
3159
  # @!attribute [rw] glue_version
3138
3160
  # Glue version determines the versions of Apache Spark and Python that
3139
- # AWS Glue supports. The Python version indicates the version
3140
- # supported for running your ETL scripts on development endpoints.
3161
+ # Glue supports. The Python version indicates the version supported
3162
+ # for running your ETL scripts on development endpoints.
3163
+ #
3164
+ # For more information about the available Glue versions and
3165
+ # corresponding Spark and Python versions, see [Glue version][1] in
3166
+ # the developer guide.
3167
+ #
3168
+ #
3169
+ #
3170
+ # [1]: https://docs.aws.amazon.com/glue/latest/dg/add-job.html
3141
3171
  # @return [String]
3142
3172
  #
3143
3173
  # @!attribute [rw] number_of_workers
@@ -3184,9 +3214,7 @@ module Aws::Glue
3184
3214
  #
3185
3215
  # * `"--enable-glue-datacatalog": ""`
3186
3216
  #
3187
- # * `"GLUE_PYTHON_VERSION": "3"`
3188
- #
3189
- # * `"GLUE_PYTHON_VERSION": "2"`
3217
+ # ^
3190
3218
  #
3191
3219
  # You can specify a version of Python support for development
3192
3220
  # endpoints by using the `Arguments` parameter in the
@@ -3325,22 +3353,22 @@ module Aws::Glue
3325
3353
  # @return [Types::ExecutionProperty]
3326
3354
  #
3327
3355
  # @!attribute [rw] command
3328
- # The `JobCommand` that executes this job.
3356
+ # The `JobCommand` that runs this job.
3329
3357
  # @return [Types::JobCommand]
3330
3358
  #
3331
3359
  # @!attribute [rw] default_arguments
3332
3360
  # The default arguments for this job.
3333
3361
  #
3334
3362
  # You can specify arguments here that your own job-execution script
3335
- # consumes, as well as arguments that AWS Glue itself consumes.
3363
+ # consumes, as well as arguments that Glue itself consumes.
3336
3364
  #
3337
3365
  # For information about how to specify and consume your own Job
3338
- # arguments, see the [Calling AWS Glue APIs in Python][1] topic in the
3366
+ # arguments, see the [Calling Glue APIs in Python][1] topic in the
3339
3367
  # developer guide.
3340
3368
  #
3341
- # For information about the key-value pairs that AWS Glue consumes to
3342
- # set up your job, see the [Special Parameters Used by AWS Glue][2]
3343
- # topic in the developer guide.
3369
+ # For information about the key-value pairs that Glue consumes to set
3370
+ # up your job, see the [Special Parameters Used by Glue][2] topic in
3371
+ # the developer guide.
3344
3372
  #
3345
3373
  #
3346
3374
  #
@@ -3364,11 +3392,11 @@ module Aws::Glue
3364
3392
  # @!attribute [rw] allocated_capacity
3365
3393
  # This parameter is deprecated. Use `MaxCapacity` instead.
3366
3394
  #
3367
- # The number of AWS Glue data processing units (DPUs) to allocate to
3368
- # this Job. You can allocate from 2 to 100 DPUs; the default is 10. A
3369
- # DPU is a relative measure of processing power that consists of 4
3370
- # vCPUs of compute capacity and 16 GB of memory. For more information,
3371
- # see the [AWS Glue pricing page][1].
3395
+ # The number of Glue data processing units (DPUs) to allocate to this
3396
+ # Job. You can allocate from 2 to 100 DPUs; the default is 10. A DPU
3397
+ # is a relative measure of processing power that consists of 4 vCPUs
3398
+ # of compute capacity and 16 GB of memory. For more information, see
3399
+ # the [Glue pricing page][1].
3372
3400
  #
3373
3401
  #
3374
3402
  #
@@ -3382,11 +3410,11 @@ module Aws::Glue
3382
3410
  # @return [Integer]
3383
3411
  #
3384
3412
  # @!attribute [rw] max_capacity
3385
- # The number of AWS Glue data processing units (DPUs) that can be
3413
+ # For Glue version 1.0 or earlier jobs, using the standard worker
3414
+ # type, the number of Glue data processing units (DPUs) that can be
3386
3415
  # allocated when this job runs. A DPU is a relative measure of
3387
3416
  # processing power that consists of 4 vCPUs of compute capacity and 16
3388
- # GB of memory. For more information, see the [AWS Glue pricing
3389
- # page][1].
3417
+ # GB of memory. For more information, see the [Glue pricing page][1].
3390
3418
  #
3391
3419
  # Do not set `Max Capacity` if using `WorkerType` and
3392
3420
  # `NumberOfWorkers`.
@@ -3404,6 +3432,10 @@ module Aws::Glue
3404
3432
  # 100 DPUs. The default is 10 DPUs. This job type cannot have a
3405
3433
  # fractional DPU allocation.
3406
3434
  #
3435
+ # For Glue version 2.0 jobs, you cannot instead specify a `Maximum
3436
+ # capacity`. Instead, you should specify a `Worker type` and the
3437
+ # `Number of workers`.
3438
+ #
3407
3439
  #
3408
3440
  #
3409
3441
  # [1]: https://aws.amazon.com/glue/pricing/
@@ -3416,8 +3448,8 @@ module Aws::Glue
3416
3448
  #
3417
3449
  # @!attribute [rw] tags
3418
3450
  # The tags to use with this job. You may use tags to limit access to
3419
- # the job. For more information about tags in AWS Glue, see [AWS Tags
3420
- # in AWS Glue][1] in the developer guide.
3451
+ # the job. For more information about tags in Glue, see [Amazon Web
3452
+ # Services Tags in Glue][1] in the developer guide.
3421
3453
  #
3422
3454
  #
3423
3455
  #
@@ -3430,10 +3462,10 @@ module Aws::Glue
3430
3462
  #
3431
3463
  # @!attribute [rw] glue_version
3432
3464
  # Glue version determines the versions of Apache Spark and Python that
3433
- # AWS Glue supports. The Python version indicates the version
3434
- # supported for jobs of type Spark.
3465
+ # Glue supports. The Python version indicates the version supported
3466
+ # for jobs of type Spark.
3435
3467
  #
3436
- # For more information about the available AWS Glue versions and
3468
+ # For more information about the available Glue versions and
3437
3469
  # corresponding Spark and Python versions, see [Glue version][1] in
3438
3470
  # the developer guide.
3439
3471
  #
@@ -3523,7 +3555,7 @@ module Aws::Glue
3523
3555
  #
3524
3556
  # @!attribute [rw] json_path
3525
3557
  # A `JsonPath` string defining the JSON data for the classifier to
3526
- # classify. AWS Glue supports a subset of JsonPath, as described in
3558
+ # classify. Glue supports a subset of JsonPath, as described in
3527
3559
  # [Writing JsonPath Custom Classifiers][1].
3528
3560
  #
3529
3561
  #
@@ -3592,7 +3624,7 @@ module Aws::Glue
3592
3624
  # @return [String]
3593
3625
  #
3594
3626
  # @!attribute [rw] input_record_tables
3595
- # A list of AWS Glue table definitions used by the transform.
3627
+ # A list of Glue table definitions used by the transform.
3596
3628
  # @return [Array<Types::GlueTable>]
3597
3629
  #
3598
3630
  # @!attribute [rw] parameters
@@ -3602,13 +3634,13 @@ module Aws::Glue
3602
3634
  #
3603
3635
  # @!attribute [rw] role
3604
3636
  # The name or Amazon Resource Name (ARN) of the IAM role with the
3605
- # required permissions. The required permissions include both AWS Glue
3606
- # service role permissions to AWS Glue resources, and Amazon S3
3637
+ # required permissions. The required permissions include both Glue
3638
+ # service role permissions to Glue resources, and Amazon S3
3607
3639
  # permissions required by the transform.
3608
3640
  #
3609
- # * This role needs AWS Glue service role permissions to allow access
3610
- # to resources in AWS Glue. See [Attach a Policy to IAM Users That
3611
- # Access AWS Glue][1].
3641
+ # * This role needs Glue service role permissions to allow access to
3642
+ # resources in Glue. See [Attach a Policy to IAM Users That Access
3643
+ # Glue][1].
3612
3644
  #
3613
3645
  # * This role needs permission to your Amazon Simple Storage Service
3614
3646
  # (Amazon S3) sources, targets, temporary directory, scripts, and
@@ -3620,11 +3652,11 @@ module Aws::Glue
3620
3652
  # @return [String]
3621
3653
  #
3622
3654
  # @!attribute [rw] glue_version
3623
- # This value determines which version of AWS Glue this machine
3624
- # learning transform is compatible with. Glue 1.0 is recommended for
3625
- # most customers. If the value is not set, the Glue compatibility
3626
- # defaults to Glue 0.9. For more information, see [AWS Glue
3627
- # Versions][1] in the developer guide.
3655
+ # This value determines which version of Glue this machine learning
3656
+ # transform is compatible with. Glue 1.0 is recommended for most
3657
+ # customers. If the value is not set, the Glue compatibility defaults
3658
+ # to Glue 0.9. For more information, see [Glue Versions][1] in the
3659
+ # developer guide.
3628
3660
  #
3629
3661
  #
3630
3662
  #
@@ -3632,12 +3664,11 @@ module Aws::Glue
3632
3664
  # @return [String]
3633
3665
  #
3634
3666
  # @!attribute [rw] max_capacity
3635
- # The number of AWS Glue data processing units (DPUs) that are
3636
- # allocated to task runs for this transform. You can allocate from 2
3637
- # to 100 DPUs; the default is 10. A DPU is a relative measure of
3638
- # processing power that consists of 4 vCPUs of compute capacity and 16
3639
- # GB of memory. For more information, see the [AWS Glue pricing
3640
- # page][1].
3667
+ # The number of Glue data processing units (DPUs) that are allocated
3668
+ # to task runs for this transform. You can allocate from 2 to 100
3669
+ # DPUs; the default is 10. A DPU is a relative measure of processing
3670
+ # power that consists of 4 vCPUs of compute capacity and 16 GB of
3671
+ # memory. For more information, see the [Glue pricing page][1].
3641
3672
  #
3642
3673
  # `MaxCapacity` is a mutually exclusive option with `NumberOfWorkers`
3643
3674
  # and `WorkerType`.
@@ -3715,8 +3746,8 @@ module Aws::Glue
3715
3746
  # @!attribute [rw] tags
3716
3747
  # The tags to use with this machine learning transform. You may use
3717
3748
  # tags to limit access to the machine learning transform. For more
3718
- # information about tags in AWS Glue, see [AWS Tags in AWS Glue][1] in
3719
- # the developer guide.
3749
+ # information about tags in Glue, see [Amazon Web Services Tags in
3750
+ # Glue][1] in the developer guide.
3720
3751
  #
3721
3752
  #
3722
3753
  #
@@ -3877,8 +3908,8 @@ module Aws::Glue
3877
3908
  # }
3878
3909
  #
3879
3910
  # @!attribute [rw] catalog_id
3880
- # The AWS account ID of the catalog in which the partition is to be
3881
- # created.
3911
+ # The Amazon Web Services account ID of the catalog in which the
3912
+ # partition is to be created.
3882
3913
  # @return [String]
3883
3914
  #
3884
3915
  # @!attribute [rw] database_name
@@ -3933,8 +3964,8 @@ module Aws::Glue
3933
3964
  # @return [String]
3934
3965
  #
3935
3966
  # @!attribute [rw] tags
3936
- # AWS tags that contain a key value pair and may be searched by
3937
- # console, command line, or API.
3967
+ # Amazon Web Services tags that contain a key value pair and may be
3968
+ # searched by console, command line, or API.
3938
3969
  # @return [Hash<String,String>]
3939
3970
  #
3940
3971
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/CreateRegistryInput AWS API Documentation
@@ -3983,7 +4014,7 @@ module Aws::Glue
3983
4014
  # registry_arn: "GlueResourceArn",
3984
4015
  # },
3985
4016
  # schema_name: "SchemaRegistryNameString", # required
3986
- # data_format: "AVRO", # required, accepts AVRO
4017
+ # data_format: "AVRO", # required, accepts AVRO, JSON
3987
4018
  # compatibility: "NONE", # accepts NONE, DISABLED, BACKWARD, BACKWARD_ALL, FORWARD, FORWARD_ALL, FULL, FULL_ALL
3988
4019
  # description: "DescriptionString",
3989
4020
  # tags: {
@@ -4006,8 +4037,8 @@ module Aws::Glue
4006
4037
  # @return [String]
4007
4038
  #
4008
4039
  # @!attribute [rw] data_format
4009
- # The data format of the schema definition. Currently only `AVRO` is
4010
- # supported.
4040
+ # The data format of the schema definition. Currently `AVRO` and
4041
+ # `JSON` are supported.
4011
4042
  # @return [String]
4012
4043
  #
4013
4044
  # @!attribute [rw] compatibility
@@ -4065,9 +4096,9 @@ module Aws::Glue
4065
4096
  # @return [String]
4066
4097
  #
4067
4098
  # @!attribute [rw] tags
4068
- # AWS tags that contain a key value pair and may be searched by
4069
- # console, command line, or API. If specified, follows the AWS
4070
- # tags-on-create pattern.
4099
+ # Amazon Web Services tags that contain a key value pair and may be
4100
+ # searched by console, command line, or API. If specified, follows the
4101
+ # Amazon Web Services tags-on-create pattern.
4071
4102
  # @return [Hash<String,String>]
4072
4103
  #
4073
4104
  # @!attribute [rw] schema_definition
@@ -4110,8 +4141,8 @@ module Aws::Glue
4110
4141
  # @return [String]
4111
4142
  #
4112
4143
  # @!attribute [rw] data_format
4113
- # The data format of the schema definition. Currently only `AVRO` is
4114
- # supported.
4144
+ # The data format of the schema definition. Currently `AVRO` and
4145
+ # `JSON` are supported.
4115
4146
  # @return [String]
4116
4147
  #
4117
4148
  # @!attribute [rw] compatibility
@@ -4390,7 +4421,7 @@ module Aws::Glue
4390
4421
  #
4391
4422
  # @!attribute [rw] catalog_id
4392
4423
  # The ID of the Data Catalog in which to create the `Table`. If none
4393
- # is supplied, the AWS account ID is used by default.
4424
+ # is supplied, the Amazon Web Services account ID is used by default.
4394
4425
  # @return [String]
4395
4426
  #
4396
4427
  # @!attribute [rw] database_name
@@ -4429,7 +4460,7 @@ module Aws::Glue
4429
4460
  # {
4430
4461
  # name: "NameString", # required
4431
4462
  # workflow_name: "NameString",
4432
- # type: "SCHEDULED", # required, accepts SCHEDULED, CONDITIONAL, ON_DEMAND
4463
+ # type: "SCHEDULED", # required, accepts SCHEDULED, CONDITIONAL, ON_DEMAND, EVENT
4433
4464
  # schedule: "GenericString",
4434
4465
  # predicate: {
4435
4466
  # logical: "AND", # accepts AND, ANY
@@ -4462,6 +4493,10 @@ module Aws::Glue
4462
4493
  # tags: {
4463
4494
  # "TagKey" => "TagValue",
4464
4495
  # },
4496
+ # event_batching_condition: {
4497
+ # batch_size: 1, # required
4498
+ # batch_window: 1,
4499
+ # },
4465
4500
  # }
4466
4501
  #
4467
4502
  # @!attribute [rw] name
@@ -4509,14 +4544,20 @@ module Aws::Glue
4509
4544
  #
4510
4545
  # @!attribute [rw] tags
4511
4546
  # The tags to use with this trigger. You may use tags to limit access
4512
- # to the trigger. For more information about tags in AWS Glue, see
4513
- # [AWS Tags in AWS Glue][1] in the developer guide.
4547
+ # to the trigger. For more information about tags in Glue, see [Amazon
4548
+ # Web Services Tags in Glue][1] in the developer guide.
4514
4549
  #
4515
4550
  #
4516
4551
  #
4517
4552
  # [1]: https://docs.aws.amazon.com/glue/latest/dg/monitor-tags.html
4518
4553
  # @return [Hash<String,String>]
4519
4554
  #
4555
+ # @!attribute [rw] event_batching_condition
4556
+ # Batch condition that must be met (specified number of events
4557
+ # received or batch time window expired) before EventBridge event
4558
+ # trigger fires.
4559
+ # @return [Types::EventBatchingCondition]
4560
+ #
4520
4561
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/CreateTriggerRequest AWS API Documentation
4521
4562
  #
4522
4563
  class CreateTriggerRequest < Struct.new(
@@ -4528,7 +4569,8 @@ module Aws::Glue
4528
4569
  :actions,
4529
4570
  :description,
4530
4571
  :start_on_creation,
4531
- :tags)
4572
+ :tags,
4573
+ :event_batching_condition)
4532
4574
  SENSITIVE = []
4533
4575
  include Aws::Structure
4534
4576
  end
@@ -4567,7 +4609,7 @@ module Aws::Glue
4567
4609
  #
4568
4610
  # @!attribute [rw] catalog_id
4569
4611
  # The ID of the Data Catalog in which to create the function. If none
4570
- # is provided, the AWS account ID is used by default.
4612
+ # is provided, the Amazon Web Services account ID is used by default.
4571
4613
  # @return [String]
4572
4614
  #
4573
4615
  # @!attribute [rw] database_name
@@ -4796,7 +4838,7 @@ module Aws::Glue
4796
4838
  include Aws::Structure
4797
4839
  end
4798
4840
 
4799
- # The AWS Lake Formation principal.
4841
+ # The Lake Formation principal.
4800
4842
  #
4801
4843
  # @note When making an API call, you may pass DataLakePrincipal
4802
4844
  # data as a hash:
@@ -4806,7 +4848,7 @@ module Aws::Glue
4806
4848
  # }
4807
4849
  #
4808
4850
  # @!attribute [rw] data_lake_principal_identifier
4809
- # An identifier for the AWS Lake Formation principal.
4851
+ # An identifier for the Lake Formation principal.
4810
4852
  # @return [String]
4811
4853
  #
4812
4854
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/DataLakePrincipal AWS API Documentation
@@ -5115,7 +5157,8 @@ module Aws::Glue
5115
5157
  #
5116
5158
  # @!attribute [rw] catalog_id
5117
5159
  # The ID of the Data Catalog where the partitions in question reside.
5118
- # If none is supplied, the AWS account ID is used by default.
5160
+ # If none is supplied, the Amazon Web Services account ID is used by
5161
+ # default.
5119
5162
  # @return [String]
5120
5163
  #
5121
5164
  # @!attribute [rw] database_name
@@ -5162,7 +5205,8 @@ module Aws::Glue
5162
5205
  #
5163
5206
  # @!attribute [rw] catalog_id
5164
5207
  # The ID of the Data Catalog where the partitions in question reside.
5165
- # If none is supplied, the AWS account ID is used by default.
5208
+ # If none is supplied, the Amazon Web Services account ID is used by
5209
+ # default.
5166
5210
  # @return [String]
5167
5211
  #
5168
5212
  # @!attribute [rw] database_name
@@ -5202,7 +5246,7 @@ module Aws::Glue
5202
5246
  #
5203
5247
  # @!attribute [rw] catalog_id
5204
5248
  # The ID of the Data Catalog in which the connection resides. If none
5205
- # is provided, the AWS account ID is used by default.
5249
+ # is provided, the Amazon Web Services account ID is used by default.
5206
5250
  # @return [String]
5207
5251
  #
5208
5252
  # @!attribute [rw] connection_name
@@ -5255,7 +5299,7 @@ module Aws::Glue
5255
5299
  #
5256
5300
  # @!attribute [rw] catalog_id
5257
5301
  # The ID of the Data Catalog in which the database resides. If none is
5258
- # provided, the AWS account ID is used by default.
5302
+ # provided, the Amazon Web Services account ID is used by default.
5259
5303
  # @return [String]
5260
5304
  #
5261
5305
  # @!attribute [rw] name
@@ -5416,7 +5460,8 @@ module Aws::Glue
5416
5460
  #
5417
5461
  # @!attribute [rw] catalog_id
5418
5462
  # The ID of the Data Catalog where the partition to be deleted
5419
- # resides. If none is provided, the AWS account ID is used by default.
5463
+ # resides. If none is provided, the Amazon Web Services account ID is
5464
+ # used by default.
5420
5465
  # @return [String]
5421
5466
  #
5422
5467
  # @!attribute [rw] database_name
@@ -5506,8 +5551,7 @@ module Aws::Glue
5506
5551
  # @return [String]
5507
5552
  #
5508
5553
  # @!attribute [rw] resource_arn
5509
- # The ARN of the AWS Glue resource for the resource policy to be
5510
- # deleted.
5554
+ # The ARN of the Glue resource for the resource policy to be deleted.
5511
5555
  # @return [String]
5512
5556
  #
5513
5557
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/DeleteResourcePolicyRequest AWS API Documentation
@@ -5650,7 +5694,7 @@ module Aws::Glue
5650
5694
  #
5651
5695
  # @!attribute [rw] catalog_id
5652
5696
  # The ID of the Data Catalog where the table resides. If none is
5653
- # provided, the AWS account ID is used by default.
5697
+ # provided, the Amazon Web Services account ID is used by default.
5654
5698
  # @return [String]
5655
5699
  #
5656
5700
  # @!attribute [rw] database_name
@@ -5689,7 +5733,7 @@ module Aws::Glue
5689
5733
  #
5690
5734
  # @!attribute [rw] catalog_id
5691
5735
  # The ID of the Data Catalog where the tables reside. If none is
5692
- # provided, the AWS account ID is used by default.
5736
+ # provided, the Amazon Web Services account ID is used by default.
5693
5737
  # @return [String]
5694
5738
  #
5695
5739
  # @!attribute [rw] database_name
@@ -5764,7 +5808,8 @@ module Aws::Glue
5764
5808
  #
5765
5809
  # @!attribute [rw] catalog_id
5766
5810
  # The ID of the Data Catalog where the function to be deleted is
5767
- # located. If none is supplied, the AWS account ID is used by default.
5811
+ # located. If none is supplied, the Amazon Web Services account ID is
5812
+ # used by default.
5768
5813
  # @return [String]
5769
5814
  #
5770
5815
  # @!attribute [rw] database_name
@@ -5886,10 +5931,10 @@ module Aws::Glue
5886
5931
  #
5887
5932
  # @!attribute [rw] glue_version
5888
5933
  # Glue version determines the versions of Apache Spark and Python that
5889
- # AWS Glue supports. The Python version indicates the version
5890
- # supported for running your ETL scripts on development endpoints.
5934
+ # Glue supports. The Python version indicates the version supported
5935
+ # for running your ETL scripts on development endpoints.
5891
5936
  #
5892
- # For more information about the available AWS Glue versions and
5937
+ # For more information about the available Glue versions and
5893
5938
  # corresponding Spark and Python versions, see [Glue version][1] in
5894
5939
  # the developer guide.
5895
5940
  #
@@ -5915,8 +5960,8 @@ module Aws::Glue
5915
5960
  # @return [Integer]
5916
5961
  #
5917
5962
  # @!attribute [rw] number_of_nodes
5918
- # The number of AWS Glue Data Processing Units (DPUs) allocated to
5919
- # this `DevEndpoint`.
5963
+ # The number of Glue Data Processing Units (DPUs) allocated to this
5964
+ # `DevEndpoint`.
5920
5965
  # @return [Integer]
5921
5966
  #
5922
5967
  # @!attribute [rw] availability_zone
@@ -6002,9 +6047,7 @@ module Aws::Glue
6002
6047
  #
6003
6048
  # * `"--enable-glue-datacatalog": ""`
6004
6049
  #
6005
- # * `"GLUE_PYTHON_VERSION": "3"`
6006
- #
6007
- # * `"GLUE_PYTHON_VERSION": "2"`
6050
+ # ^
6008
6051
  #
6009
6052
  # You can specify a version of Python support for development
6010
6053
  # endpoints by using the `Arguments` parameter in the
@@ -6156,9 +6199,9 @@ module Aws::Glue
6156
6199
  #
6157
6200
  # @!attribute [rw] scan_rate
6158
6201
  # The percentage of the configured read capacity units to use by the
6159
- # AWS Glue crawler. Read capacity units is a term defined by DynamoDB,
6160
- # and is a numeric value that acts as rate limiter for the number of
6161
- # reads that can be performed on that table per second.
6202
+ # Glue crawler. Read capacity units is a term defined by DynamoDB, and
6203
+ # is a numeric value that acts as rate limiter for the number of reads
6204
+ # that can be performed on that table per second.
6162
6205
  #
6163
6206
  # The valid values are null or a value between 0.1 to 1.5. A null
6164
6207
  # value is used when user does not provide a value, and defaults to
@@ -6177,8 +6220,8 @@ module Aws::Glue
6177
6220
  include Aws::Structure
6178
6221
  end
6179
6222
 
6180
- # An edge represents a directed connection between two AWS Glue
6181
- # components that are part of the workflow the edge belongs to.
6223
+ # An edge represents a directed connection between two components on a
6224
+ # workflow graph.
6182
6225
  #
6183
6226
  # @!attribute [rw] source_id
6184
6227
  # The unique of the node within the workflow where the edge starts.
@@ -6212,7 +6255,7 @@ module Aws::Glue
6212
6255
  # @return [String]
6213
6256
  #
6214
6257
  # @!attribute [rw] sse_aws_kms_key_id
6215
- # The ID of the AWS KMS key to use for encryption at rest.
6258
+ # The ID of the KMS key to use for encryption at rest.
6216
6259
  # @return [String]
6217
6260
  #
6218
6261
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/EncryptionAtRest AWS API Documentation
@@ -6341,6 +6384,36 @@ module Aws::Glue
6341
6384
  include Aws::Structure
6342
6385
  end
6343
6386
 
6387
+ # Batch condition that must be met (specified number of events received
6388
+ # or batch time window expired) before EventBridge event trigger fires.
6389
+ #
6390
+ # @note When making an API call, you may pass EventBatchingCondition
6391
+ # data as a hash:
6392
+ #
6393
+ # {
6394
+ # batch_size: 1, # required
6395
+ # batch_window: 1,
6396
+ # }
6397
+ #
6398
+ # @!attribute [rw] batch_size
6399
+ # Number of events that must be received from Amazon EventBridge
6400
+ # before EventBridge event trigger fires.
6401
+ # @return [Integer]
6402
+ #
6403
+ # @!attribute [rw] batch_window
6404
+ # Window of time in seconds after which EventBridge event trigger
6405
+ # fires. Window starts when first event is received.
6406
+ # @return [Integer]
6407
+ #
6408
+ # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/EventBatchingCondition AWS API Documentation
6409
+ #
6410
+ class EventBatchingCondition < Struct.new(
6411
+ :batch_size,
6412
+ :batch_window)
6413
+ SENSITIVE = []
6414
+ include Aws::Structure
6415
+ end
6416
+
6344
6417
  # An execution property of a job.
6345
6418
  #
6346
6419
  # @note When making an API call, you may pass ExecutionProperty
@@ -6568,8 +6641,8 @@ module Aws::Glue
6568
6641
  # }
6569
6642
  #
6570
6643
  # @!attribute [rw] catalog_id
6571
- # The ID of the catalog to migrate. Currently, this should be the AWS
6572
- # account ID.
6644
+ # The ID of the catalog to migrate. Currently, this should be the
6645
+ # Amazon Web Services account ID.
6573
6646
  # @return [String]
6574
6647
  #
6575
6648
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GetCatalogImportStatusRequest AWS API Documentation
@@ -6678,7 +6751,8 @@ module Aws::Glue
6678
6751
  #
6679
6752
  # @!attribute [rw] catalog_id
6680
6753
  # The ID of the Data Catalog where the partitions in question reside.
6681
- # If none is supplied, the AWS account ID is used by default.
6754
+ # If none is supplied, the Amazon Web Services account ID is used by
6755
+ # default.
6682
6756
  # @return [String]
6683
6757
  #
6684
6758
  # @!attribute [rw] database_name
@@ -6738,7 +6812,8 @@ module Aws::Glue
6738
6812
  #
6739
6813
  # @!attribute [rw] catalog_id
6740
6814
  # The ID of the Data Catalog where the partitions in question reside.
6741
- # If none is supplied, the AWS account ID is used by default.
6815
+ # If none is supplied, the Amazon Web Services account ID is used by
6816
+ # default.
6742
6817
  # @return [String]
6743
6818
  #
6744
6819
  # @!attribute [rw] database_name
@@ -6792,7 +6867,7 @@ module Aws::Glue
6792
6867
  #
6793
6868
  # @!attribute [rw] catalog_id
6794
6869
  # The ID of the Data Catalog in which the connection resides. If none
6795
- # is provided, the AWS account ID is used by default.
6870
+ # is provided, the Amazon Web Services account ID is used by default.
6796
6871
  # @return [String]
6797
6872
  #
6798
6873
  # @!attribute [rw] name
@@ -6803,9 +6878,9 @@ module Aws::Glue
6803
6878
  # Allows you to retrieve the connection metadata without returning the
6804
6879
  # password. For instance, the AWS Glue console uses this flag to
6805
6880
  # retrieve the connection, and does not display the password. Set this
6806
- # parameter when the caller might not have permission to use the AWS
6807
- # KMS key to decrypt the password, but it does have permission to
6808
- # access the rest of the connection properties.
6881
+ # parameter when the caller might not have permission to use the KMS
6882
+ # key to decrypt the password, but it does have permission to access
6883
+ # the rest of the connection properties.
6809
6884
  # @return [Boolean]
6810
6885
  #
6811
6886
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GetConnectionRequest AWS API Documentation
@@ -6875,7 +6950,7 @@ module Aws::Glue
6875
6950
  #
6876
6951
  # @!attribute [rw] catalog_id
6877
6952
  # The ID of the Data Catalog in which the connections reside. If none
6878
- # is provided, the AWS account ID is used by default.
6953
+ # is provided, the Amazon Web Services account ID is used by default.
6879
6954
  # @return [String]
6880
6955
  #
6881
6956
  # @!attribute [rw] filter
@@ -6886,9 +6961,9 @@ module Aws::Glue
6886
6961
  # Allows you to retrieve the connection metadata without returning the
6887
6962
  # password. For instance, the AWS Glue console uses this flag to
6888
6963
  # retrieve the connection, and does not display the password. Set this
6889
- # parameter when the caller might not have permission to use the AWS
6890
- # KMS key to decrypt the password, but it does have permission to
6891
- # access the rest of the connection properties.
6964
+ # parameter when the caller might not have permission to use the KMS
6965
+ # key to decrypt the password, but it does have permission to access
6966
+ # the rest of the connection properties.
6892
6967
  # @return [Boolean]
6893
6968
  #
6894
6969
  # @!attribute [rw] next_token
@@ -7061,7 +7136,8 @@ module Aws::Glue
7061
7136
  #
7062
7137
  # @!attribute [rw] catalog_id
7063
7138
  # The ID of the Data Catalog to retrieve the security configuration
7064
- # for. If none is provided, the AWS account ID is used by default.
7139
+ # for. If none is provided, the Amazon Web Services account ID is used
7140
+ # by default.
7065
7141
  # @return [String]
7066
7142
  #
7067
7143
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GetDataCatalogEncryptionSettingsRequest AWS API Documentation
@@ -7094,7 +7170,7 @@ module Aws::Glue
7094
7170
  #
7095
7171
  # @!attribute [rw] catalog_id
7096
7172
  # The ID of the Data Catalog in which the database resides. If none is
7097
- # provided, the AWS account ID is used by default.
7173
+ # provided, the Amazon Web Services account ID is used by default.
7098
7174
  # @return [String]
7099
7175
  #
7100
7176
  # @!attribute [rw] name
@@ -7135,7 +7211,8 @@ module Aws::Glue
7135
7211
  #
7136
7212
  # @!attribute [rw] catalog_id
7137
7213
  # The ID of the Data Catalog from which to retrieve `Databases`. If
7138
- # none is provided, the AWS account ID is used by default.
7214
+ # none is provided, the Amazon Web Services account ID is used by
7215
+ # default.
7139
7216
  # @return [String]
7140
7217
  #
7141
7218
  # @!attribute [rw] next_token
@@ -7699,7 +7776,7 @@ module Aws::Glue
7699
7776
  # @return [Time]
7700
7777
  #
7701
7778
  # @!attribute [rw] input_record_tables
7702
- # A list of AWS Glue table definitions used by the transform.
7779
+ # A list of Glue table definitions used by the transform.
7703
7780
  # @return [Array<Types::GlueTable>]
7704
7781
  #
7705
7782
  # @!attribute [rw] parameters
@@ -7726,11 +7803,11 @@ module Aws::Glue
7726
7803
  # @return [String]
7727
7804
  #
7728
7805
  # @!attribute [rw] glue_version
7729
- # This value determines which version of AWS Glue this machine
7730
- # learning transform is compatible with. Glue 1.0 is recommended for
7731
- # most customers. If the value is not set, the Glue compatibility
7732
- # defaults to Glue 0.9. For more information, see [AWS Glue
7733
- # Versions][1] in the developer guide.
7806
+ # This value determines which version of Glue this machine learning
7807
+ # transform is compatible with. Glue 1.0 is recommended for most
7808
+ # customers. If the value is not set, the Glue compatibility defaults
7809
+ # to Glue 0.9. For more information, see [Glue Versions][1] in the
7810
+ # developer guide.
7734
7811
  #
7735
7812
  #
7736
7813
  #
@@ -7738,12 +7815,11 @@ module Aws::Glue
7738
7815
  # @return [String]
7739
7816
  #
7740
7817
  # @!attribute [rw] max_capacity
7741
- # The number of AWS Glue data processing units (DPUs) that are
7742
- # allocated to task runs for this transform. You can allocate from 2
7743
- # to 100 DPUs; the default is 10. A DPU is a relative measure of
7744
- # processing power that consists of 4 vCPUs of compute capacity and 16
7745
- # GB of memory. For more information, see the [AWS Glue pricing
7746
- # page][1].
7818
+ # The number of Glue data processing units (DPUs) that are allocated
7819
+ # to task runs for this transform. You can allocate from 2 to 100
7820
+ # DPUs; the default is 10. A DPU is a relative measure of processing
7821
+ # power that consists of 4 vCPUs of compute capacity and 16 GB of
7822
+ # memory. For more information, see the [Glue pricing page][1].
7747
7823
  #
7748
7824
  # When the `WorkerType` field is set to a value other than `Standard`,
7749
7825
  # the `MaxCapacity` field is set automatically and becomes read-only.
@@ -8030,7 +8106,8 @@ module Aws::Glue
8030
8106
  #
8031
8107
  # @!attribute [rw] catalog_id
8032
8108
  # The ID of the Data Catalog where the partition in question resides.
8033
- # If none is provided, the AWS account ID is used by default.
8109
+ # If none is provided, the Amazon Web Services account ID is used by
8110
+ # default.
8034
8111
  # @return [String]
8035
8112
  #
8036
8113
  # @!attribute [rw] database_name
@@ -8087,7 +8164,8 @@ module Aws::Glue
8087
8164
  #
8088
8165
  # @!attribute [rw] catalog_id
8089
8166
  # The ID of the Data Catalog where the partitions in question reside.
8090
- # If none is provided, the AWS account ID is used by default.
8167
+ # If none is provided, the Amazon Web Services account ID is used by
8168
+ # default.
8091
8169
  # @return [String]
8092
8170
  #
8093
8171
  # @!attribute [rw] database_name
@@ -8182,7 +8260,7 @@ module Aws::Glue
8182
8260
  #
8183
8261
  # * `decimal`
8184
8262
  #
8185
- # If an invalid type is encountered, an exception is thrown.
8263
+ # If an type is encountered that is not valid, an exception is thrown.
8186
8264
  #
8187
8265
  # The following list shows the valid operators on each type. When you
8188
8266
  # define a crawler, the `partitionKey` type is created as a `STRING`,
@@ -8323,7 +8401,7 @@ module Aws::Glue
8323
8401
  # Currently, these key-value pairs are supported:
8324
8402
  #
8325
8403
  # * `inferSchema`  —  Specifies whether to set `inferSchema` to true
8326
- # or false for the default script generated by an AWS Glue job. For
8404
+ # or false for the default script generated by an Glue job. For
8327
8405
  # example, to set `inferSchema` to true, pass the following key
8328
8406
  # value pair:
8329
8407
  #
@@ -8472,10 +8550,10 @@ module Aws::Glue
8472
8550
  # }
8473
8551
  #
8474
8552
  # @!attribute [rw] resource_arn
8475
- # The ARN of the AWS Glue resource for which to retrieve the resource
8553
+ # The ARN of the Glue resource for which to retrieve the resource
8476
8554
  # policy. If not supplied, the Data Catalog resource policy is
8477
8555
  # returned. Use `GetResourcePolicies` to view all existing resource
8478
- # policies. For more information see [Specifying AWS Glue Resource
8556
+ # policies. For more information see [Specifying Glue Resource
8479
8557
  # ARNs][1].
8480
8558
  #
8481
8559
  #
@@ -8563,8 +8641,8 @@ module Aws::Glue
8563
8641
  # @return [String]
8564
8642
  #
8565
8643
  # @!attribute [rw] data_format
8566
- # The data format of the schema definition. Currently only `AVRO` is
8567
- # supported.
8644
+ # The data format of the schema definition. Currently only `AVRO` and
8645
+ # `JSON` are supported.
8568
8646
  # @return [String]
8569
8647
  #
8570
8648
  # @!attribute [rw] status
@@ -8639,8 +8717,8 @@ module Aws::Glue
8639
8717
  # @return [String]
8640
8718
  #
8641
8719
  # @!attribute [rw] data_format
8642
- # The data format of the schema definition. Currently only `AVRO` is
8643
- # supported.
8720
+ # The data format of the schema definition. Currently `AVRO` and
8721
+ # `JSON` are supported.
8644
8722
  # @return [String]
8645
8723
  #
8646
8724
  # @!attribute [rw] compatibility
@@ -8751,8 +8829,8 @@ module Aws::Glue
8751
8829
  # @return [String]
8752
8830
  #
8753
8831
  # @!attribute [rw] data_format
8754
- # The data format of the schema definition. Currently only `AVRO` is
8755
- # supported.
8832
+ # The data format of the schema definition. Currently `AVRO` and
8833
+ # `JSON` are supported.
8756
8834
  # @return [String]
8757
8835
  #
8758
8836
  # @!attribute [rw] schema_arn
@@ -8936,7 +9014,7 @@ module Aws::Glue
8936
9014
  #
8937
9015
  # @!attribute [rw] catalog_id
8938
9016
  # The ID of the Data Catalog where the table resides. If none is
8939
- # provided, the AWS account ID is used by default.
9017
+ # provided, the Amazon Web Services account ID is used by default.
8940
9018
  # @return [String]
8941
9019
  #
8942
9020
  # @!attribute [rw] database_name
@@ -8983,7 +9061,7 @@ module Aws::Glue
8983
9061
  #
8984
9062
  # @!attribute [rw] catalog_id
8985
9063
  # The ID of the Data Catalog where the tables reside. If none is
8986
- # provided, the AWS account ID is used by default.
9064
+ # provided, the Amazon Web Services account ID is used by default.
8987
9065
  # @return [String]
8988
9066
  #
8989
9067
  # @!attribute [rw] database_name
@@ -9038,7 +9116,7 @@ module Aws::Glue
9038
9116
  #
9039
9117
  # @!attribute [rw] catalog_id
9040
9118
  # The ID of the Data Catalog where the tables reside. If none is
9041
- # provided, the AWS account ID is used by default.
9119
+ # provided, the Amazon Web Services account ID is used by default.
9042
9120
  # @return [String]
9043
9121
  #
9044
9122
  # @!attribute [rw] database_name
@@ -9103,7 +9181,7 @@ module Aws::Glue
9103
9181
  #
9104
9182
  # @!attribute [rw] catalog_id
9105
9183
  # The ID of the Data Catalog where the tables reside. If none is
9106
- # provided, the AWS account ID is used by default.
9184
+ # provided, the Amazon Web Services account ID is used by default.
9107
9185
  # @return [String]
9108
9186
  #
9109
9187
  # @!attribute [rw] database_name
@@ -9279,7 +9357,8 @@ module Aws::Glue
9279
9357
  #
9280
9358
  # @!attribute [rw] catalog_id
9281
9359
  # The ID of the Data Catalog where the function to be retrieved is
9282
- # located. If none is provided, the AWS account ID is used by default.
9360
+ # located. If none is provided, the Amazon Web Services account ID is
9361
+ # used by default.
9283
9362
  # @return [String]
9284
9363
  #
9285
9364
  # @!attribute [rw] database_name
@@ -9325,7 +9404,8 @@ module Aws::Glue
9325
9404
  #
9326
9405
  # @!attribute [rw] catalog_id
9327
9406
  # The ID of the Data Catalog where the functions to be retrieved are
9328
- # located. If none is provided, the AWS account ID is used by default.
9407
+ # located. If none is provided, the Amazon Web Services account ID is
9408
+ # used by default.
9329
9409
  # @return [String]
9330
9410
  #
9331
9411
  # @!attribute [rw] database_name
@@ -9593,8 +9673,8 @@ module Aws::Glue
9593
9673
  include Aws::Structure
9594
9674
  end
9595
9675
 
9596
- # The database and table in the AWS Glue Data Catalog that is used for
9597
- # input or output data.
9676
+ # The database and table in the Glue Data Catalog that is used for input
9677
+ # or output data.
9598
9678
  #
9599
9679
  # @note When making an API call, you may pass GlueTable
9600
9680
  # data as a hash:
@@ -9607,19 +9687,19 @@ module Aws::Glue
9607
9687
  # }
9608
9688
  #
9609
9689
  # @!attribute [rw] database_name
9610
- # A database name in the AWS Glue Data Catalog.
9690
+ # A database name in the Glue Data Catalog.
9611
9691
  # @return [String]
9612
9692
  #
9613
9693
  # @!attribute [rw] table_name
9614
- # A table name in the AWS Glue Data Catalog.
9694
+ # A table name in the Glue Data Catalog.
9615
9695
  # @return [String]
9616
9696
  #
9617
9697
  # @!attribute [rw] catalog_id
9618
- # A unique identifier for the AWS Glue Data Catalog.
9698
+ # A unique identifier for the Glue Data Catalog.
9619
9699
  # @return [String]
9620
9700
  #
9621
9701
  # @!attribute [rw] connection_name
9622
- # The name of the connection to the AWS Glue Data Catalog.
9702
+ # The name of the connection to the Glue Data Catalog.
9623
9703
  # @return [String]
9624
9704
  #
9625
9705
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GlueTable AWS API Documentation
@@ -9725,8 +9805,8 @@ module Aws::Glue
9725
9805
  # }
9726
9806
  #
9727
9807
  # @!attribute [rw] catalog_id
9728
- # The ID of the catalog to import. Currently, this should be the AWS
9729
- # account ID.
9808
+ # The ID of the catalog to import. Currently, this should be the
9809
+ # Amazon Web Services account ID.
9730
9810
  # @return [String]
9731
9811
  #
9732
9812
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/ImportCatalogToGlueRequest AWS API Documentation
@@ -9860,22 +9940,22 @@ module Aws::Glue
9860
9940
  # @return [Types::ExecutionProperty]
9861
9941
  #
9862
9942
  # @!attribute [rw] command
9863
- # The `JobCommand` that executes this job.
9943
+ # The `JobCommand` that runs this job.
9864
9944
  # @return [Types::JobCommand]
9865
9945
  #
9866
9946
  # @!attribute [rw] default_arguments
9867
9947
  # The default arguments for this job, specified as name-value pairs.
9868
9948
  #
9869
9949
  # You can specify arguments here that your own job-execution script
9870
- # consumes, as well as arguments that AWS Glue itself consumes.
9950
+ # consumes, as well as arguments that Glue itself consumes.
9871
9951
  #
9872
9952
  # For information about how to specify and consume your own Job
9873
- # arguments, see the [Calling AWS Glue APIs in Python][1] topic in the
9953
+ # arguments, see the [Calling Glue APIs in Python][1] topic in the
9874
9954
  # developer guide.
9875
9955
  #
9876
- # For information about the key-value pairs that AWS Glue consumes to
9877
- # set up your job, see the [Special Parameters Used by AWS Glue][2]
9878
- # topic in the developer guide.
9956
+ # For information about the key-value pairs that Glue consumes to set
9957
+ # up your job, see the [Special Parameters Used by Glue][2] topic in
9958
+ # the developer guide.
9879
9959
  #
9880
9960
  #
9881
9961
  #
@@ -9899,11 +9979,11 @@ module Aws::Glue
9899
9979
  # @!attribute [rw] allocated_capacity
9900
9980
  # This field is deprecated. Use `MaxCapacity` instead.
9901
9981
  #
9902
- # The number of AWS Glue data processing units (DPUs) allocated to
9903
- # runs of this job. You can allocate from 2 to 100 DPUs; the default
9904
- # is 10. A DPU is a relative measure of processing power that consists
9905
- # of 4 vCPUs of compute capacity and 16 GB of memory. For more
9906
- # information, see the [AWS Glue pricing page][1].
9982
+ # The number of Glue data processing units (DPUs) allocated to runs of
9983
+ # this job. You can allocate from 2 to 100 DPUs; the default is 10. A
9984
+ # DPU is a relative measure of processing power that consists of 4
9985
+ # vCPUs of compute capacity and 16 GB of memory. For more information,
9986
+ # see the [Glue pricing page][1].
9907
9987
  #
9908
9988
  #
9909
9989
  #
@@ -9919,11 +9999,11 @@ module Aws::Glue
9919
9999
  # @return [Integer]
9920
10000
  #
9921
10001
  # @!attribute [rw] max_capacity
9922
- # The number of AWS Glue data processing units (DPUs) that can be
10002
+ # For Glue version 1.0 or earlier jobs, using the standard worker
10003
+ # type, the number of Glue data processing units (DPUs) that can be
9923
10004
  # allocated when this job runs. A DPU is a relative measure of
9924
10005
  # processing power that consists of 4 vCPUs of compute capacity and 16
9925
- # GB of memory. For more information, see the [AWS Glue pricing
9926
- # page][1].
10006
+ # GB of memory. For more information, see the [Glue pricing page][1].
9927
10007
  #
9928
10008
  # Do not set `Max Capacity` if using `WorkerType` and
9929
10009
  # `NumberOfWorkers`.
@@ -9942,6 +10022,10 @@ module Aws::Glue
9942
10022
  # 100 DPUs. The default is 10 DPUs. This job type cannot have a
9943
10023
  # fractional DPU allocation.
9944
10024
  #
10025
+ # For Glue version 2.0 jobs, you cannot instead specify a `Maximum
10026
+ # capacity`. Instead, you should specify a `Worker type` and the
10027
+ # `Number of workers`.
10028
+ #
9945
10029
  #
9946
10030
  #
9947
10031
  # [1]: https://aws.amazon.com/glue/pricing/
@@ -9982,10 +10066,10 @@ module Aws::Glue
9982
10066
  #
9983
10067
  # @!attribute [rw] glue_version
9984
10068
  # Glue version determines the versions of Apache Spark and Python that
9985
- # AWS Glue supports. The Python version indicates the version
9986
- # supported for jobs of type Spark.
10069
+ # Glue supports. The Python version indicates the version supported
10070
+ # for jobs of type Spark.
9987
10071
  #
9988
- # For more information about the available AWS Glue versions and
10072
+ # For more information about the available Glue versions and
9989
10073
  # corresponding Spark and Python versions, see [Glue version][1] in
9990
10074
  # the developer guide.
9991
10075
  #
@@ -10096,7 +10180,7 @@ module Aws::Glue
10096
10180
  include Aws::Structure
10097
10181
  end
10098
10182
 
10099
- # Specifies code executed when a job is run.
10183
+ # Specifies code that runs when a job is run.
10100
10184
  #
10101
10185
  # @note When making an API call, you may pass JobCommand
10102
10186
  # data as a hash:
@@ -10115,11 +10199,11 @@ module Aws::Glue
10115
10199
  #
10116
10200
  # @!attribute [rw] script_location
10117
10201
  # Specifies the Amazon Simple Storage Service (Amazon S3) path to a
10118
- # script that executes a job.
10202
+ # script that runs a job.
10119
10203
  # @return [String]
10120
10204
  #
10121
10205
  # @!attribute [rw] python_version
10122
- # The Python version being used to execute a Python shell job. Allowed
10206
+ # The Python version being used to run a Python shell job. Allowed
10123
10207
  # values are 2 or 3.
10124
10208
  # @return [String]
10125
10209
  #
@@ -10184,8 +10268,8 @@ module Aws::Glue
10184
10268
  #
10185
10269
  # @!attribute [rw] job_run_state
10186
10270
  # The current state of the job run. For more information about the
10187
- # statuses of jobs that have terminated abnormally, see [AWS Glue Job
10188
- # Run Statuses][1].
10271
+ # statuses of jobs that have terminated abnormally, see [Glue Job Run
10272
+ # Statuses][1].
10189
10273
  #
10190
10274
  #
10191
10275
  #
@@ -10197,15 +10281,15 @@ module Aws::Glue
10197
10281
  # replace the default arguments set in the job definition itself.
10198
10282
  #
10199
10283
  # You can specify arguments here that your own job-execution script
10200
- # consumes, as well as arguments that AWS Glue itself consumes.
10284
+ # consumes, as well as arguments that Glue itself consumes.
10201
10285
  #
10202
10286
  # For information about how to specify and consume your own job
10203
- # arguments, see the [Calling AWS Glue APIs in Python][1] topic in the
10287
+ # arguments, see the [Calling Glue APIs in Python][1] topic in the
10204
10288
  # developer guide.
10205
10289
  #
10206
- # For information about the key-value pairs that AWS Glue consumes to
10207
- # set up your job, see the [Special Parameters Used by AWS Glue][2]
10208
- # topic in the developer guide.
10290
+ # For information about the key-value pairs that Glue consumes to set
10291
+ # up your job, see the [Special Parameters Used by Glue][2] topic in
10292
+ # the developer guide.
10209
10293
  #
10210
10294
  #
10211
10295
  #
@@ -10224,11 +10308,11 @@ module Aws::Glue
10224
10308
  # @!attribute [rw] allocated_capacity
10225
10309
  # This field is deprecated. Use `MaxCapacity` instead.
10226
10310
  #
10227
- # The number of AWS Glue data processing units (DPUs) allocated to
10228
- # this JobRun. From 2 to 100 DPUs can be allocated; the default is 10.
10229
- # A DPU is a relative measure of processing power that consists of 4
10311
+ # The number of Glue data processing units (DPUs) allocated to this
10312
+ # JobRun. From 2 to 100 DPUs can be allocated; the default is 10. A
10313
+ # DPU is a relative measure of processing power that consists of 4
10230
10314
  # vCPUs of compute capacity and 16 GB of memory. For more information,
10231
- # see the [AWS Glue pricing page][1].
10315
+ # see the [Glue pricing page][1].
10232
10316
  #
10233
10317
  #
10234
10318
  #
@@ -10247,11 +10331,10 @@ module Aws::Glue
10247
10331
  # @return [Integer]
10248
10332
  #
10249
10333
  # @!attribute [rw] max_capacity
10250
- # The number of AWS Glue data processing units (DPUs) that can be
10334
+ # The number of Glue data processing units (DPUs) that can be
10251
10335
  # allocated when this job runs. A DPU is a relative measure of
10252
10336
  # processing power that consists of 4 vCPUs of compute capacity and 16
10253
- # GB of memory. For more information, see the [AWS Glue pricing
10254
- # page][1].
10337
+ # GB of memory. For more information, see the [Glue pricing page][1].
10255
10338
  #
10256
10339
  # Do not set `Max Capacity` if using `WorkerType` and
10257
10340
  # `NumberOfWorkers`.
@@ -10270,7 +10353,7 @@ module Aws::Glue
10270
10353
  #
10271
10354
  #
10272
10355
  #
10273
- # [1]: https://docs.aws.amazon.com/https:/aws.amazon.com/glue/pricing/
10356
+ # [1]: https://aws.amazon.com/glue/pricing/
10274
10357
  # @return [Float]
10275
10358
  #
10276
10359
  # @!attribute [rw] worker_type
@@ -10302,7 +10385,7 @@ module Aws::Glue
10302
10385
  #
10303
10386
  # @!attribute [rw] log_group_name
10304
10387
  # The name of the log group for secure logging that can be server-side
10305
- # encrypted in Amazon CloudWatch using AWS KMS. This name can be
10388
+ # encrypted in Amazon CloudWatch using KMS. This name can be
10306
10389
  # `/aws-glue/jobs/`, in which case the default encryption is `NONE`.
10307
10390
  # If you add a role name and `SecurityConfiguration` name (in other
10308
10391
  # words,
@@ -10316,10 +10399,10 @@ module Aws::Glue
10316
10399
  #
10317
10400
  # @!attribute [rw] glue_version
10318
10401
  # Glue version determines the versions of Apache Spark and Python that
10319
- # AWS Glue supports. The Python version indicates the version
10320
- # supported for jobs of type Spark.
10402
+ # Glue supports. The Python version indicates the version supported
10403
+ # for jobs of type Spark.
10321
10404
  #
10322
- # For more information about the available AWS Glue versions and
10405
+ # For more information about the available Glue versions and
10323
10406
  # corresponding Spark and Python versions, see [Glue version][1] in
10324
10407
  # the developer guide.
10325
10408
  #
@@ -10419,22 +10502,22 @@ module Aws::Glue
10419
10502
  # @return [Types::ExecutionProperty]
10420
10503
  #
10421
10504
  # @!attribute [rw] command
10422
- # The `JobCommand` that executes this job (required).
10505
+ # The `JobCommand` that runs this job (required).
10423
10506
  # @return [Types::JobCommand]
10424
10507
  #
10425
10508
  # @!attribute [rw] default_arguments
10426
10509
  # The default arguments for this job.
10427
10510
  #
10428
10511
  # You can specify arguments here that your own job-execution script
10429
- # consumes, as well as arguments that AWS Glue itself consumes.
10512
+ # consumes, as well as arguments that Glue itself consumes.
10430
10513
  #
10431
10514
  # For information about how to specify and consume your own Job
10432
- # arguments, see the [Calling AWS Glue APIs in Python][1] topic in the
10515
+ # arguments, see the [Calling Glue APIs in Python][1] topic in the
10433
10516
  # developer guide.
10434
10517
  #
10435
- # For information about the key-value pairs that AWS Glue consumes to
10436
- # set up your job, see the [Special Parameters Used by AWS Glue][2]
10437
- # topic in the developer guide.
10518
+ # For information about the key-value pairs that Glue consumes to set
10519
+ # up your job, see the [Special Parameters Used by Glue][2] topic in
10520
+ # the developer guide.
10438
10521
  #
10439
10522
  #
10440
10523
  #
@@ -10458,11 +10541,11 @@ module Aws::Glue
10458
10541
  # @!attribute [rw] allocated_capacity
10459
10542
  # This field is deprecated. Use `MaxCapacity` instead.
10460
10543
  #
10461
- # The number of AWS Glue data processing units (DPUs) to allocate to
10462
- # this job. You can allocate from 2 to 100 DPUs; the default is 10. A
10463
- # DPU is a relative measure of processing power that consists of 4
10464
- # vCPUs of compute capacity and 16 GB of memory. For more information,
10465
- # see the [AWS Glue pricing page][1].
10544
+ # The number of Glue data processing units (DPUs) to allocate to this
10545
+ # job. You can allocate from 2 to 100 DPUs; the default is 10. A DPU
10546
+ # is a relative measure of processing power that consists of 4 vCPUs
10547
+ # of compute capacity and 16 GB of memory. For more information, see
10548
+ # the [Glue pricing page][1].
10466
10549
  #
10467
10550
  #
10468
10551
  #
@@ -10476,11 +10559,11 @@ module Aws::Glue
10476
10559
  # @return [Integer]
10477
10560
  #
10478
10561
  # @!attribute [rw] max_capacity
10479
- # The number of AWS Glue data processing units (DPUs) that can be
10562
+ # For Glue version 1.0 or earlier jobs, using the standard worker
10563
+ # type, the number of Glue data processing units (DPUs) that can be
10480
10564
  # allocated when this job runs. A DPU is a relative measure of
10481
10565
  # processing power that consists of 4 vCPUs of compute capacity and 16
10482
- # GB of memory. For more information, see the [AWS Glue pricing
10483
- # page][1].
10566
+ # GB of memory. For more information, see the [Glue pricing page][1].
10484
10567
  #
10485
10568
  # Do not set `Max Capacity` if using `WorkerType` and
10486
10569
  # `NumberOfWorkers`.
@@ -10498,6 +10581,10 @@ module Aws::Glue
10498
10581
  # 100 DPUs. The default is 10 DPUs. This job type cannot have a
10499
10582
  # fractional DPU allocation.
10500
10583
  #
10584
+ # For Glue version 2.0 jobs, you cannot instead specify a `Maximum
10585
+ # capacity`. Instead, you should specify a `Worker type` and the
10586
+ # `Number of workers`.
10587
+ #
10501
10588
  #
10502
10589
  #
10503
10590
  # [1]: https://aws.amazon.com/glue/pricing/
@@ -10538,10 +10625,10 @@ module Aws::Glue
10538
10625
  #
10539
10626
  # @!attribute [rw] glue_version
10540
10627
  # Glue version determines the versions of Apache Spark and Python that
10541
- # AWS Glue supports. The Python version indicates the version
10542
- # supported for jobs of type Spark.
10628
+ # Glue supports. The Python version indicates the version supported
10629
+ # for jobs of type Spark.
10543
10630
  #
10544
- # For more information about the available AWS Glue versions and
10631
+ # For more information about the available Glue versions and
10545
10632
  # corresponding Spark and Python versions, see [Glue version][1] in
10546
10633
  # the developer guide.
10547
10634
  #
@@ -10594,7 +10681,7 @@ module Aws::Glue
10594
10681
  #
10595
10682
  # @!attribute [rw] json_path
10596
10683
  # A `JsonPath` string defining the JSON data for the classifier to
10597
- # classify. AWS Glue supports a subset of JsonPath, as described in
10684
+ # classify. Glue supports a subset of JsonPath, as described in
10598
10685
  # [Writing JsonPath Custom Classifiers][1].
10599
10686
  #
10600
10687
  #
@@ -11342,7 +11429,7 @@ module Aws::Glue
11342
11429
  # @return [Time]
11343
11430
  #
11344
11431
  # @!attribute [rw] input_record_tables
11345
- # A list of AWS Glue table definitions used by the transform.
11432
+ # A list of Glue table definitions used by the transform.
11346
11433
  # @return [Array<Types::GlueTable>]
11347
11434
  #
11348
11435
  # @!attribute [rw] parameters
@@ -11358,9 +11445,9 @@ module Aws::Glue
11358
11445
  # @return [Types::EvaluationMetrics]
11359
11446
  #
11360
11447
  # @!attribute [rw] label_count
11361
- # A count identifier for the labeling files generated by AWS Glue for
11362
- # this transform. As you create a better transform, you can
11363
- # iteratively download, label, and upload the labeling file.
11448
+ # A count identifier for the labeling files generated by Glue for this
11449
+ # transform. As you create a better transform, you can iteratively
11450
+ # download, label, and upload the labeling file.
11364
11451
  # @return [Integer]
11365
11452
  #
11366
11453
  # @!attribute [rw] schema
@@ -11371,13 +11458,13 @@ module Aws::Glue
11371
11458
  #
11372
11459
  # @!attribute [rw] role
11373
11460
  # The name or Amazon Resource Name (ARN) of the IAM role with the
11374
- # required permissions. The required permissions include both AWS Glue
11375
- # service role permissions to AWS Glue resources, and Amazon S3
11461
+ # required permissions. The required permissions include both Glue
11462
+ # service role permissions to Glue resources, and Amazon S3
11376
11463
  # permissions required by the transform.
11377
11464
  #
11378
- # * This role needs AWS Glue service role permissions to allow access
11379
- # to resources in AWS Glue. See [Attach a Policy to IAM Users That
11380
- # Access AWS Glue][1].
11465
+ # * This role needs Glue service role permissions to allow access to
11466
+ # resources in Glue. See [Attach a Policy to IAM Users That Access
11467
+ # Glue][1].
11381
11468
  #
11382
11469
  # * This role needs permission to your Amazon Simple Storage Service
11383
11470
  # (Amazon S3) sources, targets, temporary directory, scripts, and
@@ -11389,11 +11476,11 @@ module Aws::Glue
11389
11476
  # @return [String]
11390
11477
  #
11391
11478
  # @!attribute [rw] glue_version
11392
- # This value determines which version of AWS Glue this machine
11393
- # learning transform is compatible with. Glue 1.0 is recommended for
11394
- # most customers. If the value is not set, the Glue compatibility
11395
- # defaults to Glue 0.9. For more information, see [AWS Glue
11396
- # Versions][1] in the developer guide.
11479
+ # This value determines which version of Glue this machine learning
11480
+ # transform is compatible with. Glue 1.0 is recommended for most
11481
+ # customers. If the value is not set, the Glue compatibility defaults
11482
+ # to Glue 0.9. For more information, see [Glue Versions][1] in the
11483
+ # developer guide.
11397
11484
  #
11398
11485
  #
11399
11486
  #
@@ -11401,12 +11488,11 @@ module Aws::Glue
11401
11488
  # @return [String]
11402
11489
  #
11403
11490
  # @!attribute [rw] max_capacity
11404
- # The number of AWS Glue data processing units (DPUs) that are
11405
- # allocated to task runs for this transform. You can allocate from 2
11406
- # to 100 DPUs; the default is 10. A DPU is a relative measure of
11407
- # processing power that consists of 4 vCPUs of compute capacity and 16
11408
- # GB of memory. For more information, see the [AWS Glue pricing
11409
- # page][1].
11491
+ # The number of Glue data processing units (DPUs) that are allocated
11492
+ # to task runs for this transform. You can allocate from 2 to 100
11493
+ # DPUs; the default is 10. A DPU is a relative measure of processing
11494
+ # power that consists of 4 vCPUs of compute capacity and 16 GB of
11495
+ # memory. For more information, see the [Glue pricing page][1].
11410
11496
  #
11411
11497
  # `MaxCapacity` is a mutually exclusive option with `NumberOfWorkers`
11412
11498
  # and `WorkerType`.
@@ -11537,8 +11623,8 @@ module Aws::Glue
11537
11623
  #
11538
11624
  # * DISABLED: encryption is disabled
11539
11625
  #
11540
- # * SSEKMS: use of server-side encryption with AWS Key Management
11541
- # Service (SSE-KMS) for user data stored in Amazon S3.
11626
+ # * SSEKMS: use of server-side encryption with Key Management Service
11627
+ # (SSE-KMS) for user data stored in Amazon S3.
11542
11628
  # @return [String]
11543
11629
  #
11544
11630
  # @!attribute [rw] kms_key_id
@@ -11711,15 +11797,15 @@ module Aws::Glue
11711
11797
  include Aws::Structure
11712
11798
  end
11713
11799
 
11714
- # A node represents an AWS Glue component such as a trigger, or job,
11715
- # etc., that is part of a workflow.
11800
+ # A node represents an Glue component (trigger, crawler, or job) on a
11801
+ # workflow graph.
11716
11802
  #
11717
11803
  # @!attribute [rw] type
11718
- # The type of AWS Glue component represented by the node.
11804
+ # The type of Glue component represented by the node.
11719
11805
  # @return [String]
11720
11806
  #
11721
11807
  # @!attribute [rw] name
11722
- # The name of the AWS Glue component represented by the node.
11808
+ # The name of the Glue component represented by the node.
11723
11809
  # @return [String]
11724
11810
  #
11725
11811
  # @!attribute [rw] unique_id
@@ -12051,8 +12137,8 @@ module Aws::Glue
12051
12137
  #
12052
12138
  # The values for the keys for the new partition must be passed as an
12053
12139
  # array of String objects that must be ordered in the same order as
12054
- # the partition keys appearing in the Amazon S3 prefix. Otherwise AWS
12055
- # Glue will add the values to the wrong keys.
12140
+ # the partition keys appearing in the Amazon S3 prefix. Otherwise Glue
12141
+ # will add the values to the wrong keys.
12056
12142
  # @return [Array<String>]
12057
12143
  #
12058
12144
  # @!attribute [rw] last_access_time
@@ -12279,7 +12365,8 @@ module Aws::Glue
12279
12365
  #
12280
12366
  # @!attribute [rw] catalog_id
12281
12367
  # The ID of the Data Catalog to set the security configuration for. If
12282
- # none is provided, the AWS account ID is used by default.
12368
+ # none is provided, the Amazon Web Services account ID is used by
12369
+ # default.
12283
12370
  # @return [String]
12284
12371
  #
12285
12372
  # @!attribute [rw] data_catalog_encryption_settings
@@ -12338,7 +12425,7 @@ module Aws::Glue
12338
12425
  #
12339
12426
  # * By directly updating the resource policy with `PutResourePolicy`
12340
12427
  #
12341
- # * By using the **Grant permissions** command on the AWS Management
12428
+ # * By using the **Grant permissions** command on the Management
12342
12429
  # Console.
12343
12430
  #
12344
12431
  # Must be set to `'TRUE'` if you have already used the Management
@@ -12593,8 +12680,8 @@ module Aws::Glue
12593
12680
  # When crawling an Amazon S3 data source after the first crawl is
12594
12681
  # complete, specifies whether to crawl the entire dataset again or to
12595
12682
  # crawl only folders that were added since the last crawler run. For
12596
- # more information, see [Incremental Crawls in AWS Glue][1] in the
12597
- # developer guide.
12683
+ # more information, see [Incremental Crawls in Glue][1] in the developer
12684
+ # guide.
12598
12685
  #
12599
12686
  #
12600
12687
  #
@@ -13018,6 +13105,7 @@ module Aws::Glue
13018
13105
  # path: "Path",
13019
13106
  # exclusions: ["Path"],
13020
13107
  # connection_name: "ConnectionName",
13108
+ # sample_size: 1,
13021
13109
  # }
13022
13110
  #
13023
13111
  # @!attribute [rw] path
@@ -13039,12 +13127,19 @@ module Aws::Glue
13039
13127
  # (Amazon VPC).
13040
13128
  # @return [String]
13041
13129
  #
13130
+ # @!attribute [rw] sample_size
13131
+ # Sets the number of files in each leaf folder to be crawled when
13132
+ # crawling sample files in a dataset. If not set, all the files are
13133
+ # crawled. A valid value is an integer between 1 and 249.
13134
+ # @return [Integer]
13135
+ #
13042
13136
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/S3Target AWS API Documentation
13043
13137
  #
13044
13138
  class S3Target < Struct.new(
13045
13139
  :path,
13046
13140
  :exclusions,
13047
- :connection_name)
13141
+ :connection_name,
13142
+ :sample_size)
13048
13143
  SENSITIVE = []
13049
13144
  include Aws::Structure
13050
13145
  end
@@ -13172,7 +13267,7 @@ module Aws::Glue
13172
13267
  include Aws::Structure
13173
13268
  end
13174
13269
 
13175
- # The unique ID of the schema in the AWS Glue schema registry.
13270
+ # The unique ID of the schema in the Glue schema registry.
13176
13271
  #
13177
13272
  # @note When making an API call, you may pass SchemaId
13178
13273
  # data as a hash:
@@ -13251,8 +13346,7 @@ module Aws::Glue
13251
13346
  include Aws::Structure
13252
13347
  end
13253
13348
 
13254
- # An object that references a schema stored in the AWS Glue Schema
13255
- # Registry.
13349
+ # An object that references a schema stored in the Glue Schema Registry.
13256
13350
  #
13257
13351
  # @note When making an API call, you may pass SchemaReference
13258
13352
  # data as a hash:
@@ -13506,7 +13600,7 @@ module Aws::Glue
13506
13600
  end
13507
13601
 
13508
13602
  # Defines a non-overlapping region of a table's partitions, allowing
13509
- # multiple requests to be executed in parallel.
13603
+ # multiple requests to be run in parallel.
13510
13604
  #
13511
13605
  # @note When making an API call, you may pass Segment
13512
13606
  # data as a hash:
@@ -13797,15 +13891,15 @@ module Aws::Glue
13797
13891
  # replace the default arguments set in the job definition itself.
13798
13892
  #
13799
13893
  # You can specify arguments here that your own job-execution script
13800
- # consumes, as well as arguments that AWS Glue itself consumes.
13894
+ # consumes, as well as arguments that Glue itself consumes.
13801
13895
  #
13802
13896
  # For information about how to specify and consume your own Job
13803
- # arguments, see the [Calling AWS Glue APIs in Python][1] topic in the
13897
+ # arguments, see the [Calling Glue APIs in Python][1] topic in the
13804
13898
  # developer guide.
13805
13899
  #
13806
- # For information about the key-value pairs that AWS Glue consumes to
13807
- # set up your job, see the [Special Parameters Used by AWS Glue][2]
13808
- # topic in the developer guide.
13900
+ # For information about the key-value pairs that Glue consumes to set
13901
+ # up your job, see the [Special Parameters Used by Glue][2] topic in
13902
+ # the developer guide.
13809
13903
  #
13810
13904
  #
13811
13905
  #
@@ -13816,15 +13910,15 @@ module Aws::Glue
13816
13910
  # @!attribute [rw] allocated_capacity
13817
13911
  # This field is deprecated. Use `MaxCapacity` instead.
13818
13912
  #
13819
- # The number of AWS Glue data processing units (DPUs) to allocate to
13820
- # this JobRun. From 2 to 100 DPUs can be allocated; the default is 10.
13821
- # A DPU is a relative measure of processing power that consists of 4
13913
+ # The number of Glue data processing units (DPUs) to allocate to this
13914
+ # JobRun. From 2 to 100 DPUs can be allocated; the default is 10. A
13915
+ # DPU is a relative measure of processing power that consists of 4
13822
13916
  # vCPUs of compute capacity and 16 GB of memory. For more information,
13823
- # see the [AWS Glue pricing page][1].
13917
+ # see the [Glue pricing page][1].
13824
13918
  #
13825
13919
  #
13826
13920
  #
13827
- # [1]: https://docs.aws.amazon.com/https:/aws.amazon.com/glue/pricing/
13921
+ # [1]: https://aws.amazon.com/glue/pricing/
13828
13922
  # @return [Integer]
13829
13923
  #
13830
13924
  # @!attribute [rw] timeout
@@ -13835,11 +13929,10 @@ module Aws::Glue
13835
13929
  # @return [Integer]
13836
13930
  #
13837
13931
  # @!attribute [rw] max_capacity
13838
- # The number of AWS Glue data processing units (DPUs) that can be
13932
+ # The number of Glue data processing units (DPUs) that can be
13839
13933
  # allocated when this job runs. A DPU is a relative measure of
13840
13934
  # processing power that consists of 4 vCPUs of compute capacity and 16
13841
- # GB of memory. For more information, see the [AWS Glue pricing
13842
- # page][1].
13935
+ # GB of memory. For more information, see the [Glue pricing page][1].
13843
13936
  #
13844
13937
  # Do not set `Max Capacity` if using `WorkerType` and
13845
13938
  # `NumberOfWorkers`.
@@ -13858,7 +13951,7 @@ module Aws::Glue
13858
13951
  #
13859
13952
  #
13860
13953
  #
13861
- # [1]: https://docs.aws.amazon.com/https:/aws.amazon.com/glue/pricing/
13954
+ # [1]: https://aws.amazon.com/glue/pricing/
13862
13955
  # @return [Float]
13863
13956
  #
13864
13957
  # @!attribute [rw] security_configuration
@@ -14052,6 +14145,28 @@ module Aws::Glue
14052
14145
  include Aws::Structure
14053
14146
  end
14054
14147
 
14148
+ # The batch condition that started the workflow run. Either the number
14149
+ # of events in the batch size arrived, in which case the BatchSize
14150
+ # member is non-zero, or the batch window expired, in which case the
14151
+ # BatchWindow member is non-zero.
14152
+ #
14153
+ # @!attribute [rw] batch_size
14154
+ # Number of events in the batch.
14155
+ # @return [Integer]
14156
+ #
14157
+ # @!attribute [rw] batch_window
14158
+ # Duration of the batch window in seconds.
14159
+ # @return [Integer]
14160
+ #
14161
+ # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/StartingEventBatchCondition AWS API Documentation
14162
+ #
14163
+ class StartingEventBatchCondition < Struct.new(
14164
+ :batch_size,
14165
+ :batch_window)
14166
+ SENSITIVE = []
14167
+ include Aws::Structure
14168
+ end
14169
+
14055
14170
  # @note When making an API call, you may pass StopCrawlerRequest
14056
14171
  # data as a hash:
14057
14172
  #
@@ -14271,7 +14386,7 @@ module Aws::Glue
14271
14386
  # @return [Boolean]
14272
14387
  #
14273
14388
  # @!attribute [rw] schema_reference
14274
- # An object that references a schema stored in the AWS Glue Schema
14389
+ # An object that references a schema stored in the Glue Schema
14275
14390
  # Registry.
14276
14391
  #
14277
14392
  # When creating a table, you can pass an empty list of columns for the
@@ -14418,8 +14533,7 @@ module Aws::Glue
14418
14533
  # @return [String]
14419
14534
  #
14420
14535
  # @!attribute [rw] is_registered_with_lake_formation
14421
- # Indicates whether the table has been registered with AWS Lake
14422
- # Formation.
14536
+ # Indicates whether the table has been registered with Lake Formation.
14423
14537
  # @return [Boolean]
14424
14538
  #
14425
14539
  # @!attribute [rw] target_table
@@ -14737,9 +14851,9 @@ module Aws::Glue
14737
14851
  # }
14738
14852
  #
14739
14853
  # @!attribute [rw] resource_arn
14740
- # The ARN of the AWS Glue resource to which to add the tags. For more
14741
- # information about AWS Glue resource ARNs, see the [AWS Glue ARN
14742
- # string pattern][1].
14854
+ # The ARN of the Glue resource to which to add the tags. For more
14855
+ # information about Glue resource ARNs, see the [Glue ARN string
14856
+ # pattern][1].
14743
14857
  #
14744
14858
  #
14745
14859
  #
@@ -15004,11 +15118,11 @@ module Aws::Glue
15004
15118
  # @return [String]
15005
15119
  #
15006
15120
  # @!attribute [rw] glue_version
15007
- # This value determines which version of AWS Glue this machine
15008
- # learning transform is compatible with. Glue 1.0 is recommended for
15009
- # most customers. If the value is not set, the Glue compatibility
15010
- # defaults to Glue 0.9. For more information, see [AWS Glue
15011
- # Versions][1] in the developer guide.
15121
+ # This value determines which version of Glue this machine learning
15122
+ # transform is compatible with. Glue 1.0 is recommended for most
15123
+ # customers. If the value is not set, the Glue compatibility defaults
15124
+ # to Glue 0.9. For more information, see [Glue Versions][1] in the
15125
+ # developer guide.
15012
15126
  #
15013
15127
  #
15014
15128
  #
@@ -15169,6 +15283,12 @@ module Aws::Glue
15169
15283
  # The predicate of this trigger, which defines when it will fire.
15170
15284
  # @return [Types::Predicate]
15171
15285
  #
15286
+ # @!attribute [rw] event_batching_condition
15287
+ # Batch condition that must be met (specified number of events
15288
+ # received or batch time window expired) before EventBridge event
15289
+ # trigger fires.
15290
+ # @return [Types::EventBatchingCondition]
15291
+ #
15172
15292
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/Trigger AWS API Documentation
15173
15293
  #
15174
15294
  class Trigger < Struct.new(
@@ -15180,7 +15300,8 @@ module Aws::Glue
15180
15300
  :description,
15181
15301
  :schedule,
15182
15302
  :actions,
15183
- :predicate)
15303
+ :predicate,
15304
+ :event_batching_condition)
15184
15305
  SENSITIVE = []
15185
15306
  include Aws::Structure
15186
15307
  end
@@ -15236,6 +15357,10 @@ module Aws::Glue
15236
15357
  # },
15237
15358
  # ],
15238
15359
  # },
15360
+ # event_batching_condition: {
15361
+ # batch_size: 1, # required
15362
+ # batch_window: 1,
15363
+ # },
15239
15364
  # }
15240
15365
  #
15241
15366
  # @!attribute [rw] name
@@ -15264,6 +15389,12 @@ module Aws::Glue
15264
15389
  # The predicate of this trigger, which defines when it will fire.
15265
15390
  # @return [Types::Predicate]
15266
15391
  #
15392
+ # @!attribute [rw] event_batching_condition
15393
+ # Batch condition that must be met (specified number of events
15394
+ # received or batch time window expired) before EventBridge event
15395
+ # trigger fires.
15396
+ # @return [Types::EventBatchingCondition]
15397
+ #
15267
15398
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/TriggerUpdate AWS API Documentation
15268
15399
  #
15269
15400
  class TriggerUpdate < Struct.new(
@@ -15271,7 +15402,8 @@ module Aws::Glue
15271
15402
  :description,
15272
15403
  :schedule,
15273
15404
  :actions,
15274
- :predicate)
15405
+ :predicate,
15406
+ :event_batching_condition)
15275
15407
  SENSITIVE = []
15276
15408
  include Aws::Structure
15277
15409
  end
@@ -15435,7 +15567,8 @@ module Aws::Glue
15435
15567
  #
15436
15568
  # @!attribute [rw] catalog_id
15437
15569
  # The ID of the Data Catalog where the partitions in question reside.
15438
- # If none is supplied, the AWS account ID is used by default.
15570
+ # If none is supplied, the Amazon Web Services account ID is used by
15571
+ # default.
15439
15572
  # @return [String]
15440
15573
  #
15441
15574
  # @!attribute [rw] database_name
@@ -15545,7 +15678,8 @@ module Aws::Glue
15545
15678
  #
15546
15679
  # @!attribute [rw] catalog_id
15547
15680
  # The ID of the Data Catalog where the partitions in question reside.
15548
- # If none is supplied, the AWS account ID is used by default.
15681
+ # If none is supplied, the Amazon Web Services account ID is used by
15682
+ # default.
15549
15683
  # @return [String]
15550
15684
  #
15551
15685
  # @!attribute [rw] database_name
@@ -15607,7 +15741,7 @@ module Aws::Glue
15607
15741
  #
15608
15742
  # @!attribute [rw] catalog_id
15609
15743
  # The ID of the Data Catalog in which the connection resides. If none
15610
- # is provided, the AWS account ID is used by default.
15744
+ # is provided, the Amazon Web Services account ID is used by default.
15611
15745
  # @return [String]
15612
15746
  #
15613
15747
  # @!attribute [rw] name
@@ -15647,6 +15781,7 @@ module Aws::Glue
15647
15781
  # path: "Path",
15648
15782
  # exclusions: ["Path"],
15649
15783
  # connection_name: "ConnectionName",
15784
+ # sample_size: 1,
15650
15785
  # },
15651
15786
  # ],
15652
15787
  # jdbc_targets: [
@@ -15704,7 +15839,7 @@ module Aws::Glue
15704
15839
  # @return [String]
15705
15840
  #
15706
15841
  # @!attribute [rw] database_name
15707
- # The AWS Glue database where results are stored, such as:
15842
+ # The Glue database where results are stored, such as:
15708
15843
  # `arn:aws:daylight:us-east-1::database/sometable/*`.
15709
15844
  # @return [String]
15710
15845
  #
@@ -15915,7 +16050,8 @@ module Aws::Glue
15915
16050
  #
15916
16051
  # @!attribute [rw] catalog_id
15917
16052
  # The ID of the Data Catalog in which the metadata database resides.
15918
- # If none is provided, the AWS account ID is used by default.
16053
+ # If none is provided, the Amazon Web Services account ID is used by
16054
+ # default.
15919
16055
  # @return [String]
15920
16056
  #
15921
16057
  # @!attribute [rw] name
@@ -15999,9 +16135,7 @@ module Aws::Glue
15999
16135
  #
16000
16136
  # * `"--enable-glue-datacatalog": ""`
16001
16137
  #
16002
- # * `"GLUE_PYTHON_VERSION": "3"`
16003
- #
16004
- # * `"GLUE_PYTHON_VERSION": "2"`
16138
+ # ^
16005
16139
  #
16006
16140
  # You can specify a version of Python support for development
16007
16141
  # endpoints by using the `Arguments` parameter in the
@@ -16154,7 +16288,7 @@ module Aws::Glue
16154
16288
  #
16155
16289
  # @!attribute [rw] json_path
16156
16290
  # A `JsonPath` string defining the JSON data for the classifier to
16157
- # classify. AWS Glue supports a subset of JsonPath, as described in
16291
+ # classify. Glue supports a subset of JsonPath, as described in
16158
16292
  # [Writing JsonPath Custom Classifiers][1].
16159
16293
  #
16160
16294
  #
@@ -16220,11 +16354,11 @@ module Aws::Glue
16220
16354
  # @return [String]
16221
16355
  #
16222
16356
  # @!attribute [rw] glue_version
16223
- # This value determines which version of AWS Glue this machine
16224
- # learning transform is compatible with. Glue 1.0 is recommended for
16225
- # most customers. If the value is not set, the Glue compatibility
16226
- # defaults to Glue 0.9. For more information, see [AWS Glue
16227
- # Versions][1] in the developer guide.
16357
+ # This value determines which version of Glue this machine learning
16358
+ # transform is compatible with. Glue 1.0 is recommended for most
16359
+ # customers. If the value is not set, the Glue compatibility defaults
16360
+ # to Glue 0.9. For more information, see [Glue Versions][1] in the
16361
+ # developer guide.
16228
16362
  #
16229
16363
  #
16230
16364
  #
@@ -16232,12 +16366,11 @@ module Aws::Glue
16232
16366
  # @return [String]
16233
16367
  #
16234
16368
  # @!attribute [rw] max_capacity
16235
- # The number of AWS Glue data processing units (DPUs) that are
16236
- # allocated to task runs for this transform. You can allocate from 2
16237
- # to 100 DPUs; the default is 10. A DPU is a relative measure of
16238
- # processing power that consists of 4 vCPUs of compute capacity and 16
16239
- # GB of memory. For more information, see the [AWS Glue pricing
16240
- # page][1].
16369
+ # The number of Glue data processing units (DPUs) that are allocated
16370
+ # to task runs for this transform. You can allocate from 2 to 100
16371
+ # DPUs; the default is 10. A DPU is a relative measure of processing
16372
+ # power that consists of 4 vCPUs of compute capacity and 16 GB of
16373
+ # memory. For more information, see the [Glue pricing page][1].
16241
16374
  #
16242
16375
  # When the `WorkerType` field is set to a value other than `Standard`,
16243
16376
  # the `MaxCapacity` field is set automatically and becomes read-only.
@@ -16379,7 +16512,8 @@ module Aws::Glue
16379
16512
  #
16380
16513
  # @!attribute [rw] catalog_id
16381
16514
  # The ID of the Data Catalog where the partition to be updated
16382
- # resides. If none is provided, the AWS account ID is used by default.
16515
+ # resides. If none is provided, the Amazon Web Services account ID is
16516
+ # used by default.
16383
16517
  # @return [String]
16384
16518
  #
16385
16519
  # @!attribute [rw] database_name
@@ -16632,7 +16766,7 @@ module Aws::Glue
16632
16766
  #
16633
16767
  # @!attribute [rw] catalog_id
16634
16768
  # The ID of the Data Catalog where the table resides. If none is
16635
- # provided, the AWS account ID is used by default.
16769
+ # provided, the Amazon Web Services account ID is used by default.
16636
16770
  # @return [String]
16637
16771
  #
16638
16772
  # @!attribute [rw] database_name
@@ -16701,6 +16835,10 @@ module Aws::Glue
16701
16835
  # },
16702
16836
  # ],
16703
16837
  # },
16838
+ # event_batching_condition: {
16839
+ # batch_size: 1, # required
16840
+ # batch_window: 1,
16841
+ # },
16704
16842
  # },
16705
16843
  # }
16706
16844
  #
@@ -16756,7 +16894,8 @@ module Aws::Glue
16756
16894
  #
16757
16895
  # @!attribute [rw] catalog_id
16758
16896
  # The ID of the Data Catalog where the function to be updated is
16759
- # located. If none is provided, the AWS account ID is used by default.
16897
+ # located. If none is provided, the Amazon Web Services account ID is
16898
+ # used by default.
16760
16899
  # @return [String]
16761
16900
  #
16762
16901
  # @!attribute [rw] database_name
@@ -17010,11 +17149,12 @@ module Aws::Glue
17010
17149
  include Aws::Structure
17011
17150
  end
17012
17151
 
17013
- # A workflow represents a flow in which AWS Glue components should be
17014
- # executed to complete a logical task.
17152
+ # A workflow is a collection of multiple dependent Glue jobs and
17153
+ # crawlers that are run to complete a complex ETL task. A workflow
17154
+ # manages the execution and monitoring of all its jobs and crawlers.
17015
17155
  #
17016
17156
  # @!attribute [rw] name
17017
- # The name of the workflow representing the flow.
17157
+ # The name of the workflow.
17018
17158
  # @return [String]
17019
17159
  #
17020
17160
  # @!attribute [rw] description
@@ -17023,7 +17163,9 @@ module Aws::Glue
17023
17163
  #
17024
17164
  # @!attribute [rw] default_run_properties
17025
17165
  # A collection of properties to be used as part of each execution of
17026
- # the workflow.
17166
+ # the workflow. The run properties are made available to each job in
17167
+ # the workflow. A job can modify the properties for the next jobs in
17168
+ # the flow.
17027
17169
  # @return [Hash<String,String>]
17028
17170
  #
17029
17171
  # @!attribute [rw] created_on
@@ -17039,9 +17181,8 @@ module Aws::Glue
17039
17181
  # @return [Types::WorkflowRun]
17040
17182
  #
17041
17183
  # @!attribute [rw] graph
17042
- # The graph representing all the AWS Glue components that belong to
17043
- # the workflow as nodes and directed connections between them as
17044
- # edges.
17184
+ # The graph representing all the Glue components that belong to the
17185
+ # workflow as nodes and directed connections between them as edges.
17045
17186
  # @return [Types::WorkflowGraph]
17046
17187
  #
17047
17188
  # @!attribute [rw] max_concurrent_runs
@@ -17068,12 +17209,12 @@ module Aws::Glue
17068
17209
  end
17069
17210
 
17070
17211
  # A workflow graph represents the complete workflow containing all the
17071
- # AWS Glue components present in the workflow and all the directed
17212
+ # Glue components present in the workflow and all the directed
17072
17213
  # connections between them.
17073
17214
  #
17074
17215
  # @!attribute [rw] nodes
17075
- # A list of the the AWS Glue components belong to the workflow
17076
- # represented as nodes.
17216
+ # A list of the the Glue components belong to the workflow represented
17217
+ # as nodes.
17077
17218
  # @return [Array<Types::Node>]
17078
17219
  #
17079
17220
  # @!attribute [rw] edges
@@ -17094,7 +17235,7 @@ module Aws::Glue
17094
17235
  # information.
17095
17236
  #
17096
17237
  # @!attribute [rw] name
17097
- # Name of the workflow that was executed.
17238
+ # Name of the workflow that was run.
17098
17239
  # @return [String]
17099
17240
  #
17100
17241
  # @!attribute [rw] workflow_run_id
@@ -17132,11 +17273,14 @@ module Aws::Glue
17132
17273
  # @return [Types::WorkflowRunStatistics]
17133
17274
  #
17134
17275
  # @!attribute [rw] graph
17135
- # The graph representing all the AWS Glue components that belong to
17136
- # the workflow as nodes and directed connections between them as
17137
- # edges.
17276
+ # The graph representing all the Glue components that belong to the
17277
+ # workflow as nodes and directed connections between them as edges.
17138
17278
  # @return [Types::WorkflowGraph]
17139
17279
  #
17280
+ # @!attribute [rw] starting_event_batch_condition
17281
+ # The batch condition that started the workflow run.
17282
+ # @return [Types::StartingEventBatchCondition]
17283
+ #
17140
17284
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/WorkflowRun AWS API Documentation
17141
17285
  #
17142
17286
  class WorkflowRun < Struct.new(
@@ -17149,7 +17293,8 @@ module Aws::Glue
17149
17293
  :status,
17150
17294
  :error_message,
17151
17295
  :statistics,
17152
- :graph)
17296
+ :graph,
17297
+ :starting_event_batch_condition)
17153
17298
  SENSITIVE = []
17154
17299
  include Aws::Structure
17155
17300
  end