aws-sdk-glue 1.30.0 → 1.31.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/aws-sdk-glue.rb +1 -1
- data/lib/aws-sdk-glue/client.rb +66 -40
- data/lib/aws-sdk-glue/client_api.rb +13 -1
- data/lib/aws-sdk-glue/types.rb +152 -98
- metadata +3 -3
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: a3ab46dc47fbdce4c17150278a67b3327e176412
|
4
|
+
data.tar.gz: 24e2830fd80a69476b8d18b0a897b44d4ae32807
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 1f5e3a7c53fdacfd78a80d0da29b1790a757a6abc305ee1db26df840e53aa23e4a4f71b0802aca31ed3fe26cbad565365cda01fc3695ed40a6fd35e8b71bcd02
|
7
|
+
data.tar.gz: 2c04a04f83c6517eab1ebc68e56619a4ccc29cd72a1bf124ed3fc8599a677316d0bd24abf48432cde65c89d495098fb950931d0f8afffa5321e0fe5545446dcb
|
data/lib/aws-sdk-glue.rb
CHANGED
data/lib/aws-sdk-glue/client.rb
CHANGED
@@ -552,7 +552,7 @@ module Aws::Glue
|
|
552
552
|
# permission conditions that uses tags.
|
553
553
|
#
|
554
554
|
# @option params [required, Array<String>] :crawler_names
|
555
|
-
# A list of crawler names, which
|
555
|
+
# A list of crawler names, which might be the names returned from the
|
556
556
|
# `ListCrawlers` operation.
|
557
557
|
#
|
558
558
|
# @return [Types::BatchGetCrawlersResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
@@ -582,6 +582,10 @@ module Aws::Glue
|
|
582
582
|
# resp.crawlers[0].targets.jdbc_targets[0].exclusions[0] #=> String
|
583
583
|
# resp.crawlers[0].targets.dynamo_db_targets #=> Array
|
584
584
|
# resp.crawlers[0].targets.dynamo_db_targets[0].path #=> String
|
585
|
+
# resp.crawlers[0].targets.catalog_targets #=> Array
|
586
|
+
# resp.crawlers[0].targets.catalog_targets[0].database_name #=> String
|
587
|
+
# resp.crawlers[0].targets.catalog_targets[0].tables #=> Array
|
588
|
+
# resp.crawlers[0].targets.catalog_targets[0].tables[0] #=> String
|
585
589
|
# resp.crawlers[0].database_name #=> String
|
586
590
|
# resp.crawlers[0].description #=> String
|
587
591
|
# resp.crawlers[0].classifiers #=> Array
|
@@ -914,7 +918,7 @@ module Aws::Glue
|
|
914
918
|
req.send_request(options)
|
915
919
|
end
|
916
920
|
|
917
|
-
# Creates a classifier in the user's account. This
|
921
|
+
# Creates a classifier in the user's account. This can be a
|
918
922
|
# `GrokClassifier`, an `XMLClassifier`, a `JsonClassifier`, or a
|
919
923
|
# `CsvClassifier`, depending on which field of the request is present.
|
920
924
|
#
|
@@ -1012,17 +1016,17 @@ module Aws::Glue
|
|
1012
1016
|
|
1013
1017
|
# Creates a new crawler with specified targets, role, configuration, and
|
1014
1018
|
# optional schedule. At least one crawl target must be specified, in the
|
1015
|
-
#
|
1019
|
+
# `s3Targets` field, the `jdbcTargets` field, or the `DynamoDBTargets`
|
1016
1020
|
# field.
|
1017
1021
|
#
|
1018
1022
|
# @option params [required, String] :name
|
1019
1023
|
# Name of the new crawler.
|
1020
1024
|
#
|
1021
1025
|
# @option params [required, String] :role
|
1022
|
-
# The IAM role
|
1023
|
-
# customer resources.
|
1026
|
+
# The IAM role or Amazon Resource Name (ARN) of an IAM role used by the
|
1027
|
+
# new crawler to access customer resources.
|
1024
1028
|
#
|
1025
|
-
# @option params [
|
1029
|
+
# @option params [String] :database_name
|
1026
1030
|
# The AWS Glue database where results are written, such as:
|
1027
1031
|
# `arn:aws:daylight:us-east-1::database/sometable/*`.
|
1028
1032
|
#
|
@@ -1033,9 +1037,10 @@ module Aws::Glue
|
|
1033
1037
|
# A list of collection of targets to crawl.
|
1034
1038
|
#
|
1035
1039
|
# @option params [String] :schedule
|
1036
|
-
# A `cron` expression used to specify the schedule
|
1037
|
-
# Schedules for Jobs and Crawlers][1]. For
|
1038
|
-
# every day at 12:15 UTC,
|
1040
|
+
# A `cron` expression used to specify the schedule. For more
|
1041
|
+
# information, see [Time-Based Schedules for Jobs and Crawlers][1]. For
|
1042
|
+
# example, to run something every day at 12:15 UTC, specify `cron(15 12
|
1043
|
+
# * * ? *)`.
|
1039
1044
|
#
|
1040
1045
|
#
|
1041
1046
|
#
|
@@ -1051,11 +1056,11 @@ module Aws::Glue
|
|
1051
1056
|
# The table prefix used for catalog tables that are created.
|
1052
1057
|
#
|
1053
1058
|
# @option params [Types::SchemaChangePolicy] :schema_change_policy
|
1054
|
-
#
|
1059
|
+
# The policy for the crawler's update and deletion behavior.
|
1055
1060
|
#
|
1056
1061
|
# @option params [String] :configuration
|
1057
|
-
#
|
1058
|
-
# users to specify aspects of a crawler's behavior. For more
|
1062
|
+
# The crawler configuration information. This versioned JSON string
|
1063
|
+
# allows users to specify aspects of a crawler's behavior. For more
|
1059
1064
|
# information, see [Configuring a Crawler][1].
|
1060
1065
|
#
|
1061
1066
|
#
|
@@ -1063,13 +1068,13 @@ module Aws::Glue
|
|
1063
1068
|
# [1]: http://docs.aws.amazon.com/glue/latest/dg/crawler-configuration.html
|
1064
1069
|
#
|
1065
1070
|
# @option params [String] :crawler_security_configuration
|
1066
|
-
# The name of the SecurityConfiguration structure to be used by this
|
1067
|
-
#
|
1071
|
+
# The name of the `SecurityConfiguration` structure to be used by this
|
1072
|
+
# crawler.
|
1068
1073
|
#
|
1069
1074
|
# @option params [Hash<String,String>] :tags
|
1070
|
-
# The tags to use with this crawler request. You
|
1071
|
-
# access to the crawler. For more information
|
1072
|
-
#
|
1075
|
+
# The tags to use with this crawler request. You can use tags to limit
|
1076
|
+
# access to the crawler. For more information, see [AWS Tags in AWS
|
1077
|
+
# Glue][1].
|
1073
1078
|
#
|
1074
1079
|
#
|
1075
1080
|
#
|
@@ -1082,7 +1087,7 @@ module Aws::Glue
|
|
1082
1087
|
# resp = client.create_crawler({
|
1083
1088
|
# name: "NameString", # required
|
1084
1089
|
# role: "Role", # required
|
1085
|
-
# database_name: "DatabaseName",
|
1090
|
+
# database_name: "DatabaseName",
|
1086
1091
|
# description: "DescriptionString",
|
1087
1092
|
# targets: { # required
|
1088
1093
|
# s3_targets: [
|
@@ -1103,6 +1108,12 @@ module Aws::Glue
|
|
1103
1108
|
# path: "Path",
|
1104
1109
|
# },
|
1105
1110
|
# ],
|
1111
|
+
# catalog_targets: [
|
1112
|
+
# {
|
1113
|
+
# database_name: "NameString", # required
|
1114
|
+
# tables: ["NameString"], # required
|
1115
|
+
# },
|
1116
|
+
# ],
|
1106
1117
|
# },
|
1107
1118
|
# schedule: "CronExpression",
|
1108
1119
|
# classifiers: ["NameString"],
|
@@ -1950,11 +1961,11 @@ module Aws::Glue
|
|
1950
1961
|
req.send_request(options)
|
1951
1962
|
end
|
1952
1963
|
|
1953
|
-
# Removes a specified crawler from the Data Catalog, unless the
|
1954
|
-
# state is `RUNNING`.
|
1964
|
+
# Removes a specified crawler from the AWS Glue Data Catalog, unless the
|
1965
|
+
# crawler state is `RUNNING`.
|
1955
1966
|
#
|
1956
1967
|
# @option params [required, String] :name
|
1957
|
-
#
|
1968
|
+
# The name of the crawler to remove.
|
1958
1969
|
#
|
1959
1970
|
# @return [Struct] Returns an empty {Seahorse::Client::Response response}.
|
1960
1971
|
#
|
@@ -2380,7 +2391,7 @@ module Aws::Glue
|
|
2380
2391
|
# Lists all classifier objects in the Data Catalog.
|
2381
2392
|
#
|
2382
2393
|
# @option params [Integer] :max_results
|
2383
|
-
#
|
2394
|
+
# The size of the list to return (optional).
|
2384
2395
|
#
|
2385
2396
|
# @option params [String] :next_token
|
2386
2397
|
# An optional continuation token.
|
@@ -2567,7 +2578,7 @@ module Aws::Glue
|
|
2567
2578
|
# Retrieves metadata for a specified crawler.
|
2568
2579
|
#
|
2569
2580
|
# @option params [required, String] :name
|
2570
|
-
#
|
2581
|
+
# The name of the crawler to retrieve metadata for.
|
2571
2582
|
#
|
2572
2583
|
# @return [Types::GetCrawlerResponse] Returns a {Seahorse::Client::Response response} object which responds to the following methods:
|
2573
2584
|
#
|
@@ -2594,6 +2605,10 @@ module Aws::Glue
|
|
2594
2605
|
# resp.crawler.targets.jdbc_targets[0].exclusions[0] #=> String
|
2595
2606
|
# resp.crawler.targets.dynamo_db_targets #=> Array
|
2596
2607
|
# resp.crawler.targets.dynamo_db_targets[0].path #=> String
|
2608
|
+
# resp.crawler.targets.catalog_targets #=> Array
|
2609
|
+
# resp.crawler.targets.catalog_targets[0].database_name #=> String
|
2610
|
+
# resp.crawler.targets.catalog_targets[0].tables #=> Array
|
2611
|
+
# resp.crawler.targets.catalog_targets[0].tables[0] #=> String
|
2597
2612
|
# resp.crawler.database_name #=> String
|
2598
2613
|
# resp.crawler.description #=> String
|
2599
2614
|
# resp.crawler.classifiers #=> Array
|
@@ -2708,6 +2723,10 @@ module Aws::Glue
|
|
2708
2723
|
# resp.crawlers[0].targets.jdbc_targets[0].exclusions[0] #=> String
|
2709
2724
|
# resp.crawlers[0].targets.dynamo_db_targets #=> Array
|
2710
2725
|
# resp.crawlers[0].targets.dynamo_db_targets[0].path #=> String
|
2726
|
+
# resp.crawlers[0].targets.catalog_targets #=> Array
|
2727
|
+
# resp.crawlers[0].targets.catalog_targets[0].database_name #=> String
|
2728
|
+
# resp.crawlers[0].targets.catalog_targets[0].tables #=> Array
|
2729
|
+
# resp.crawlers[0].targets.catalog_targets[0].tables[0] #=> String
|
2711
2730
|
# resp.crawlers[0].database_name #=> String
|
2712
2731
|
# resp.crawlers[0].description #=> String
|
2713
2732
|
# resp.crawlers[0].classifiers #=> Array
|
@@ -3591,7 +3610,7 @@ module Aws::Glue
|
|
3591
3610
|
# The target tables.
|
3592
3611
|
#
|
3593
3612
|
# @option params [Types::Location] :location
|
3594
|
-
#
|
3613
|
+
# The parameters for the mapping.
|
3595
3614
|
#
|
3596
3615
|
# @option params [String] :language
|
3597
3616
|
# The programming language of the code to perform the mapping.
|
@@ -5169,8 +5188,8 @@ module Aws::Glue
|
|
5169
5188
|
# Name of the new crawler.
|
5170
5189
|
#
|
5171
5190
|
# @option params [String] :role
|
5172
|
-
# The IAM role
|
5173
|
-
# customer resources.
|
5191
|
+
# The IAM role or Amazon Resource Name (ARN) of an IAM role that is used
|
5192
|
+
# by the new crawler to access customer resources.
|
5174
5193
|
#
|
5175
5194
|
# @option params [String] :database_name
|
5176
5195
|
# The AWS Glue database where results are stored, such as:
|
@@ -5183,9 +5202,10 @@ module Aws::Glue
|
|
5183
5202
|
# A list of targets to crawl.
|
5184
5203
|
#
|
5185
5204
|
# @option params [String] :schedule
|
5186
|
-
# A `cron` expression used to specify the schedule
|
5187
|
-
# Schedules for Jobs and Crawlers][1]. For
|
5188
|
-
# every day at 12:15 UTC,
|
5205
|
+
# A `cron` expression used to specify the schedule. For more
|
5206
|
+
# information, see [Time-Based Schedules for Jobs and Crawlers][1]. For
|
5207
|
+
# example, to run something every day at 12:15 UTC, specify `cron(15 12
|
5208
|
+
# * * ? *)`.
|
5189
5209
|
#
|
5190
5210
|
#
|
5191
5211
|
#
|
@@ -5201,11 +5221,11 @@ module Aws::Glue
|
|
5201
5221
|
# The table prefix used for catalog tables that are created.
|
5202
5222
|
#
|
5203
5223
|
# @option params [Types::SchemaChangePolicy] :schema_change_policy
|
5204
|
-
#
|
5224
|
+
# The policy for the crawler's update and deletion behavior.
|
5205
5225
|
#
|
5206
5226
|
# @option params [String] :configuration
|
5207
|
-
#
|
5208
|
-
# users to specify aspects of a crawler's behavior. For more
|
5227
|
+
# The crawler configuration information. This versioned JSON string
|
5228
|
+
# allows users to specify aspects of a crawler's behavior. For more
|
5209
5229
|
# information, see [Configuring a Crawler][1].
|
5210
5230
|
#
|
5211
5231
|
#
|
@@ -5213,8 +5233,8 @@ module Aws::Glue
|
|
5213
5233
|
# [1]: http://docs.aws.amazon.com/glue/latest/dg/crawler-configuration.html
|
5214
5234
|
#
|
5215
5235
|
# @option params [String] :crawler_security_configuration
|
5216
|
-
# The name of the SecurityConfiguration structure to be used by this
|
5217
|
-
#
|
5236
|
+
# The name of the `SecurityConfiguration` structure to be used by this
|
5237
|
+
# crawler.
|
5218
5238
|
#
|
5219
5239
|
# @return [Struct] Returns an empty {Seahorse::Client::Response response}.
|
5220
5240
|
#
|
@@ -5244,6 +5264,12 @@ module Aws::Glue
|
|
5244
5264
|
# path: "Path",
|
5245
5265
|
# },
|
5246
5266
|
# ],
|
5267
|
+
# catalog_targets: [
|
5268
|
+
# {
|
5269
|
+
# database_name: "NameString", # required
|
5270
|
+
# tables: ["NameString"], # required
|
5271
|
+
# },
|
5272
|
+
# ],
|
5247
5273
|
# },
|
5248
5274
|
# schedule: "CronExpression",
|
5249
5275
|
# classifiers: ["NameString"],
|
@@ -5268,13 +5294,13 @@ module Aws::Glue
|
|
5268
5294
|
# Updates the schedule of a crawler using a `cron` expression.
|
5269
5295
|
#
|
5270
5296
|
# @option params [required, String] :crawler_name
|
5271
|
-
#
|
5297
|
+
# The name of the crawler whose schedule to update.
|
5272
5298
|
#
|
5273
5299
|
# @option params [String] :schedule
|
5274
|
-
# The updated `cron` expression used to specify the schedule
|
5275
|
-
# [Time-Based Schedules for Jobs and Crawlers][1]. For
|
5276
|
-
# something every day at 12:15 UTC,
|
5277
|
-
# *)`.
|
5300
|
+
# The updated `cron` expression used to specify the schedule. For more
|
5301
|
+
# information, see [Time-Based Schedules for Jobs and Crawlers][1]. For
|
5302
|
+
# example, to run something every day at 12:15 UTC, specify `cron(15 12
|
5303
|
+
# * * ? *)`.
|
5278
5304
|
#
|
5279
5305
|
#
|
5280
5306
|
#
|
@@ -5776,7 +5802,7 @@ module Aws::Glue
|
|
5776
5802
|
params: params,
|
5777
5803
|
config: config)
|
5778
5804
|
context[:gem_name] = 'aws-sdk-glue'
|
5779
|
-
context[:gem_version] = '1.
|
5805
|
+
context[:gem_version] = '1.31.0'
|
5780
5806
|
Seahorse::Client::Request.new(handlers, context)
|
5781
5807
|
end
|
5782
5808
|
|
@@ -56,6 +56,9 @@ module Aws::Glue
|
|
56
56
|
CatalogEntry = Shapes::StructureShape.new(name: 'CatalogEntry')
|
57
57
|
CatalogIdString = Shapes::StringShape.new(name: 'CatalogIdString')
|
58
58
|
CatalogImportStatus = Shapes::StructureShape.new(name: 'CatalogImportStatus')
|
59
|
+
CatalogTablesList = Shapes::ListShape.new(name: 'CatalogTablesList')
|
60
|
+
CatalogTarget = Shapes::StructureShape.new(name: 'CatalogTarget')
|
61
|
+
CatalogTargetList = Shapes::ListShape.new(name: 'CatalogTargetList')
|
59
62
|
Classification = Shapes::StringShape.new(name: 'Classification')
|
60
63
|
Classifier = Shapes::StructureShape.new(name: 'Classifier')
|
61
64
|
ClassifierList = Shapes::ListShape.new(name: 'ClassifierList')
|
@@ -615,6 +618,14 @@ module Aws::Glue
|
|
615
618
|
CatalogImportStatus.add_member(:imported_by, Shapes::ShapeRef.new(shape: NameString, location_name: "ImportedBy"))
|
616
619
|
CatalogImportStatus.struct_class = Types::CatalogImportStatus
|
617
620
|
|
621
|
+
CatalogTablesList.member = Shapes::ShapeRef.new(shape: NameString)
|
622
|
+
|
623
|
+
CatalogTarget.add_member(:database_name, Shapes::ShapeRef.new(shape: NameString, required: true, location_name: "DatabaseName"))
|
624
|
+
CatalogTarget.add_member(:tables, Shapes::ShapeRef.new(shape: CatalogTablesList, required: true, location_name: "Tables"))
|
625
|
+
CatalogTarget.struct_class = Types::CatalogTarget
|
626
|
+
|
627
|
+
CatalogTargetList.member = Shapes::ShapeRef.new(shape: CatalogTarget)
|
628
|
+
|
618
629
|
Classifier.add_member(:grok_classifier, Shapes::ShapeRef.new(shape: GrokClassifier, location_name: "GrokClassifier"))
|
619
630
|
Classifier.add_member(:xml_classifier, Shapes::ShapeRef.new(shape: XMLClassifier, location_name: "XMLClassifier"))
|
620
631
|
Classifier.add_member(:json_classifier, Shapes::ShapeRef.new(shape: JsonClassifier, location_name: "JsonClassifier"))
|
@@ -732,6 +743,7 @@ module Aws::Glue
|
|
732
743
|
CrawlerTargets.add_member(:s3_targets, Shapes::ShapeRef.new(shape: S3TargetList, location_name: "S3Targets"))
|
733
744
|
CrawlerTargets.add_member(:jdbc_targets, Shapes::ShapeRef.new(shape: JdbcTargetList, location_name: "JdbcTargets"))
|
734
745
|
CrawlerTargets.add_member(:dynamo_db_targets, Shapes::ShapeRef.new(shape: DynamoDBTargetList, location_name: "DynamoDBTargets"))
|
746
|
+
CrawlerTargets.add_member(:catalog_targets, Shapes::ShapeRef.new(shape: CatalogTargetList, location_name: "CatalogTargets"))
|
735
747
|
CrawlerTargets.struct_class = Types::CrawlerTargets
|
736
748
|
|
737
749
|
CreateClassifierRequest.add_member(:grok_classifier, Shapes::ShapeRef.new(shape: CreateGrokClassifierRequest, location_name: "GrokClassifier"))
|
@@ -750,7 +762,7 @@ module Aws::Glue
|
|
750
762
|
|
751
763
|
CreateCrawlerRequest.add_member(:name, Shapes::ShapeRef.new(shape: NameString, required: true, location_name: "Name"))
|
752
764
|
CreateCrawlerRequest.add_member(:role, Shapes::ShapeRef.new(shape: Role, required: true, location_name: "Role"))
|
753
|
-
CreateCrawlerRequest.add_member(:database_name, Shapes::ShapeRef.new(shape: DatabaseName,
|
765
|
+
CreateCrawlerRequest.add_member(:database_name, Shapes::ShapeRef.new(shape: DatabaseName, location_name: "DatabaseName"))
|
754
766
|
CreateCrawlerRequest.add_member(:description, Shapes::ShapeRef.new(shape: DescriptionString, location_name: "Description"))
|
755
767
|
CreateCrawlerRequest.add_member(:targets, Shapes::ShapeRef.new(shape: CrawlerTargets, required: true, location_name: "Targets"))
|
756
768
|
CreateCrawlerRequest.add_member(:schedule, Shapes::ShapeRef.new(shape: CronExpression, location_name: "Schedule"))
|
data/lib/aws-sdk-glue/types.rb
CHANGED
@@ -378,7 +378,7 @@ module Aws::Glue
|
|
378
378
|
# }
|
379
379
|
#
|
380
380
|
# @!attribute [rw] crawler_names
|
381
|
-
# A list of crawler names, which
|
381
|
+
# A list of crawler names, which might be the names returned from the
|
382
382
|
# `ListCrawlers` operation.
|
383
383
|
# @return [Array<String>]
|
384
384
|
#
|
@@ -394,7 +394,7 @@ module Aws::Glue
|
|
394
394
|
# @return [Array<Types::Crawler>]
|
395
395
|
#
|
396
396
|
# @!attribute [rw] crawlers_not_found
|
397
|
-
# A list of names of crawlers not found.
|
397
|
+
# A list of names of crawlers that were not found.
|
398
398
|
# @return [Array<String>]
|
399
399
|
#
|
400
400
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/BatchGetCrawlersResponse AWS API Documentation
|
@@ -653,7 +653,7 @@ module Aws::Glue
|
|
653
653
|
include Aws::Structure
|
654
654
|
end
|
655
655
|
|
656
|
-
# Specifies a table definition in the Data Catalog.
|
656
|
+
# Specifies a table definition in the AWS Glue Data Catalog.
|
657
657
|
#
|
658
658
|
# @note When making an API call, you may pass CatalogEntry
|
659
659
|
# data as a hash:
|
@@ -702,32 +702,58 @@ module Aws::Glue
|
|
702
702
|
include Aws::Structure
|
703
703
|
end
|
704
704
|
|
705
|
+
# Specifies an AWS Glue Data Catalog target.
|
706
|
+
#
|
707
|
+
# @note When making an API call, you may pass CatalogTarget
|
708
|
+
# data as a hash:
|
709
|
+
#
|
710
|
+
# {
|
711
|
+
# database_name: "NameString", # required
|
712
|
+
# tables: ["NameString"], # required
|
713
|
+
# }
|
714
|
+
#
|
715
|
+
# @!attribute [rw] database_name
|
716
|
+
# The name of the database to be synchronized.
|
717
|
+
# @return [String]
|
718
|
+
#
|
719
|
+
# @!attribute [rw] tables
|
720
|
+
# A list of the tables to be synchronized.
|
721
|
+
# @return [Array<String>]
|
722
|
+
#
|
723
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/CatalogTarget AWS API Documentation
|
724
|
+
#
|
725
|
+
class CatalogTarget < Struct.new(
|
726
|
+
:database_name,
|
727
|
+
:tables)
|
728
|
+
include Aws::Structure
|
729
|
+
end
|
730
|
+
|
705
731
|
# Classifiers are triggered during a crawl task. A classifier checks
|
706
|
-
# whether a given file is in a format it can handle
|
732
|
+
# whether a given file is in a format it can handle. If it is, the
|
707
733
|
# classifier creates a schema in the form of a `StructType` object that
|
708
734
|
# matches that data format.
|
709
735
|
#
|
710
|
-
# You can use the standard classifiers that AWS Glue
|
736
|
+
# You can use the standard classifiers that AWS Glue provides, or you
|
711
737
|
# can write your own classifiers to best categorize your data sources
|
712
738
|
# and specify the appropriate schemas to use for them. A classifier can
|
713
739
|
# be a `grok` classifier, an `XML` classifier, a `JSON` classifier, or a
|
714
|
-
# custom `CSV` classifier as specified in one of the fields in the
|
740
|
+
# custom `CSV` classifier, as specified in one of the fields in the
|
715
741
|
# `Classifier` object.
|
716
742
|
#
|
717
743
|
# @!attribute [rw] grok_classifier
|
718
|
-
# A `
|
744
|
+
# A classifier that uses `grok`.
|
719
745
|
# @return [Types::GrokClassifier]
|
720
746
|
#
|
721
747
|
# @!attribute [rw] xml_classifier
|
722
|
-
#
|
748
|
+
# A classifier for XML content.
|
723
749
|
# @return [Types::XMLClassifier]
|
724
750
|
#
|
725
751
|
# @!attribute [rw] json_classifier
|
726
|
-
# A
|
752
|
+
# A classifier for JSON content.
|
727
753
|
# @return [Types::JsonClassifier]
|
728
754
|
#
|
729
755
|
# @!attribute [rw] csv_classifier
|
730
|
-
# A
|
756
|
+
# A classifier for comma-separated values (CSV).
|
731
757
|
# @return [Types::CsvClassifier]
|
732
758
|
#
|
733
759
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/Classifier AWS API Documentation
|
@@ -821,7 +847,7 @@ module Aws::Glue
|
|
821
847
|
# @return [String]
|
822
848
|
#
|
823
849
|
# @!attribute [rw] node_type
|
824
|
-
# The type of node this is.
|
850
|
+
# The type of node that this is.
|
825
851
|
# @return [String]
|
826
852
|
#
|
827
853
|
# @!attribute [rw] args
|
@@ -1169,12 +1195,13 @@ module Aws::Glue
|
|
1169
1195
|
# Catalog.
|
1170
1196
|
#
|
1171
1197
|
# @!attribute [rw] name
|
1172
|
-
# The crawler
|
1198
|
+
# The name of the crawler.
|
1173
1199
|
# @return [String]
|
1174
1200
|
#
|
1175
1201
|
# @!attribute [rw] role
|
1176
|
-
# The
|
1177
|
-
# resources, such as
|
1202
|
+
# The Amazon Resource Name (ARN) of an IAM role that's used to access
|
1203
|
+
# customer resources, such as Amazon Simple Storage Service (Amazon
|
1204
|
+
# S3) data.
|
1178
1205
|
# @return [String]
|
1179
1206
|
#
|
1180
1207
|
# @!attribute [rw] targets
|
@@ -1182,7 +1209,7 @@ module Aws::Glue
|
|
1182
1209
|
# @return [Types::CrawlerTargets]
|
1183
1210
|
#
|
1184
1211
|
# @!attribute [rw] database_name
|
1185
|
-
# The database
|
1212
|
+
# The name of the database in which the crawler's output is stored.
|
1186
1213
|
# @return [String]
|
1187
1214
|
#
|
1188
1215
|
# @!attribute [rw] description
|
@@ -1190,12 +1217,13 @@ module Aws::Glue
|
|
1190
1217
|
# @return [String]
|
1191
1218
|
#
|
1192
1219
|
# @!attribute [rw] classifiers
|
1193
|
-
# A list of
|
1220
|
+
# A list of UTF-8 strings that specify the custom classifiers that are
|
1221
|
+
# associated with the crawler.
|
1194
1222
|
# @return [Array<String>]
|
1195
1223
|
#
|
1196
1224
|
# @!attribute [rw] schema_change_policy
|
1197
|
-
#
|
1198
|
-
#
|
1225
|
+
# The policy that specifies update and delete behaviors for the
|
1226
|
+
# crawler.
|
1199
1227
|
# @return [Types::SchemaChangePolicy]
|
1200
1228
|
#
|
1201
1229
|
# @!attribute [rw] state
|
@@ -1217,11 +1245,11 @@ module Aws::Glue
|
|
1217
1245
|
# @return [Integer]
|
1218
1246
|
#
|
1219
1247
|
# @!attribute [rw] creation_time
|
1220
|
-
# The time
|
1248
|
+
# The time that the crawler was created.
|
1221
1249
|
# @return [Time]
|
1222
1250
|
#
|
1223
1251
|
# @!attribute [rw] last_updated
|
1224
|
-
# The time the crawler was last updated.
|
1252
|
+
# The time that the crawler was last updated.
|
1225
1253
|
# @return [Time]
|
1226
1254
|
#
|
1227
1255
|
# @!attribute [rw] last_crawl
|
@@ -1244,8 +1272,8 @@ module Aws::Glue
|
|
1244
1272
|
# @return [String]
|
1245
1273
|
#
|
1246
1274
|
# @!attribute [rw] crawler_security_configuration
|
1247
|
-
# The name of the SecurityConfiguration structure to be used by this
|
1248
|
-
#
|
1275
|
+
# The name of the `SecurityConfiguration` structure to be used by this
|
1276
|
+
# crawler.
|
1249
1277
|
# @return [String]
|
1250
1278
|
#
|
1251
1279
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/Crawler AWS API Documentation
|
@@ -1344,10 +1372,16 @@ module Aws::Glue
|
|
1344
1372
|
# path: "Path",
|
1345
1373
|
# },
|
1346
1374
|
# ],
|
1375
|
+
# catalog_targets: [
|
1376
|
+
# {
|
1377
|
+
# database_name: "NameString", # required
|
1378
|
+
# tables: ["NameString"], # required
|
1379
|
+
# },
|
1380
|
+
# ],
|
1347
1381
|
# }
|
1348
1382
|
#
|
1349
1383
|
# @!attribute [rw] s3_targets
|
1350
|
-
# Specifies Amazon S3 targets.
|
1384
|
+
# Specifies Amazon Simple Storage Service (Amazon S3) targets.
|
1351
1385
|
# @return [Array<Types::S3Target>]
|
1352
1386
|
#
|
1353
1387
|
# @!attribute [rw] jdbc_targets
|
@@ -1355,15 +1389,20 @@ module Aws::Glue
|
|
1355
1389
|
# @return [Array<Types::JdbcTarget>]
|
1356
1390
|
#
|
1357
1391
|
# @!attribute [rw] dynamo_db_targets
|
1358
|
-
# Specifies DynamoDB targets.
|
1392
|
+
# Specifies Amazon DynamoDB targets.
|
1359
1393
|
# @return [Array<Types::DynamoDBTarget>]
|
1360
1394
|
#
|
1395
|
+
# @!attribute [rw] catalog_targets
|
1396
|
+
# Specifies AWS Glue Data Catalog targets.
|
1397
|
+
# @return [Array<Types::CatalogTarget>]
|
1398
|
+
#
|
1361
1399
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/CrawlerTargets AWS API Documentation
|
1362
1400
|
#
|
1363
1401
|
class CrawlerTargets < Struct.new(
|
1364
1402
|
:s3_targets,
|
1365
1403
|
:jdbc_targets,
|
1366
|
-
:dynamo_db_targets
|
1404
|
+
:dynamo_db_targets,
|
1405
|
+
:catalog_targets)
|
1367
1406
|
include Aws::Structure
|
1368
1407
|
end
|
1369
1408
|
|
@@ -1475,7 +1514,7 @@ module Aws::Glue
|
|
1475
1514
|
# {
|
1476
1515
|
# name: "NameString", # required
|
1477
1516
|
# role: "Role", # required
|
1478
|
-
# database_name: "DatabaseName",
|
1517
|
+
# database_name: "DatabaseName",
|
1479
1518
|
# description: "DescriptionString",
|
1480
1519
|
# targets: { # required
|
1481
1520
|
# s3_targets: [
|
@@ -1496,6 +1535,12 @@ module Aws::Glue
|
|
1496
1535
|
# path: "Path",
|
1497
1536
|
# },
|
1498
1537
|
# ],
|
1538
|
+
# catalog_targets: [
|
1539
|
+
# {
|
1540
|
+
# database_name: "NameString", # required
|
1541
|
+
# tables: ["NameString"], # required
|
1542
|
+
# },
|
1543
|
+
# ],
|
1499
1544
|
# },
|
1500
1545
|
# schedule: "CronExpression",
|
1501
1546
|
# classifiers: ["NameString"],
|
@@ -1516,8 +1561,8 @@ module Aws::Glue
|
|
1516
1561
|
# @return [String]
|
1517
1562
|
#
|
1518
1563
|
# @!attribute [rw] role
|
1519
|
-
# The IAM role
|
1520
|
-
# access customer resources.
|
1564
|
+
# The IAM role or Amazon Resource Name (ARN) of an IAM role used by
|
1565
|
+
# the new crawler to access customer resources.
|
1521
1566
|
# @return [String]
|
1522
1567
|
#
|
1523
1568
|
# @!attribute [rw] database_name
|
@@ -1534,9 +1579,10 @@ module Aws::Glue
|
|
1534
1579
|
# @return [Types::CrawlerTargets]
|
1535
1580
|
#
|
1536
1581
|
# @!attribute [rw] schedule
|
1537
|
-
# A `cron` expression used to specify the schedule
|
1538
|
-
# Schedules for Jobs and Crawlers][1].
|
1539
|
-
# every day at 12:15 UTC,
|
1582
|
+
# A `cron` expression used to specify the schedule. For more
|
1583
|
+
# information, see [Time-Based Schedules for Jobs and Crawlers][1].
|
1584
|
+
# For example, to run something every day at 12:15 UTC, specify
|
1585
|
+
# `cron(15 12 * * ? *)`.
|
1540
1586
|
#
|
1541
1587
|
#
|
1542
1588
|
#
|
@@ -1555,12 +1601,12 @@ module Aws::Glue
|
|
1555
1601
|
# @return [String]
|
1556
1602
|
#
|
1557
1603
|
# @!attribute [rw] schema_change_policy
|
1558
|
-
#
|
1604
|
+
# The policy for the crawler's update and deletion behavior.
|
1559
1605
|
# @return [Types::SchemaChangePolicy]
|
1560
1606
|
#
|
1561
1607
|
# @!attribute [rw] configuration
|
1562
|
-
#
|
1563
|
-
# users to specify aspects of a crawler's behavior. For more
|
1608
|
+
# The crawler configuration information. This versioned JSON string
|
1609
|
+
# allows users to specify aspects of a crawler's behavior. For more
|
1564
1610
|
# information, see [Configuring a Crawler][1].
|
1565
1611
|
#
|
1566
1612
|
#
|
@@ -1569,14 +1615,14 @@ module Aws::Glue
|
|
1569
1615
|
# @return [String]
|
1570
1616
|
#
|
1571
1617
|
# @!attribute [rw] crawler_security_configuration
|
1572
|
-
# The name of the SecurityConfiguration structure to be used by this
|
1573
|
-
#
|
1618
|
+
# The name of the `SecurityConfiguration` structure to be used by this
|
1619
|
+
# crawler.
|
1574
1620
|
# @return [String]
|
1575
1621
|
#
|
1576
1622
|
# @!attribute [rw] tags
|
1577
|
-
# The tags to use with this crawler request. You
|
1578
|
-
# access to the crawler. For more information
|
1579
|
-
#
|
1623
|
+
# The tags to use with this crawler request. You can use tags to limit
|
1624
|
+
# access to the crawler. For more information, see [AWS Tags in AWS
|
1625
|
+
# Glue][1].
|
1580
1626
|
#
|
1581
1627
|
#
|
1582
1628
|
#
|
@@ -2179,7 +2225,7 @@ module Aws::Glue
|
|
2179
2225
|
#
|
2180
2226
|
# @!attribute [rw] json_path
|
2181
2227
|
# A `JsonPath` string defining the JSON data for the classifier to
|
2182
|
-
# classify. AWS Glue supports a subset of JsonPath
|
2228
|
+
# classify. AWS Glue supports a subset of `JsonPath`, as described in
|
2183
2229
|
# [Writing JsonPath Custom Classifiers][1].
|
2184
2230
|
#
|
2185
2231
|
#
|
@@ -2679,11 +2725,11 @@ module Aws::Glue
|
|
2679
2725
|
#
|
2680
2726
|
# @!attribute [rw] row_tag
|
2681
2727
|
# The XML tag designating the element that contains each record in an
|
2682
|
-
# XML document being parsed.
|
2683
|
-
#
|
2684
|
-
#
|
2685
|
-
#
|
2686
|
-
#
|
2728
|
+
# XML document being parsed. This can't identify a self-closing
|
2729
|
+
# element (closed by `/>`). An empty row element that contains only
|
2730
|
+
# attributes can be parsed as long as it ends with a closing tag (for
|
2731
|
+
# example, `<row item_a="A" item_b="B"></row>` is okay, but `<row
|
2732
|
+
# item_a="A" item_b="B" />` is not).
|
2687
2733
|
# @return [String]
|
2688
2734
|
#
|
2689
2735
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/CreateXMLClassifierRequest AWS API Documentation
|
@@ -2702,11 +2748,11 @@ module Aws::Glue
|
|
2702
2748
|
# @return [String]
|
2703
2749
|
#
|
2704
2750
|
# @!attribute [rw] creation_time
|
2705
|
-
# The time this classifier was registered.
|
2751
|
+
# The time that this classifier was registered.
|
2706
2752
|
# @return [Time]
|
2707
2753
|
#
|
2708
2754
|
# @!attribute [rw] last_updated
|
2709
|
-
# The time this classifier was last updated.
|
2755
|
+
# The time that this classifier was last updated.
|
2710
2756
|
# @return [Time]
|
2711
2757
|
#
|
2712
2758
|
# @!attribute [rw] version
|
@@ -2720,7 +2766,7 @@ module Aws::Glue
|
|
2720
2766
|
#
|
2721
2767
|
# @!attribute [rw] quote_symbol
|
2722
2768
|
# A custom symbol to denote what combines content into a single column
|
2723
|
-
# value.
|
2769
|
+
# value. It must be different from the column delimiter.
|
2724
2770
|
# @return [String]
|
2725
2771
|
#
|
2726
2772
|
# @!attribute [rw] contains_header
|
@@ -2733,7 +2779,7 @@ module Aws::Glue
|
|
2733
2779
|
#
|
2734
2780
|
# @!attribute [rw] disable_value_trimming
|
2735
2781
|
# Specifies not to trim values before identifying the type of column
|
2736
|
-
# values. The default value is true
|
2782
|
+
# values. The default value is `true`.
|
2737
2783
|
# @return [Boolean]
|
2738
2784
|
#
|
2739
2785
|
# @!attribute [rw] allow_single_column
|
@@ -2930,7 +2976,7 @@ module Aws::Glue
|
|
2930
2976
|
# }
|
2931
2977
|
#
|
2932
2978
|
# @!attribute [rw] name
|
2933
|
-
#
|
2979
|
+
# The name of the crawler to remove.
|
2934
2980
|
# @return [String]
|
2935
2981
|
#
|
2936
2982
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/DeleteCrawlerRequest AWS API Documentation
|
@@ -3452,7 +3498,7 @@ module Aws::Glue
|
|
3452
3498
|
include Aws::Structure
|
3453
3499
|
end
|
3454
3500
|
|
3455
|
-
# Specifies
|
3501
|
+
# Specifies an Amazon DynamoDB table to crawl.
|
3456
3502
|
#
|
3457
3503
|
# @note When making an API call, you may pass DynamoDBTarget
|
3458
3504
|
# data as a hash:
|
@@ -3649,7 +3695,7 @@ module Aws::Glue
|
|
3649
3695
|
# }
|
3650
3696
|
#
|
3651
3697
|
# @!attribute [rw] max_results
|
3652
|
-
#
|
3698
|
+
# The size of the list to return (optional).
|
3653
3699
|
# @return [Integer]
|
3654
3700
|
#
|
3655
3701
|
# @!attribute [rw] next_token
|
@@ -3879,7 +3925,7 @@ module Aws::Glue
|
|
3879
3925
|
# }
|
3880
3926
|
#
|
3881
3927
|
# @!attribute [rw] name
|
3882
|
-
#
|
3928
|
+
# The name of the crawler to retrieve metadata for.
|
3883
3929
|
# @return [String]
|
3884
3930
|
#
|
3885
3931
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GetCrawlerRequest AWS API Documentation
|
@@ -4668,7 +4714,7 @@ module Aws::Glue
|
|
4668
4714
|
# @return [Array<Types::CatalogEntry>]
|
4669
4715
|
#
|
4670
4716
|
# @!attribute [rw] location
|
4671
|
-
#
|
4717
|
+
# The parameters for the mapping.
|
4672
4718
|
# @return [Types::Location]
|
4673
4719
|
#
|
4674
4720
|
# @!attribute [rw] language
|
@@ -4691,7 +4737,7 @@ module Aws::Glue
|
|
4691
4737
|
# @return [String]
|
4692
4738
|
#
|
4693
4739
|
# @!attribute [rw] scala_code
|
4694
|
-
# Scala code to perform the mapping.
|
4740
|
+
# The Scala code to perform the mapping.
|
4695
4741
|
# @return [String]
|
4696
4742
|
#
|
4697
4743
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GetPlanResponse AWS API Documentation
|
@@ -5247,11 +5293,11 @@ module Aws::Glue
|
|
5247
5293
|
# @return [String]
|
5248
5294
|
#
|
5249
5295
|
# @!attribute [rw] creation_time
|
5250
|
-
# The time this classifier was registered.
|
5296
|
+
# The time that this classifier was registered.
|
5251
5297
|
# @return [Time]
|
5252
5298
|
#
|
5253
5299
|
# @!attribute [rw] last_updated
|
5254
|
-
# The time this classifier was last updated.
|
5300
|
+
# The time that this classifier was last updated.
|
5255
5301
|
# @return [Time]
|
5256
5302
|
#
|
5257
5303
|
# @!attribute [rw] version
|
@@ -5261,7 +5307,7 @@ module Aws::Glue
|
|
5261
5307
|
# @!attribute [rw] grok_pattern
|
5262
5308
|
# The grok pattern applied to a data store by this classifier. For
|
5263
5309
|
# more information, see built-in patterns in [Writing Custom
|
5264
|
-
#
|
5310
|
+
# Classifiers][1].
|
5265
5311
|
#
|
5266
5312
|
#
|
5267
5313
|
#
|
@@ -5270,7 +5316,7 @@ module Aws::Glue
|
|
5270
5316
|
#
|
5271
5317
|
# @!attribute [rw] custom_patterns
|
5272
5318
|
# Optional custom grok patterns defined by this classifier. For more
|
5273
|
-
# information, see custom patterns in [Writing Custom
|
5319
|
+
# information, see custom patterns in [Writing Custom Classifiers][1].
|
5274
5320
|
#
|
5275
5321
|
#
|
5276
5322
|
#
|
@@ -5982,11 +6028,11 @@ module Aws::Glue
|
|
5982
6028
|
# @return [String]
|
5983
6029
|
#
|
5984
6030
|
# @!attribute [rw] creation_time
|
5985
|
-
# The time this classifier was registered.
|
6031
|
+
# The time that this classifier was registered.
|
5986
6032
|
# @return [Time]
|
5987
6033
|
#
|
5988
6034
|
# @!attribute [rw] last_updated
|
5989
|
-
# The time this classifier was last updated.
|
6035
|
+
# The time that this classifier was last updated.
|
5990
6036
|
# @return [Time]
|
5991
6037
|
#
|
5992
6038
|
# @!attribute [rw] version
|
@@ -5995,7 +6041,7 @@ module Aws::Glue
|
|
5995
6041
|
#
|
5996
6042
|
# @!attribute [rw] json_path
|
5997
6043
|
# A `JsonPath` string defining the JSON data for the classifier to
|
5998
|
-
# classify. AWS Glue supports a subset of JsonPath
|
6044
|
+
# classify. AWS Glue supports a subset of `JsonPath`, as described in
|
5999
6045
|
# [Writing JsonPath Custom Classifiers][1].
|
6000
6046
|
#
|
6001
6047
|
#
|
@@ -6294,11 +6340,11 @@ module Aws::Glue
|
|
6294
6340
|
# @return [Array<Types::CodeGenNodeArg>]
|
6295
6341
|
#
|
6296
6342
|
# @!attribute [rw] s3
|
6297
|
-
# An Amazon S3 location.
|
6343
|
+
# An Amazon Simple Storage Service (Amazon S3) location.
|
6298
6344
|
# @return [Array<Types::CodeGenNodeArg>]
|
6299
6345
|
#
|
6300
6346
|
# @!attribute [rw] dynamo_db
|
6301
|
-
#
|
6347
|
+
# An Amazon DynamoDB table location.
|
6302
6348
|
# @return [Array<Types::CodeGenNodeArg>]
|
6303
6349
|
#
|
6304
6350
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/Location AWS API Documentation
|
@@ -6839,7 +6885,7 @@ module Aws::Glue
|
|
6839
6885
|
include Aws::Structure
|
6840
6886
|
end
|
6841
6887
|
|
6842
|
-
# Specifies a data store in Amazon S3.
|
6888
|
+
# Specifies a data store in Amazon Simple Storage Service (Amazon S3).
|
6843
6889
|
#
|
6844
6890
|
# @note When making an API call, you may pass S3Target
|
6845
6891
|
# data as a hash:
|
@@ -6873,9 +6919,10 @@ module Aws::Glue
|
|
6873
6919
|
# A scheduling object using a `cron` statement to schedule an event.
|
6874
6920
|
#
|
6875
6921
|
# @!attribute [rw] schedule_expression
|
6876
|
-
# A `cron` expression used to specify the schedule
|
6877
|
-
# Schedules for Jobs and Crawlers][1].
|
6878
|
-
# every day at 12:15 UTC,
|
6922
|
+
# A `cron` expression used to specify the schedule. For more
|
6923
|
+
# information, see [Time-Based Schedules for Jobs and Crawlers][1].
|
6924
|
+
# For example, to run something every day at 12:15 UTC, specify
|
6925
|
+
# `cron(15 12 * * ? *)`.
|
6879
6926
|
#
|
6880
6927
|
#
|
6881
6928
|
#
|
@@ -6894,7 +6941,7 @@ module Aws::Glue
|
|
6894
6941
|
include Aws::Structure
|
6895
6942
|
end
|
6896
6943
|
|
6897
|
-
#
|
6944
|
+
# A policy that specifies update and deletion behaviors for the crawler.
|
6898
6945
|
#
|
6899
6946
|
# @note When making an API call, you may pass SchemaChangePolicy
|
6900
6947
|
# data as a hash:
|
@@ -8098,6 +8145,12 @@ module Aws::Glue
|
|
8098
8145
|
# path: "Path",
|
8099
8146
|
# },
|
8100
8147
|
# ],
|
8148
|
+
# catalog_targets: [
|
8149
|
+
# {
|
8150
|
+
# database_name: "NameString", # required
|
8151
|
+
# tables: ["NameString"], # required
|
8152
|
+
# },
|
8153
|
+
# ],
|
8101
8154
|
# },
|
8102
8155
|
# schedule: "CronExpression",
|
8103
8156
|
# classifiers: ["NameString"],
|
@@ -8115,8 +8168,8 @@ module Aws::Glue
|
|
8115
8168
|
# @return [String]
|
8116
8169
|
#
|
8117
8170
|
# @!attribute [rw] role
|
8118
|
-
# The IAM role
|
8119
|
-
# access customer resources.
|
8171
|
+
# The IAM role or Amazon Resource Name (ARN) of an IAM role that is
|
8172
|
+
# used by the new crawler to access customer resources.
|
8120
8173
|
# @return [String]
|
8121
8174
|
#
|
8122
8175
|
# @!attribute [rw] database_name
|
@@ -8133,9 +8186,10 @@ module Aws::Glue
|
|
8133
8186
|
# @return [Types::CrawlerTargets]
|
8134
8187
|
#
|
8135
8188
|
# @!attribute [rw] schedule
|
8136
|
-
# A `cron` expression used to specify the schedule
|
8137
|
-
# Schedules for Jobs and Crawlers][1].
|
8138
|
-
# every day at 12:15 UTC,
|
8189
|
+
# A `cron` expression used to specify the schedule. For more
|
8190
|
+
# information, see [Time-Based Schedules for Jobs and Crawlers][1].
|
8191
|
+
# For example, to run something every day at 12:15 UTC, specify
|
8192
|
+
# `cron(15 12 * * ? *)`.
|
8139
8193
|
#
|
8140
8194
|
#
|
8141
8195
|
#
|
@@ -8154,12 +8208,12 @@ module Aws::Glue
|
|
8154
8208
|
# @return [String]
|
8155
8209
|
#
|
8156
8210
|
# @!attribute [rw] schema_change_policy
|
8157
|
-
#
|
8211
|
+
# The policy for the crawler's update and deletion behavior.
|
8158
8212
|
# @return [Types::SchemaChangePolicy]
|
8159
8213
|
#
|
8160
8214
|
# @!attribute [rw] configuration
|
8161
|
-
#
|
8162
|
-
# users to specify aspects of a crawler's behavior. For more
|
8215
|
+
# The crawler configuration information. This versioned JSON string
|
8216
|
+
# allows users to specify aspects of a crawler's behavior. For more
|
8163
8217
|
# information, see [Configuring a Crawler][1].
|
8164
8218
|
#
|
8165
8219
|
#
|
@@ -8168,8 +8222,8 @@ module Aws::Glue
|
|
8168
8222
|
# @return [String]
|
8169
8223
|
#
|
8170
8224
|
# @!attribute [rw] crawler_security_configuration
|
8171
|
-
# The name of the SecurityConfiguration structure to be used by this
|
8172
|
-
#
|
8225
|
+
# The name of the `SecurityConfiguration` structure to be used by this
|
8226
|
+
# crawler.
|
8173
8227
|
# @return [String]
|
8174
8228
|
#
|
8175
8229
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/UpdateCrawlerRequest AWS API Documentation
|
@@ -8202,14 +8256,14 @@ module Aws::Glue
|
|
8202
8256
|
# }
|
8203
8257
|
#
|
8204
8258
|
# @!attribute [rw] crawler_name
|
8205
|
-
#
|
8259
|
+
# The name of the crawler whose schedule to update.
|
8206
8260
|
# @return [String]
|
8207
8261
|
#
|
8208
8262
|
# @!attribute [rw] schedule
|
8209
|
-
# The updated `cron` expression used to specify the schedule
|
8210
|
-
# [Time-Based Schedules for Jobs and Crawlers][1].
|
8211
|
-
# something every day at 12:15 UTC,
|
8212
|
-
# ? *)`.
|
8263
|
+
# The updated `cron` expression used to specify the schedule. For more
|
8264
|
+
# information, see [Time-Based Schedules for Jobs and Crawlers][1].
|
8265
|
+
# For example, to run something every day at 12:15 UTC, specify
|
8266
|
+
# `cron(15 12 * * ? *)`.
|
8213
8267
|
#
|
8214
8268
|
#
|
8215
8269
|
#
|
@@ -8254,7 +8308,7 @@ module Aws::Glue
|
|
8254
8308
|
#
|
8255
8309
|
# @!attribute [rw] quote_symbol
|
8256
8310
|
# A custom symbol to denote what combines content into a single column
|
8257
|
-
# value.
|
8311
|
+
# value. It must be different from the column delimiter.
|
8258
8312
|
# @return [String]
|
8259
8313
|
#
|
8260
8314
|
# @!attribute [rw] contains_header
|
@@ -8521,7 +8575,7 @@ module Aws::Glue
|
|
8521
8575
|
#
|
8522
8576
|
# @!attribute [rw] json_path
|
8523
8577
|
# A `JsonPath` string defining the JSON data for the classifier to
|
8524
|
-
# classify. AWS Glue supports a subset of JsonPath
|
8578
|
+
# classify. AWS Glue supports a subset of `JsonPath`, as described in
|
8525
8579
|
# [Writing JsonPath Custom Classifiers][1].
|
8526
8580
|
#
|
8527
8581
|
#
|
@@ -8872,11 +8926,11 @@ module Aws::Glue
|
|
8872
8926
|
#
|
8873
8927
|
# @!attribute [rw] row_tag
|
8874
8928
|
# The XML tag designating the element that contains each record in an
|
8875
|
-
# XML document being parsed.
|
8876
|
-
#
|
8877
|
-
#
|
8878
|
-
#
|
8879
|
-
#
|
8929
|
+
# XML document being parsed. This cannot identify a self-closing
|
8930
|
+
# element (closed by `/>`). An empty row element that contains only
|
8931
|
+
# attributes can be parsed as long as it ends with a closing tag (for
|
8932
|
+
# example, `<row item_a="A" item_b="B"></row>` is okay, but `<row
|
8933
|
+
# item_a="A" item_b="B" />` is not).
|
8880
8934
|
# @return [String]
|
8881
8935
|
#
|
8882
8936
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/UpdateXMLClassifierRequest AWS API Documentation
|
@@ -8987,11 +9041,11 @@ module Aws::Glue
|
|
8987
9041
|
# @return [String]
|
8988
9042
|
#
|
8989
9043
|
# @!attribute [rw] creation_time
|
8990
|
-
# The time this classifier was registered.
|
9044
|
+
# The time that this classifier was registered.
|
8991
9045
|
# @return [Time]
|
8992
9046
|
#
|
8993
9047
|
# @!attribute [rw] last_updated
|
8994
|
-
# The time this classifier was last updated.
|
9048
|
+
# The time that this classifier was last updated.
|
8995
9049
|
# @return [Time]
|
8996
9050
|
#
|
8997
9051
|
# @!attribute [rw] version
|
@@ -9000,11 +9054,11 @@ module Aws::Glue
|
|
9000
9054
|
#
|
9001
9055
|
# @!attribute [rw] row_tag
|
9002
9056
|
# The XML tag designating the element that contains each record in an
|
9003
|
-
# XML document being parsed.
|
9004
|
-
#
|
9005
|
-
#
|
9006
|
-
#
|
9007
|
-
#
|
9057
|
+
# XML document being parsed. This can't identify a self-closing
|
9058
|
+
# element (closed by `/>`). An empty row element that contains only
|
9059
|
+
# attributes can be parsed as long as it ends with a closing tag (for
|
9060
|
+
# example, `<row item_a="A" item_b="B"></row>` is okay, but `<row
|
9061
|
+
# item_a="A" item_b="B" />` is not).
|
9008
9062
|
# @return [String]
|
9009
9063
|
#
|
9010
9064
|
# @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/XMLClassifier AWS API Documentation
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: aws-sdk-glue
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.
|
4
|
+
version: 1.31.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Amazon Web Services
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2019-
|
11
|
+
date: 2019-05-10 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: aws-sdk-core
|
@@ -59,7 +59,7 @@ files:
|
|
59
59
|
- lib/aws-sdk-glue/errors.rb
|
60
60
|
- lib/aws-sdk-glue/resource.rb
|
61
61
|
- lib/aws-sdk-glue/types.rb
|
62
|
-
homepage:
|
62
|
+
homepage: https://github.com/aws/aws-sdk-ruby
|
63
63
|
licenses:
|
64
64
|
- Apache-2.0
|
65
65
|
metadata:
|