aws-sdk-gluedatabrew 1.15.0 → 1.19.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/CHANGELOG.md +20 -0
- data/VERSION +1 -1
- data/lib/aws-sdk-gluedatabrew/client.rb +404 -9
- data/lib/aws-sdk-gluedatabrew/client_api.rb +207 -1
- data/lib/aws-sdk-gluedatabrew/types.rb +845 -22
- data/lib/aws-sdk-gluedatabrew.rb +1 -1
- metadata +4 -4
@@ -23,6 +23,30 @@ module Aws::GlueDataBrew
|
|
23
23
|
include Aws::Structure
|
24
24
|
end
|
25
25
|
|
26
|
+
# Configuration of statistics that are allowed to be run on columns that
|
27
|
+
# contain detected entities. When undefined, no statistics will be
|
28
|
+
# computed on columns that contain detected entities.
|
29
|
+
#
|
30
|
+
# @note When making an API call, you may pass AllowedStatistics
|
31
|
+
# data as a hash:
|
32
|
+
#
|
33
|
+
# {
|
34
|
+
# statistics: ["Statistic"], # required
|
35
|
+
# }
|
36
|
+
#
|
37
|
+
# @!attribute [rw] statistics
|
38
|
+
# One or more column statistics to allow for columns that contain
|
39
|
+
# detected entities.
|
40
|
+
# @return [Array<String>]
|
41
|
+
#
|
42
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/AllowedStatistics AWS API Documentation
|
43
|
+
#
|
44
|
+
class AllowedStatistics < Struct.new(
|
45
|
+
:statistics)
|
46
|
+
SENSITIVE = []
|
47
|
+
include Aws::Structure
|
48
|
+
end
|
49
|
+
|
26
50
|
# @note When making an API call, you may pass BatchDeleteRecipeVersionRequest
|
27
51
|
# data as a hash:
|
28
52
|
#
|
@@ -228,6 +252,7 @@ module Aws::GlueDataBrew
|
|
228
252
|
# s3_input_definition: {
|
229
253
|
# bucket: "Bucket", # required
|
230
254
|
# key: "Key",
|
255
|
+
# bucket_owner: "BucketOwner",
|
231
256
|
# },
|
232
257
|
# data_catalog_input_definition: {
|
233
258
|
# catalog_id: "CatalogId",
|
@@ -236,15 +261,21 @@ module Aws::GlueDataBrew
|
|
236
261
|
# temp_directory: {
|
237
262
|
# bucket: "Bucket", # required
|
238
263
|
# key: "Key",
|
264
|
+
# bucket_owner: "BucketOwner",
|
239
265
|
# },
|
240
266
|
# },
|
241
267
|
# database_input_definition: {
|
242
268
|
# glue_connection_name: "GlueConnectionName", # required
|
243
|
-
# database_table_name: "DatabaseTableName",
|
269
|
+
# database_table_name: "DatabaseTableName",
|
244
270
|
# temp_directory: {
|
245
271
|
# bucket: "Bucket", # required
|
246
272
|
# key: "Key",
|
273
|
+
# bucket_owner: "BucketOwner",
|
247
274
|
# },
|
275
|
+
# query_string: "QueryString",
|
276
|
+
# },
|
277
|
+
# metadata: {
|
278
|
+
# source_arn: "Arn",
|
248
279
|
# },
|
249
280
|
# },
|
250
281
|
# path_options: {
|
@@ -351,6 +382,7 @@ module Aws::GlueDataBrew
|
|
351
382
|
# output_location: { # required
|
352
383
|
# bucket: "Bucket", # required
|
353
384
|
# key: "Key",
|
385
|
+
# bucket_owner: "BucketOwner",
|
354
386
|
# },
|
355
387
|
# configuration: {
|
356
388
|
# dataset_statistics_configuration: {
|
@@ -391,7 +423,21 @@ module Aws::GlueDataBrew
|
|
391
423
|
# },
|
392
424
|
# },
|
393
425
|
# ],
|
426
|
+
# entity_detector_configuration: {
|
427
|
+
# entity_types: ["EntityType"], # required
|
428
|
+
# allowed_statistics: [
|
429
|
+
# {
|
430
|
+
# statistics: ["Statistic"], # required
|
431
|
+
# },
|
432
|
+
# ],
|
433
|
+
# },
|
394
434
|
# },
|
435
|
+
# validation_configurations: [
|
436
|
+
# {
|
437
|
+
# ruleset_arn: "Arn", # required
|
438
|
+
# validation_mode: "CHECK_ALL", # accepts CHECK_ALL
|
439
|
+
# },
|
440
|
+
# ],
|
395
441
|
# role_arn: "Arn", # required
|
396
442
|
# tags: {
|
397
443
|
# "TagKey" => "TagValue",
|
@@ -442,8 +488,9 @@ module Aws::GlueDataBrew
|
|
442
488
|
# @return [Integer]
|
443
489
|
#
|
444
490
|
# @!attribute [rw] output_location
|
445
|
-
# Represents an Amazon S3 location (bucket name
|
446
|
-
# DataBrew can read input data, or write output from
|
491
|
+
# Represents an Amazon S3 location (bucket name, bucket owner, and
|
492
|
+
# object key) where DataBrew can read input data, or write output from
|
493
|
+
# a job.
|
447
494
|
# @return [Types::S3Location]
|
448
495
|
#
|
449
496
|
# @!attribute [rw] configuration
|
@@ -453,6 +500,11 @@ module Aws::GlueDataBrew
|
|
453
500
|
# settings.
|
454
501
|
# @return [Types::ProfileConfiguration]
|
455
502
|
#
|
503
|
+
# @!attribute [rw] validation_configurations
|
504
|
+
# List of validation configurations that are applied to the profile
|
505
|
+
# job.
|
506
|
+
# @return [Array<Types::ValidationConfiguration>]
|
507
|
+
#
|
456
508
|
# @!attribute [rw] role_arn
|
457
509
|
# The Amazon Resource Name (ARN) of the Identity and Access Management
|
458
510
|
# (IAM) role to be assumed when DataBrew runs the job.
|
@@ -487,6 +539,7 @@ module Aws::GlueDataBrew
|
|
487
539
|
:max_retries,
|
488
540
|
:output_location,
|
489
541
|
:configuration,
|
542
|
+
:validation_configurations,
|
490
543
|
:role_arn,
|
491
544
|
:tags,
|
492
545
|
:timeout,
|
@@ -595,6 +648,7 @@ module Aws::GlueDataBrew
|
|
595
648
|
# location: { # required
|
596
649
|
# bucket: "Bucket", # required
|
597
650
|
# key: "Key",
|
651
|
+
# bucket_owner: "BucketOwner",
|
598
652
|
# },
|
599
653
|
# overwrite: false,
|
600
654
|
# format_options: {
|
@@ -613,12 +667,14 @@ module Aws::GlueDataBrew
|
|
613
667
|
# location: { # required
|
614
668
|
# bucket: "Bucket", # required
|
615
669
|
# key: "Key",
|
670
|
+
# bucket_owner: "BucketOwner",
|
616
671
|
# },
|
617
672
|
# },
|
618
673
|
# database_options: {
|
619
674
|
# temp_directory: {
|
620
675
|
# bucket: "Bucket", # required
|
621
676
|
# key: "Key",
|
677
|
+
# bucket_owner: "BucketOwner",
|
622
678
|
# },
|
623
679
|
# table_name: "DatabaseTableName", # required
|
624
680
|
# },
|
@@ -632,6 +688,7 @@ module Aws::GlueDataBrew
|
|
632
688
|
# temp_directory: {
|
633
689
|
# bucket: "Bucket", # required
|
634
690
|
# key: "Key",
|
691
|
+
# bucket_owner: "BucketOwner",
|
635
692
|
# },
|
636
693
|
# table_name: "DatabaseTableName", # required
|
637
694
|
# },
|
@@ -829,6 +886,86 @@ module Aws::GlueDataBrew
|
|
829
886
|
include Aws::Structure
|
830
887
|
end
|
831
888
|
|
889
|
+
# @note When making an API call, you may pass CreateRulesetRequest
|
890
|
+
# data as a hash:
|
891
|
+
#
|
892
|
+
# {
|
893
|
+
# name: "RulesetName", # required
|
894
|
+
# description: "RulesetDescription",
|
895
|
+
# target_arn: "Arn", # required
|
896
|
+
# rules: [ # required
|
897
|
+
# {
|
898
|
+
# name: "RuleName", # required
|
899
|
+
# disabled: false,
|
900
|
+
# check_expression: "Expression", # required
|
901
|
+
# substitution_map: {
|
902
|
+
# "ValueReference" => "ConditionValue",
|
903
|
+
# },
|
904
|
+
# threshold: {
|
905
|
+
# value: 1.0, # required
|
906
|
+
# type: "GREATER_THAN_OR_EQUAL", # accepts GREATER_THAN_OR_EQUAL, LESS_THAN_OR_EQUAL, GREATER_THAN, LESS_THAN
|
907
|
+
# unit: "COUNT", # accepts COUNT, PERCENTAGE
|
908
|
+
# },
|
909
|
+
# column_selectors: [
|
910
|
+
# {
|
911
|
+
# regex: "ColumnName",
|
912
|
+
# name: "ColumnName",
|
913
|
+
# },
|
914
|
+
# ],
|
915
|
+
# },
|
916
|
+
# ],
|
917
|
+
# tags: {
|
918
|
+
# "TagKey" => "TagValue",
|
919
|
+
# },
|
920
|
+
# }
|
921
|
+
#
|
922
|
+
# @!attribute [rw] name
|
923
|
+
# The name of the ruleset to be created. Valid characters are
|
924
|
+
# alphanumeric (A-Z, a-z, 0-9), hyphen (-), period (.), and space.
|
925
|
+
# @return [String]
|
926
|
+
#
|
927
|
+
# @!attribute [rw] description
|
928
|
+
# The description of the ruleset.
|
929
|
+
# @return [String]
|
930
|
+
#
|
931
|
+
# @!attribute [rw] target_arn
|
932
|
+
# The Amazon Resource Name (ARN) of a resource (dataset) that the
|
933
|
+
# ruleset is associated with.
|
934
|
+
# @return [String]
|
935
|
+
#
|
936
|
+
# @!attribute [rw] rules
|
937
|
+
# A list of rules that are defined with the ruleset. A rule includes
|
938
|
+
# one or more checks to be validated on a DataBrew dataset.
|
939
|
+
# @return [Array<Types::Rule>]
|
940
|
+
#
|
941
|
+
# @!attribute [rw] tags
|
942
|
+
# Metadata tags to apply to the ruleset.
|
943
|
+
# @return [Hash<String,String>]
|
944
|
+
#
|
945
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/CreateRulesetRequest AWS API Documentation
|
946
|
+
#
|
947
|
+
class CreateRulesetRequest < Struct.new(
|
948
|
+
:name,
|
949
|
+
:description,
|
950
|
+
:target_arn,
|
951
|
+
:rules,
|
952
|
+
:tags)
|
953
|
+
SENSITIVE = []
|
954
|
+
include Aws::Structure
|
955
|
+
end
|
956
|
+
|
957
|
+
# @!attribute [rw] name
|
958
|
+
# The unique name of the created ruleset.
|
959
|
+
# @return [String]
|
960
|
+
#
|
961
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/CreateRulesetResponse AWS API Documentation
|
962
|
+
#
|
963
|
+
class CreateRulesetResponse < Struct.new(
|
964
|
+
:name)
|
965
|
+
SENSITIVE = []
|
966
|
+
include Aws::Structure
|
967
|
+
end
|
968
|
+
|
832
969
|
# @note When making an API call, you may pass CreateScheduleRequest
|
833
970
|
# data as a hash:
|
834
971
|
#
|
@@ -955,6 +1092,7 @@ module Aws::GlueDataBrew
|
|
955
1092
|
# temp_directory: {
|
956
1093
|
# bucket: "Bucket", # required
|
957
1094
|
# key: "Key",
|
1095
|
+
# bucket_owner: "BucketOwner",
|
958
1096
|
# },
|
959
1097
|
# }
|
960
1098
|
#
|
@@ -1002,12 +1140,14 @@ module Aws::GlueDataBrew
|
|
1002
1140
|
# location: { # required
|
1003
1141
|
# bucket: "Bucket", # required
|
1004
1142
|
# key: "Key",
|
1143
|
+
# bucket_owner: "BucketOwner",
|
1005
1144
|
# },
|
1006
1145
|
# },
|
1007
1146
|
# database_options: {
|
1008
1147
|
# temp_directory: {
|
1009
1148
|
# bucket: "Bucket", # required
|
1010
1149
|
# key: "Key",
|
1150
|
+
# bucket_owner: "BucketOwner",
|
1011
1151
|
# },
|
1012
1152
|
# table_name: "DatabaseTableName", # required
|
1013
1153
|
# },
|
@@ -1063,11 +1203,13 @@ module Aws::GlueDataBrew
|
|
1063
1203
|
#
|
1064
1204
|
# {
|
1065
1205
|
# glue_connection_name: "GlueConnectionName", # required
|
1066
|
-
# database_table_name: "DatabaseTableName",
|
1206
|
+
# database_table_name: "DatabaseTableName",
|
1067
1207
|
# temp_directory: {
|
1068
1208
|
# bucket: "Bucket", # required
|
1069
1209
|
# key: "Key",
|
1210
|
+
# bucket_owner: "BucketOwner",
|
1070
1211
|
# },
|
1212
|
+
# query_string: "QueryString",
|
1071
1213
|
# }
|
1072
1214
|
#
|
1073
1215
|
# @!attribute [rw] glue_connection_name
|
@@ -1080,16 +1222,23 @@ module Aws::GlueDataBrew
|
|
1080
1222
|
# @return [String]
|
1081
1223
|
#
|
1082
1224
|
# @!attribute [rw] temp_directory
|
1083
|
-
# Represents an Amazon S3 location (bucket name
|
1084
|
-
# DataBrew can read input data, or write output from
|
1225
|
+
# Represents an Amazon S3 location (bucket name, bucket owner, and
|
1226
|
+
# object key) where DataBrew can read input data, or write output from
|
1227
|
+
# a job.
|
1085
1228
|
# @return [Types::S3Location]
|
1086
1229
|
#
|
1230
|
+
# @!attribute [rw] query_string
|
1231
|
+
# Custom SQL to run against the provided Glue connection. This SQL
|
1232
|
+
# will be used as the input for DataBrew projects and jobs.
|
1233
|
+
# @return [String]
|
1234
|
+
#
|
1087
1235
|
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/DatabaseInputDefinition AWS API Documentation
|
1088
1236
|
#
|
1089
1237
|
class DatabaseInputDefinition < Struct.new(
|
1090
1238
|
:glue_connection_name,
|
1091
1239
|
:database_table_name,
|
1092
|
-
:temp_directory
|
1240
|
+
:temp_directory,
|
1241
|
+
:query_string)
|
1093
1242
|
SENSITIVE = []
|
1094
1243
|
include Aws::Structure
|
1095
1244
|
end
|
@@ -1106,6 +1255,7 @@ module Aws::GlueDataBrew
|
|
1106
1255
|
# temp_directory: {
|
1107
1256
|
# bucket: "Bucket", # required
|
1108
1257
|
# key: "Key",
|
1258
|
+
# bucket_owner: "BucketOwner",
|
1109
1259
|
# },
|
1110
1260
|
# table_name: "DatabaseTableName", # required
|
1111
1261
|
# },
|
@@ -1147,6 +1297,7 @@ module Aws::GlueDataBrew
|
|
1147
1297
|
# temp_directory: {
|
1148
1298
|
# bucket: "Bucket", # required
|
1149
1299
|
# key: "Key",
|
1300
|
+
# bucket_owner: "BucketOwner",
|
1150
1301
|
# },
|
1151
1302
|
# table_name: "DatabaseTableName", # required
|
1152
1303
|
# }
|
@@ -1489,6 +1640,37 @@ module Aws::GlueDataBrew
|
|
1489
1640
|
include Aws::Structure
|
1490
1641
|
end
|
1491
1642
|
|
1643
|
+
# @note When making an API call, you may pass DeleteRulesetRequest
|
1644
|
+
# data as a hash:
|
1645
|
+
#
|
1646
|
+
# {
|
1647
|
+
# name: "RulesetName", # required
|
1648
|
+
# }
|
1649
|
+
#
|
1650
|
+
# @!attribute [rw] name
|
1651
|
+
# The name of the ruleset to be deleted.
|
1652
|
+
# @return [String]
|
1653
|
+
#
|
1654
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/DeleteRulesetRequest AWS API Documentation
|
1655
|
+
#
|
1656
|
+
class DeleteRulesetRequest < Struct.new(
|
1657
|
+
:name)
|
1658
|
+
SENSITIVE = []
|
1659
|
+
include Aws::Structure
|
1660
|
+
end
|
1661
|
+
|
1662
|
+
# @!attribute [rw] name
|
1663
|
+
# The name of the deleted ruleset.
|
1664
|
+
# @return [String]
|
1665
|
+
#
|
1666
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/DeleteRulesetResponse AWS API Documentation
|
1667
|
+
#
|
1668
|
+
class DeleteRulesetResponse < Struct.new(
|
1669
|
+
:name)
|
1670
|
+
SENSITIVE = []
|
1671
|
+
include Aws::Structure
|
1672
|
+
end
|
1673
|
+
|
1492
1674
|
# @note When making an API call, you may pass DeleteScheduleRequest
|
1493
1675
|
# data as a hash:
|
1494
1676
|
#
|
@@ -1718,6 +1900,11 @@ module Aws::GlueDataBrew
|
|
1718
1900
|
# settings.
|
1719
1901
|
# @return [Types::ProfileConfiguration]
|
1720
1902
|
#
|
1903
|
+
# @!attribute [rw] validation_configurations
|
1904
|
+
# List of validation configurations that are applied to the profile
|
1905
|
+
# job.
|
1906
|
+
# @return [Array<Types::ValidationConfiguration>]
|
1907
|
+
#
|
1721
1908
|
# @!attribute [rw] recipe_reference
|
1722
1909
|
# Represents the name and version of a DataBrew recipe.
|
1723
1910
|
# @return [Types::RecipeReference]
|
@@ -1765,6 +1952,7 @@ module Aws::GlueDataBrew
|
|
1765
1952
|
:database_outputs,
|
1766
1953
|
:project_name,
|
1767
1954
|
:profile_configuration,
|
1955
|
+
:validation_configurations,
|
1768
1956
|
:recipe_reference,
|
1769
1957
|
:resource_arn,
|
1770
1958
|
:role_arn,
|
@@ -1833,6 +2021,11 @@ module Aws::GlueDataBrew
|
|
1833
2021
|
# settings.
|
1834
2022
|
# @return [Types::ProfileConfiguration]
|
1835
2023
|
#
|
2024
|
+
# @!attribute [rw] validation_configurations
|
2025
|
+
# List of validation configurations that are applied to the profile
|
2026
|
+
# job.
|
2027
|
+
# @return [Array<Types::ValidationConfiguration>]
|
2028
|
+
#
|
1836
2029
|
# @!attribute [rw] run_id
|
1837
2030
|
# The unique identifier of the job run.
|
1838
2031
|
# @return [String]
|
@@ -1894,6 +2087,7 @@ module Aws::GlueDataBrew
|
|
1894
2087
|
:execution_time,
|
1895
2088
|
:job_name,
|
1896
2089
|
:profile_configuration,
|
2090
|
+
:validation_configurations,
|
1897
2091
|
:run_id,
|
1898
2092
|
:state,
|
1899
2093
|
:log_subscription,
|
@@ -2116,6 +2310,85 @@ module Aws::GlueDataBrew
|
|
2116
2310
|
include Aws::Structure
|
2117
2311
|
end
|
2118
2312
|
|
2313
|
+
# @note When making an API call, you may pass DescribeRulesetRequest
|
2314
|
+
# data as a hash:
|
2315
|
+
#
|
2316
|
+
# {
|
2317
|
+
# name: "RulesetName", # required
|
2318
|
+
# }
|
2319
|
+
#
|
2320
|
+
# @!attribute [rw] name
|
2321
|
+
# The name of the ruleset to be described.
|
2322
|
+
# @return [String]
|
2323
|
+
#
|
2324
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/DescribeRulesetRequest AWS API Documentation
|
2325
|
+
#
|
2326
|
+
class DescribeRulesetRequest < Struct.new(
|
2327
|
+
:name)
|
2328
|
+
SENSITIVE = []
|
2329
|
+
include Aws::Structure
|
2330
|
+
end
|
2331
|
+
|
2332
|
+
# @!attribute [rw] name
|
2333
|
+
# The name of the ruleset.
|
2334
|
+
# @return [String]
|
2335
|
+
#
|
2336
|
+
# @!attribute [rw] description
|
2337
|
+
# The description of the ruleset.
|
2338
|
+
# @return [String]
|
2339
|
+
#
|
2340
|
+
# @!attribute [rw] target_arn
|
2341
|
+
# The Amazon Resource Name (ARN) of a resource (dataset) that the
|
2342
|
+
# ruleset is associated with.
|
2343
|
+
# @return [String]
|
2344
|
+
#
|
2345
|
+
# @!attribute [rw] rules
|
2346
|
+
# A list of rules that are defined with the ruleset. A rule includes
|
2347
|
+
# one or more checks to be validated on a DataBrew dataset.
|
2348
|
+
# @return [Array<Types::Rule>]
|
2349
|
+
#
|
2350
|
+
# @!attribute [rw] create_date
|
2351
|
+
# The date and time that the ruleset was created.
|
2352
|
+
# @return [Time]
|
2353
|
+
#
|
2354
|
+
# @!attribute [rw] created_by
|
2355
|
+
# The Amazon Resource Name (ARN) of the user who created the ruleset.
|
2356
|
+
# @return [String]
|
2357
|
+
#
|
2358
|
+
# @!attribute [rw] last_modified_by
|
2359
|
+
# The Amazon Resource Name (ARN) of the user who last modified the
|
2360
|
+
# ruleset.
|
2361
|
+
# @return [String]
|
2362
|
+
#
|
2363
|
+
# @!attribute [rw] last_modified_date
|
2364
|
+
# The modification date and time of the ruleset.
|
2365
|
+
# @return [Time]
|
2366
|
+
#
|
2367
|
+
# @!attribute [rw] resource_arn
|
2368
|
+
# The Amazon Resource Name (ARN) for the ruleset.
|
2369
|
+
# @return [String]
|
2370
|
+
#
|
2371
|
+
# @!attribute [rw] tags
|
2372
|
+
# Metadata tags that have been applied to the ruleset.
|
2373
|
+
# @return [Hash<String,String>]
|
2374
|
+
#
|
2375
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/DescribeRulesetResponse AWS API Documentation
|
2376
|
+
#
|
2377
|
+
class DescribeRulesetResponse < Struct.new(
|
2378
|
+
:name,
|
2379
|
+
:description,
|
2380
|
+
:target_arn,
|
2381
|
+
:rules,
|
2382
|
+
:create_date,
|
2383
|
+
:created_by,
|
2384
|
+
:last_modified_by,
|
2385
|
+
:last_modified_date,
|
2386
|
+
:resource_arn,
|
2387
|
+
:tags)
|
2388
|
+
SENSITIVE = []
|
2389
|
+
include Aws::Structure
|
2390
|
+
end
|
2391
|
+
|
2119
2392
|
# @note When making an API call, you may pass DescribeScheduleRequest
|
2120
2393
|
# data as a hash:
|
2121
2394
|
#
|
@@ -2195,6 +2468,81 @@ module Aws::GlueDataBrew
|
|
2195
2468
|
include Aws::Structure
|
2196
2469
|
end
|
2197
2470
|
|
2471
|
+
# Configuration of entity detection for a profile job. When undefined,
|
2472
|
+
# entity detection is disabled.
|
2473
|
+
#
|
2474
|
+
# @note When making an API call, you may pass EntityDetectorConfiguration
|
2475
|
+
# data as a hash:
|
2476
|
+
#
|
2477
|
+
# {
|
2478
|
+
# entity_types: ["EntityType"], # required
|
2479
|
+
# allowed_statistics: [
|
2480
|
+
# {
|
2481
|
+
# statistics: ["Statistic"], # required
|
2482
|
+
# },
|
2483
|
+
# ],
|
2484
|
+
# }
|
2485
|
+
#
|
2486
|
+
# @!attribute [rw] entity_types
|
2487
|
+
# Entity types to detect. Can be any of the following:
|
2488
|
+
#
|
2489
|
+
# * USA\_SSN
|
2490
|
+
#
|
2491
|
+
# * EMAIL
|
2492
|
+
#
|
2493
|
+
# * USA\_ITIN
|
2494
|
+
#
|
2495
|
+
# * USA\_PASSPORT\_NUMBER
|
2496
|
+
#
|
2497
|
+
# * PHONE\_NUMBER
|
2498
|
+
#
|
2499
|
+
# * USA\_DRIVING\_LICENSE
|
2500
|
+
#
|
2501
|
+
# * BANK\_ACCOUNT
|
2502
|
+
#
|
2503
|
+
# * CREDIT\_CARD
|
2504
|
+
#
|
2505
|
+
# * IP\_ADDRESS
|
2506
|
+
#
|
2507
|
+
# * MAC\_ADDRESS
|
2508
|
+
#
|
2509
|
+
# * USA\_DEA\_NUMBER
|
2510
|
+
#
|
2511
|
+
# * USA\_HCPCS\_CODE
|
2512
|
+
#
|
2513
|
+
# * USA\_NATIONAL\_PROVIDER\_IDENTIFIER
|
2514
|
+
#
|
2515
|
+
# * USA\_NATIONAL\_DRUG\_CODE
|
2516
|
+
#
|
2517
|
+
# * USA\_HEALTH\_INSURANCE\_CLAIM\_NUMBER
|
2518
|
+
#
|
2519
|
+
# * USA\_MEDICARE\_BENEFICIARY\_IDENTIFIER
|
2520
|
+
#
|
2521
|
+
# * USA\_CPT\_CODE
|
2522
|
+
#
|
2523
|
+
# * PERSON\_NAME
|
2524
|
+
#
|
2525
|
+
# * DATE
|
2526
|
+
#
|
2527
|
+
# The Entity type group USA\_ALL is also supported, and includes all
|
2528
|
+
# of the above entity types except PERSON\_NAME and DATE.
|
2529
|
+
# @return [Array<String>]
|
2530
|
+
#
|
2531
|
+
# @!attribute [rw] allowed_statistics
|
2532
|
+
# Configuration of statistics that are allowed to be run on columns
|
2533
|
+
# that contain detected entities. When undefined, no statistics will
|
2534
|
+
# be computed on columns that contain detected entities.
|
2535
|
+
# @return [Array<Types::AllowedStatistics>]
|
2536
|
+
#
|
2537
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/EntityDetectorConfiguration AWS API Documentation
|
2538
|
+
#
|
2539
|
+
class EntityDetectorConfiguration < Struct.new(
|
2540
|
+
:entity_types,
|
2541
|
+
:allowed_statistics)
|
2542
|
+
SENSITIVE = []
|
2543
|
+
include Aws::Structure
|
2544
|
+
end
|
2545
|
+
|
2198
2546
|
# Represents a set of options that define how DataBrew will interpret a
|
2199
2547
|
# Microsoft Excel file when creating a dataset from that file.
|
2200
2548
|
#
|
@@ -2277,7 +2625,7 @@ module Aws::GlueDataBrew
|
|
2277
2625
|
#
|
2278
2626
|
#
|
2279
2627
|
#
|
2280
|
-
# [1]: https://docs
|
2628
|
+
# [1]: https://docs.aws.amazon.com/databrew/latest/dg/datasets.multiple-files.html#conditions.for.dynamic.datasets
|
2281
2629
|
#
|
2282
2630
|
# @note When making an API call, you may pass FilterExpression
|
2283
2631
|
# data as a hash:
|
@@ -2365,6 +2713,7 @@ module Aws::GlueDataBrew
|
|
2365
2713
|
# s3_input_definition: {
|
2366
2714
|
# bucket: "Bucket", # required
|
2367
2715
|
# key: "Key",
|
2716
|
+
# bucket_owner: "BucketOwner",
|
2368
2717
|
# },
|
2369
2718
|
# data_catalog_input_definition: {
|
2370
2719
|
# catalog_id: "CatalogId",
|
@@ -2373,15 +2722,21 @@ module Aws::GlueDataBrew
|
|
2373
2722
|
# temp_directory: {
|
2374
2723
|
# bucket: "Bucket", # required
|
2375
2724
|
# key: "Key",
|
2725
|
+
# bucket_owner: "BucketOwner",
|
2376
2726
|
# },
|
2377
2727
|
# },
|
2378
2728
|
# database_input_definition: {
|
2379
2729
|
# glue_connection_name: "GlueConnectionName", # required
|
2380
|
-
# database_table_name: "DatabaseTableName",
|
2730
|
+
# database_table_name: "DatabaseTableName",
|
2381
2731
|
# temp_directory: {
|
2382
2732
|
# bucket: "Bucket", # required
|
2383
2733
|
# key: "Key",
|
2734
|
+
# bucket_owner: "BucketOwner",
|
2384
2735
|
# },
|
2736
|
+
# query_string: "QueryString",
|
2737
|
+
# },
|
2738
|
+
# metadata: {
|
2739
|
+
# source_arn: "Arn",
|
2385
2740
|
# },
|
2386
2741
|
# }
|
2387
2742
|
#
|
@@ -2397,12 +2752,18 @@ module Aws::GlueDataBrew
|
|
2397
2752
|
# Connection information for dataset input files stored in a database.
|
2398
2753
|
# @return [Types::DatabaseInputDefinition]
|
2399
2754
|
#
|
2755
|
+
# @!attribute [rw] metadata
|
2756
|
+
# Contains additional resource information needed for specific
|
2757
|
+
# datasets.
|
2758
|
+
# @return [Types::Metadata]
|
2759
|
+
#
|
2400
2760
|
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/Input AWS API Documentation
|
2401
2761
|
#
|
2402
2762
|
class Input < Struct.new(
|
2403
2763
|
:s3_input_definition,
|
2404
2764
|
:data_catalog_input_definition,
|
2405
|
-
:database_input_definition
|
2765
|
+
:database_input_definition,
|
2766
|
+
:metadata)
|
2406
2767
|
SENSITIVE = []
|
2407
2768
|
include Aws::Structure
|
2408
2769
|
end
|
@@ -2540,6 +2901,11 @@ module Aws::GlueDataBrew
|
|
2540
2901
|
# parameter.
|
2541
2902
|
# @return [Types::JobSample]
|
2542
2903
|
#
|
2904
|
+
# @!attribute [rw] validation_configurations
|
2905
|
+
# List of validation configurations that are applied to the profile
|
2906
|
+
# job.
|
2907
|
+
# @return [Array<Types::ValidationConfiguration>]
|
2908
|
+
#
|
2543
2909
|
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/Job AWS API Documentation
|
2544
2910
|
#
|
2545
2911
|
class Job < Struct.new(
|
@@ -2565,7 +2931,8 @@ module Aws::GlueDataBrew
|
|
2565
2931
|
:role_arn,
|
2566
2932
|
:timeout,
|
2567
2933
|
:tags,
|
2568
|
-
:job_sample
|
2934
|
+
:job_sample,
|
2935
|
+
:validation_configurations)
|
2569
2936
|
SENSITIVE = []
|
2570
2937
|
include Aws::Structure
|
2571
2938
|
end
|
@@ -2650,6 +3017,11 @@ module Aws::GlueDataBrew
|
|
2650
3017
|
# parameter.
|
2651
3018
|
# @return [Types::JobSample]
|
2652
3019
|
#
|
3020
|
+
# @!attribute [rw] validation_configurations
|
3021
|
+
# List of validation configurations that are applied to the profile
|
3022
|
+
# job run.
|
3023
|
+
# @return [Array<Types::ValidationConfiguration>]
|
3024
|
+
#
|
2653
3025
|
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/JobRun AWS API Documentation
|
2654
3026
|
#
|
2655
3027
|
class JobRun < Struct.new(
|
@@ -2669,7 +3041,8 @@ module Aws::GlueDataBrew
|
|
2669
3041
|
:recipe_reference,
|
2670
3042
|
:started_by,
|
2671
3043
|
:started_on,
|
2672
|
-
:job_sample
|
3044
|
+
:job_sample,
|
3045
|
+
:validation_configurations)
|
2673
3046
|
SENSITIVE = []
|
2674
3047
|
include Aws::Structure
|
2675
3048
|
end
|
@@ -3041,6 +3414,60 @@ module Aws::GlueDataBrew
|
|
3041
3414
|
include Aws::Structure
|
3042
3415
|
end
|
3043
3416
|
|
3417
|
+
# @note When making an API call, you may pass ListRulesetsRequest
|
3418
|
+
# data as a hash:
|
3419
|
+
#
|
3420
|
+
# {
|
3421
|
+
# target_arn: "Arn",
|
3422
|
+
# max_results: 1,
|
3423
|
+
# next_token: "NextToken",
|
3424
|
+
# }
|
3425
|
+
#
|
3426
|
+
# @!attribute [rw] target_arn
|
3427
|
+
# The Amazon Resource Name (ARN) of a resource (dataset). Using this
|
3428
|
+
# parameter indicates to return only those rulesets that are
|
3429
|
+
# associated with the specified resource.
|
3430
|
+
# @return [String]
|
3431
|
+
#
|
3432
|
+
# @!attribute [rw] max_results
|
3433
|
+
# The maximum number of results to return in this request.
|
3434
|
+
# @return [Integer]
|
3435
|
+
#
|
3436
|
+
# @!attribute [rw] next_token
|
3437
|
+
# A token generated by DataBrew that specifies where to continue
|
3438
|
+
# pagination if a previous request was truncated. To get the next set
|
3439
|
+
# of pages, pass in the NextToken value from the response object of
|
3440
|
+
# the previous page call.
|
3441
|
+
# @return [String]
|
3442
|
+
#
|
3443
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/ListRulesetsRequest AWS API Documentation
|
3444
|
+
#
|
3445
|
+
class ListRulesetsRequest < Struct.new(
|
3446
|
+
:target_arn,
|
3447
|
+
:max_results,
|
3448
|
+
:next_token)
|
3449
|
+
SENSITIVE = []
|
3450
|
+
include Aws::Structure
|
3451
|
+
end
|
3452
|
+
|
3453
|
+
# @!attribute [rw] rulesets
|
3454
|
+
# A list of RulesetItem. RulesetItem contains meta data of a ruleset.
|
3455
|
+
# @return [Array<Types::RulesetItem>]
|
3456
|
+
#
|
3457
|
+
# @!attribute [rw] next_token
|
3458
|
+
# A token that you can use in a subsequent call to retrieve the next
|
3459
|
+
# set of results.
|
3460
|
+
# @return [String]
|
3461
|
+
#
|
3462
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/ListRulesetsResponse AWS API Documentation
|
3463
|
+
#
|
3464
|
+
class ListRulesetsResponse < Struct.new(
|
3465
|
+
:rulesets,
|
3466
|
+
:next_token)
|
3467
|
+
SENSITIVE = []
|
3468
|
+
include Aws::Structure
|
3469
|
+
end
|
3470
|
+
|
3044
3471
|
# @note When making an API call, you may pass ListSchedulesRequest
|
3045
3472
|
# data as a hash:
|
3046
3473
|
#
|
@@ -3123,6 +3550,28 @@ module Aws::GlueDataBrew
|
|
3123
3550
|
include Aws::Structure
|
3124
3551
|
end
|
3125
3552
|
|
3553
|
+
# Contains additional resource information needed for specific datasets.
|
3554
|
+
#
|
3555
|
+
# @note When making an API call, you may pass Metadata
|
3556
|
+
# data as a hash:
|
3557
|
+
#
|
3558
|
+
# {
|
3559
|
+
# source_arn: "Arn",
|
3560
|
+
# }
|
3561
|
+
#
|
3562
|
+
# @!attribute [rw] source_arn
|
3563
|
+
# The Amazon Resource Name (ARN) associated with the dataset.
|
3564
|
+
# Currently, DataBrew only supports ARNs from Amazon AppFlow.
|
3565
|
+
# @return [String]
|
3566
|
+
#
|
3567
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/Metadata AWS API Documentation
|
3568
|
+
#
|
3569
|
+
class Metadata < Struct.new(
|
3570
|
+
:source_arn)
|
3571
|
+
SENSITIVE = []
|
3572
|
+
include Aws::Structure
|
3573
|
+
end
|
3574
|
+
|
3126
3575
|
# Represents options that specify how and where in Amazon S3 DataBrew
|
3127
3576
|
# writes the output generated by recipe jobs or profile jobs.
|
3128
3577
|
#
|
@@ -3136,6 +3585,7 @@ module Aws::GlueDataBrew
|
|
3136
3585
|
# location: { # required
|
3137
3586
|
# bucket: "Bucket", # required
|
3138
3587
|
# key: "Key",
|
3588
|
+
# bucket_owner: "BucketOwner",
|
3139
3589
|
# },
|
3140
3590
|
# overwrite: false,
|
3141
3591
|
# format_options: {
|
@@ -3321,6 +3771,14 @@ module Aws::GlueDataBrew
|
|
3321
3771
|
# },
|
3322
3772
|
# },
|
3323
3773
|
# ],
|
3774
|
+
# entity_detector_configuration: {
|
3775
|
+
# entity_types: ["EntityType"], # required
|
3776
|
+
# allowed_statistics: [
|
3777
|
+
# {
|
3778
|
+
# statistics: ["Statistic"], # required
|
3779
|
+
# },
|
3780
|
+
# ],
|
3781
|
+
# },
|
3324
3782
|
# }
|
3325
3783
|
#
|
3326
3784
|
# @!attribute [rw] dataset_statistics_configuration
|
@@ -3344,12 +3802,18 @@ module Aws::GlueDataBrew
|
|
3344
3802
|
# profile all supported columns and run all supported evaluations.
|
3345
3803
|
# @return [Array<Types::ColumnStatisticsConfiguration>]
|
3346
3804
|
#
|
3805
|
+
# @!attribute [rw] entity_detector_configuration
|
3806
|
+
# Configuration of entity detection for a profile job. When undefined,
|
3807
|
+
# entity detection is disabled.
|
3808
|
+
# @return [Types::EntityDetectorConfiguration]
|
3809
|
+
#
|
3347
3810
|
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/ProfileConfiguration AWS API Documentation
|
3348
3811
|
#
|
3349
3812
|
class ProfileConfiguration < Struct.new(
|
3350
3813
|
:dataset_statistics_configuration,
|
3351
3814
|
:profile_columns,
|
3352
|
-
:column_statistics_configurations
|
3815
|
+
:column_statistics_configurations,
|
3816
|
+
:entity_detector_configuration)
|
3353
3817
|
SENSITIVE = []
|
3354
3818
|
include Aws::Structure
|
3355
3819
|
end
|
@@ -3708,8 +4172,167 @@ module Aws::GlueDataBrew
|
|
3708
4172
|
include Aws::Structure
|
3709
4173
|
end
|
3710
4174
|
|
3711
|
-
# Represents
|
3712
|
-
#
|
4175
|
+
# Represents a single data quality requirement that should be validated
|
4176
|
+
# in the scope of this dataset.
|
4177
|
+
#
|
4178
|
+
# @note When making an API call, you may pass Rule
|
4179
|
+
# data as a hash:
|
4180
|
+
#
|
4181
|
+
# {
|
4182
|
+
# name: "RuleName", # required
|
4183
|
+
# disabled: false,
|
4184
|
+
# check_expression: "Expression", # required
|
4185
|
+
# substitution_map: {
|
4186
|
+
# "ValueReference" => "ConditionValue",
|
4187
|
+
# },
|
4188
|
+
# threshold: {
|
4189
|
+
# value: 1.0, # required
|
4190
|
+
# type: "GREATER_THAN_OR_EQUAL", # accepts GREATER_THAN_OR_EQUAL, LESS_THAN_OR_EQUAL, GREATER_THAN, LESS_THAN
|
4191
|
+
# unit: "COUNT", # accepts COUNT, PERCENTAGE
|
4192
|
+
# },
|
4193
|
+
# column_selectors: [
|
4194
|
+
# {
|
4195
|
+
# regex: "ColumnName",
|
4196
|
+
# name: "ColumnName",
|
4197
|
+
# },
|
4198
|
+
# ],
|
4199
|
+
# }
|
4200
|
+
#
|
4201
|
+
# @!attribute [rw] name
|
4202
|
+
# The name of the rule.
|
4203
|
+
# @return [String]
|
4204
|
+
#
|
4205
|
+
# @!attribute [rw] disabled
|
4206
|
+
# A value that specifies whether the rule is disabled. Once a rule is
|
4207
|
+
# disabled, a profile job will not validate it during a job run.
|
4208
|
+
# Default value is false.
|
4209
|
+
# @return [Boolean]
|
4210
|
+
#
|
4211
|
+
# @!attribute [rw] check_expression
|
4212
|
+
# The expression which includes column references, condition names
|
4213
|
+
# followed by variable references, possibly grouped and combined with
|
4214
|
+
# other conditions. For example, `(:col1 starts_with :prefix1 or :col1
|
4215
|
+
# starts_with :prefix2) and (:col1 ends_with :suffix1 or :col1
|
4216
|
+
# ends_with :suffix2)`. Column and value references are substitution
|
4217
|
+
# variables that should start with the ':' symbol. Depending on the
|
4218
|
+
# context, substitution variables' values can be either an actual
|
4219
|
+
# value or a column name. These values are defined in the
|
4220
|
+
# SubstitutionMap. If a CheckExpression starts with a column
|
4221
|
+
# reference, then ColumnSelectors in the rule should be null. If
|
4222
|
+
# ColumnSelectors has been defined, then there should be no columnn
|
4223
|
+
# reference in the left side of a condition, for example, `is_between
|
4224
|
+
# :val1 and :val2`.
|
4225
|
+
#
|
4226
|
+
# For more information, see [Available checks][1]
|
4227
|
+
#
|
4228
|
+
#
|
4229
|
+
#
|
4230
|
+
# [1]: https://docs.aws.amazon.com/databrew/latest/dg/profile.data-quality-available-checks.html
|
4231
|
+
# @return [String]
|
4232
|
+
#
|
4233
|
+
# @!attribute [rw] substitution_map
|
4234
|
+
# The map of substitution variable names to their values used in a
|
4235
|
+
# check expression. Variable names should start with a ':' (colon).
|
4236
|
+
# Variable values can either be actual values or column names. To
|
4237
|
+
# differentiate between the two, column names should be enclosed in
|
4238
|
+
# backticks, for example, `` ":col1": "`Column A`". ``
|
4239
|
+
# @return [Hash<String,String>]
|
4240
|
+
#
|
4241
|
+
# @!attribute [rw] threshold
|
4242
|
+
# The threshold used with a non-aggregate check expression.
|
4243
|
+
# Non-aggregate check expressions will be applied to each row in a
|
4244
|
+
# specific column, and the threshold will be used to determine whether
|
4245
|
+
# the validation succeeds.
|
4246
|
+
# @return [Types::Threshold]
|
4247
|
+
#
|
4248
|
+
# @!attribute [rw] column_selectors
|
4249
|
+
# List of column selectors. Selectors can be used to select columns
|
4250
|
+
# using a name or regular expression from the dataset. Rule will be
|
4251
|
+
# applied to selected columns.
|
4252
|
+
# @return [Array<Types::ColumnSelector>]
|
4253
|
+
#
|
4254
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/Rule AWS API Documentation
|
4255
|
+
#
|
4256
|
+
class Rule < Struct.new(
|
4257
|
+
:name,
|
4258
|
+
:disabled,
|
4259
|
+
:check_expression,
|
4260
|
+
:substitution_map,
|
4261
|
+
:threshold,
|
4262
|
+
:column_selectors)
|
4263
|
+
SENSITIVE = []
|
4264
|
+
include Aws::Structure
|
4265
|
+
end
|
4266
|
+
|
4267
|
+
# Contains metadata about the ruleset.
|
4268
|
+
#
|
4269
|
+
# @!attribute [rw] account_id
|
4270
|
+
# The ID of the Amazon Web Services account that owns the ruleset.
|
4271
|
+
# @return [String]
|
4272
|
+
#
|
4273
|
+
# @!attribute [rw] created_by
|
4274
|
+
# The Amazon Resource Name (ARN) of the user who created the ruleset.
|
4275
|
+
# @return [String]
|
4276
|
+
#
|
4277
|
+
# @!attribute [rw] create_date
|
4278
|
+
# The date and time that the ruleset was created.
|
4279
|
+
# @return [Time]
|
4280
|
+
#
|
4281
|
+
# @!attribute [rw] description
|
4282
|
+
# The description of the ruleset.
|
4283
|
+
# @return [String]
|
4284
|
+
#
|
4285
|
+
# @!attribute [rw] last_modified_by
|
4286
|
+
# The Amazon Resource Name (ARN) of the user who last modified the
|
4287
|
+
# ruleset.
|
4288
|
+
# @return [String]
|
4289
|
+
#
|
4290
|
+
# @!attribute [rw] last_modified_date
|
4291
|
+
# The modification date and time of the ruleset.
|
4292
|
+
# @return [Time]
|
4293
|
+
#
|
4294
|
+
# @!attribute [rw] name
|
4295
|
+
# The name of the ruleset.
|
4296
|
+
# @return [String]
|
4297
|
+
#
|
4298
|
+
# @!attribute [rw] resource_arn
|
4299
|
+
# The Amazon Resource Name (ARN) for the ruleset.
|
4300
|
+
# @return [String]
|
4301
|
+
#
|
4302
|
+
# @!attribute [rw] rule_count
|
4303
|
+
# The number of rules that are defined in the ruleset.
|
4304
|
+
# @return [Integer]
|
4305
|
+
#
|
4306
|
+
# @!attribute [rw] tags
|
4307
|
+
# Metadata tags that have been applied to the ruleset.
|
4308
|
+
# @return [Hash<String,String>]
|
4309
|
+
#
|
4310
|
+
# @!attribute [rw] target_arn
|
4311
|
+
# The Amazon Resource Name (ARN) of a resource (dataset) that the
|
4312
|
+
# ruleset is associated with.
|
4313
|
+
# @return [String]
|
4314
|
+
#
|
4315
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/RulesetItem AWS API Documentation
|
4316
|
+
#
|
4317
|
+
class RulesetItem < Struct.new(
|
4318
|
+
:account_id,
|
4319
|
+
:created_by,
|
4320
|
+
:create_date,
|
4321
|
+
:description,
|
4322
|
+
:last_modified_by,
|
4323
|
+
:last_modified_date,
|
4324
|
+
:name,
|
4325
|
+
:resource_arn,
|
4326
|
+
:rule_count,
|
4327
|
+
:tags,
|
4328
|
+
:target_arn)
|
4329
|
+
SENSITIVE = []
|
4330
|
+
include Aws::Structure
|
4331
|
+
end
|
4332
|
+
|
4333
|
+
# Represents an Amazon S3 location (bucket name, bucket owner, and
|
4334
|
+
# object key) where DataBrew can read input data, or write output from a
|
4335
|
+
# job.
|
3713
4336
|
#
|
3714
4337
|
# @note When making an API call, you may pass S3Location
|
3715
4338
|
# data as a hash:
|
@@ -3717,6 +4340,7 @@ module Aws::GlueDataBrew
|
|
3717
4340
|
# {
|
3718
4341
|
# bucket: "Bucket", # required
|
3719
4342
|
# key: "Key",
|
4343
|
+
# bucket_owner: "BucketOwner",
|
3720
4344
|
# }
|
3721
4345
|
#
|
3722
4346
|
# @!attribute [rw] bucket
|
@@ -3727,11 +4351,16 @@ module Aws::GlueDataBrew
|
|
3727
4351
|
# The unique name of the object in the bucket.
|
3728
4352
|
# @return [String]
|
3729
4353
|
#
|
4354
|
+
# @!attribute [rw] bucket_owner
|
4355
|
+
# The Amazon Web Services account ID of the bucket owner.
|
4356
|
+
# @return [String]
|
4357
|
+
#
|
3730
4358
|
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/S3Location AWS API Documentation
|
3731
4359
|
#
|
3732
4360
|
class S3Location < Struct.new(
|
3733
4361
|
:bucket,
|
3734
|
-
:key
|
4362
|
+
:key,
|
4363
|
+
:bucket_owner)
|
3735
4364
|
SENSITIVE = []
|
3736
4365
|
include Aws::Structure
|
3737
4366
|
end
|
@@ -3746,6 +4375,7 @@ module Aws::GlueDataBrew
|
|
3746
4375
|
# location: { # required
|
3747
4376
|
# bucket: "Bucket", # required
|
3748
4377
|
# key: "Key",
|
4378
|
+
# bucket_owner: "BucketOwner",
|
3749
4379
|
# },
|
3750
4380
|
# }
|
3751
4381
|
#
|
@@ -3882,6 +4512,9 @@ module Aws::GlueDataBrew
|
|
3882
4512
|
# start_column_index: 1, # required
|
3883
4513
|
# column_range: 1,
|
3884
4514
|
# hidden_columns: ["ColumnName"],
|
4515
|
+
# start_row_index: 1,
|
4516
|
+
# row_range: 1,
|
4517
|
+
# analytics: "ENABLE", # accepts ENABLE, DISABLE
|
3885
4518
|
# },
|
3886
4519
|
# }
|
3887
4520
|
#
|
@@ -3923,7 +4556,7 @@ module Aws::GlueDataBrew
|
|
3923
4556
|
:step_index,
|
3924
4557
|
:client_session_id,
|
3925
4558
|
:view_frame)
|
3926
|
-
SENSITIVE = []
|
4559
|
+
SENSITIVE = [:client_session_id]
|
3927
4560
|
include Aws::Structure
|
3928
4561
|
end
|
3929
4562
|
|
@@ -4032,7 +4665,7 @@ module Aws::GlueDataBrew
|
|
4032
4665
|
class StartProjectSessionResponse < Struct.new(
|
4033
4666
|
:name,
|
4034
4667
|
:client_session_id)
|
4035
|
-
SENSITIVE = []
|
4668
|
+
SENSITIVE = [:client_session_id]
|
4036
4669
|
include Aws::Structure
|
4037
4670
|
end
|
4038
4671
|
|
@@ -4172,6 +4805,44 @@ module Aws::GlueDataBrew
|
|
4172
4805
|
#
|
4173
4806
|
class TagResourceResponse < Aws::EmptyStructure; end
|
4174
4807
|
|
4808
|
+
# The threshold used with a non-aggregate check expression. The
|
4809
|
+
# non-aggregate check expression will be applied to each row in a
|
4810
|
+
# specific column. Then the threshold will be used to determine whether
|
4811
|
+
# the validation succeeds.
|
4812
|
+
#
|
4813
|
+
# @note When making an API call, you may pass Threshold
|
4814
|
+
# data as a hash:
|
4815
|
+
#
|
4816
|
+
# {
|
4817
|
+
# value: 1.0, # required
|
4818
|
+
# type: "GREATER_THAN_OR_EQUAL", # accepts GREATER_THAN_OR_EQUAL, LESS_THAN_OR_EQUAL, GREATER_THAN, LESS_THAN
|
4819
|
+
# unit: "COUNT", # accepts COUNT, PERCENTAGE
|
4820
|
+
# }
|
4821
|
+
#
|
4822
|
+
# @!attribute [rw] value
|
4823
|
+
# The value of a threshold.
|
4824
|
+
# @return [Float]
|
4825
|
+
#
|
4826
|
+
# @!attribute [rw] type
|
4827
|
+
# The type of a threshold. Used for comparison of an actual count of
|
4828
|
+
# rows that satisfy the rule to the threshold value.
|
4829
|
+
# @return [String]
|
4830
|
+
#
|
4831
|
+
# @!attribute [rw] unit
|
4832
|
+
# Unit of threshold value. Can be either a COUNT or PERCENTAGE of the
|
4833
|
+
# full sample size used for validation.
|
4834
|
+
# @return [String]
|
4835
|
+
#
|
4836
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/Threshold AWS API Documentation
|
4837
|
+
#
|
4838
|
+
class Threshold < Struct.new(
|
4839
|
+
:value,
|
4840
|
+
:type,
|
4841
|
+
:unit)
|
4842
|
+
SENSITIVE = []
|
4843
|
+
include Aws::Structure
|
4844
|
+
end
|
4845
|
+
|
4175
4846
|
# @note When making an API call, you may pass UntagResourceRequest
|
4176
4847
|
# data as a hash:
|
4177
4848
|
#
|
@@ -4226,6 +4897,7 @@ module Aws::GlueDataBrew
|
|
4226
4897
|
# s3_input_definition: {
|
4227
4898
|
# bucket: "Bucket", # required
|
4228
4899
|
# key: "Key",
|
4900
|
+
# bucket_owner: "BucketOwner",
|
4229
4901
|
# },
|
4230
4902
|
# data_catalog_input_definition: {
|
4231
4903
|
# catalog_id: "CatalogId",
|
@@ -4234,15 +4906,21 @@ module Aws::GlueDataBrew
|
|
4234
4906
|
# temp_directory: {
|
4235
4907
|
# bucket: "Bucket", # required
|
4236
4908
|
# key: "Key",
|
4909
|
+
# bucket_owner: "BucketOwner",
|
4237
4910
|
# },
|
4238
4911
|
# },
|
4239
4912
|
# database_input_definition: {
|
4240
4913
|
# glue_connection_name: "GlueConnectionName", # required
|
4241
|
-
# database_table_name: "DatabaseTableName",
|
4914
|
+
# database_table_name: "DatabaseTableName",
|
4242
4915
|
# temp_directory: {
|
4243
4916
|
# bucket: "Bucket", # required
|
4244
4917
|
# key: "Key",
|
4918
|
+
# bucket_owner: "BucketOwner",
|
4245
4919
|
# },
|
4920
|
+
# query_string: "QueryString",
|
4921
|
+
# },
|
4922
|
+
# metadata: {
|
4923
|
+
# source_arn: "Arn",
|
4246
4924
|
# },
|
4247
4925
|
# },
|
4248
4926
|
# path_options: {
|
@@ -4369,6 +5047,14 @@ module Aws::GlueDataBrew
|
|
4369
5047
|
# },
|
4370
5048
|
# },
|
4371
5049
|
# ],
|
5050
|
+
# entity_detector_configuration: {
|
5051
|
+
# entity_types: ["EntityType"], # required
|
5052
|
+
# allowed_statistics: [
|
5053
|
+
# {
|
5054
|
+
# statistics: ["Statistic"], # required
|
5055
|
+
# },
|
5056
|
+
# ],
|
5057
|
+
# },
|
4372
5058
|
# },
|
4373
5059
|
# encryption_key_arn: "EncryptionKeyArn",
|
4374
5060
|
# encryption_mode: "SSE-KMS", # accepts SSE-KMS, SSE-S3
|
@@ -4379,7 +5065,14 @@ module Aws::GlueDataBrew
|
|
4379
5065
|
# output_location: { # required
|
4380
5066
|
# bucket: "Bucket", # required
|
4381
5067
|
# key: "Key",
|
5068
|
+
# bucket_owner: "BucketOwner",
|
4382
5069
|
# },
|
5070
|
+
# validation_configurations: [
|
5071
|
+
# {
|
5072
|
+
# ruleset_arn: "Arn", # required
|
5073
|
+
# validation_mode: "CHECK_ALL", # accepts CHECK_ALL
|
5074
|
+
# },
|
5075
|
+
# ],
|
4383
5076
|
# role_arn: "Arn", # required
|
4384
5077
|
# timeout: 1,
|
4385
5078
|
# job_sample: {
|
@@ -4428,10 +5121,16 @@ module Aws::GlueDataBrew
|
|
4428
5121
|
# @return [Integer]
|
4429
5122
|
#
|
4430
5123
|
# @!attribute [rw] output_location
|
4431
|
-
# Represents an Amazon S3 location (bucket name
|
4432
|
-
# DataBrew can read input data, or write output from
|
5124
|
+
# Represents an Amazon S3 location (bucket name, bucket owner, and
|
5125
|
+
# object key) where DataBrew can read input data, or write output from
|
5126
|
+
# a job.
|
4433
5127
|
# @return [Types::S3Location]
|
4434
5128
|
#
|
5129
|
+
# @!attribute [rw] validation_configurations
|
5130
|
+
# List of validation configurations that are applied to the profile
|
5131
|
+
# job.
|
5132
|
+
# @return [Array<Types::ValidationConfiguration>]
|
5133
|
+
#
|
4435
5134
|
# @!attribute [rw] role_arn
|
4436
5135
|
# The Amazon Resource Name (ARN) of the Identity and Access Management
|
4437
5136
|
# (IAM) role to be assumed when DataBrew runs the job.
|
@@ -4461,6 +5160,7 @@ module Aws::GlueDataBrew
|
|
4461
5160
|
:max_capacity,
|
4462
5161
|
:max_retries,
|
4463
5162
|
:output_location,
|
5163
|
+
:validation_configurations,
|
4464
5164
|
:role_arn,
|
4465
5165
|
:timeout,
|
4466
5166
|
:job_sample)
|
@@ -4551,6 +5251,7 @@ module Aws::GlueDataBrew
|
|
4551
5251
|
# location: { # required
|
4552
5252
|
# bucket: "Bucket", # required
|
4553
5253
|
# key: "Key",
|
5254
|
+
# bucket_owner: "BucketOwner",
|
4554
5255
|
# },
|
4555
5256
|
# overwrite: false,
|
4556
5257
|
# format_options: {
|
@@ -4569,12 +5270,14 @@ module Aws::GlueDataBrew
|
|
4569
5270
|
# location: { # required
|
4570
5271
|
# bucket: "Bucket", # required
|
4571
5272
|
# key: "Key",
|
5273
|
+
# bucket_owner: "BucketOwner",
|
4572
5274
|
# },
|
4573
5275
|
# },
|
4574
5276
|
# database_options: {
|
4575
5277
|
# temp_directory: {
|
4576
5278
|
# bucket: "Bucket", # required
|
4577
5279
|
# key: "Key",
|
5280
|
+
# bucket_owner: "BucketOwner",
|
4578
5281
|
# },
|
4579
5282
|
# table_name: "DatabaseTableName", # required
|
4580
5283
|
# },
|
@@ -4588,6 +5291,7 @@ module Aws::GlueDataBrew
|
|
4588
5291
|
# temp_directory: {
|
4589
5292
|
# bucket: "Bucket", # required
|
4590
5293
|
# key: "Key",
|
5294
|
+
# bucket_owner: "BucketOwner",
|
4591
5295
|
# },
|
4592
5296
|
# table_name: "DatabaseTableName", # required
|
4593
5297
|
# },
|
@@ -4746,6 +5450,70 @@ module Aws::GlueDataBrew
|
|
4746
5450
|
include Aws::Structure
|
4747
5451
|
end
|
4748
5452
|
|
5453
|
+
# @note When making an API call, you may pass UpdateRulesetRequest
|
5454
|
+
# data as a hash:
|
5455
|
+
#
|
5456
|
+
# {
|
5457
|
+
# name: "RulesetName", # required
|
5458
|
+
# description: "RulesetDescription",
|
5459
|
+
# rules: [ # required
|
5460
|
+
# {
|
5461
|
+
# name: "RuleName", # required
|
5462
|
+
# disabled: false,
|
5463
|
+
# check_expression: "Expression", # required
|
5464
|
+
# substitution_map: {
|
5465
|
+
# "ValueReference" => "ConditionValue",
|
5466
|
+
# },
|
5467
|
+
# threshold: {
|
5468
|
+
# value: 1.0, # required
|
5469
|
+
# type: "GREATER_THAN_OR_EQUAL", # accepts GREATER_THAN_OR_EQUAL, LESS_THAN_OR_EQUAL, GREATER_THAN, LESS_THAN
|
5470
|
+
# unit: "COUNT", # accepts COUNT, PERCENTAGE
|
5471
|
+
# },
|
5472
|
+
# column_selectors: [
|
5473
|
+
# {
|
5474
|
+
# regex: "ColumnName",
|
5475
|
+
# name: "ColumnName",
|
5476
|
+
# },
|
5477
|
+
# ],
|
5478
|
+
# },
|
5479
|
+
# ],
|
5480
|
+
# }
|
5481
|
+
#
|
5482
|
+
# @!attribute [rw] name
|
5483
|
+
# The name of the ruleset to be updated.
|
5484
|
+
# @return [String]
|
5485
|
+
#
|
5486
|
+
# @!attribute [rw] description
|
5487
|
+
# The description of the ruleset.
|
5488
|
+
# @return [String]
|
5489
|
+
#
|
5490
|
+
# @!attribute [rw] rules
|
5491
|
+
# A list of rules that are defined with the ruleset. A rule includes
|
5492
|
+
# one or more checks to be validated on a DataBrew dataset.
|
5493
|
+
# @return [Array<Types::Rule>]
|
5494
|
+
#
|
5495
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/UpdateRulesetRequest AWS API Documentation
|
5496
|
+
#
|
5497
|
+
class UpdateRulesetRequest < Struct.new(
|
5498
|
+
:name,
|
5499
|
+
:description,
|
5500
|
+
:rules)
|
5501
|
+
SENSITIVE = []
|
5502
|
+
include Aws::Structure
|
5503
|
+
end
|
5504
|
+
|
5505
|
+
# @!attribute [rw] name
|
5506
|
+
# The name of the updated ruleset.
|
5507
|
+
# @return [String]
|
5508
|
+
#
|
5509
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/UpdateRulesetResponse AWS API Documentation
|
5510
|
+
#
|
5511
|
+
class UpdateRulesetResponse < Struct.new(
|
5512
|
+
:name)
|
5513
|
+
SENSITIVE = []
|
5514
|
+
include Aws::Structure
|
5515
|
+
end
|
5516
|
+
|
4749
5517
|
# @note When making an API call, you may pass UpdateScheduleRequest
|
4750
5518
|
# data as a hash:
|
4751
5519
|
#
|
@@ -4795,6 +5563,40 @@ module Aws::GlueDataBrew
|
|
4795
5563
|
include Aws::Structure
|
4796
5564
|
end
|
4797
5565
|
|
5566
|
+
# Configuration for data quality validation. Used to select the Rulesets
|
5567
|
+
# and Validation Mode to be used in the profile job. When
|
5568
|
+
# ValidationConfiguration is null, the profile job will run without data
|
5569
|
+
# quality validation.
|
5570
|
+
#
|
5571
|
+
# @note When making an API call, you may pass ValidationConfiguration
|
5572
|
+
# data as a hash:
|
5573
|
+
#
|
5574
|
+
# {
|
5575
|
+
# ruleset_arn: "Arn", # required
|
5576
|
+
# validation_mode: "CHECK_ALL", # accepts CHECK_ALL
|
5577
|
+
# }
|
5578
|
+
#
|
5579
|
+
# @!attribute [rw] ruleset_arn
|
5580
|
+
# The Amazon Resource Name (ARN) for the ruleset to be validated in
|
5581
|
+
# the profile job. The TargetArn of the selected ruleset should be the
|
5582
|
+
# same as the Amazon Resource Name (ARN) of the dataset that is
|
5583
|
+
# associated with the profile job.
|
5584
|
+
# @return [String]
|
5585
|
+
#
|
5586
|
+
# @!attribute [rw] validation_mode
|
5587
|
+
# Mode of data quality validation. Default mode is “CHECK\_ALL” which
|
5588
|
+
# verifies all rules defined in the selected ruleset.
|
5589
|
+
# @return [String]
|
5590
|
+
#
|
5591
|
+
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/ValidationConfiguration AWS API Documentation
|
5592
|
+
#
|
5593
|
+
class ValidationConfiguration < Struct.new(
|
5594
|
+
:ruleset_arn,
|
5595
|
+
:validation_mode)
|
5596
|
+
SENSITIVE = []
|
5597
|
+
include Aws::Structure
|
5598
|
+
end
|
5599
|
+
|
4798
5600
|
# The input parameters for this request failed validation.
|
4799
5601
|
#
|
4800
5602
|
# @!attribute [rw] message
|
@@ -4817,6 +5619,9 @@ module Aws::GlueDataBrew
|
|
4817
5619
|
# start_column_index: 1, # required
|
4818
5620
|
# column_range: 1,
|
4819
5621
|
# hidden_columns: ["ColumnName"],
|
5622
|
+
# start_row_index: 1,
|
5623
|
+
# row_range: 1,
|
5624
|
+
# analytics: "ENABLE", # accepts ENABLE, DISABLE
|
4820
5625
|
# }
|
4821
5626
|
#
|
4822
5627
|
# @!attribute [rw] start_column_index
|
@@ -4834,12 +5639,30 @@ module Aws::GlueDataBrew
|
|
4834
5639
|
# A list of columns to hide in the view frame.
|
4835
5640
|
# @return [Array<String>]
|
4836
5641
|
#
|
5642
|
+
# @!attribute [rw] start_row_index
|
5643
|
+
# The starting index for the range of rows to return in the view
|
5644
|
+
# frame.
|
5645
|
+
# @return [Integer]
|
5646
|
+
#
|
5647
|
+
# @!attribute [rw] row_range
|
5648
|
+
# The number of rows to include in the view frame, beginning with the
|
5649
|
+
# `StartRowIndex` value.
|
5650
|
+
# @return [Integer]
|
5651
|
+
#
|
5652
|
+
# @!attribute [rw] analytics
|
5653
|
+
# Controls if analytics computation is enabled or disabled. Enabled by
|
5654
|
+
# default.
|
5655
|
+
# @return [String]
|
5656
|
+
#
|
4837
5657
|
# @see http://docs.aws.amazon.com/goto/WebAPI/databrew-2017-07-25/ViewFrame AWS API Documentation
|
4838
5658
|
#
|
4839
5659
|
class ViewFrame < Struct.new(
|
4840
5660
|
:start_column_index,
|
4841
5661
|
:column_range,
|
4842
|
-
:hidden_columns
|
5662
|
+
:hidden_columns,
|
5663
|
+
:start_row_index,
|
5664
|
+
:row_range,
|
5665
|
+
:analytics)
|
4843
5666
|
SENSITIVE = []
|
4844
5667
|
include Aws::Structure
|
4845
5668
|
end
|