aws-sdk-glue 1.1.0 → 1.2.0

Sign up to get free protection for your applications and to get access to all the features.
@@ -466,21 +466,29 @@ module Aws::Glue
466
466
  include Aws::Structure
467
467
  end
468
468
 
469
- # Classifiers are written in Python and triggered during a Crawl Task.
470
- # You can write your own Classifiers to best categorize your data
469
+ # Classifiers are written in Python and triggered during a crawl task.
470
+ # You can write your own classifiers to best categorize your data
471
471
  # sources and specify the appropriate schemas to use for them. A
472
- # Classifier first checks whether a given file is in a format it can
473
- # handle, and then, if so, creates a schema in the form of a
472
+ # classifier checks whether a given file is in a format it can handle,
473
+ # and if it is, the classifier creates a schema in the form of a
474
474
  # `StructType` object that matches that data format.
475
475
  #
476
+ # A classifier can be either a `grok` classifier or an XML classifier,
477
+ # specified in one or the other field of the `Classifier` object.
478
+ #
476
479
  # @!attribute [rw] grok_classifier
477
- # A GrokClassifier object.
480
+ # A `GrokClassifier` object.
478
481
  # @return [Types::GrokClassifier]
479
482
  #
483
+ # @!attribute [rw] xml_classifier
484
+ # An `XMLClassifier` object.
485
+ # @return [Types::XMLClassifier]
486
+ #
480
487
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/Classifier AWS API Documentation
481
488
  #
482
489
  class Classifier < Struct.new(
483
- :grok_classifier)
490
+ :grok_classifier,
491
+ :xml_classifier)
484
492
  include Aws::Structure
485
493
  end
486
494
 
@@ -792,15 +800,16 @@ module Aws::Glue
792
800
 
793
801
  # Specifies a crawler program that examines a data source and uses
794
802
  # classifiers to try to determine its schema. If successful, the crawler
795
- # records metatdata concerning the data source in the Data Catalog.
803
+ # records metadata concerning the data source in the AWS Glue Data
804
+ # Catalog.
796
805
  #
797
806
  # @!attribute [rw] name
798
- # The `Crawler` name.
807
+ # The crawler name.
799
808
  # @return [String]
800
809
  #
801
810
  # @!attribute [rw] role
802
811
  # The IAM role (or ARN of an IAM role) used to access customer
803
- # resources such as data in S3.
812
+ # resources, such as data in Amazon S3.
804
813
  # @return [String]
805
814
  #
806
815
  # @!attribute [rw] targets
@@ -808,46 +817,46 @@ module Aws::Glue
808
817
  # @return [Types::CrawlerTargets]
809
818
  #
810
819
  # @!attribute [rw] database_name
811
- # The `Database` where this Crawler's output should be stored.
820
+ # The database where metadata is written by this crawler.
812
821
  # @return [String]
813
822
  #
814
823
  # @!attribute [rw] description
815
- # A description of this Crawler and where it should be used.
824
+ # A description of the crawler.
816
825
  # @return [String]
817
826
  #
818
827
  # @!attribute [rw] classifiers
819
- # A list of custom `Classifier`s associated with this Crawler.
828
+ # A list of custom classifiers associated with the crawler.
820
829
  # @return [Array<String>]
821
830
  #
822
831
  # @!attribute [rw] schema_change_policy
823
- # Sets policy for the crawler's update and delete behavior.
832
+ # Sets the behavior when the crawler finds a changed or deleted
833
+ # object.
824
834
  # @return [Types::SchemaChangePolicy]
825
835
  #
826
836
  # @!attribute [rw] state
827
- # Indicates whether this Crawler is running, or whether a run is
837
+ # Indicates whether the crawler is running, or whether a run is
828
838
  # pending.
829
839
  # @return [String]
830
840
  #
831
841
  # @!attribute [rw] table_prefix
832
- # The table prefix used for catalog tables created.
842
+ # The prefix added to the names of tables that are created.
833
843
  # @return [String]
834
844
  #
835
845
  # @!attribute [rw] schedule
836
- # A `Schedule` object that specifies the schedule on which this
837
- # Crawler is to be run.
846
+ # For scheduled crawlers, the schedule when the crawler runs.
838
847
  # @return [Types::Schedule]
839
848
  #
840
849
  # @!attribute [rw] crawl_elapsed_time
841
- # If this Crawler is running, contains the total time elapsed since
842
- # the last crawl began.
850
+ # If the crawler is running, contains the total time elapsed since the
851
+ # last crawl began.
843
852
  # @return [Integer]
844
853
  #
845
854
  # @!attribute [rw] creation_time
846
- # The time when the Crawler was created.
855
+ # The time when the crawler was created.
847
856
  # @return [Time]
848
857
  #
849
858
  # @!attribute [rw] last_updated
850
- # The time the Crawler was last updated.
859
+ # The time the crawler was last updated.
851
860
  # @return [Time]
852
861
  #
853
862
  # @!attribute [rw] last_crawl
@@ -856,9 +865,20 @@ module Aws::Glue
856
865
  # @return [Types::LastCrawlInfo]
857
866
  #
858
867
  # @!attribute [rw] version
859
- # The version of the Crawler.
868
+ # The version of the crawler.
860
869
  # @return [Integer]
861
870
  #
871
+ # @!attribute [rw] configuration
872
+ # Crawler configuration information. This versioned JSON string allows
873
+ # users to specify aspects of a Crawler's behavior.
874
+ #
875
+ # You can use this field to force partitions to inherit metadata such
876
+ # as classification, input format, output format, serde information,
877
+ # and schema from their parent table, rather than detect this
878
+ # information separately for each partition. Use the following JSON
879
+ # string to specify that behavior:
880
+ # @return [String]
881
+ #
862
882
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/Crawler AWS API Documentation
863
883
  #
864
884
  class Crawler < Struct.new(
@@ -876,7 +896,8 @@ module Aws::Glue
876
896
  :creation_time,
877
897
  :last_updated,
878
898
  :last_crawl,
879
- :version)
899
+ :version,
900
+ :configuration)
880
901
  include Aws::Structure
881
902
  end
882
903
 
@@ -891,7 +912,8 @@ module Aws::Glue
891
912
  # @return [Float]
892
913
  #
893
914
  # @!attribute [rw] still_estimating
894
- # True if the crawler is estimating its
915
+ # True if the crawler is still estimating how long it will take to
916
+ # complete this run.
895
917
  # @return [Boolean]
896
918
  #
897
919
  # @!attribute [rw] last_runtime_seconds
@@ -903,15 +925,15 @@ module Aws::Glue
903
925
  # @return [Float]
904
926
  #
905
927
  # @!attribute [rw] tables_created
906
- # A list of the tables created by this crawler.
928
+ # The number of tables created by this crawler.
907
929
  # @return [Integer]
908
930
  #
909
931
  # @!attribute [rw] tables_updated
910
- # A list of the tables created by this crawler.
932
+ # The number of tables updated by this crawler.
911
933
  # @return [Integer]
912
934
  #
913
935
  # @!attribute [rw] tables_deleted
914
- # A list of the tables deleted by this crawler.
936
+ # The number of tables deleted by this crawler.
915
937
  # @return [Integer]
916
938
  #
917
939
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/CrawlerMetrics AWS API Documentation
@@ -928,7 +950,7 @@ module Aws::Glue
928
950
  include Aws::Structure
929
951
  end
930
952
 
931
- # Specifies crawler targets.
953
+ # Specifies data stores to crawl.
932
954
  #
933
955
  # @note When making an API call, you may pass CrawlerTargets
934
956
  # data as a hash:
@@ -950,7 +972,7 @@ module Aws::Glue
950
972
  # }
951
973
  #
952
974
  # @!attribute [rw] s3_targets
953
- # Specifies targets in AWS S3.
975
+ # Specifies Amazon S3 targets.
954
976
  # @return [Array<Types::S3Target>]
955
977
  #
956
978
  # @!attribute [rw] jdbc_targets
@@ -975,16 +997,26 @@ module Aws::Glue
975
997
  # grok_pattern: "GrokPattern", # required
976
998
  # custom_patterns: "CustomPatterns",
977
999
  # },
1000
+ # xml_classifier: {
1001
+ # classification: "Classification", # required
1002
+ # name: "NameString", # required
1003
+ # row_tag: "RowTag",
1004
+ # },
978
1005
  # }
979
1006
  #
980
1007
  # @!attribute [rw] grok_classifier
981
- # A grok classifier to create.
1008
+ # A `GrokClassifier` object specifying the classifier to create.
982
1009
  # @return [Types::CreateGrokClassifierRequest]
983
1010
  #
1011
+ # @!attribute [rw] xml_classifier
1012
+ # An `XMLClassifier` object specifying the classifier to create.
1013
+ # @return [Types::CreateXMLClassifierRequest]
1014
+ #
984
1015
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/CreateClassifierRequest AWS API Documentation
985
1016
  #
986
1017
  class CreateClassifierRequest < Struct.new(
987
- :grok_classifier)
1018
+ :grok_classifier,
1019
+ :xml_classifier)
988
1020
  include Aws::Structure
989
1021
  end
990
1022
 
@@ -1039,7 +1071,7 @@ module Aws::Glue
1039
1071
  #
1040
1072
  # {
1041
1073
  # name: "NameString", # required
1042
- # role: "RoleArn", # required
1074
+ # role: "Role", # required
1043
1075
  # database_name: "DatabaseName", # required
1044
1076
  # description: "DescriptionString",
1045
1077
  # targets: { # required
@@ -1064,24 +1096,25 @@ module Aws::Glue
1064
1096
  # update_behavior: "LOG", # accepts LOG, UPDATE_IN_DATABASE
1065
1097
  # delete_behavior: "LOG", # accepts LOG, DELETE_FROM_DATABASE, DEPRECATE_IN_DATABASE
1066
1098
  # },
1099
+ # configuration: "CrawlerConfiguration",
1067
1100
  # }
1068
1101
  #
1069
1102
  # @!attribute [rw] name
1070
- # Name of the new `Crawler`.
1103
+ # Name of the new crawler.
1071
1104
  # @return [String]
1072
1105
  #
1073
1106
  # @!attribute [rw] role
1074
- # The IAM role (or ARN of an IAM role) used by the new `Crawler` to
1107
+ # The IAM role (or ARN of an IAM role) used by the new crawler to
1075
1108
  # access customer resources.
1076
1109
  # @return [String]
1077
1110
  #
1078
1111
  # @!attribute [rw] database_name
1079
- # The Glue `Database` where results will be stored, such as:
1112
+ # The AWS Glue database where results are written, such as:
1080
1113
  # `arn:aws:daylight:us-east-1::database/sometable/*`.
1081
1114
  # @return [String]
1082
1115
  #
1083
1116
  # @!attribute [rw] description
1084
- # A description of the new `Crawler`.
1117
+ # A description of the new crawler.
1085
1118
  # @return [String]
1086
1119
  #
1087
1120
  # @!attribute [rw] targets
@@ -1099,20 +1132,30 @@ module Aws::Glue
1099
1132
  # @return [String]
1100
1133
  #
1101
1134
  # @!attribute [rw] classifiers
1102
- # A list of custom `Classifier` names that the user has registered. By
1135
+ # A list of custom classifiers that the user has registered. By
1103
1136
  # default, all AWS classifiers are included in a crawl, but these
1104
1137
  # custom classifiers always override the default classifiers for a
1105
1138
  # given classification.
1106
1139
  # @return [Array<String>]
1107
1140
  #
1108
1141
  # @!attribute [rw] table_prefix
1109
- # The table prefix used for catalog tables created.
1142
+ # The table prefix used for catalog tables that are created.
1110
1143
  # @return [String]
1111
1144
  #
1112
1145
  # @!attribute [rw] schema_change_policy
1113
1146
  # Policy for the crawler's update and deletion behavior.
1114
1147
  # @return [Types::SchemaChangePolicy]
1115
1148
  #
1149
+ # @!attribute [rw] configuration
1150
+ # Crawler configuration information. This versioned JSON string allows
1151
+ # users to specify aspects of a Crawler's behavior.
1152
+ #
1153
+ # You can use this field to force partitions to inherit metadata such
1154
+ # as classification, input format, output format, serde information,
1155
+ # and schema from their parent table, rather than detect this
1156
+ # information separately for each partition.
1157
+ # @return [String]
1158
+ #
1116
1159
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/CreateCrawlerRequest AWS API Documentation
1117
1160
  #
1118
1161
  class CreateCrawlerRequest < Struct.new(
@@ -1124,7 +1167,8 @@ module Aws::Glue
1124
1167
  :schedule,
1125
1168
  :classifiers,
1126
1169
  :table_prefix,
1127
- :schema_change_policy)
1170
+ :schema_change_policy,
1171
+ :configuration)
1128
1172
  include Aws::Structure
1129
1173
  end
1130
1174
 
@@ -1321,7 +1365,7 @@ module Aws::Glue
1321
1365
  include Aws::Structure
1322
1366
  end
1323
1367
 
1324
- # Specifies a Grok classifier for CreateClassifier to create.
1368
+ # Specifies a `grok` classifier for `CreateClassifier` to create.
1325
1369
  #
1326
1370
  # @note When making an API call, you may pass CreateGrokClassifierRequest
1327
1371
  # data as a hash:
@@ -1334,12 +1378,12 @@ module Aws::Glue
1334
1378
  # }
1335
1379
  #
1336
1380
  # @!attribute [rw] classification
1337
- # The type of result that the classifier matches, such as Twitter
1338
- # Json, Omniture logs, Cloudwatch logs, and so forth.
1381
+ # An identifier of the data format that the classifier matches, such
1382
+ # as Twitter, JSON, Omniture logs, Amazon CloudWatch Logs, and so on.
1339
1383
  # @return [String]
1340
1384
  #
1341
1385
  # @!attribute [rw] name
1342
- # The name of the new Classifier.
1386
+ # The name of the new classifier.
1343
1387
  # @return [String]
1344
1388
  #
1345
1389
  # @!attribute [rw] grok_pattern
@@ -1347,7 +1391,7 @@ module Aws::Glue
1347
1391
  # @return [String]
1348
1392
  #
1349
1393
  # @!attribute [rw] custom_patterns
1350
- # Custom grok patterns used by this classifier.
1394
+ # Optional custom grok patterns used by this classifier.
1351
1395
  # @return [String]
1352
1396
  #
1353
1397
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/CreateGrokClassifierRequest AWS API Documentation
@@ -1819,6 +1863,41 @@ module Aws::Glue
1819
1863
  #
1820
1864
  class CreateUserDefinedFunctionResponse < Aws::EmptyStructure; end
1821
1865
 
1866
+ # Specifies an XML classifier for `CreateClassifier` to create.
1867
+ #
1868
+ # @note When making an API call, you may pass CreateXMLClassifierRequest
1869
+ # data as a hash:
1870
+ #
1871
+ # {
1872
+ # classification: "Classification", # required
1873
+ # name: "NameString", # required
1874
+ # row_tag: "RowTag",
1875
+ # }
1876
+ #
1877
+ # @!attribute [rw] classification
1878
+ # An identifier of the data format that the classifier matches.
1879
+ # @return [String]
1880
+ #
1881
+ # @!attribute [rw] name
1882
+ # The name of the classifier.
1883
+ # @return [String]
1884
+ #
1885
+ # @!attribute [rw] row_tag
1886
+ # The XML tag designating the element that contains each record in an
1887
+ # XML document being parsed. Note that this cannot be an empty
1888
+ # element. It must contain child elements representing fields in the
1889
+ # record.
1890
+ # @return [String]
1891
+ #
1892
+ # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/CreateXMLClassifierRequest AWS API Documentation
1893
+ #
1894
+ class CreateXMLClassifierRequest < Struct.new(
1895
+ :classification,
1896
+ :name,
1897
+ :row_tag)
1898
+ include Aws::Structure
1899
+ end
1900
+
1822
1901
  # The `Database` object represents a logical grouping of tables that may
1823
1902
  # reside in a Hive metastore or an RDBMS.
1824
1903
  #
@@ -1903,7 +1982,7 @@ module Aws::Glue
1903
1982
  # }
1904
1983
  #
1905
1984
  # @!attribute [rw] name
1906
- # Name of the `Classifier` to remove.
1985
+ # Name of the classifier to remove.
1907
1986
  # @return [String]
1908
1987
  #
1909
1988
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/DeleteClassifierRequest AWS API Documentation
@@ -1954,7 +2033,7 @@ module Aws::Glue
1954
2033
  # }
1955
2034
  #
1956
2035
  # @!attribute [rw] name
1957
- # Name of the `Crawler` to remove.
2036
+ # Name of the crawler to remove.
1958
2037
  # @return [String]
1959
2038
  #
1960
2039
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/DeleteCrawlerRequest AWS API Documentation
@@ -2419,7 +2498,7 @@ module Aws::Glue
2419
2498
  # }
2420
2499
  #
2421
2500
  # @!attribute [rw] name
2422
- # Name of the `Classifier` to retrieve.
2501
+ # Name of the classifier to retrieve.
2423
2502
  # @return [String]
2424
2503
  #
2425
2504
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GetClassifierRequest AWS API Documentation
@@ -2430,7 +2509,7 @@ module Aws::Glue
2430
2509
  end
2431
2510
 
2432
2511
  # @!attribute [rw] classifier
2433
- # The requested `Classifier`.
2512
+ # The requested classifier.
2434
2513
  # @return [Types::Classifier]
2435
2514
  #
2436
2515
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GetClassifierResponse AWS API Documentation
@@ -2465,7 +2544,7 @@ module Aws::Glue
2465
2544
  end
2466
2545
 
2467
2546
  # @!attribute [rw] classifiers
2468
- # The requested list of `Classifier` objects.
2547
+ # The requested list of classifier objects.
2469
2548
  # @return [Array<Types::Classifier>]
2470
2549
  #
2471
2550
  # @!attribute [rw] next_token
@@ -2657,7 +2736,7 @@ module Aws::Glue
2657
2736
  # }
2658
2737
  #
2659
2738
  # @!attribute [rw] name
2660
- # Name of the `Crawler` to retrieve metadata for.
2739
+ # Name of the crawler to retrieve metadata for.
2661
2740
  # @return [String]
2662
2741
  #
2663
2742
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GetCrawlerRequest AWS API Documentation
@@ -2668,7 +2747,7 @@ module Aws::Glue
2668
2747
  end
2669
2748
 
2670
2749
  # @!attribute [rw] crawler
2671
- # The metadata for the specified `Crawler`.
2750
+ # The metadata for the specified crawler.
2672
2751
  # @return [Types::Crawler]
2673
2752
  #
2674
2753
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GetCrawlerResponse AWS API Documentation
@@ -2687,7 +2766,7 @@ module Aws::Glue
2687
2766
  # }
2688
2767
  #
2689
2768
  # @!attribute [rw] max_results
2690
- # The number of Crawlers to return on each call.
2769
+ # The number of crawlers to return on each call.
2691
2770
  # @return [Integer]
2692
2771
  #
2693
2772
  # @!attribute [rw] next_token
@@ -2703,7 +2782,7 @@ module Aws::Glue
2703
2782
  end
2704
2783
 
2705
2784
  # @!attribute [rw] crawlers
2706
- # A list of `Crawler` metadata.
2785
+ # A list of crawler metadata.
2707
2786
  # @return [Array<Types::Crawler>]
2708
2787
  #
2709
2788
  # @!attribute [rw] next_token
@@ -3321,7 +3400,7 @@ module Aws::Glue
3321
3400
  end
3322
3401
 
3323
3402
  # @!attribute [rw] python_script
3324
- # A python script to perform the mapping.
3403
+ # A Python script to perform the mapping.
3325
3404
  # @return [String]
3326
3405
  #
3327
3406
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GetPlanResponse AWS API Documentation
@@ -3674,15 +3753,15 @@ module Aws::Glue
3674
3753
  include Aws::Structure
3675
3754
  end
3676
3755
 
3677
- # A classifier that uses `grok`.
3756
+ # A classifier that uses `grok` patterns.
3678
3757
  #
3679
3758
  # @!attribute [rw] name
3680
3759
  # The name of the classifier.
3681
3760
  # @return [String]
3682
3761
  #
3683
3762
  # @!attribute [rw] classification
3684
- # The data form that the classifier matches, such as Twitter, JSON,
3685
- # Omniture Logs, and so forth.
3763
+ # An identifier of the data format that the classifier matches, such
3764
+ # as Twitter, JSON, Omniture logs, and so on.
3686
3765
  # @return [String]
3687
3766
  #
3688
3767
  # @!attribute [rw] creation_time
@@ -3698,11 +3777,22 @@ module Aws::Glue
3698
3777
  # @return [Integer]
3699
3778
  #
3700
3779
  # @!attribute [rw] grok_pattern
3701
- # The grok pattern used by this classifier.
3780
+ # The grok pattern applied to a data store by this classifier. For
3781
+ # more information, see built-in patterns in [Writing Custom
3782
+ # Classifers][1].
3783
+ #
3784
+ #
3785
+ #
3786
+ # [1]: http://docs.aws.amazon.com/glue/latest/dg/custom-classifier.html
3702
3787
  # @return [String]
3703
3788
  #
3704
3789
  # @!attribute [rw] custom_patterns
3705
- # Custom grok patterns used by this classifier.
3790
+ # Optional custom grok patterns defined by this classifier. For more
3791
+ # information, see custom patterns in [Writing Custom Classifers][1].
3792
+ #
3793
+ #
3794
+ #
3795
+ # [1]: http://docs.aws.amazon.com/glue/latest/dg/custom-classifier.html
3706
3796
  # @return [String]
3707
3797
  #
3708
3798
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/GrokClassifier AWS API Documentation
@@ -3741,7 +3831,7 @@ module Aws::Glue
3741
3831
  #
3742
3832
  class ImportCatalogToGlueResponse < Aws::EmptyStructure; end
3743
3833
 
3744
- # Specifies a JDBC target for a crawl.
3834
+ # Specifies a JDBC data store to crawl.
3745
3835
  #
3746
3836
  # @note When making an API call, you may pass JdbcTarget
3747
3837
  # data as a hash:
@@ -3753,7 +3843,7 @@ module Aws::Glue
3753
3843
  # }
3754
3844
  #
3755
3845
  # @!attribute [rw] connection_name
3756
- # The name of the connection to use for the JDBC target.
3846
+ # The name of the connection to use to connect to the JDBC target.
3757
3847
  # @return [String]
3758
3848
  #
3759
3849
  # @!attribute [rw] path
@@ -3761,7 +3851,12 @@ module Aws::Glue
3761
3851
  # @return [String]
3762
3852
  #
3763
3853
  # @!attribute [rw] exclusions
3764
- # A list of items to exclude from the crawl.
3854
+ # A list of glob patterns used to exclude from the crawl. For more
3855
+ # information, see [Catalog Tables with a Crawler][1].
3856
+ #
3857
+ #
3858
+ #
3859
+ # [1]: http://docs.aws.amazon.com/glue/latest/dg/add-crawler.html
3765
3860
  # @return [Array<String>]
3766
3861
  #
3767
3862
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/JdbcTarget AWS API Documentation
@@ -4059,7 +4154,7 @@ module Aws::Glue
4059
4154
  # @return [String]
4060
4155
  #
4061
4156
  # @!attribute [rw] error_message
4062
- # Error information about the last crawl, if an error occurred.
4157
+ # If an error occurred, the error information about the last crawl.
4063
4158
  # @return [String]
4064
4159
  #
4065
4160
  # @!attribute [rw] log_group
@@ -4117,7 +4212,7 @@ module Aws::Glue
4117
4212
  # @return [Array<Types::CodeGenNodeArg>]
4118
4213
  #
4119
4214
  # @!attribute [rw] s3
4120
- # An AWS S3 location.
4215
+ # An Amazon S3 location.
4121
4216
  # @return [Array<Types::CodeGenNodeArg>]
4122
4217
  #
4123
4218
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/Location AWS API Documentation
@@ -4517,7 +4612,7 @@ module Aws::Glue
4517
4612
  include Aws::Structure
4518
4613
  end
4519
4614
 
4520
- # Specifies a crawler target in AWS S3.
4615
+ # Specifies a data store in Amazon S3.
4521
4616
  #
4522
4617
  # @note When making an API call, you may pass S3Target
4523
4618
  # data as a hash:
@@ -4528,11 +4623,16 @@ module Aws::Glue
4528
4623
  # }
4529
4624
  #
4530
4625
  # @!attribute [rw] path
4531
- # The path to the S3 target.
4626
+ # The path to the Amazon S3 target.
4532
4627
  # @return [String]
4533
4628
  #
4534
4629
  # @!attribute [rw] exclusions
4535
- # A list of S3 objects to exclude from the crawl.
4630
+ # A list of glob patterns used to exclude from the crawl. For more
4631
+ # information, see [Catalog Tables with a Crawler][1].
4632
+ #
4633
+ #
4634
+ #
4635
+ # [1]: http://docs.aws.amazon.com/glue/latest/dg/add-crawler.html
4536
4636
  # @return [Array<String>]
4537
4637
  #
4538
4638
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/S3Target AWS API Documentation
@@ -4578,11 +4678,11 @@ module Aws::Glue
4578
4678
  # }
4579
4679
  #
4580
4680
  # @!attribute [rw] update_behavior
4581
- # The update behavior.
4681
+ # The update behavior when the crawler finds a changed schema.
4582
4682
  # @return [String]
4583
4683
  #
4584
4684
  # @!attribute [rw] delete_behavior
4585
- # The deletion behavior.
4685
+ # The deletion behavior when the crawler finds a deleted object.
4586
4686
  # @return [String]
4587
4687
  #
4588
4688
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/SchemaChangePolicy AWS API Documentation
@@ -4703,7 +4803,7 @@ module Aws::Glue
4703
4803
  # }
4704
4804
  #
4705
4805
  # @!attribute [rw] name
4706
- # Name of the `Crawler` to start.
4806
+ # Name of the crawler to start.
4707
4807
  # @return [String]
4708
4808
  #
4709
4809
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/StartCrawlerRequest AWS API Documentation
@@ -4825,7 +4925,7 @@ module Aws::Glue
4825
4925
  # }
4826
4926
  #
4827
4927
  # @!attribute [rw] name
4828
- # Name of the `Crawler` to stop.
4928
+ # Name of the crawler to stop.
4829
4929
  # @return [String]
4830
4930
  #
4831
4931
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/StopCrawlerRequest AWS API Documentation
@@ -5403,16 +5503,26 @@ module Aws::Glue
5403
5503
  # grok_pattern: "GrokPattern",
5404
5504
  # custom_patterns: "CustomPatterns",
5405
5505
  # },
5506
+ # xml_classifier: {
5507
+ # name: "NameString", # required
5508
+ # classification: "Classification",
5509
+ # row_tag: "RowTag",
5510
+ # },
5406
5511
  # }
5407
5512
  #
5408
5513
  # @!attribute [rw] grok_classifier
5409
5514
  # A `GrokClassifier` object with updated fields.
5410
5515
  # @return [Types::UpdateGrokClassifierRequest]
5411
5516
  #
5517
+ # @!attribute [rw] xml_classifier
5518
+ # An `XMLClassifier` object with updated fields.
5519
+ # @return [Types::UpdateXMLClassifierRequest]
5520
+ #
5412
5521
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/UpdateClassifierRequest AWS API Documentation
5413
5522
  #
5414
5523
  class UpdateClassifierRequest < Struct.new(
5415
- :grok_classifier)
5524
+ :grok_classifier,
5525
+ :xml_classifier)
5416
5526
  include Aws::Structure
5417
5527
  end
5418
5528
 
@@ -5474,7 +5584,7 @@ module Aws::Glue
5474
5584
  #
5475
5585
  # {
5476
5586
  # name: "NameString", # required
5477
- # role: "RoleArn",
5587
+ # role: "Role",
5478
5588
  # database_name: "DatabaseName",
5479
5589
  # description: "DescriptionStringRemovable",
5480
5590
  # targets: {
@@ -5499,28 +5609,29 @@ module Aws::Glue
5499
5609
  # update_behavior: "LOG", # accepts LOG, UPDATE_IN_DATABASE
5500
5610
  # delete_behavior: "LOG", # accepts LOG, DELETE_FROM_DATABASE, DEPRECATE_IN_DATABASE
5501
5611
  # },
5612
+ # configuration: "CrawlerConfiguration",
5502
5613
  # }
5503
5614
  #
5504
5615
  # @!attribute [rw] name
5505
- # Name of the new `Crawler`.
5616
+ # Name of the new crawler.
5506
5617
  # @return [String]
5507
5618
  #
5508
5619
  # @!attribute [rw] role
5509
- # The IAM role (or ARN of an IAM role) used by the new `Crawler` to
5620
+ # The IAM role (or ARN of an IAM role) used by the new crawler to
5510
5621
  # access customer resources.
5511
5622
  # @return [String]
5512
5623
  #
5513
5624
  # @!attribute [rw] database_name
5514
- # The Glue `Database` where results will be stored, such as:
5625
+ # The AWS Glue database where results are stored, such as:
5515
5626
  # `arn:aws:daylight:us-east-1::database/sometable/*`.
5516
5627
  # @return [String]
5517
5628
  #
5518
5629
  # @!attribute [rw] description
5519
- # A description of the new `Crawler`.
5630
+ # A description of the new crawler.
5520
5631
  # @return [String]
5521
5632
  #
5522
5633
  # @!attribute [rw] targets
5523
- # A list of collection of targets to crawl.
5634
+ # A list of targets to crawl.
5524
5635
  # @return [Types::CrawlerTargets]
5525
5636
  #
5526
5637
  # @!attribute [rw] schedule
@@ -5534,20 +5645,31 @@ module Aws::Glue
5534
5645
  # @return [String]
5535
5646
  #
5536
5647
  # @!attribute [rw] classifiers
5537
- # A list of custom `Classifier` names that the user has registered. By
5538
- # default, all AWS classifiers are included in a crawl, but these
5539
- # custom classifiers always override the default classifiers for a
5540
- # given classification.
5648
+ # A list of custom classifiers that the user has registered. By
5649
+ # default, all classifiers are included in a crawl, but these custom
5650
+ # classifiers always override the default classifiers for a given
5651
+ # classification.
5541
5652
  # @return [Array<String>]
5542
5653
  #
5543
5654
  # @!attribute [rw] table_prefix
5544
- # The table prefix used for catalog tables created.
5655
+ # The table prefix used for catalog tables that are created.
5545
5656
  # @return [String]
5546
5657
  #
5547
5658
  # @!attribute [rw] schema_change_policy
5548
5659
  # Policy for the crawler's update and deletion behavior.
5549
5660
  # @return [Types::SchemaChangePolicy]
5550
5661
  #
5662
+ # @!attribute [rw] configuration
5663
+ # Crawler configuration information. This versioned JSON string allows
5664
+ # users to specify aspects of a Crawler's behavior.
5665
+ #
5666
+ # You can use this field to force partitions to inherit metadata such
5667
+ # as classification, input format, output format, serde information,
5668
+ # and schema from their parent table, rather than detect this
5669
+ # information separately for each partition. Use the following JSON
5670
+ # string to specify that behavior:
5671
+ # @return [String]
5672
+ #
5551
5673
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/UpdateCrawlerRequest AWS API Documentation
5552
5674
  #
5553
5675
  class UpdateCrawlerRequest < Struct.new(
@@ -5559,7 +5681,8 @@ module Aws::Glue
5559
5681
  :schedule,
5560
5682
  :classifiers,
5561
5683
  :table_prefix,
5562
- :schema_change_policy)
5684
+ :schema_change_policy,
5685
+ :configuration)
5563
5686
  include Aws::Structure
5564
5687
  end
5565
5688
 
@@ -5689,7 +5812,8 @@ module Aws::Glue
5689
5812
  #
5690
5813
  class UpdateDevEndpointResponse < Aws::EmptyStructure; end
5691
5814
 
5692
- # Specifies a Grok classifier to update when passed to UpdateClassifier.
5815
+ # Specifies a grok classifier to update when passed to
5816
+ # `UpdateClassifier`.
5693
5817
  #
5694
5818
  # @note When making an API call, you may pass UpdateGrokClassifierRequest
5695
5819
  # data as a hash:
@@ -5706,8 +5830,8 @@ module Aws::Glue
5706
5830
  # @return [String]
5707
5831
  #
5708
5832
  # @!attribute [rw] classification
5709
- # The type of result that the classifier matches, such as Twitter
5710
- # Json, Omniture logs, Cloudwatch logs, and so forth.
5833
+ # An identifier of the data format that the classifier matches, such
5834
+ # as Twitter, JSON, Omniture logs, Amazon CloudWatch Logs, and so on.
5711
5835
  # @return [String]
5712
5836
  #
5713
5837
  # @!attribute [rw] grok_pattern
@@ -5715,7 +5839,7 @@ module Aws::Glue
5715
5839
  # @return [String]
5716
5840
  #
5717
5841
  # @!attribute [rw] custom_patterns
5718
- # Custom grok patterns used by this classifier.
5842
+ # Optional custom grok patterns used by this classifier.
5719
5843
  # @return [String]
5720
5844
  #
5721
5845
  # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/UpdateGrokClassifierRequest AWS API Documentation
@@ -6082,6 +6206,41 @@ module Aws::Glue
6082
6206
  #
6083
6207
  class UpdateUserDefinedFunctionResponse < Aws::EmptyStructure; end
6084
6208
 
6209
+ # Specifies an XML classifier to be updated.
6210
+ #
6211
+ # @note When making an API call, you may pass UpdateXMLClassifierRequest
6212
+ # data as a hash:
6213
+ #
6214
+ # {
6215
+ # name: "NameString", # required
6216
+ # classification: "Classification",
6217
+ # row_tag: "RowTag",
6218
+ # }
6219
+ #
6220
+ # @!attribute [rw] name
6221
+ # The name of the classifier.
6222
+ # @return [String]
6223
+ #
6224
+ # @!attribute [rw] classification
6225
+ # An identifier of the data format that the classifier matches.
6226
+ # @return [String]
6227
+ #
6228
+ # @!attribute [rw] row_tag
6229
+ # The XML tag designating the element that contains each record in an
6230
+ # XML document being parsed. Note that this cannot be an empty
6231
+ # element. It must contain child elements representing fields in the
6232
+ # record.
6233
+ # @return [String]
6234
+ #
6235
+ # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/UpdateXMLClassifierRequest AWS API Documentation
6236
+ #
6237
+ class UpdateXMLClassifierRequest < Struct.new(
6238
+ :name,
6239
+ :classification,
6240
+ :row_tag)
6241
+ include Aws::Structure
6242
+ end
6243
+
6085
6244
  # Represents the equivalent of a Hive user-defined function (`UDF`)
6086
6245
  # definition.
6087
6246
  #
@@ -6170,5 +6329,46 @@ module Aws::Glue
6170
6329
  include Aws::Structure
6171
6330
  end
6172
6331
 
6332
+ # A classifier for `XML` content.
6333
+ #
6334
+ # @!attribute [rw] name
6335
+ # The name of the classifier.
6336
+ # @return [String]
6337
+ #
6338
+ # @!attribute [rw] classification
6339
+ # An identifier of the data format that the classifier matches.
6340
+ # @return [String]
6341
+ #
6342
+ # @!attribute [rw] creation_time
6343
+ # The time this classifier was registered.
6344
+ # @return [Time]
6345
+ #
6346
+ # @!attribute [rw] last_updated
6347
+ # The time this classifier was last updated.
6348
+ # @return [Time]
6349
+ #
6350
+ # @!attribute [rw] version
6351
+ # The version of this classifier.
6352
+ # @return [Integer]
6353
+ #
6354
+ # @!attribute [rw] row_tag
6355
+ # The XML tag designating the element that contains each record in an
6356
+ # XML document being parsed. Note that this cannot be an empty
6357
+ # element. It must contain child elements representing fields in the
6358
+ # record.
6359
+ # @return [String]
6360
+ #
6361
+ # @see http://docs.aws.amazon.com/goto/WebAPI/glue-2017-03-31/XMLClassifier AWS API Documentation
6362
+ #
6363
+ class XMLClassifier < Struct.new(
6364
+ :name,
6365
+ :classification,
6366
+ :creation_time,
6367
+ :last_updated,
6368
+ :version,
6369
+ :row_tag)
6370
+ include Aws::Structure
6371
+ end
6372
+
6173
6373
  end
6174
6374
  end