aws-sdk-comprehend 1.67.0 → 1.68.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 98cca79ad616409a627fb408bf9d57dde00f6ae9f610d0b2347cb53172595630
4
- data.tar.gz: 37bf33b746207ed09a41855ec47bac27e7bf7d9618ef40927f7ad89234d2d4ab
3
+ metadata.gz: 2795339a1b5ff7154a977a6f4921117728519249538628c2e430ff0439de0778
4
+ data.tar.gz: 91f757f8d8a73726513ba2a7b526c5991ff24ea62cc072938a85395cfd96b431
5
5
  SHA512:
6
- metadata.gz: ee8117be4044e5ded7fd37ff794c2de556a4f47beec32abee11ffb61a9f7a82ea440c21cec9f1ab7389ad67a8ede376e975cb2b54bf0065e2e224c0ba005aa04
7
- data.tar.gz: ff0b87b8396361b18eaf86b3b907b99e20ca83f1777216fa1446dfe6debac2f6ac769e50d066d0c47474472e408d404a85277ad9224db88833303b00148d1eb0
6
+ metadata.gz: 460952c4bc9f3eee19662f76e4421bf4105807f1c6d0e54e9efea4c501201d382652a87dc5e1a01613e1105c6b5250c0f494015545e5d88f33d2eacef57deeaa
7
+ data.tar.gz: da511f2b66c64df9893d055713dc490716ec475a9050d7b2214fd2a82243a8ec073a04d300418bd14264e8673ab5836dd2ddf77aa48546a0d31947a9c06063b5
data/CHANGELOG.md CHANGED
@@ -1,6 +1,11 @@
1
1
  Unreleased Changes
2
2
  ------------------
3
3
 
4
+ 1.68.0 (2023-04-19)
5
+ ------------------
6
+
7
+ * Feature - This release supports native document models for custom classification, in addition to plain-text models. You train native document models using documents (PDF, Word, images) in their native format.
8
+
4
9
  1.67.0 (2023-03-24)
5
10
  ------------------
6
11
 
data/VERSION CHANGED
@@ -1 +1 @@
1
- 1.67.0
1
+ 1.68.0
@@ -765,6 +765,7 @@ module Aws::Comprehend
765
765
  # * {Types::ClassifyDocumentResponse#document_metadata #document_metadata} => Types::DocumentMetadata
766
766
  # * {Types::ClassifyDocumentResponse#document_type #document_type} => Array<Types::DocumentTypeListItem>
767
767
  # * {Types::ClassifyDocumentResponse#errors #errors} => Array<Types::ErrorsListItem>
768
+ # * {Types::ClassifyDocumentResponse#warnings #warnings} => Array<Types::WarningsListItem>
768
769
  #
769
770
  # @example Request syntax with placeholder values
770
771
  #
@@ -800,6 +801,10 @@ module Aws::Comprehend
800
801
  # resp.errors[0].page #=> Integer
801
802
  # resp.errors[0].error_code #=> String, one of "TEXTRACT_BAD_PAGE", "TEXTRACT_PROVISIONED_THROUGHPUT_EXCEEDED", "PAGE_CHARACTERS_EXCEEDED", "PAGE_SIZE_EXCEEDED", "INTERNAL_SERVER_ERROR"
802
803
  # resp.errors[0].error_message #=> String
804
+ # resp.warnings #=> Array
805
+ # resp.warnings[0].page #=> Integer
806
+ # resp.warnings[0].warn_code #=> String, one of "INFERENCING_PLAINTEXT_WITH_NATIVE_TRAINED_MODEL", "INFERENCING_NATIVE_DOCUMENT_WITH_PLAINTEXT_TRAINED_MODEL"
807
+ # resp.warnings[0].warn_message #=> String
803
808
  #
804
809
  # @see http://docs.aws.amazon.com/goto/WebAPI/comprehend-2017-11-27/ClassifyDocument AWS API Documentation
805
810
  #
@@ -947,14 +952,13 @@ module Aws::Comprehend
947
952
 
948
953
  # Creates a new document classifier that you can use to categorize
949
954
  # documents. To create a classifier, you provide a set of training
950
- # documents that labeled with the categories that you want to use. After
951
- # the classifier is trained you can use it to categorize a set of
952
- # labeled documents into the categories. For more information, see
953
- # [Document Classification][1] in the Comprehend Developer Guide.
955
+ # documents that are labeled with the categories that you want to use.
956
+ # For more information, see [Training classifier models][1] in the
957
+ # Comprehend Developer Guide.
954
958
  #
955
959
  #
956
960
  #
957
- # [1]: https://docs.aws.amazon.com/comprehend/latest/dg/how-document-classification.html
961
+ # [1]: https://docs.aws.amazon.com/comprehend/latest/dg/training-classifier-model.html
958
962
  #
959
963
  # @option params [required, String] :document_classifier_name
960
964
  # The name of the document classifier.
@@ -980,8 +984,9 @@ module Aws::Comprehend
980
984
  # Specifies the format and location of the input data for the job.
981
985
  #
982
986
  # @option params [Types::DocumentClassifierOutputDataConfig] :output_data_config
983
- # Enables the addition of output results configuration parameters for
984
- # custom classifier jobs.
987
+ # Specifies the location for the output files from a custom classifier
988
+ # job. This parameter is required for a request that creates a native
989
+ # classifier model.
985
990
  #
986
991
  # @option params [String] :client_request_token
987
992
  # A unique identifier for the request. If you don't set the client
@@ -1082,6 +1087,16 @@ module Aws::Comprehend
1082
1087
  # document_type: "PLAIN_TEXT_DOCUMENT", # accepts PLAIN_TEXT_DOCUMENT, SEMI_STRUCTURED_DOCUMENT
1083
1088
  # },
1084
1089
  # ],
1090
+ # document_type: "PLAIN_TEXT_DOCUMENT", # accepts PLAIN_TEXT_DOCUMENT, SEMI_STRUCTURED_DOCUMENT
1091
+ # documents: {
1092
+ # s3_uri: "S3Uri", # required
1093
+ # test_s3_uri: "S3Uri",
1094
+ # },
1095
+ # document_reader_config: {
1096
+ # document_read_action: "TEXTRACT_DETECT_DOCUMENT_TEXT", # required, accepts TEXTRACT_DETECT_DOCUMENT_TEXT, TEXTRACT_ANALYZE_DOCUMENT
1097
+ # document_read_mode: "SERVICE_DEFAULT", # accepts SERVICE_DEFAULT, FORCE_DOCUMENT_READ_ACTION
1098
+ # feature_types: ["TABLES"], # accepts TABLES, FORMS
1099
+ # },
1085
1100
  # },
1086
1101
  # output_data_config: {
1087
1102
  # s3_uri: "S3Uri",
@@ -1760,6 +1775,13 @@ module Aws::Comprehend
1760
1775
  # resp.document_classifier_properties.input_data_config.augmented_manifests[0].annotation_data_s3_uri #=> String
1761
1776
  # resp.document_classifier_properties.input_data_config.augmented_manifests[0].source_documents_s3_uri #=> String
1762
1777
  # resp.document_classifier_properties.input_data_config.augmented_manifests[0].document_type #=> String, one of "PLAIN_TEXT_DOCUMENT", "SEMI_STRUCTURED_DOCUMENT"
1778
+ # resp.document_classifier_properties.input_data_config.document_type #=> String, one of "PLAIN_TEXT_DOCUMENT", "SEMI_STRUCTURED_DOCUMENT"
1779
+ # resp.document_classifier_properties.input_data_config.documents.s3_uri #=> String
1780
+ # resp.document_classifier_properties.input_data_config.documents.test_s3_uri #=> String
1781
+ # resp.document_classifier_properties.input_data_config.document_reader_config.document_read_action #=> String, one of "TEXTRACT_DETECT_DOCUMENT_TEXT", "TEXTRACT_ANALYZE_DOCUMENT"
1782
+ # resp.document_classifier_properties.input_data_config.document_reader_config.document_read_mode #=> String, one of "SERVICE_DEFAULT", "FORCE_DOCUMENT_READ_ACTION"
1783
+ # resp.document_classifier_properties.input_data_config.document_reader_config.feature_types #=> Array
1784
+ # resp.document_classifier_properties.input_data_config.document_reader_config.feature_types[0] #=> String, one of "TABLES", "FORMS"
1763
1785
  # resp.document_classifier_properties.output_data_config.s3_uri #=> String
1764
1786
  # resp.document_classifier_properties.output_data_config.kms_key_id #=> String
1765
1787
  # resp.document_classifier_properties.output_data_config.flywheel_stats_s3_prefix #=> String
@@ -3201,6 +3223,13 @@ module Aws::Comprehend
3201
3223
  # resp.document_classifier_properties_list[0].input_data_config.augmented_manifests[0].annotation_data_s3_uri #=> String
3202
3224
  # resp.document_classifier_properties_list[0].input_data_config.augmented_manifests[0].source_documents_s3_uri #=> String
3203
3225
  # resp.document_classifier_properties_list[0].input_data_config.augmented_manifests[0].document_type #=> String, one of "PLAIN_TEXT_DOCUMENT", "SEMI_STRUCTURED_DOCUMENT"
3226
+ # resp.document_classifier_properties_list[0].input_data_config.document_type #=> String, one of "PLAIN_TEXT_DOCUMENT", "SEMI_STRUCTURED_DOCUMENT"
3227
+ # resp.document_classifier_properties_list[0].input_data_config.documents.s3_uri #=> String
3228
+ # resp.document_classifier_properties_list[0].input_data_config.documents.test_s3_uri #=> String
3229
+ # resp.document_classifier_properties_list[0].input_data_config.document_reader_config.document_read_action #=> String, one of "TEXTRACT_DETECT_DOCUMENT_TEXT", "TEXTRACT_ANALYZE_DOCUMENT"
3230
+ # resp.document_classifier_properties_list[0].input_data_config.document_reader_config.document_read_mode #=> String, one of "SERVICE_DEFAULT", "FORCE_DOCUMENT_READ_ACTION"
3231
+ # resp.document_classifier_properties_list[0].input_data_config.document_reader_config.feature_types #=> Array
3232
+ # resp.document_classifier_properties_list[0].input_data_config.document_reader_config.feature_types[0] #=> String, one of "TABLES", "FORMS"
3204
3233
  # resp.document_classifier_properties_list[0].output_data_config.s3_uri #=> String
3205
3234
  # resp.document_classifier_properties_list[0].output_data_config.kms_key_id #=> String
3206
3235
  # resp.document_classifier_properties_list[0].output_data_config.flywheel_stats_s3_prefix #=> String
@@ -5786,7 +5815,7 @@ module Aws::Comprehend
5786
5815
  params: params,
5787
5816
  config: config)
5788
5817
  context[:gem_name] = 'aws-sdk-comprehend'
5789
- context[:gem_version] = '1.67.0'
5818
+ context[:gem_version] = '1.68.0'
5790
5819
  Seahorse::Client::Request.new(handlers, context)
5791
5820
  end
5792
5821
 
@@ -151,6 +151,8 @@ module Aws::Comprehend
151
151
  DocumentClassifierArn = Shapes::StringShape.new(name: 'DocumentClassifierArn')
152
152
  DocumentClassifierAugmentedManifestsList = Shapes::ListShape.new(name: 'DocumentClassifierAugmentedManifestsList')
153
153
  DocumentClassifierDataFormat = Shapes::StringShape.new(name: 'DocumentClassifierDataFormat')
154
+ DocumentClassifierDocumentTypeFormat = Shapes::StringShape.new(name: 'DocumentClassifierDocumentTypeFormat')
155
+ DocumentClassifierDocuments = Shapes::StructureShape.new(name: 'DocumentClassifierDocuments')
154
156
  DocumentClassifierEndpointArn = Shapes::StringShape.new(name: 'DocumentClassifierEndpointArn')
155
157
  DocumentClassifierFilter = Shapes::StructureShape.new(name: 'DocumentClassifierFilter')
156
158
  DocumentClassifierInputDataConfig = Shapes::StructureShape.new(name: 'DocumentClassifierInputDataConfig')
@@ -305,6 +307,7 @@ module Aws::Comprehend
305
307
  ListOfRelationships = Shapes::ListShape.new(name: 'ListOfRelationships')
306
308
  ListOfSyntaxTokens = Shapes::ListShape.new(name: 'ListOfSyntaxTokens')
307
309
  ListOfTargetedSentimentEntities = Shapes::ListShape.new(name: 'ListOfTargetedSentimentEntities')
310
+ ListOfWarnings = Shapes::ListShape.new(name: 'ListOfWarnings')
308
311
  ListPiiEntitiesDetectionJobsRequest = Shapes::StructureShape.new(name: 'ListPiiEntitiesDetectionJobsRequest')
309
312
  ListPiiEntitiesDetectionJobsResponse = Shapes::StructureShape.new(name: 'ListPiiEntitiesDetectionJobsResponse')
310
313
  ListSentimentDetectionJobsRequest = Shapes::StructureShape.new(name: 'ListSentimentDetectionJobsRequest')
@@ -324,6 +327,7 @@ module Aws::Comprehend
324
327
  NumberOfTopicsInteger = Shapes::IntegerShape.new(name: 'NumberOfTopicsInteger')
325
328
  OutputDataConfig = Shapes::StructureShape.new(name: 'OutputDataConfig')
326
329
  PageBasedErrorCode = Shapes::StringShape.new(name: 'PageBasedErrorCode')
330
+ PageBasedWarningCode = Shapes::StringShape.new(name: 'PageBasedWarningCode')
327
331
  PartOfSpeechTag = Shapes::StructureShape.new(name: 'PartOfSpeechTag')
328
332
  PartOfSpeechTagType = Shapes::StringShape.new(name: 'PartOfSpeechTagType')
329
333
  PiiEntitiesDetectionJobFilter = Shapes::StructureShape.new(name: 'PiiEntitiesDetectionJobFilter')
@@ -434,6 +438,7 @@ module Aws::Comprehend
434
438
  UpdateFlywheelResponse = Shapes::StructureShape.new(name: 'UpdateFlywheelResponse')
435
439
  VersionName = Shapes::StringShape.new(name: 'VersionName')
436
440
  VpcConfig = Shapes::StructureShape.new(name: 'VpcConfig')
441
+ WarningsListItem = Shapes::StructureShape.new(name: 'WarningsListItem')
437
442
 
438
443
  AttributeNamesList.member = Shapes::ShapeRef.new(shape: AttributeNamesListItem)
439
444
 
@@ -579,6 +584,7 @@ module Aws::Comprehend
579
584
  ClassifyDocumentResponse.add_member(:document_metadata, Shapes::ShapeRef.new(shape: DocumentMetadata, location_name: "DocumentMetadata"))
580
585
  ClassifyDocumentResponse.add_member(:document_type, Shapes::ShapeRef.new(shape: ListOfDocumentType, location_name: "DocumentType"))
581
586
  ClassifyDocumentResponse.add_member(:errors, Shapes::ShapeRef.new(shape: ListOfErrors, location_name: "Errors"))
587
+ ClassifyDocumentResponse.add_member(:warnings, Shapes::ShapeRef.new(shape: ListOfWarnings, location_name: "Warnings"))
582
588
  ClassifyDocumentResponse.struct_class = Types::ClassifyDocumentResponse
583
589
 
584
590
  ConcurrentModificationException.add_member(:message, Shapes::ShapeRef.new(shape: String, location_name: "Message"))
@@ -944,6 +950,10 @@ module Aws::Comprehend
944
950
 
945
951
  DocumentClassifierAugmentedManifestsList.member = Shapes::ShapeRef.new(shape: AugmentedManifestsListItem)
946
952
 
953
+ DocumentClassifierDocuments.add_member(:s3_uri, Shapes::ShapeRef.new(shape: S3Uri, required: true, location_name: "S3Uri"))
954
+ DocumentClassifierDocuments.add_member(:test_s3_uri, Shapes::ShapeRef.new(shape: S3Uri, location_name: "TestS3Uri"))
955
+ DocumentClassifierDocuments.struct_class = Types::DocumentClassifierDocuments
956
+
947
957
  DocumentClassifierFilter.add_member(:status, Shapes::ShapeRef.new(shape: ModelStatus, location_name: "Status"))
948
958
  DocumentClassifierFilter.add_member(:document_classifier_name, Shapes::ShapeRef.new(shape: ComprehendArnName, location_name: "DocumentClassifierName"))
949
959
  DocumentClassifierFilter.add_member(:submit_time_before, Shapes::ShapeRef.new(shape: Timestamp, location_name: "SubmitTimeBefore"))
@@ -955,6 +965,9 @@ module Aws::Comprehend
955
965
  DocumentClassifierInputDataConfig.add_member(:test_s3_uri, Shapes::ShapeRef.new(shape: S3Uri, location_name: "TestS3Uri"))
956
966
  DocumentClassifierInputDataConfig.add_member(:label_delimiter, Shapes::ShapeRef.new(shape: LabelDelimiter, location_name: "LabelDelimiter"))
957
967
  DocumentClassifierInputDataConfig.add_member(:augmented_manifests, Shapes::ShapeRef.new(shape: DocumentClassifierAugmentedManifestsList, location_name: "AugmentedManifests"))
968
+ DocumentClassifierInputDataConfig.add_member(:document_type, Shapes::ShapeRef.new(shape: DocumentClassifierDocumentTypeFormat, location_name: "DocumentType"))
969
+ DocumentClassifierInputDataConfig.add_member(:documents, Shapes::ShapeRef.new(shape: DocumentClassifierDocuments, location_name: "Documents"))
970
+ DocumentClassifierInputDataConfig.add_member(:document_reader_config, Shapes::ShapeRef.new(shape: DocumentReaderConfig, location_name: "DocumentReaderConfig"))
958
971
  DocumentClassifierInputDataConfig.struct_class = Types::DocumentClassifierInputDataConfig
959
972
 
960
973
  DocumentClassifierOutputDataConfig.add_member(:s3_uri, Shapes::ShapeRef.new(shape: S3Uri, location_name: "S3Uri"))
@@ -1518,6 +1531,8 @@ module Aws::Comprehend
1518
1531
 
1519
1532
  ListOfTargetedSentimentEntities.member = Shapes::ShapeRef.new(shape: TargetedSentimentEntity)
1520
1533
 
1534
+ ListOfWarnings.member = Shapes::ShapeRef.new(shape: WarningsListItem)
1535
+
1521
1536
  ListPiiEntitiesDetectionJobsRequest.add_member(:filter, Shapes::ShapeRef.new(shape: PiiEntitiesDetectionJobFilter, location_name: "Filter"))
1522
1537
  ListPiiEntitiesDetectionJobsRequest.add_member(:next_token, Shapes::ShapeRef.new(shape: String, location_name: "NextToken"))
1523
1538
  ListPiiEntitiesDetectionJobsRequest.add_member(:max_results, Shapes::ShapeRef.new(shape: MaxResultsInteger, location_name: "MaxResults"))
@@ -2026,6 +2041,11 @@ module Aws::Comprehend
2026
2041
  VpcConfig.add_member(:subnets, Shapes::ShapeRef.new(shape: Subnets, required: true, location_name: "Subnets"))
2027
2042
  VpcConfig.struct_class = Types::VpcConfig
2028
2043
 
2044
+ WarningsListItem.add_member(:page, Shapes::ShapeRef.new(shape: Integer, location_name: "Page"))
2045
+ WarningsListItem.add_member(:warn_code, Shapes::ShapeRef.new(shape: PageBasedWarningCode, location_name: "WarnCode"))
2046
+ WarningsListItem.add_member(:warn_message, Shapes::ShapeRef.new(shape: String, location_name: "WarnMessage"))
2047
+ WarningsListItem.struct_class = Types::WarningsListItem
2048
+
2029
2049
 
2030
2050
  # @api private
2031
2051
  API = Seahorse::Model::Api.new.tap do |api|
@@ -2924,6 +2944,7 @@ module Aws::Comprehend
2924
2944
  o.errors << Shapes::ShapeRef.new(shape: ResourceUnavailableException)
2925
2945
  o.errors << Shapes::ShapeRef.new(shape: KmsKeyValidationException)
2926
2946
  o.errors << Shapes::ShapeRef.new(shape: TooManyTagsException)
2947
+ o.errors << Shapes::ShapeRef.new(shape: ResourceInUseException)
2927
2948
  o.errors << Shapes::ShapeRef.new(shape: InternalServerException)
2928
2949
  end)
2929
2950
 
@@ -2937,6 +2958,7 @@ module Aws::Comprehend
2937
2958
  o.errors << Shapes::ShapeRef.new(shape: TooManyRequestsException)
2938
2959
  o.errors << Shapes::ShapeRef.new(shape: KmsKeyValidationException)
2939
2960
  o.errors << Shapes::ShapeRef.new(shape: TooManyTagsException)
2961
+ o.errors << Shapes::ShapeRef.new(shape: ResourceInUseException)
2940
2962
  o.errors << Shapes::ShapeRef.new(shape: InternalServerException)
2941
2963
  end)
2942
2964
 
@@ -2952,6 +2974,7 @@ module Aws::Comprehend
2952
2974
  o.errors << Shapes::ShapeRef.new(shape: ResourceUnavailableException)
2953
2975
  o.errors << Shapes::ShapeRef.new(shape: KmsKeyValidationException)
2954
2976
  o.errors << Shapes::ShapeRef.new(shape: TooManyTagsException)
2977
+ o.errors << Shapes::ShapeRef.new(shape: ResourceInUseException)
2955
2978
  o.errors << Shapes::ShapeRef.new(shape: InternalServerException)
2956
2979
  end)
2957
2980
 
@@ -2965,6 +2988,7 @@ module Aws::Comprehend
2965
2988
  o.errors << Shapes::ShapeRef.new(shape: TooManyRequestsException)
2966
2989
  o.errors << Shapes::ShapeRef.new(shape: KmsKeyValidationException)
2967
2990
  o.errors << Shapes::ShapeRef.new(shape: TooManyTagsException)
2991
+ o.errors << Shapes::ShapeRef.new(shape: ResourceInUseException)
2968
2992
  o.errors << Shapes::ShapeRef.new(shape: InternalServerException)
2969
2993
  end)
2970
2994
 
@@ -2991,6 +3015,7 @@ module Aws::Comprehend
2991
3015
  o.errors << Shapes::ShapeRef.new(shape: TooManyRequestsException)
2992
3016
  o.errors << Shapes::ShapeRef.new(shape: KmsKeyValidationException)
2993
3017
  o.errors << Shapes::ShapeRef.new(shape: TooManyTagsException)
3018
+ o.errors << Shapes::ShapeRef.new(shape: ResourceInUseException)
2994
3019
  o.errors << Shapes::ShapeRef.new(shape: InternalServerException)
2995
3020
  end)
2996
3021
 
@@ -3004,6 +3029,7 @@ module Aws::Comprehend
3004
3029
  o.errors << Shapes::ShapeRef.new(shape: TooManyRequestsException)
3005
3030
  o.errors << Shapes::ShapeRef.new(shape: KmsKeyValidationException)
3006
3031
  o.errors << Shapes::ShapeRef.new(shape: TooManyTagsException)
3032
+ o.errors << Shapes::ShapeRef.new(shape: ResourceInUseException)
3007
3033
  o.errors << Shapes::ShapeRef.new(shape: InternalServerException)
3008
3034
  end)
3009
3035
 
@@ -3017,6 +3043,7 @@ module Aws::Comprehend
3017
3043
  o.errors << Shapes::ShapeRef.new(shape: TooManyRequestsException)
3018
3044
  o.errors << Shapes::ShapeRef.new(shape: KmsKeyValidationException)
3019
3045
  o.errors << Shapes::ShapeRef.new(shape: TooManyTagsException)
3046
+ o.errors << Shapes::ShapeRef.new(shape: ResourceInUseException)
3020
3047
  o.errors << Shapes::ShapeRef.new(shape: InternalServerException)
3021
3048
  end)
3022
3049
 
@@ -3030,6 +3057,7 @@ module Aws::Comprehend
3030
3057
  o.errors << Shapes::ShapeRef.new(shape: TooManyRequestsException)
3031
3058
  o.errors << Shapes::ShapeRef.new(shape: KmsKeyValidationException)
3032
3059
  o.errors << Shapes::ShapeRef.new(shape: TooManyTagsException)
3060
+ o.errors << Shapes::ShapeRef.new(shape: ResourceInUseException)
3033
3061
  o.errors << Shapes::ShapeRef.new(shape: InternalServerException)
3034
3062
  end)
3035
3063
 
@@ -3043,6 +3071,7 @@ module Aws::Comprehend
3043
3071
  o.errors << Shapes::ShapeRef.new(shape: TooManyRequestsException)
3044
3072
  o.errors << Shapes::ShapeRef.new(shape: KmsKeyValidationException)
3045
3073
  o.errors << Shapes::ShapeRef.new(shape: TooManyTagsException)
3074
+ o.errors << Shapes::ShapeRef.new(shape: ResourceInUseException)
3046
3075
  o.errors << Shapes::ShapeRef.new(shape: InternalServerException)
3047
3076
  end)
3048
3077
 
@@ -856,6 +856,16 @@ module Aws::Comprehend
856
856
  # errors.
857
857
  # @return [Array<Types::ErrorsListItem>]
858
858
  #
859
+ # @!attribute [rw] warnings
860
+ # Warnings detected while processing the input document. The response
861
+ # includes a warning if there is a mismatch between the input document
862
+ # type and the model type associated with the endpoint that you
863
+ # specified. The response can also include warnings for individual
864
+ # pages that have a mismatch.
865
+ #
866
+ # The field is empty if the system generated no warnings.
867
+ # @return [Array<Types::WarningsListItem>]
868
+ #
859
869
  # @see http://docs.aws.amazon.com/goto/WebAPI/comprehend-2017-11-27/ClassifyDocumentResponse AWS API Documentation
860
870
  #
861
871
  class ClassifyDocumentResponse < Struct.new(
@@ -863,7 +873,8 @@ module Aws::Comprehend
863
873
  :labels,
864
874
  :document_metadata,
865
875
  :document_type,
866
- :errors)
876
+ :errors,
877
+ :warnings)
867
878
  SENSITIVE = []
868
879
  include Aws::Structure
869
880
  end
@@ -1004,8 +1015,9 @@ module Aws::Comprehend
1004
1015
  # @return [Types::DocumentClassifierInputDataConfig]
1005
1016
  #
1006
1017
  # @!attribute [rw] output_data_config
1007
- # Enables the addition of output results configuration parameters for
1008
- # custom classifier jobs.
1018
+ # Specifies the location for the output files from a custom classifier
1019
+ # job. This parameter is required for a request that creates a native
1020
+ # classifier model.
1009
1021
  # @return [Types::DocumentClassifierOutputDataConfig]
1010
1022
  #
1011
1023
  # @!attribute [rw] client_request_token
@@ -2830,6 +2842,29 @@ module Aws::Comprehend
2830
2842
  include Aws::Structure
2831
2843
  end
2832
2844
 
2845
+ # The location of the training documents. This parameter is required in
2846
+ # a request to create a native classifier model.
2847
+ #
2848
+ # @!attribute [rw] s3_uri
2849
+ # The S3 URI location of the training documents specified in the S3Uri
2850
+ # CSV file.
2851
+ # @return [String]
2852
+ #
2853
+ # @!attribute [rw] test_s3_uri
2854
+ # The S3 URI location of the test documents included in the TestS3Uri
2855
+ # CSV file. This field is not required if you do not specify a test
2856
+ # CSV file.
2857
+ # @return [String]
2858
+ #
2859
+ # @see http://docs.aws.amazon.com/goto/WebAPI/comprehend-2017-11-27/DocumentClassifierDocuments AWS API Documentation
2860
+ #
2861
+ class DocumentClassifierDocuments < Struct.new(
2862
+ :s3_uri,
2863
+ :test_s3_uri)
2864
+ SENSITIVE = []
2865
+ include Aws::Structure
2866
+ end
2867
+
2833
2868
  # Provides information for filtering a list of document classifiers. You
2834
2869
  # can only specify one filtering parameter in a request. For more
2835
2870
  # information, see the `ListDocumentClassifiers` operation.
@@ -2936,6 +2971,45 @@ module Aws::Comprehend
2936
2971
  # `AUGMENTED_MANIFEST`.
2937
2972
  # @return [Array<Types::AugmentedManifestsListItem>]
2938
2973
  #
2974
+ # @!attribute [rw] document_type
2975
+ # The type of input documents for training the model. Provide
2976
+ # plain-text documents to create a plain-text model, and provide
2977
+ # semi-structured documents to create a native model.
2978
+ # @return [String]
2979
+ #
2980
+ # @!attribute [rw] documents
2981
+ # The S3 location of the training documents. This parameter is
2982
+ # required in a request to create a native classifier model.
2983
+ # @return [Types::DocumentClassifierDocuments]
2984
+ #
2985
+ # @!attribute [rw] document_reader_config
2986
+ # Provides configuration parameters to override the default actions
2987
+ # for extracting text from PDF documents and image files.
2988
+ #
2989
+ # By default, Amazon Comprehend performs the following actions to
2990
+ # extract text from files, based on the input file type:
2991
+ #
2992
+ # * **Word files** - Amazon Comprehend parser extracts the text.
2993
+ #
2994
+ # * **Digital PDF files** - Amazon Comprehend parser extracts the
2995
+ # text.
2996
+ #
2997
+ # * **Image files and scanned PDF files** - Amazon Comprehend uses the
2998
+ # Amazon Textract `DetectDocumentText` API to extract the text.
2999
+ #
3000
+ # `DocumentReaderConfig` does not apply to plain text files or Word
3001
+ # files.
3002
+ #
3003
+ # For image files and PDF documents, you can override these default
3004
+ # actions using the fields listed below. For more information, see [
3005
+ # Setting text extraction options][1] in the Comprehend Developer
3006
+ # Guide.
3007
+ #
3008
+ #
3009
+ #
3010
+ # [1]: https://docs.aws.amazon.com/comprehend/latest/dg/idp-set-textract-options.html
3011
+ # @return [Types::DocumentReaderConfig]
3012
+ #
2939
3013
  # @see http://docs.aws.amazon.com/goto/WebAPI/comprehend-2017-11-27/DocumentClassifierInputDataConfig AWS API Documentation
2940
3014
  #
2941
3015
  class DocumentClassifierInputDataConfig < Struct.new(
@@ -2943,20 +3017,24 @@ module Aws::Comprehend
2943
3017
  :s3_uri,
2944
3018
  :test_s3_uri,
2945
3019
  :label_delimiter,
2946
- :augmented_manifests)
3020
+ :augmented_manifests,
3021
+ :document_type,
3022
+ :documents,
3023
+ :document_reader_config)
2947
3024
  SENSITIVE = []
2948
3025
  include Aws::Structure
2949
3026
  end
2950
3027
 
2951
- # Provides output results configuration parameters for custom classifier
2952
- # jobs.
3028
+ # Provide the location for output data from a custom classifier job.
3029
+ # This field is mandatory if you are training a native classifier model.
2953
3030
  #
2954
3031
  # @!attribute [rw] s3_uri
2955
3032
  # When you use the `OutputDataConfig` object while creating a custom
2956
3033
  # classifier, you specify the Amazon S3 location where you want to
2957
- # write the confusion matrix. The URI must be in the same Region as
2958
- # the API endpoint that you are calling. The location is used as the
2959
- # prefix for the actual location of this output file.
3034
+ # write the confusion matrix and other output files. The URI must be
3035
+ # in the same Region as the API endpoint that you are calling. The
3036
+ # location is used as the prefix for the actual location of this
3037
+ # output file.
2960
3038
  #
2961
3039
  # When the custom classifier job is finished, the service creates the
2962
3040
  # output file in a directory specific to the job. The `S3Uri` field
@@ -3009,9 +3087,13 @@ module Aws::Comprehend
3009
3087
  #
3010
3088
  # @!attribute [rw] status
3011
3089
  # The status of the document classifier. If the status is `TRAINED`
3012
- # the classifier is ready to use. If the status is `FAILED` you can
3013
- # see additional information about why the classifier wasn't trained
3014
- # in the `Message` field.
3090
+ # the classifier is ready to use. If the status is
3091
+ # `TRAINED_WITH_WARNINGS` the classifier training succeeded, but you
3092
+ # should review the warnings returned in the
3093
+ # `CreateDocumentClassifier` response.
3094
+ #
3095
+ # If the status is `FAILED` you can see additional information about
3096
+ # why the classifier wasn't trained in the `Message` field.
3015
3097
  # @return [String]
3016
3098
  #
3017
3099
  # @!attribute [rw] message
@@ -3241,11 +3323,11 @@ module Aws::Comprehend
3241
3323
  #
3242
3324
  # For image files and PDF documents, you can override these default
3243
3325
  # actions using the fields listed below. For more information, see [
3244
- # Setting text extraction options][1].
3326
+ # Setting text extraction options][1] in the Comprehend Developer Guide.
3245
3327
  #
3246
3328
  #
3247
3329
  #
3248
- # [1]: https://docs.aws.amazon.com/comprehend/latest/dg/detecting-cer.html#detecting-cer-pdf
3330
+ # [1]: https://docs.aws.amazon.com/comprehend/latest/dg/idp-set-textract-options.html
3249
3331
  #
3250
3332
  # @!attribute [rw] document_read_action
3251
3333
  # This field defines the Amazon Textract API operation that Amazon
@@ -8731,5 +8813,36 @@ module Aws::Comprehend
8731
8813
  include Aws::Structure
8732
8814
  end
8733
8815
 
8816
+ # The system identified one of the following warnings while processing
8817
+ # the input document:
8818
+ #
8819
+ # * The document to classify is plain text, but the classifier is a
8820
+ # native model.
8821
+ #
8822
+ # * The document to classify is semi-structured, but the classifier is a
8823
+ # plain-text model.
8824
+ #
8825
+ # @!attribute [rw] page
8826
+ # Page number in the input document.
8827
+ # @return [Integer]
8828
+ #
8829
+ # @!attribute [rw] warn_code
8830
+ # The type of warning.
8831
+ # @return [String]
8832
+ #
8833
+ # @!attribute [rw] warn_message
8834
+ # Text message associated with the warning.
8835
+ # @return [String]
8836
+ #
8837
+ # @see http://docs.aws.amazon.com/goto/WebAPI/comprehend-2017-11-27/WarningsListItem AWS API Documentation
8838
+ #
8839
+ class WarningsListItem < Struct.new(
8840
+ :page,
8841
+ :warn_code,
8842
+ :warn_message)
8843
+ SENSITIVE = []
8844
+ include Aws::Structure
8845
+ end
8846
+
8734
8847
  end
8735
8848
  end
@@ -52,6 +52,6 @@ require_relative 'aws-sdk-comprehend/customizations'
52
52
  # @!group service
53
53
  module Aws::Comprehend
54
54
 
55
- GEM_VERSION = '1.67.0'
55
+ GEM_VERSION = '1.68.0'
56
56
 
57
57
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: aws-sdk-comprehend
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.67.0
4
+ version: 1.68.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Amazon Web Services
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2023-03-24 00:00:00.000000000 Z
11
+ date: 2023-04-19 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: aws-sdk-core