@cdklabs/cdk-appmod-catalog-blueprints 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (105) hide show
  1. package/.jsii +8644 -0
  2. package/LICENSE +202 -0
  3. package/README.md +212 -0
  4. package/lib/document-processing/agentic-document-processing.d.ts +16 -0
  5. package/lib/document-processing/agentic-document-processing.js +90 -0
  6. package/lib/document-processing/base-document-processing.d.ts +189 -0
  7. package/lib/document-processing/base-document-processing.js +509 -0
  8. package/lib/document-processing/bedrock-document-processing.d.ts +167 -0
  9. package/lib/document-processing/bedrock-document-processing.js +297 -0
  10. package/lib/document-processing/index.d.ts +3 -0
  11. package/lib/document-processing/index.js +20 -0
  12. package/lib/document-processing/resources/default-bedrock-invoke/index.py +63 -0
  13. package/lib/document-processing/resources/default-bedrock-invoke/requirements.txt +4 -0
  14. package/lib/document-processing/resources/default-doc-retrieval-lambda/index.mjs +92 -0
  15. package/lib/document-processing/resources/default-doc-retrieval-lambda/package.json +10 -0
  16. package/lib/document-processing/resources/default-error-handler/index.js +46 -0
  17. package/lib/document-processing/resources/default-error-handler/package.json +4 -0
  18. package/lib/document-processing/resources/default-image-processor/classifier.mjs +665 -0
  19. package/lib/document-processing/resources/default-image-processor/extractors.mjs +465 -0
  20. package/lib/document-processing/resources/default-image-processor/index.mjs +143 -0
  21. package/lib/document-processing/resources/default-image-processor/package-lock.json +12 -0
  22. package/lib/document-processing/resources/default-image-processor/package.json +4 -0
  23. package/lib/document-processing/resources/default-image-validator/index.mjs +76 -0
  24. package/lib/document-processing/resources/default-image-validator/package-lock.json +154 -0
  25. package/lib/document-processing/resources/default-image-validator/package.json +7 -0
  26. package/lib/document-processing/resources/default-pdf-processor/index.js +46 -0
  27. package/lib/document-processing/resources/default-pdf-validator/index.js +36 -0
  28. package/lib/document-processing/resources/default-sqs-consumer/index.py +111 -0
  29. package/lib/document-processing/resources/default-sqs-consumer/requirements.txt +4 -0
  30. package/lib/document-processing/resources/default-sqs-consumer/sample_payload.json +20 -0
  31. package/lib/document-processing/resources/default-sqs-consumer/sample_payload_multi.json +24 -0
  32. package/lib/document-processing/resources/default-strands-agent/index.py +111 -0
  33. package/lib/document-processing/resources/default-strands-agent/requirements.txt +6 -0
  34. package/lib/document-processing/tests/agentic-document-processing-nag.test.d.ts +1 -0
  35. package/lib/document-processing/tests/agentic-document-processing-nag.test.js +107 -0
  36. package/lib/document-processing/tests/agentic-document-processing.test.d.ts +1 -0
  37. package/lib/document-processing/tests/agentic-document-processing.test.js +125 -0
  38. package/lib/document-processing/tests/bedrock-document-processing-nag.test.d.ts +1 -0
  39. package/lib/document-processing/tests/bedrock-document-processing-nag.test.js +101 -0
  40. package/lib/document-processing/tests/bedrock-document-processing.test.d.ts +1 -0
  41. package/lib/document-processing/tests/bedrock-document-processing.test.js +79 -0
  42. package/lib/framework/custom-resource/default-runtimes.d.ts +21 -0
  43. package/lib/framework/custom-resource/default-runtimes.js +34 -0
  44. package/lib/framework/custom-resource/index.d.ts +1 -0
  45. package/lib/framework/custom-resource/index.js +18 -0
  46. package/lib/framework/foundation/access-log.d.ts +69 -0
  47. package/lib/framework/foundation/access-log.js +121 -0
  48. package/lib/framework/foundation/eventbridge-broker.d.ts +18 -0
  49. package/lib/framework/foundation/eventbridge-broker.js +42 -0
  50. package/lib/framework/foundation/index.d.ts +3 -0
  51. package/lib/framework/foundation/index.js +20 -0
  52. package/lib/framework/foundation/network.d.ts +19 -0
  53. package/lib/framework/foundation/network.js +83 -0
  54. package/lib/framework/index.d.ts +2 -0
  55. package/lib/framework/index.js +19 -0
  56. package/lib/framework/quickstart/base-quickstart.d.ts +30 -0
  57. package/lib/framework/quickstart/base-quickstart.js +30 -0
  58. package/lib/index.d.ts +4 -0
  59. package/lib/index.js +21 -0
  60. package/lib/tsconfig.tsbuildinfo +1 -0
  61. package/lib/utilities/cdk-nag-config.d.ts +42 -0
  62. package/lib/utilities/cdk-nag-config.js +194 -0
  63. package/lib/utilities/data-loader-lambda/index.py +282 -0
  64. package/lib/utilities/data-loader-lambda/requirements.txt +3 -0
  65. package/lib/utilities/data-loader.d.ts +173 -0
  66. package/lib/utilities/data-loader.js +447 -0
  67. package/lib/utilities/index.d.ts +3 -0
  68. package/lib/utilities/index.js +20 -0
  69. package/lib/utilities/lambda-iam-utils.d.ts +145 -0
  70. package/lib/utilities/lambda-iam-utils.js +235 -0
  71. package/lib/utilities/lambda_layers/data-masking/layer-construct.d.ts +42 -0
  72. package/lib/utilities/lambda_layers/data-masking/layer-construct.js +53 -0
  73. package/lib/utilities/lambda_layers/data-masking/layer-construct.ts +88 -0
  74. package/lib/utilities/observability/bedrock-observability.d.ts +18 -0
  75. package/lib/utilities/observability/bedrock-observability.js +131 -0
  76. package/lib/utilities/observability/cloudfront-distribution-observability-property-injector.d.ts +6 -0
  77. package/lib/utilities/observability/cloudfront-distribution-observability-property-injector.js +22 -0
  78. package/lib/utilities/observability/index.d.ts +6 -0
  79. package/lib/utilities/observability/index.js +25 -0
  80. package/lib/utilities/observability/lambda-observability-property-injector.d.ts +8 -0
  81. package/lib/utilities/observability/lambda-observability-property-injector.js +43 -0
  82. package/lib/utilities/observability/log-group-data-protection-props.d.ts +19 -0
  83. package/lib/utilities/observability/log-group-data-protection-props.js +5 -0
  84. package/lib/utilities/observability/observability.d.ts +83 -0
  85. package/lib/utilities/observability/observability.js +278 -0
  86. package/lib/utilities/observability/observable.d.ts +32 -0
  87. package/lib/utilities/observability/observable.js +3 -0
  88. package/lib/utilities/observability/powertools-config.d.ts +3 -0
  89. package/lib/utilities/observability/powertools-config.js +25 -0
  90. package/lib/utilities/observability/resources/bedrock-manage-logging-configuration/index.py +27 -0
  91. package/lib/utilities/observability/state-machine-observability-property-injector.d.ts +8 -0
  92. package/lib/utilities/observability/state-machine-observability-property-injector.js +49 -0
  93. package/lib/utilities/tests/data-loader-nag.test.d.ts +1 -0
  94. package/lib/utilities/tests/data-loader-nag.test.js +432 -0
  95. package/lib/utilities/tests/data-loader.test.d.ts +1 -0
  96. package/lib/utilities/tests/data-loader.test.js +284 -0
  97. package/lib/webapp/frontend-construct.d.ts +136 -0
  98. package/lib/webapp/frontend-construct.js +253 -0
  99. package/lib/webapp/index.d.ts +1 -0
  100. package/lib/webapp/index.js +18 -0
  101. package/lib/webapp/tests/frontend-construct-nag.test.d.ts +1 -0
  102. package/lib/webapp/tests/frontend-construct-nag.test.js +266 -0
  103. package/lib/webapp/tests/frontend-construct.test.d.ts +1 -0
  104. package/lib/webapp/tests/frontend-construct.test.js +385 -0
  105. package/package.json +183 -0
@@ -0,0 +1,167 @@
1
+ import { Duration } from 'aws-cdk-lib';
2
+ import { FoundationModelIdentifier } from 'aws-cdk-lib/aws-bedrock';
3
+ import { Role } from 'aws-cdk-lib/aws-iam';
4
+ import { Function } from 'aws-cdk-lib/aws-lambda';
5
+ import { StateMachine } from 'aws-cdk-lib/aws-stepfunctions';
6
+ import { Construct } from 'constructs';
7
+ import { BaseDocumentProcessing, BaseDocumentProcessingProps, DocumentProcessingStepType } from './base-document-processing';
8
+ /**
9
+ * Configuration properties for BedrockDocumentProcessing construct.
10
+ * Extends BaseDocumentProcessingProps with Bedrock-specific options.
11
+ */
12
+ export interface BedrockDocumentProcessingProps extends BaseDocumentProcessingProps {
13
+ /**
14
+ * Bedrock foundation model for document classification step.
15
+ * @default FoundationModelIdentifier.ANTHROPIC_CLAUDE_3_7_SONNET_20250219_V1_0
16
+ */
17
+ readonly classificationModelId?: FoundationModelIdentifier;
18
+ /**
19
+ * Bedrock foundation model for document extraction step.
20
+ * @default FoundationModelIdentifier.ANTHROPIC_CLAUDE_3_7_SONNET_20250219_V1_0
21
+ */
22
+ readonly processingModelId?: FoundationModelIdentifier;
23
+ /**
24
+ * Custom prompt template for document classification.
25
+ * Must include placeholder for document content.
26
+ * @default DEFAULT_CLASSIFICATION_PROMPT
27
+ */
28
+ readonly classificationPrompt?: string;
29
+ /**
30
+ * Custom prompt template for document extraction.
31
+ * Must include placeholder for document content and classification result.
32
+ * @default DEFAULT_EXTRACTION_PROMPT
33
+ */
34
+ readonly processingPrompt?: string;
35
+ /**
36
+ * Optional Lambda function for document enrichment step.
37
+ * If provided, will be invoked after extraction with workflow state.
38
+ */
39
+ readonly enrichmentLambdaFunction?: Function;
40
+ /**
41
+ * Optional Lambda function for post-processing step.
42
+ * If provided, will be invoked after enrichment with workflow state.
43
+ */
44
+ readonly postProcessingLambdaFunction?: Function;
45
+ /**
46
+ * Timeout for individual Step Functions tasks (classification, extraction, etc.).
47
+ * @default Duration.minutes(5)
48
+ */
49
+ readonly stepTimeouts?: Duration;
50
+ /**
51
+ * Enable cross-region inference for Bedrock models to improve availability and performance.
52
+ * When enabled, uses inference profiles instead of direct model invocation.
53
+ * @default false
54
+ */
55
+ readonly useCrossRegionInference?: boolean;
56
+ /**
57
+ * Prefix for cross-region inference configuration.
58
+ * Only used when useCrossRegionInference is true.
59
+ * @default BedrockCrossRegionInferencePrefix.US
60
+ */
61
+ readonly crossRegionInferencePrefix?: BedrockCrossRegionInferencePrefix;
62
+ }
63
+ /**
64
+ * Cross-region inference prefix options for Bedrock models.
65
+ * Used to configure inference profiles for improved availability and performance.
66
+ */
67
+ export declare enum BedrockCrossRegionInferencePrefix {
68
+ /** US-based cross-region inference profile */
69
+ US = "us",
70
+ /** EU-based cross-region inference profile */
71
+ EU = "eu"
72
+ }
73
+ /**
74
+ * Document processing workflow powered by Amazon Bedrock foundation models.
75
+ *
76
+ * Extends BaseDocumentProcessing to provide AI-powered document classification and extraction
77
+ * using Amazon Bedrock foundation models. This implementation offers:
78
+ *
79
+ * ## Key Features
80
+ * - **AI-Powered Classification**: Uses Claude 3.7 Sonnet (configurable) to classify document types
81
+ * - **Intelligent Extraction**: Extracts structured data from documents using foundation models
82
+ * - **Cross-Region Inference**: Optional support for improved availability via inference profiles
83
+ * - **Flexible Processing**: Optional enrichment and post-processing Lambda functions
84
+ * - **Cost Optimized**: Configurable timeouts and model selection for cost control
85
+ *
86
+ * ## Processing Workflow
87
+ * S3 Upload → Classification (Bedrock) → Extraction (Bedrock) → [Enrichment] → [Post-Processing] → Results
88
+ *
89
+ * ## Default Models
90
+ * - Classification: Claude 3.7 Sonnet (anthropic.claude-3-7-sonnet-20250219-v1:0)
91
+ * - Extraction: Claude 3.7 Sonnet (anthropic.claude-3-7-sonnet-20250219-v1:0)
92
+ *
93
+ * ## Prompt Templates
94
+ * The construct uses default prompts that can be customized:
95
+ * - **Classification**: Analyzes document and returns JSON with documentClassification field
96
+ * - **Extraction**: Uses classification result to extract entities in structured JSON format
97
+ *
98
+ * ## Cross-Region Inference
99
+ * When enabled, uses Bedrock inference profiles for improved availability:
100
+ * - US prefix: Routes to US-based regions for lower latency
101
+ * - EU prefix: Routes to EU-based regions for data residency compliance
102
+ */
103
+ export declare class BedrockDocumentProcessing extends BaseDocumentProcessing {
104
+ protected static readonly DEFAULT_CLASSIFICATION_MODEL_ID: FoundationModelIdentifier;
105
+ protected static readonly DEFAULT_PROCESSING_MODEL_ID: FoundationModelIdentifier;
106
+ protected static readonly DEFAULT_CLASSIFICATION_PROMPT = "\n Analyze the document below, and classify the type of document it is (eg. INVOICE, IDENTITY_DOCUMENT, RECEIPT, etc). The result should be in JSON and should follow the following structure (only respond in JSON with the following structure and do not use markdown to indicate the json, just output plain old json with nothing else):\n\n {\n documentClassification: <CLASSIFICATION>\n }\n\n Attached document is as follows:\n\n ";
107
+ protected static readonly DEFAULT_PROCESSING_PROMPT = "\n The document below has been classified as [ACTUAL_CLASSIFICATION]. Extract important entities from the document and return the result as JSON following the structure below (only respond in JSON with the following structure and do not use markdown to indicate the json, just output plain old json with nothing else):\n\n {\n documentClassification: <CLASSIFICATION>,\n result: {\n entities: [\n {\n type: <TYPE OF ENTITY>\n value: <VALUE OF ENTITY>\n },\n ...\n ]\n }\n }\n\n Attached document is as follows:\n\n ";
108
+ /** Configuration properties specific to Bedrock document processing */
109
+ protected readonly bedrockDocumentProcessingProps: BedrockDocumentProcessingProps;
110
+ /** Cross-region inference prefix for Bedrock model routing */
111
+ protected readonly crossRegionInferencePrefix: BedrockCrossRegionInferencePrefix;
112
+ /** The Step Functions state machine that orchestrates the document processing workflow */
113
+ readonly stateMachine: StateMachine;
114
+ /**
115
+ * Creates a new BedrockDocumentProcessing construct.
116
+ *
117
+ * Initializes the Bedrock-powered document processing pipeline with AI classification
118
+ * and extraction capabilities. Creates Lambda functions with appropriate IAM roles
119
+ * for Bedrock model invocation and S3 access.
120
+ *
121
+ * @param scope - The scope in which to define this construct
122
+ * @param id - The scoped construct ID. Must be unique within the scope.
123
+ * @param props - Configuration properties for the Bedrock document processing pipeline
124
+ */
125
+ constructor(scope: Construct, id: string, props: BedrockDocumentProcessingProps);
126
+ /**
127
+ * Implements the document classification step using Amazon Bedrock.
128
+ *
129
+ * Creates a Lambda function that invokes the configured Bedrock model to classify
130
+ * the document type. The function reads the document from S3 and sends it to
131
+ * Bedrock with the classification prompt.
132
+ *
133
+ * @returns LambdaInvoke task configured for document classification
134
+ */
135
+ protected classificationStep(): DocumentProcessingStepType;
136
+ /**
137
+ * Implements the document extraction step using Amazon Bedrock.
138
+ *
139
+ * Creates a Lambda function that invokes the configured Bedrock model to extract
140
+ * structured data from the document. Uses the classification result from the
141
+ * previous step to provide context for more accurate extraction.
142
+ *
143
+ * @returns LambdaInvoke task configured for document extraction
144
+ */
145
+ protected processingStep(): DocumentProcessingStepType;
146
+ protected generateLambdaRoleForBedrock(fmModel: FoundationModelIdentifier, id: string): Role;
147
+ /**
148
+ * Implements the optional document enrichment step.
149
+ *
150
+ * If an enrichment Lambda function is provided in the props, creates a LambdaInvoke
151
+ * task to perform additional processing on the extracted data. This step is useful
152
+ * for data validation, transformation, or integration with external systems.
153
+ *
154
+ * @returns LambdaInvoke task for enrichment, or undefined to skip this step
155
+ */
156
+ protected enrichmentStep(): DocumentProcessingStepType | undefined;
157
+ /**
158
+ * Implements the optional post-processing step.
159
+ *
160
+ * If a post-processing Lambda function is provided in the props, creates a LambdaInvoke
161
+ * task to perform final processing on the workflow results. This step is useful for
162
+ * data formatting, notifications, or integration with downstream systems.
163
+ *
164
+ * @returns LambdaInvoke task for post-processing, or undefined to skip this step
165
+ */
166
+ protected postProcessingStep(): DocumentProcessingStepType | undefined;
167
+ }
@@ -0,0 +1,297 @@
1
+ "use strict";
2
+ var _a;
3
+ Object.defineProperty(exports, "__esModule", { value: true });
4
+ exports.BedrockDocumentProcessing = exports.BedrockCrossRegionInferencePrefix = void 0;
5
+ const JSII_RTTI_SYMBOL_1 = Symbol.for("jsii.rtti");
6
+ // Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
7
+ // SPDX-License-Identifier: Apache-2.0
8
+ const path = require("path");
9
+ const aws_lambda_python_alpha_1 = require("@aws-cdk/aws-lambda-python-alpha");
10
+ const aws_cdk_lib_1 = require("aws-cdk-lib");
11
+ const aws_bedrock_1 = require("aws-cdk-lib/aws-bedrock");
12
+ const aws_ec2_1 = require("aws-cdk-lib/aws-ec2");
13
+ const aws_iam_1 = require("aws-cdk-lib/aws-iam");
14
+ const aws_lambda_1 = require("aws-cdk-lib/aws-lambda");
15
+ const aws_stepfunctions_tasks_1 = require("aws-cdk-lib/aws-stepfunctions-tasks");
16
+ const base_document_processing_1 = require("./base-document-processing");
17
+ const framework_1 = require("../framework");
18
+ const utilities_1 = require("../utilities");
19
+ const powertools_config_1 = require("../utilities/observability/powertools-config");
20
+ /**
21
+ * Cross-region inference prefix options for Bedrock models.
22
+ * Used to configure inference profiles for improved availability and performance.
23
+ */
24
+ var BedrockCrossRegionInferencePrefix;
25
+ (function (BedrockCrossRegionInferencePrefix) {
26
+ /** US-based cross-region inference profile */
27
+ BedrockCrossRegionInferencePrefix["US"] = "us";
28
+ /** EU-based cross-region inference profile */
29
+ BedrockCrossRegionInferencePrefix["EU"] = "eu";
30
+ })(BedrockCrossRegionInferencePrefix || (exports.BedrockCrossRegionInferencePrefix = BedrockCrossRegionInferencePrefix = {}));
31
+ /**
32
+ * Document processing workflow powered by Amazon Bedrock foundation models.
33
+ *
34
+ * Extends BaseDocumentProcessing to provide AI-powered document classification and extraction
35
+ * using Amazon Bedrock foundation models. This implementation offers:
36
+ *
37
+ * ## Key Features
38
+ * - **AI-Powered Classification**: Uses Claude 3.7 Sonnet (configurable) to classify document types
39
+ * - **Intelligent Extraction**: Extracts structured data from documents using foundation models
40
+ * - **Cross-Region Inference**: Optional support for improved availability via inference profiles
41
+ * - **Flexible Processing**: Optional enrichment and post-processing Lambda functions
42
+ * - **Cost Optimized**: Configurable timeouts and model selection for cost control
43
+ *
44
+ * ## Processing Workflow
45
+ * S3 Upload → Classification (Bedrock) → Extraction (Bedrock) → [Enrichment] → [Post-Processing] → Results
46
+ *
47
+ * ## Default Models
48
+ * - Classification: Claude 3.7 Sonnet (anthropic.claude-3-7-sonnet-20250219-v1:0)
49
+ * - Extraction: Claude 3.7 Sonnet (anthropic.claude-3-7-sonnet-20250219-v1:0)
50
+ *
51
+ * ## Prompt Templates
52
+ * The construct uses default prompts that can be customized:
53
+ * - **Classification**: Analyzes document and returns JSON with documentClassification field
54
+ * - **Extraction**: Uses classification result to extract entities in structured JSON format
55
+ *
56
+ * ## Cross-Region Inference
57
+ * When enabled, uses Bedrock inference profiles for improved availability:
58
+ * - US prefix: Routes to US-based regions for lower latency
59
+ * - EU prefix: Routes to EU-based regions for data residency compliance
60
+ */
61
+ class BedrockDocumentProcessing extends base_document_processing_1.BaseDocumentProcessing {
62
+ /**
63
+ * Creates a new BedrockDocumentProcessing construct.
64
+ *
65
+ * Initializes the Bedrock-powered document processing pipeline with AI classification
66
+ * and extraction capabilities. Creates Lambda functions with appropriate IAM roles
67
+ * for Bedrock model invocation and S3 access.
68
+ *
69
+ * @param scope - The scope in which to define this construct
70
+ * @param id - The scoped construct ID. Must be unique within the scope.
71
+ * @param props - Configuration properties for the Bedrock document processing pipeline
72
+ */
73
+ constructor(scope, id, props) {
74
+ super(scope, id, props);
75
+ if (props.network) {
76
+ props.network.createServiceEndpoint('vpce-bedrock', aws_ec2_1.InterfaceVpcEndpointAwsService.BEDROCK);
77
+ props.network.createServiceEndpoint('vpce-bedrock-runtime', aws_ec2_1.InterfaceVpcEndpointAwsService.BEDROCK_RUNTIME);
78
+ }
79
+ this.bedrockDocumentProcessingProps = props;
80
+ this.crossRegionInferencePrefix = props.crossRegionInferencePrefix || BedrockCrossRegionInferencePrefix.US;
81
+ this.stateMachine = this.handleStateMachineCreation('bedrock-document-processing-workflow');
82
+ }
83
+ /**
84
+ * Implements the document classification step using Amazon Bedrock.
85
+ *
86
+ * Creates a Lambda function that invokes the configured Bedrock model to classify
87
+ * the document type. The function reads the document from S3 and sends it to
88
+ * Bedrock with the classification prompt.
89
+ *
90
+ * @returns LambdaInvoke task configured for document classification
91
+ */
92
+ classificationStep() {
93
+ const prompt = this.bedrockDocumentProcessingProps.classificationPrompt || BedrockDocumentProcessing.DEFAULT_CLASSIFICATION_PROMPT;
94
+ const fmModel = this.bedrockDocumentProcessingProps.classificationModelId || BedrockDocumentProcessing.DEFAULT_CLASSIFICATION_MODEL_ID;
95
+ const adjustedModelId = this.bedrockDocumentProcessingProps.useCrossRegionInference ? `${this.crossRegionInferencePrefix}.${fmModel.modelId}` : fmModel.modelId;
96
+ const role = this.generateLambdaRoleForBedrock(fmModel, 'ClassificationLambdaRole');
97
+ const { region, account } = aws_cdk_lib_1.Stack.of(this);
98
+ const generatedLogPermissions = utilities_1.LambdaIamUtils.createLogsPermissions({
99
+ account,
100
+ functionName: 'bedrock-idp-classification',
101
+ region,
102
+ scope: this,
103
+ });
104
+ this.encryptionKey.grantEncryptDecrypt(role);
105
+ if (this.bucketEncryptionKey) {
106
+ this.bucketEncryptionKey.grantEncryptDecrypt(role);
107
+ }
108
+ const bedrockFunction = new aws_lambda_python_alpha_1.PythonFunction(this, 'BedrockClassificationFunction', {
109
+ functionName: generatedLogPermissions.uniqueFunctionName,
110
+ architecture: aws_lambda_1.Architecture.X86_64,
111
+ runtime: framework_1.DefaultRuntimes.PYTHON,
112
+ entry: path.join(__dirname, 'resources/default-bedrock-invoke'),
113
+ role,
114
+ memorySize: 512,
115
+ timeout: this.bedrockDocumentProcessingProps.stepTimeouts || aws_cdk_lib_1.Duration.minutes(5),
116
+ environment: {
117
+ MODEL_ID: adjustedModelId,
118
+ PROMPT: prompt,
119
+ INVOKE_TYPE: 'classification',
120
+ ...powertools_config_1.PowertoolsConfig.generateDefaultLambdaConfig(this.bedrockDocumentProcessingProps.enableObservability, this.metricNamespace, this.metricServiceName),
121
+ },
122
+ environmentEncryption: this.encryptionKey,
123
+ vpc: this.bedrockDocumentProcessingProps.network ? this.bedrockDocumentProcessingProps.network.vpc : undefined,
124
+ vpcSubnets: this.bedrockDocumentProcessingProps.network ? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection() : undefined,
125
+ });
126
+ for (const statement of generatedLogPermissions.policyStatements) {
127
+ bedrockFunction.role?.addToPrincipalPolicy(statement);
128
+ }
129
+ if (this.bedrockDocumentProcessingProps.network) {
130
+ bedrockFunction.role?.addToPrincipalPolicy(utilities_1.LambdaIamUtils.generateLambdaVPCPermissions());
131
+ }
132
+ return new aws_stepfunctions_tasks_1.LambdaInvoke(this, 'ClassificationStep', {
133
+ lambdaFunction: bedrockFunction,
134
+ resultPath: '$.classificationResult',
135
+ resultSelector: {
136
+ 'documentClassification.$': '$.Payload.documentClassification',
137
+ },
138
+ });
139
+ }
140
+ /**
141
+ * Implements the document extraction step using Amazon Bedrock.
142
+ *
143
+ * Creates a Lambda function that invokes the configured Bedrock model to extract
144
+ * structured data from the document. Uses the classification result from the
145
+ * previous step to provide context for more accurate extraction.
146
+ *
147
+ * @returns LambdaInvoke task configured for document extraction
148
+ */
149
+ processingStep() {
150
+ const prompt = this.bedrockDocumentProcessingProps.processingPrompt || BedrockDocumentProcessing.DEFAULT_PROCESSING_PROMPT;
151
+ const fmModel = this.bedrockDocumentProcessingProps.processingModelId || BedrockDocumentProcessing.DEFAULT_PROCESSING_MODEL_ID;
152
+ const adjustedModelId = this.bedrockDocumentProcessingProps.useCrossRegionInference ? `${this.crossRegionInferencePrefix}.${fmModel.modelId}` : fmModel.modelId;
153
+ const role = this.generateLambdaRoleForBedrock(fmModel, 'ProcessingLambdaRole');
154
+ const { region, account } = aws_cdk_lib_1.Stack.of(this);
155
+ const generatedLogPermissions = utilities_1.LambdaIamUtils.createLogsPermissions({
156
+ account,
157
+ functionName: 'bedrock-idp-processing',
158
+ region,
159
+ scope: this,
160
+ });
161
+ this.encryptionKey.grantEncryptDecrypt(role);
162
+ if (this.bucketEncryptionKey) {
163
+ this.bucketEncryptionKey.grantEncryptDecrypt(role);
164
+ }
165
+ const bedrockFunction = new aws_lambda_python_alpha_1.PythonFunction(this, 'BedrockExtractionFunction', {
166
+ functionName: generatedLogPermissions.uniqueFunctionName,
167
+ runtime: framework_1.DefaultRuntimes.PYTHON,
168
+ architecture: aws_lambda_1.Architecture.X86_64,
169
+ entry: path.join(__dirname, 'resources/default-bedrock-invoke'),
170
+ role,
171
+ memorySize: 512,
172
+ timeout: this.bedrockDocumentProcessingProps.stepTimeouts || aws_cdk_lib_1.Duration.minutes(5),
173
+ environment: {
174
+ MODEL_ID: adjustedModelId,
175
+ PROMPT: prompt,
176
+ INVOKE_TYPE: 'processing',
177
+ ...powertools_config_1.PowertoolsConfig.generateDefaultLambdaConfig(this.bedrockDocumentProcessingProps.enableObservability, this.metricNamespace, this.metricServiceName),
178
+ },
179
+ environmentEncryption: this.encryptionKey,
180
+ vpc: this.bedrockDocumentProcessingProps.network ? this.bedrockDocumentProcessingProps.network.vpc : undefined,
181
+ vpcSubnets: this.bedrockDocumentProcessingProps.network ? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection() : undefined,
182
+ });
183
+ for (const statement of generatedLogPermissions.policyStatements) {
184
+ bedrockFunction.role?.addToPrincipalPolicy(statement);
185
+ }
186
+ if (this.bedrockDocumentProcessingProps.network) {
187
+ bedrockFunction.role?.addToPrincipalPolicy(utilities_1.LambdaIamUtils.generateLambdaVPCPermissions());
188
+ }
189
+ return new aws_stepfunctions_tasks_1.LambdaInvoke(this, 'ProcessingStep', {
190
+ lambdaFunction: bedrockFunction,
191
+ resultPath: '$.processingResult',
192
+ resultSelector: {
193
+ 'documentClassification.$': '$.Payload.documentClassification',
194
+ 'result.$': '$.Payload.result',
195
+ },
196
+ });
197
+ }
198
+ generateLambdaRoleForBedrock(fmModel, id) {
199
+ const { region, account } = aws_cdk_lib_1.Stack.of(this);
200
+ return new aws_iam_1.Role(this, id, {
201
+ assumedBy: new aws_iam_1.ServicePrincipal('lambda.amazonaws.com'),
202
+ inlinePolicies: {
203
+ BedrockInvokePolicy: new aws_iam_1.PolicyDocument({
204
+ statements: [
205
+ new aws_iam_1.PolicyStatement({
206
+ effect: aws_iam_1.Effect.ALLOW,
207
+ actions: ['s3:GetObject'],
208
+ resources: [`${this.bucket.bucketArn}/*`],
209
+ }),
210
+ new aws_iam_1.PolicyStatement({
211
+ effect: aws_iam_1.Effect.ALLOW,
212
+ actions: [
213
+ 'bedrock:InvokeModel',
214
+ 'bedrock:InvokeModelWithResponseStream',
215
+ ],
216
+ resources: [
217
+ `arn:aws:bedrock:*::foundation-model/${fmModel.modelId}`,
218
+ `arn:aws:bedrock:${region}:${account}:inference-profile/${this.crossRegionInferencePrefix}.${fmModel.modelId}`,
219
+ ],
220
+ }),
221
+ ],
222
+ }),
223
+ },
224
+ });
225
+ }
226
+ /**
227
+ * Implements the optional document enrichment step.
228
+ *
229
+ * If an enrichment Lambda function is provided in the props, creates a LambdaInvoke
230
+ * task to perform additional processing on the extracted data. This step is useful
231
+ * for data validation, transformation, or integration with external systems.
232
+ *
233
+ * @returns LambdaInvoke task for enrichment, or undefined to skip this step
234
+ */
235
+ enrichmentStep() {
236
+ if (!this.bedrockDocumentProcessingProps.enrichmentLambdaFunction) {
237
+ return undefined;
238
+ }
239
+ return new aws_stepfunctions_tasks_1.LambdaInvoke(this, 'EnrichmentStep', {
240
+ lambdaFunction: this.bedrockDocumentProcessingProps.enrichmentLambdaFunction,
241
+ resultPath: '$.enrichedResult',
242
+ });
243
+ }
244
+ /**
245
+ * Implements the optional post-processing step.
246
+ *
247
+ * If a post-processing Lambda function is provided in the props, creates a LambdaInvoke
248
+ * task to perform final processing on the workflow results. This step is useful for
249
+ * data formatting, notifications, or integration with downstream systems.
250
+ *
251
+ * @returns LambdaInvoke task for post-processing, or undefined to skip this step
252
+ */
253
+ postProcessingStep() {
254
+ if (!this.bedrockDocumentProcessingProps.postProcessingLambdaFunction) {
255
+ return undefined;
256
+ }
257
+ return new aws_stepfunctions_tasks_1.LambdaInvoke(this, 'PostProcessingStep', {
258
+ lambdaFunction: this.bedrockDocumentProcessingProps.postProcessingLambdaFunction,
259
+ resultPath: '$.postProcessedResult',
260
+ });
261
+ }
262
+ }
263
+ exports.BedrockDocumentProcessing = BedrockDocumentProcessing;
264
+ _a = JSII_RTTI_SYMBOL_1;
265
+ BedrockDocumentProcessing[_a] = { fqn: "@cdklabs/cdk-appmod-catalog-blueprints.BedrockDocumentProcessing", version: "1.0.0" };
266
+ BedrockDocumentProcessing.DEFAULT_CLASSIFICATION_MODEL_ID = aws_bedrock_1.FoundationModelIdentifier.ANTHROPIC_CLAUDE_3_7_SONNET_20250219_V1_0;
267
+ BedrockDocumentProcessing.DEFAULT_PROCESSING_MODEL_ID = aws_bedrock_1.FoundationModelIdentifier.ANTHROPIC_CLAUDE_3_7_SONNET_20250219_V1_0;
268
+ BedrockDocumentProcessing.DEFAULT_CLASSIFICATION_PROMPT = `
269
+ Analyze the document below, and classify the type of document it is (eg. INVOICE, IDENTITY_DOCUMENT, RECEIPT, etc). The result should be in JSON and should follow the following structure (only respond in JSON with the following structure and do not use markdown to indicate the json, just output plain old json with nothing else):
270
+
271
+ {
272
+ documentClassification: <CLASSIFICATION>
273
+ }
274
+
275
+ Attached document is as follows:
276
+
277
+ `;
278
+ BedrockDocumentProcessing.DEFAULT_PROCESSING_PROMPT = `
279
+ The document below has been classified as [ACTUAL_CLASSIFICATION]. Extract important entities from the document and return the result as JSON following the structure below (only respond in JSON with the following structure and do not use markdown to indicate the json, just output plain old json with nothing else):
280
+
281
+ {
282
+ documentClassification: <CLASSIFICATION>,
283
+ result: {
284
+ entities: [
285
+ {
286
+ type: <TYPE OF ENTITY>
287
+ value: <VALUE OF ENTITY>
288
+ },
289
+ ...
290
+ ]
291
+ }
292
+ }
293
+
294
+ Attached document is as follows:
295
+
296
+ `;
297
+ //# sourceMappingURL=data:application/json;base64,
@@ -0,0 +1,3 @@
1
+ export * from './base-document-processing';
2
+ export * from './bedrock-document-processing';
3
+ export * from './agentic-document-processing';
@@ -0,0 +1,20 @@
1
+ "use strict";
2
+ var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
3
+ if (k2 === undefined) k2 = k;
4
+ var desc = Object.getOwnPropertyDescriptor(m, k);
5
+ if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
6
+ desc = { enumerable: true, get: function() { return m[k]; } };
7
+ }
8
+ Object.defineProperty(o, k2, desc);
9
+ }) : (function(o, m, k, k2) {
10
+ if (k2 === undefined) k2 = k;
11
+ o[k2] = m[k];
12
+ }));
13
+ var __exportStar = (this && this.__exportStar) || function(m, exports) {
14
+ for (var p in m) if (p !== "default" && !Object.prototype.hasOwnProperty.call(exports, p)) __createBinding(exports, m, p);
15
+ };
16
+ Object.defineProperty(exports, "__esModule", { value: true });
17
+ __exportStar(require("./base-document-processing"), exports);
18
+ __exportStar(require("./bedrock-document-processing"), exports);
19
+ __exportStar(require("./agentic-document-processing"), exports);
20
+ //# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoiaW5kZXguanMiLCJzb3VyY2VSb290IjoiIiwic291cmNlcyI6WyIuLi8uLi91c2UtY2FzZXMvZG9jdW1lbnQtcHJvY2Vzc2luZy9pbmRleC50cyJdLCJuYW1lcyI6W10sIm1hcHBpbmdzIjoiOzs7Ozs7Ozs7Ozs7Ozs7O0FBQUEsNkRBQTJDO0FBQzNDLGdFQUE4QztBQUM5QyxnRUFBOEMiLCJzb3VyY2VzQ29udGVudCI6WyJleHBvcnQgKiBmcm9tICcuL2Jhc2UtZG9jdW1lbnQtcHJvY2Vzc2luZyc7XG5leHBvcnQgKiBmcm9tICcuL2JlZHJvY2stZG9jdW1lbnQtcHJvY2Vzc2luZyc7XG5leHBvcnQgKiBmcm9tICcuL2FnZW50aWMtZG9jdW1lbnQtcHJvY2Vzc2luZyc7Il19
@@ -0,0 +1,63 @@
1
+ import json
2
+ import os
3
+ import boto3
4
+ import base64
5
+ from aws_lambda_powertools import Metrics, Tracer
6
+ from aws_lambda_powertools.metrics import MetricUnit
7
+
8
+ s3 = boto3.client('s3')
9
+ bedrock = boto3.client('bedrock-runtime')
10
+ metrics = Metrics()
11
+ tracer = Tracer()
12
+
13
+ @metrics.log_metrics
14
+ @tracer.capture_lambda_handler
15
+ def handler(event, context):
16
+ bucket = event['bucket']
17
+ key = event['key']
18
+ invoke_type = os.environ["INVOKE_TYPE"]
19
+ tracer.put_annotation(key="invoke_type", value=invoke_type)
20
+ tracer.put_annotation(key="documentId", value=event["documentId"])
21
+ metrics.add_dimension(name="invoke_type", value=invoke_type)
22
+
23
+ # Check file type
24
+ ext = key.lower().split('.')[-1]
25
+ if ext not in ['jpg', 'jpeg', 'png', 'pdf']:
26
+ raise ValueError(f"Unsupported file type: {ext}")
27
+
28
+ media_type = {'jpg': 'image/jpeg', 'jpeg': 'image/jpeg', 'png': 'image/png', 'pdf': 'application/pdf'}[ext]
29
+
30
+ # Download file to /tmp
31
+ local_path = f"/tmp/{key.split('/')[-1]}"
32
+ s3.download_file(bucket, key, local_path)
33
+
34
+ # Read and encode file
35
+ with open(local_path, 'rb') as f:
36
+ file_data = base64.b64encode(f.read()).decode('utf-8')
37
+
38
+ # Format prompt if classification result exists
39
+ prompt = os.environ['PROMPT']
40
+ if 'classificationResult' in event:
41
+ classification = event['classificationResult']['documentClassification']
42
+ prompt = prompt.replace("[ACTUAL_CLASSIFICATION]", classification)
43
+
44
+ # Build content based on file type
45
+ content = [{'type': 'text', 'text': prompt}]
46
+ if ext == 'pdf':
47
+ content.append({'type': 'document', 'source': {'type': 'base64', 'media_type': media_type, 'data': file_data}})
48
+ else:
49
+ content.append({'type': 'image', 'source': {'type': 'base64', 'media_type': media_type, 'data': file_data}})
50
+
51
+ # Invoke Bedrock
52
+ response = bedrock.invoke_model(
53
+ modelId=os.environ['MODEL_ID'],
54
+ body=json.dumps({
55
+ 'anthropic_version': 'bedrock-2023-05-31',
56
+ 'max_tokens': 1000,
57
+ 'messages': [{'role': 'user', 'content': content}]
58
+ })
59
+ )
60
+
61
+ response_payload = response['body'].read()
62
+ metrics.add_metric(name="SuccessfulInvocation", unit=MetricUnit.Count, value=1)
63
+ return json.loads(json.loads(response_payload)["content"][0]["text"])
@@ -0,0 +1,4 @@
1
+ boto3>=1.26.0
2
+ aws-lambda-powertools
3
+ urllib3>=1.26.0,<2.0.0
4
+ aws-xray-sdk