@cdklabs/cdk-appmod-catalog-blueprints 1.4.1 → 1.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.jsii +2579 -194
- package/lib/document-processing/adapter/adapter.d.ts +4 -2
- package/lib/document-processing/adapter/adapter.js +1 -1
- package/lib/document-processing/adapter/queued-s3-adapter.d.ts +9 -2
- package/lib/document-processing/adapter/queued-s3-adapter.js +29 -15
- package/lib/document-processing/agentic-document-processing.d.ts +4 -0
- package/lib/document-processing/agentic-document-processing.js +20 -10
- package/lib/document-processing/base-document-processing.d.ts +54 -2
- package/lib/document-processing/base-document-processing.js +136 -82
- package/lib/document-processing/bedrock-document-processing.d.ts +202 -2
- package/lib/document-processing/bedrock-document-processing.js +717 -77
- package/lib/document-processing/chunking-config.d.ts +614 -0
- package/lib/document-processing/chunking-config.js +5 -0
- package/lib/document-processing/default-document-processing-config.js +1 -1
- package/lib/document-processing/index.d.ts +1 -0
- package/lib/document-processing/index.js +2 -1
- package/lib/document-processing/resources/aggregation/handler.py +567 -0
- package/lib/document-processing/resources/aggregation/requirements.txt +7 -0
- package/lib/document-processing/resources/aggregation/test_handler.py +362 -0
- package/lib/document-processing/resources/cleanup/handler.py +276 -0
- package/lib/document-processing/resources/cleanup/requirements.txt +5 -0
- package/lib/document-processing/resources/cleanup/test_handler.py +436 -0
- package/lib/document-processing/resources/default-bedrock-invoke/index.py +85 -3
- package/lib/document-processing/resources/default-bedrock-invoke/test_index.py +622 -0
- package/lib/document-processing/resources/pdf-chunking/README.md +313 -0
- package/lib/document-processing/resources/pdf-chunking/chunking_strategies.py +460 -0
- package/lib/document-processing/resources/pdf-chunking/error_handling.py +491 -0
- package/lib/document-processing/resources/pdf-chunking/handler.py +958 -0
- package/lib/document-processing/resources/pdf-chunking/metrics.py +435 -0
- package/lib/document-processing/resources/pdf-chunking/requirements.txt +3 -0
- package/lib/document-processing/resources/pdf-chunking/strategy_selection.py +420 -0
- package/lib/document-processing/resources/pdf-chunking/structured_logging.py +457 -0
- package/lib/document-processing/resources/pdf-chunking/test_chunking_strategies.py +353 -0
- package/lib/document-processing/resources/pdf-chunking/test_error_handling.py +487 -0
- package/lib/document-processing/resources/pdf-chunking/test_handler.py +609 -0
- package/lib/document-processing/resources/pdf-chunking/test_integration.py +694 -0
- package/lib/document-processing/resources/pdf-chunking/test_metrics.py +532 -0
- package/lib/document-processing/resources/pdf-chunking/test_strategy_selection.py +471 -0
- package/lib/document-processing/resources/pdf-chunking/test_structured_logging.py +449 -0
- package/lib/document-processing/resources/pdf-chunking/test_token_estimation.py +374 -0
- package/lib/document-processing/resources/pdf-chunking/token_estimation.py +189 -0
- package/lib/document-processing/tests/agentic-document-processing-nag.test.js +4 -3
- package/lib/document-processing/tests/agentic-document-processing.test.js +488 -4
- package/lib/document-processing/tests/base-document-processing-nag.test.js +9 -2
- package/lib/document-processing/tests/base-document-processing-schema.test.d.ts +1 -0
- package/lib/document-processing/tests/base-document-processing-schema.test.js +337 -0
- package/lib/document-processing/tests/base-document-processing.test.js +114 -8
- package/lib/document-processing/tests/bedrock-document-processing-chunking-nag.test.d.ts +1 -0
- package/lib/document-processing/tests/bedrock-document-processing-chunking-nag.test.js +382 -0
- package/lib/document-processing/tests/bedrock-document-processing-nag.test.js +4 -3
- package/lib/document-processing/tests/bedrock-document-processing-security.test.d.ts +1 -0
- package/lib/document-processing/tests/bedrock-document-processing-security.test.js +389 -0
- package/lib/document-processing/tests/bedrock-document-processing.test.js +808 -8
- package/lib/document-processing/tests/chunking-config.test.d.ts +1 -0
- package/lib/document-processing/tests/chunking-config.test.js +238 -0
- package/lib/document-processing/tests/queued-s3-adapter-nag.test.js +9 -2
- package/lib/document-processing/tests/queued-s3-adapter.test.js +17 -6
- package/lib/framework/agents/base-agent.js +1 -1
- package/lib/framework/agents/batch-agent.js +1 -1
- package/lib/framework/agents/default-agent-config.js +1 -1
- package/lib/framework/bedrock/bedrock.js +1 -1
- package/lib/framework/custom-resource/default-runtimes.js +1 -1
- package/lib/framework/foundation/access-log.js +1 -1
- package/lib/framework/foundation/eventbridge-broker.js +1 -1
- package/lib/framework/foundation/network.d.ts +4 -2
- package/lib/framework/foundation/network.js +52 -41
- package/lib/framework/tests/access-log.test.js +5 -2
- package/lib/framework/tests/batch-agent.test.js +5 -2
- package/lib/framework/tests/bedrock.test.js +5 -2
- package/lib/framework/tests/eventbridge-broker.test.js +5 -2
- package/lib/framework/tests/framework-nag.test.js +26 -7
- package/lib/framework/tests/network.test.js +30 -2
- package/lib/tsconfig.tsbuildinfo +1 -1
- package/lib/utilities/data-loader.js +1 -1
- package/lib/utilities/lambda-iam-utils.js +1 -1
- package/lib/utilities/observability/cloudfront-distribution-observability-property-injector.js +1 -1
- package/lib/utilities/observability/default-observability-config.js +1 -1
- package/lib/utilities/observability/lambda-observability-property-injector.js +1 -1
- package/lib/utilities/observability/log-group-data-protection-utils.js +1 -1
- package/lib/utilities/observability/powertools-config.d.ts +10 -1
- package/lib/utilities/observability/powertools-config.js +19 -3
- package/lib/utilities/observability/state-machine-observability-property-injector.js +1 -1
- package/lib/utilities/test-utils.d.ts +43 -0
- package/lib/utilities/test-utils.js +56 -0
- package/lib/utilities/tests/data-loader-nag.test.js +3 -2
- package/lib/utilities/tests/data-loader.test.js +3 -2
- package/lib/webapp/frontend-construct.js +1 -1
- package/lib/webapp/tests/frontend-construct-nag.test.js +3 -2
- package/lib/webapp/tests/frontend-construct.test.js +3 -2
- package/package.json +6 -5
- package/lib/document-processing/resources/default-error-handler/index.js +0 -46
- package/lib/document-processing/resources/default-pdf-processor/index.js +0 -46
- package/lib/document-processing/resources/default-pdf-validator/index.js +0 -36
|
@@ -11,6 +11,7 @@ const aws_cdk_lib_1 = require("aws-cdk-lib");
|
|
|
11
11
|
const aws_ec2_1 = require("aws-cdk-lib/aws-ec2");
|
|
12
12
|
const aws_iam_1 = require("aws-cdk-lib/aws-iam");
|
|
13
13
|
const aws_lambda_1 = require("aws-cdk-lib/aws-lambda");
|
|
14
|
+
const aws_stepfunctions_1 = require("aws-cdk-lib/aws-stepfunctions");
|
|
14
15
|
const aws_stepfunctions_tasks_1 = require("aws-cdk-lib/aws-stepfunctions-tasks");
|
|
15
16
|
const base_document_processing_1 = require("./base-document-processing");
|
|
16
17
|
const framework_1 = require("../framework");
|
|
@@ -58,9 +59,24 @@ class BedrockDocumentProcessing extends base_document_processing_1.BaseDocumentP
|
|
|
58
59
|
* @param scope - The scope in which to define this construct
|
|
59
60
|
* @param id - The scoped construct ID. Must be unique within the scope.
|
|
60
61
|
* @param props - Configuration properties for the Bedrock document processing pipeline
|
|
62
|
+
* @throws Error if chunking configuration is invalid
|
|
61
63
|
*/
|
|
62
64
|
constructor(scope, id, props) {
|
|
63
65
|
super(scope, id, props);
|
|
66
|
+
/** Counter for generating unique classification step IDs */
|
|
67
|
+
this._classificationStepCounter = 0;
|
|
68
|
+
/** Counter for generating unique processing step IDs */
|
|
69
|
+
this._processingStepCounter = 0;
|
|
70
|
+
/** Counter for generating unique aggregation step IDs */
|
|
71
|
+
this._aggregationStepCounter = 0;
|
|
72
|
+
/** Counter for generating unique enrichment step IDs */
|
|
73
|
+
this._enrichmentStepCounter = 0;
|
|
74
|
+
/** Counter for generating unique post-processing step IDs */
|
|
75
|
+
this._postProcessingStepCounter = 0;
|
|
76
|
+
// Validate chunking configuration if provided
|
|
77
|
+
if (props.enableChunking && props.chunkingConfig) {
|
|
78
|
+
this.validateChunkingConfig(props.chunkingConfig);
|
|
79
|
+
}
|
|
64
80
|
if (props.network) {
|
|
65
81
|
props.network.createServiceEndpoint('vpce-bedrock', aws_ec2_1.InterfaceVpcEndpointAwsService.BEDROCK);
|
|
66
82
|
props.network.createServiceEndpoint('vpce-bedrock-runtime', aws_ec2_1.InterfaceVpcEndpointAwsService.BEDROCK_RUNTIME);
|
|
@@ -68,6 +84,77 @@ class BedrockDocumentProcessing extends base_document_processing_1.BaseDocumentP
|
|
|
68
84
|
this.bedrockDocumentProcessingProps = props;
|
|
69
85
|
this.stateMachine = this.handleStateMachineCreation('bedrock-document-processing-workflow');
|
|
70
86
|
}
|
|
87
|
+
/**
|
|
88
|
+
* Validates the chunking configuration parameters.
|
|
89
|
+
*
|
|
90
|
+
* Ensures that:
|
|
91
|
+
* - Chunk size is greater than 0
|
|
92
|
+
* - Overlap is non-negative and less than chunk size
|
|
93
|
+
* - Thresholds are greater than 0
|
|
94
|
+
* - Max concurrency is greater than 0
|
|
95
|
+
* - Min success threshold is between 0 and 1
|
|
96
|
+
*
|
|
97
|
+
* @param config - The chunking configuration to validate
|
|
98
|
+
* @throws Error if any configuration parameter is invalid
|
|
99
|
+
*/
|
|
100
|
+
validateChunkingConfig(config) {
|
|
101
|
+
// Validate chunk size (for fixed-pages strategy)
|
|
102
|
+
if (config.chunkSize !== undefined) {
|
|
103
|
+
if (config.chunkSize <= 0) {
|
|
104
|
+
throw new Error('ChunkingConfig validation error: chunkSize must be greater than 0');
|
|
105
|
+
}
|
|
106
|
+
}
|
|
107
|
+
// Validate overlap pages (for fixed-pages strategy)
|
|
108
|
+
if (config.overlapPages !== undefined) {
|
|
109
|
+
if (config.overlapPages < 0) {
|
|
110
|
+
throw new Error('ChunkingConfig validation error: overlapPages must be non-negative');
|
|
111
|
+
}
|
|
112
|
+
const effectiveChunkSize = config.chunkSize || 50; // default chunk size
|
|
113
|
+
if (config.overlapPages >= effectiveChunkSize) {
|
|
114
|
+
throw new Error('ChunkingConfig validation error: overlapPages must be less than chunkSize');
|
|
115
|
+
}
|
|
116
|
+
}
|
|
117
|
+
// Validate page threshold
|
|
118
|
+
if (config.pageThreshold !== undefined && config.pageThreshold <= 0) {
|
|
119
|
+
throw new Error('ChunkingConfig validation error: pageThreshold must be greater than 0');
|
|
120
|
+
}
|
|
121
|
+
// Validate token threshold
|
|
122
|
+
if (config.tokenThreshold !== undefined && config.tokenThreshold <= 0) {
|
|
123
|
+
throw new Error('ChunkingConfig validation error: tokenThreshold must be greater than 0');
|
|
124
|
+
}
|
|
125
|
+
// Validate max tokens per chunk (for token-based strategy)
|
|
126
|
+
if (config.maxTokensPerChunk !== undefined && config.maxTokensPerChunk <= 0) {
|
|
127
|
+
throw new Error('ChunkingConfig validation error: maxTokensPerChunk must be greater than 0');
|
|
128
|
+
}
|
|
129
|
+
// Validate overlap tokens (for token-based and hybrid strategies)
|
|
130
|
+
if (config.overlapTokens !== undefined) {
|
|
131
|
+
if (config.overlapTokens < 0) {
|
|
132
|
+
throw new Error('ChunkingConfig validation error: overlapTokens must be non-negative');
|
|
133
|
+
}
|
|
134
|
+
const effectiveMaxTokens = config.maxTokensPerChunk || 100000; // default max tokens
|
|
135
|
+
if (config.overlapTokens >= effectiveMaxTokens) {
|
|
136
|
+
throw new Error('ChunkingConfig validation error: overlapTokens must be less than maxTokensPerChunk');
|
|
137
|
+
}
|
|
138
|
+
}
|
|
139
|
+
// Validate max pages per chunk (for hybrid strategy)
|
|
140
|
+
if (config.maxPagesPerChunk !== undefined && config.maxPagesPerChunk <= 0) {
|
|
141
|
+
throw new Error('ChunkingConfig validation error: maxPagesPerChunk must be greater than 0');
|
|
142
|
+
}
|
|
143
|
+
// Validate target tokens per chunk (for hybrid strategy)
|
|
144
|
+
if (config.targetTokensPerChunk !== undefined && config.targetTokensPerChunk <= 0) {
|
|
145
|
+
throw new Error('ChunkingConfig validation error: targetTokensPerChunk must be greater than 0');
|
|
146
|
+
}
|
|
147
|
+
// Validate max concurrency
|
|
148
|
+
if (config.maxConcurrency !== undefined && config.maxConcurrency <= 0) {
|
|
149
|
+
throw new Error('ChunkingConfig validation error: maxConcurrency must be greater than 0');
|
|
150
|
+
}
|
|
151
|
+
// Validate min success threshold
|
|
152
|
+
if (config.minSuccessThreshold !== undefined) {
|
|
153
|
+
if (config.minSuccessThreshold < 0 || config.minSuccessThreshold > 1) {
|
|
154
|
+
throw new Error('ChunkingConfig validation error: minSuccessThreshold must be between 0 and 1');
|
|
155
|
+
}
|
|
156
|
+
}
|
|
157
|
+
}
|
|
71
158
|
/**
|
|
72
159
|
* Implements the document classification step using Amazon Bedrock.
|
|
73
160
|
*
|
|
@@ -75,47 +162,60 @@ class BedrockDocumentProcessing extends base_document_processing_1.BaseDocumentP
|
|
|
75
162
|
* the document type. The function reads the document from S3 and sends it to
|
|
76
163
|
* Bedrock with the classification prompt.
|
|
77
164
|
*
|
|
165
|
+
* This method caches the Lambda function to avoid creating duplicate resources,
|
|
166
|
+
* but creates a new LambdaInvoke task each time to allow proper state chaining.
|
|
167
|
+
*
|
|
78
168
|
* @returns LambdaInvoke task configured for document classification
|
|
79
169
|
*/
|
|
80
170
|
classificationStep() {
|
|
81
|
-
|
|
82
|
-
|
|
83
|
-
|
|
84
|
-
|
|
85
|
-
|
|
86
|
-
account
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
|
|
90
|
-
|
|
91
|
-
|
|
92
|
-
|
|
93
|
-
|
|
94
|
-
|
|
95
|
-
|
|
96
|
-
|
|
97
|
-
|
|
98
|
-
|
|
99
|
-
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
|
|
112
|
-
|
|
113
|
-
|
|
114
|
-
|
|
115
|
-
|
|
171
|
+
// Create Lambda function only once
|
|
172
|
+
if (!this._classificationFunction) {
|
|
173
|
+
const prompt = this.bedrockDocumentProcessingProps.classificationPrompt || BedrockDocumentProcessing.DEFAULT_CLASSIFICATION_PROMPT;
|
|
174
|
+
const adjustedModelId = bedrock_1.BedrockModelUtils.deriveActualModelId(this.bedrockDocumentProcessingProps.classificationBedrockModel);
|
|
175
|
+
const role = this.generateLambdaRoleForBedrock('ClassificationLambdaRole', this.bedrockDocumentProcessingProps.classificationBedrockModel);
|
|
176
|
+
const { region, account } = aws_cdk_lib_1.Stack.of(this);
|
|
177
|
+
const generatedLogPermissions = utilities_1.LambdaIamUtils.createLogsPermissions({
|
|
178
|
+
account,
|
|
179
|
+
functionName: 'bedrock-idp-classification',
|
|
180
|
+
region,
|
|
181
|
+
scope: this,
|
|
182
|
+
enableObservability: this.bedrockDocumentProcessingProps.enableObservability,
|
|
183
|
+
});
|
|
184
|
+
this.encryptionKey.grantEncryptDecrypt(role);
|
|
185
|
+
this._classificationFunction = new aws_lambda_python_alpha_1.PythonFunction(this, 'BedrockClassificationFunction', {
|
|
186
|
+
functionName: generatedLogPermissions.uniqueFunctionName,
|
|
187
|
+
architecture: aws_lambda_1.Architecture.X86_64,
|
|
188
|
+
runtime: framework_1.DefaultRuntimes.PYTHON,
|
|
189
|
+
entry: path.join(__dirname, 'resources/default-bedrock-invoke'),
|
|
190
|
+
role,
|
|
191
|
+
memorySize: 512,
|
|
192
|
+
timeout: this.bedrockDocumentProcessingProps.stepTimeouts || aws_cdk_lib_1.Duration.minutes(5),
|
|
193
|
+
environment: {
|
|
194
|
+
MODEL_ID: adjustedModelId,
|
|
195
|
+
PROMPT: prompt,
|
|
196
|
+
INVOKE_TYPE: 'classification',
|
|
197
|
+
...powertools_config_1.PowertoolsConfig.generateDefaultLambdaConfig(this.bedrockDocumentProcessingProps.enableObservability, this.metricNamespace, this.metricServiceName),
|
|
198
|
+
},
|
|
199
|
+
environmentEncryption: this.encryptionKey,
|
|
200
|
+
vpc: this.bedrockDocumentProcessingProps.network
|
|
201
|
+
? this.bedrockDocumentProcessingProps.network.vpc
|
|
202
|
+
: undefined,
|
|
203
|
+
vpcSubnets: this.bedrockDocumentProcessingProps.network
|
|
204
|
+
? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection()
|
|
205
|
+
: undefined,
|
|
206
|
+
});
|
|
207
|
+
for (const statement of generatedLogPermissions.policyStatements) {
|
|
208
|
+
this._classificationFunction.role?.addToPrincipalPolicy(statement);
|
|
209
|
+
}
|
|
210
|
+
if (this.bedrockDocumentProcessingProps.network) {
|
|
211
|
+
this._classificationFunction.role?.addToPrincipalPolicy(utilities_1.LambdaIamUtils.generateLambdaVPCPermissions());
|
|
212
|
+
}
|
|
116
213
|
}
|
|
117
|
-
|
|
118
|
-
|
|
214
|
+
// Always create a new LambdaInvoke task to allow proper state chaining
|
|
215
|
+
const stepId = `ClassificationStep-${this._classificationStepCounter}`;
|
|
216
|
+
this._classificationStepCounter++;
|
|
217
|
+
return new aws_stepfunctions_tasks_1.LambdaInvoke(this, stepId, {
|
|
218
|
+
lambdaFunction: this._classificationFunction,
|
|
119
219
|
resultPath: '$.classificationResult',
|
|
120
220
|
resultSelector: {
|
|
121
221
|
'documentClassification.$': '$.Payload.documentClassification',
|
|
@@ -129,46 +229,59 @@ class BedrockDocumentProcessing extends base_document_processing_1.BaseDocumentP
|
|
|
129
229
|
* structured data from the document. Uses the classification result from the
|
|
130
230
|
* previous step to provide context for more accurate extraction.
|
|
131
231
|
*
|
|
232
|
+
* This method caches the Lambda function to avoid creating duplicate resources,
|
|
233
|
+
* but creates a new LambdaInvoke task each time to allow proper state chaining.
|
|
234
|
+
*
|
|
132
235
|
* @returns LambdaInvoke task configured for document extraction
|
|
133
236
|
*/
|
|
134
237
|
processingStep() {
|
|
135
|
-
|
|
136
|
-
|
|
137
|
-
|
|
138
|
-
|
|
139
|
-
|
|
140
|
-
account
|
|
141
|
-
|
|
142
|
-
|
|
143
|
-
|
|
144
|
-
|
|
145
|
-
|
|
146
|
-
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
|
|
154
|
-
|
|
155
|
-
|
|
156
|
-
|
|
157
|
-
|
|
158
|
-
|
|
159
|
-
|
|
160
|
-
|
|
161
|
-
|
|
162
|
-
|
|
163
|
-
|
|
164
|
-
|
|
165
|
-
|
|
166
|
-
|
|
167
|
-
|
|
168
|
-
|
|
238
|
+
// Create Lambda function only once
|
|
239
|
+
if (!this._processingFunction) {
|
|
240
|
+
const prompt = this.bedrockDocumentProcessingProps.processingPrompt || BedrockDocumentProcessing.DEFAULT_PROCESSING_PROMPT;
|
|
241
|
+
const adjustedModelId = bedrock_1.BedrockModelUtils.deriveActualModelId(this.bedrockDocumentProcessingProps.processingBedrockModel);
|
|
242
|
+
const role = this.generateLambdaRoleForBedrock('ProcessingLambdaRole', this.bedrockDocumentProcessingProps.processingBedrockModel);
|
|
243
|
+
const { region, account } = aws_cdk_lib_1.Stack.of(this);
|
|
244
|
+
const generatedLogPermissions = utilities_1.LambdaIamUtils.createLogsPermissions({
|
|
245
|
+
account,
|
|
246
|
+
functionName: 'bedrock-idp-processing',
|
|
247
|
+
region,
|
|
248
|
+
scope: this,
|
|
249
|
+
});
|
|
250
|
+
this.encryptionKey.grantEncryptDecrypt(role);
|
|
251
|
+
this._processingFunction = new aws_lambda_python_alpha_1.PythonFunction(this, 'BedrockExtractionFunction', {
|
|
252
|
+
functionName: generatedLogPermissions.uniqueFunctionName,
|
|
253
|
+
runtime: framework_1.DefaultRuntimes.PYTHON,
|
|
254
|
+
architecture: aws_lambda_1.Architecture.X86_64,
|
|
255
|
+
entry: path.join(__dirname, 'resources/default-bedrock-invoke'),
|
|
256
|
+
role,
|
|
257
|
+
memorySize: 512,
|
|
258
|
+
timeout: this.bedrockDocumentProcessingProps.stepTimeouts || aws_cdk_lib_1.Duration.minutes(5),
|
|
259
|
+
environment: {
|
|
260
|
+
MODEL_ID: adjustedModelId,
|
|
261
|
+
PROMPT: prompt,
|
|
262
|
+
INVOKE_TYPE: 'processing',
|
|
263
|
+
...powertools_config_1.PowertoolsConfig.generateDefaultLambdaConfig(this.bedrockDocumentProcessingProps.enableObservability, this.metricNamespace, this.metricServiceName),
|
|
264
|
+
},
|
|
265
|
+
environmentEncryption: this.encryptionKey,
|
|
266
|
+
vpc: this.bedrockDocumentProcessingProps.network
|
|
267
|
+
? this.bedrockDocumentProcessingProps.network.vpc
|
|
268
|
+
: undefined,
|
|
269
|
+
vpcSubnets: this.bedrockDocumentProcessingProps.network
|
|
270
|
+
? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection()
|
|
271
|
+
: undefined,
|
|
272
|
+
});
|
|
273
|
+
for (const statement of generatedLogPermissions.policyStatements) {
|
|
274
|
+
this._processingFunction.role?.addToPrincipalPolicy(statement);
|
|
275
|
+
}
|
|
276
|
+
if (this.bedrockDocumentProcessingProps.network) {
|
|
277
|
+
this._processingFunction.role?.addToPrincipalPolicy(utilities_1.LambdaIamUtils.generateLambdaVPCPermissions());
|
|
278
|
+
}
|
|
169
279
|
}
|
|
170
|
-
|
|
171
|
-
|
|
280
|
+
// Always create a new LambdaInvoke task to allow proper state chaining
|
|
281
|
+
const stepId = `ProcessingStep-${this._processingStepCounter}`;
|
|
282
|
+
this._processingStepCounter++;
|
|
283
|
+
return new aws_stepfunctions_tasks_1.LambdaInvoke(this, stepId, {
|
|
284
|
+
lambdaFunction: this._processingFunction,
|
|
172
285
|
resultPath: '$.processingResult',
|
|
173
286
|
resultSelector: {
|
|
174
287
|
'documentClassification.$': '$.Payload.documentClassification',
|
|
@@ -182,6 +295,7 @@ class BedrockDocumentProcessing extends base_document_processing_1.BaseDocumentP
|
|
|
182
295
|
inlinePolicies: {
|
|
183
296
|
BedrockInvokePolicy: new aws_iam_1.PolicyDocument({
|
|
184
297
|
statements: [
|
|
298
|
+
// S3 read-only access for document retrieval - least privilege
|
|
185
299
|
...this.ingressAdapter.generateAdapterIAMPolicies(),
|
|
186
300
|
bedrock_1.BedrockModelUtils.generateModelIAMPermissions(this, model),
|
|
187
301
|
],
|
|
@@ -202,9 +316,13 @@ class BedrockDocumentProcessing extends base_document_processing_1.BaseDocumentP
|
|
|
202
316
|
if (!this.bedrockDocumentProcessingProps.enrichmentLambdaFunction) {
|
|
203
317
|
return undefined;
|
|
204
318
|
}
|
|
205
|
-
|
|
319
|
+
const stepId = `EnrichmentStep-${this._enrichmentStepCounter}`;
|
|
320
|
+
this._enrichmentStepCounter++;
|
|
321
|
+
return new aws_stepfunctions_tasks_1.LambdaInvoke(this, stepId, {
|
|
206
322
|
lambdaFunction: this.bedrockDocumentProcessingProps.enrichmentLambdaFunction,
|
|
207
323
|
resultPath: '$.enrichedResult',
|
|
324
|
+
outputPath: '$',
|
|
325
|
+
payloadResponseOnly: true,
|
|
208
326
|
});
|
|
209
327
|
}
|
|
210
328
|
/**
|
|
@@ -220,15 +338,515 @@ class BedrockDocumentProcessing extends base_document_processing_1.BaseDocumentP
|
|
|
220
338
|
if (!this.bedrockDocumentProcessingProps.postProcessingLambdaFunction) {
|
|
221
339
|
return undefined;
|
|
222
340
|
}
|
|
223
|
-
|
|
341
|
+
const stepId = `PostProcessingStep-${this._postProcessingStepCounter}`;
|
|
342
|
+
this._postProcessingStepCounter++;
|
|
343
|
+
return new aws_stepfunctions_tasks_1.LambdaInvoke(this, stepId, {
|
|
224
344
|
lambdaFunction: this.bedrockDocumentProcessingProps.postProcessingLambdaFunction,
|
|
225
345
|
resultPath: '$.postProcessedResult',
|
|
346
|
+
outputPath: '$',
|
|
347
|
+
payloadResponseOnly: true,
|
|
226
348
|
});
|
|
227
349
|
}
|
|
350
|
+
/**
|
|
351
|
+
* Implements the optional preprocessing step for PDF chunking.
|
|
352
|
+
*
|
|
353
|
+
* When chunking is enabled, creates a Lambda function that analyzes PDFs and
|
|
354
|
+
* splits large documents into manageable chunks. The function:
|
|
355
|
+
* 1. Analyzes the PDF to determine page count and token estimates
|
|
356
|
+
* 2. Decides if chunking is needed based on configured thresholds
|
|
357
|
+
* 3. If chunking is needed, splits the PDF and uploads chunks to S3
|
|
358
|
+
*
|
|
359
|
+
* @returns LambdaInvoke task for PDF analysis and chunking, or undefined if chunking is disabled
|
|
360
|
+
*/
|
|
361
|
+
preprocessingStep() {
|
|
362
|
+
// Only enable chunking if explicitly configured
|
|
363
|
+
if (!this.bedrockDocumentProcessingProps.enableChunking) {
|
|
364
|
+
return undefined;
|
|
365
|
+
}
|
|
366
|
+
const { region, account } = aws_cdk_lib_1.Stack.of(this);
|
|
367
|
+
const chunkingConfig = this.bedrockDocumentProcessingProps.chunkingConfig || {};
|
|
368
|
+
// Create IAM role for chunking Lambda with least privilege permissions
|
|
369
|
+
// Chunking Lambda needs: GetObject (read raw PDFs), PutObject (write chunks)
|
|
370
|
+
const role = new aws_iam_1.Role(this, 'ChunkingLambdaRole', {
|
|
371
|
+
assumedBy: new aws_iam_1.ServicePrincipal('lambda.amazonaws.com'),
|
|
372
|
+
inlinePolicies: {
|
|
373
|
+
ChunkingPolicy: new aws_iam_1.PolicyDocument({
|
|
374
|
+
statements: [
|
|
375
|
+
...this.ingressAdapter.generateAdapterIAMPolicies(),
|
|
376
|
+
],
|
|
377
|
+
}),
|
|
378
|
+
},
|
|
379
|
+
});
|
|
380
|
+
const generatedLogPermissions = utilities_1.LambdaIamUtils.createLogsPermissions({
|
|
381
|
+
account,
|
|
382
|
+
functionName: 'bedrock-idp-chunking',
|
|
383
|
+
region,
|
|
384
|
+
scope: this,
|
|
385
|
+
enableObservability: this.bedrockDocumentProcessingProps.enableObservability,
|
|
386
|
+
});
|
|
387
|
+
this.encryptionKey.grantEncryptDecrypt(role);
|
|
388
|
+
// Create PDF Analysis & Chunking Lambda
|
|
389
|
+
const chunkingLambda = new aws_lambda_python_alpha_1.PythonFunction(this, 'PDFChunkingFunction', {
|
|
390
|
+
functionName: generatedLogPermissions.uniqueFunctionName,
|
|
391
|
+
entry: path.join(__dirname, 'resources/pdf-chunking'),
|
|
392
|
+
index: 'handler.py',
|
|
393
|
+
handler: 'handler',
|
|
394
|
+
runtime: framework_1.DefaultRuntimes.PYTHON,
|
|
395
|
+
architecture: aws_lambda_1.Architecture.X86_64,
|
|
396
|
+
role,
|
|
397
|
+
memorySize: 2048,
|
|
398
|
+
timeout: aws_cdk_lib_1.Duration.minutes(10),
|
|
399
|
+
environment: {
|
|
400
|
+
CHUNKING_STRATEGY: chunkingConfig.strategy || 'hybrid',
|
|
401
|
+
PAGE_THRESHOLD: String(chunkingConfig.pageThreshold || 100),
|
|
402
|
+
TOKEN_THRESHOLD: String(chunkingConfig.tokenThreshold || 150000),
|
|
403
|
+
CHUNK_SIZE: String(chunkingConfig.chunkSize || 50),
|
|
404
|
+
OVERLAP_PAGES: String(chunkingConfig.overlapPages || 5),
|
|
405
|
+
MAX_TOKENS_PER_CHUNK: String(chunkingConfig.maxTokensPerChunk || 100000),
|
|
406
|
+
OVERLAP_TOKENS: String(chunkingConfig.overlapTokens || 5000),
|
|
407
|
+
TARGET_TOKENS_PER_CHUNK: String(chunkingConfig.targetTokensPerChunk || 80000),
|
|
408
|
+
MAX_PAGES_PER_CHUNK: String(chunkingConfig.maxPagesPerChunk || 99),
|
|
409
|
+
...powertools_config_1.PowertoolsConfig.generateDefaultLambdaConfig(this.bedrockDocumentProcessingProps.enableObservability, this.metricNamespace, this.metricServiceName),
|
|
410
|
+
},
|
|
411
|
+
environmentEncryption: this.encryptionKey,
|
|
412
|
+
vpc: this.bedrockDocumentProcessingProps.network
|
|
413
|
+
? this.bedrockDocumentProcessingProps.network.vpc
|
|
414
|
+
: undefined,
|
|
415
|
+
vpcSubnets: this.bedrockDocumentProcessingProps.network
|
|
416
|
+
? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection()
|
|
417
|
+
: undefined,
|
|
418
|
+
});
|
|
419
|
+
for (const statement of generatedLogPermissions.policyStatements) {
|
|
420
|
+
chunkingLambda.role?.addToPrincipalPolicy(statement);
|
|
421
|
+
}
|
|
422
|
+
if (this.bedrockDocumentProcessingProps.network) {
|
|
423
|
+
chunkingLambda.role?.addToPrincipalPolicy(utilities_1.LambdaIamUtils.generateLambdaVPCPermissions());
|
|
424
|
+
}
|
|
425
|
+
return new aws_stepfunctions_tasks_1.LambdaInvoke(this, 'PDFAnalysisAndChunking', {
|
|
426
|
+
lambdaFunction: chunkingLambda,
|
|
427
|
+
resultPath: '$.chunkingResult',
|
|
428
|
+
resultSelector: {
|
|
429
|
+
'requiresChunking.$': '$.Payload.requiresChunking',
|
|
430
|
+
'tokenAnalysis.$': '$.Payload.tokenAnalysis',
|
|
431
|
+
'strategy.$': '$.Payload.strategy',
|
|
432
|
+
'chunks.$': '$.Payload.chunks',
|
|
433
|
+
},
|
|
434
|
+
});
|
|
435
|
+
}
|
|
436
|
+
/**
|
|
437
|
+
* Provides additional metadata fields for chunking to be stored in DynamoDB.
|
|
438
|
+
*
|
|
439
|
+
* When chunking is enabled, adds fields for:
|
|
440
|
+
* - ChunkingEnabled: string representation of boolean flag
|
|
441
|
+
* - ChunkingStrategy: strategy used (fixed-pages, token-based, hybrid)
|
|
442
|
+
* - TokenAnalysis: JSON string with token analysis results
|
|
443
|
+
* - ChunkMetadata: JSON string array with chunk information
|
|
444
|
+
*
|
|
445
|
+
* @returns Record of DynamoDB attribute values for chunking metadata
|
|
446
|
+
*/
|
|
447
|
+
preprocessingMetadata() {
|
|
448
|
+
if (!this.bedrockDocumentProcessingProps.enableChunking) {
|
|
449
|
+
return {};
|
|
450
|
+
}
|
|
451
|
+
return {
|
|
452
|
+
ChunkingEnabled: aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.stringAt('States.Format(\'{}\', $.chunkingResult.requiresChunking)')),
|
|
453
|
+
ChunkingStrategy: aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.stringAt('$.chunkingResult.strategy')),
|
|
454
|
+
TokenAnalysis: aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.jsonToString(aws_stepfunctions_1.JsonPath.objectAt('$.chunkingResult.tokenAnalysis'))),
|
|
455
|
+
ChunkMetadata: aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.jsonToString(aws_stepfunctions_1.JsonPath.objectAt('$.chunkingResult.chunks'))),
|
|
456
|
+
};
|
|
457
|
+
}
|
|
458
|
+
/**
|
|
459
|
+
* Creates the processing workflow with conditional branching for chunked documents.
|
|
460
|
+
*
|
|
461
|
+
* When chunking is enabled, creates a Choice State that:
|
|
462
|
+
* - Routes to chunked processing flow if document was chunked
|
|
463
|
+
* - Routes to standard processing flow if document was not chunked
|
|
464
|
+
*
|
|
465
|
+
* When chunking is disabled, returns the standard processing workflow.
|
|
466
|
+
*
|
|
467
|
+
* @returns Step Functions chain for processing the document
|
|
468
|
+
*/
|
|
469
|
+
createProcessingWorkflow() {
|
|
470
|
+
// If chunking is not enabled, use standard workflow
|
|
471
|
+
if (!this.bedrockDocumentProcessingProps.enableChunking) {
|
|
472
|
+
return this.createStandardProcessingWorkflow();
|
|
473
|
+
}
|
|
474
|
+
// Create Choice State to check if chunking was applied
|
|
475
|
+
const choiceState = new aws_stepfunctions_1.Choice(this, 'CheckIfChunked');
|
|
476
|
+
choiceState
|
|
477
|
+
.when(aws_stepfunctions_1.Condition.booleanEquals('$.chunkingResult.requiresChunking', true), this.createChunkedProcessingFlow())
|
|
478
|
+
.otherwise(
|
|
479
|
+
// Pass 'Standard' prefix to avoid construct ID collisions with chunked flow
|
|
480
|
+
this.createStandardProcessingWorkflow('Standard'));
|
|
481
|
+
return choiceState;
|
|
482
|
+
}
|
|
483
|
+
/**
|
|
484
|
+
* Creates the chunked processing flow for large documents.
|
|
485
|
+
*
|
|
486
|
+
* This flow:
|
|
487
|
+
* 1. Uses a Map State to process each chunk in parallel (or sequentially)
|
|
488
|
+
* 2. Each chunk goes through classification and processing
|
|
489
|
+
* 3. Results are aggregated using the aggregation Lambda
|
|
490
|
+
* 4. DynamoDB is updated with the aggregated result
|
|
491
|
+
* 5. Temporary chunks are cleaned up from S3
|
|
492
|
+
*
|
|
493
|
+
* @returns Step Functions chain for chunked document processing
|
|
494
|
+
*/
|
|
495
|
+
createChunkedProcessingFlow() {
|
|
496
|
+
const chunkingConfig = this.bedrockDocumentProcessingProps.chunkingConfig || {};
|
|
497
|
+
const maxConcurrency = chunkingConfig.processingMode === 'sequential'
|
|
498
|
+
? 1
|
|
499
|
+
: (chunkingConfig.maxConcurrency || 10);
|
|
500
|
+
// Create Map State for processing chunks
|
|
501
|
+
const mapState = new aws_stepfunctions_1.Map(this, 'ProcessChunks', {
|
|
502
|
+
itemsPath: '$.chunkingResult.chunks',
|
|
503
|
+
maxConcurrency,
|
|
504
|
+
parameters: {
|
|
505
|
+
'documentId.$': '$.documentId',
|
|
506
|
+
'chunk.$': '$$.Map.Item.Value',
|
|
507
|
+
'chunkIndex.$': '$$.Map.Item.Index',
|
|
508
|
+
'totalChunks.$': 'States.ArrayLength($.chunkingResult.chunks)',
|
|
509
|
+
// Override content to point to the chunk PDF, not the original document
|
|
510
|
+
'content': {
|
|
511
|
+
'location': 's3',
|
|
512
|
+
'bucket.$': '$$.Map.Item.Value.bucket',
|
|
513
|
+
'key.$': '$$.Map.Item.Value.key',
|
|
514
|
+
'filename.$': '$.content.filename',
|
|
515
|
+
},
|
|
516
|
+
'contentType.$': '$.contentType',
|
|
517
|
+
},
|
|
518
|
+
resultPath: '$.chunkResults',
|
|
519
|
+
});
|
|
520
|
+
// Define per-chunk processing: classification → processing
|
|
521
|
+
const chunkClassification = this.classificationStep();
|
|
522
|
+
const chunkProcessing = this.processingStep();
|
|
523
|
+
mapState.itemProcessor(chunkClassification.next(chunkProcessing));
|
|
524
|
+
// Create aggregation step (Lambda invoke only, normalization added separately)
|
|
525
|
+
const aggregationLambdaStep = this.createAggregationStep();
|
|
526
|
+
// Add a Pass state to normalize the aggregated result for downstream compatibility
|
|
527
|
+
// This copies aggregatedResult to processingResult so enrichment/post-processing
|
|
528
|
+
// see a consistent structure regardless of whether chunking was used
|
|
529
|
+
const normalizeState = new aws_stepfunctions_1.Pass(this, 'NormalizeAggregatedResult', {
|
|
530
|
+
parameters: {
|
|
531
|
+
'documentId.$': '$.documentId',
|
|
532
|
+
'contentType.$': '$.contentType',
|
|
533
|
+
'content.$': '$.content',
|
|
534
|
+
'chunkingResult.$': '$.chunkingResult',
|
|
535
|
+
'chunkResults.$': '$.chunkResults',
|
|
536
|
+
'aggregatedResult.$': '$.aggregatedResult',
|
|
537
|
+
// Copy aggregated result to processingResult for downstream compatibility
|
|
538
|
+
'processingResult': {
|
|
539
|
+
'result.$': '$.aggregatedResult.result',
|
|
540
|
+
},
|
|
541
|
+
// Also set classificationResult from the first successful chunk for consistency
|
|
542
|
+
'classificationResult.$': '$.chunkResults[0].classificationResult',
|
|
543
|
+
},
|
|
544
|
+
});
|
|
545
|
+
// Create DynamoDB update step for aggregated result
|
|
546
|
+
const updateAggregatedResultStep = this.createUpdateAggregatedResultStep();
|
|
547
|
+
// Create cleanup step
|
|
548
|
+
const cleanupStep = this.createCleanupStep();
|
|
549
|
+
// Create move to processed chain with 'Chunked' prefix to avoid ID collisions
|
|
550
|
+
const moveToProcessed = this.ingressAdapter.createSuccessChain(this, 'Chunked');
|
|
551
|
+
// Create error handler for aggregation failures
|
|
552
|
+
const aggregationErrorHandler = this.createAggregationErrorHandler();
|
|
553
|
+
// Get optional enrichment and post-processing steps
|
|
554
|
+
const enrichmentStep = this.enrichmentStep();
|
|
555
|
+
const postProcessingStep = this.postProcessingStep();
|
|
556
|
+
// Build the final chain after aggregation
|
|
557
|
+
// Chain: Map State → Aggregation → DynamoDB Update → [Enrichment] → [PostProcessing] → Cleanup → Move to Processed
|
|
558
|
+
let finalChain = cleanupStep
|
|
559
|
+
.addRetry({
|
|
560
|
+
errors: ['Lambda.ServiceException', 'Lambda.TooManyRequestsException'],
|
|
561
|
+
interval: aws_cdk_lib_1.Duration.seconds(2),
|
|
562
|
+
maxAttempts: 3,
|
|
563
|
+
backoffRate: 2,
|
|
564
|
+
})
|
|
565
|
+
.next(moveToProcessed);
|
|
566
|
+
// Add post-processing if provided (insert before cleanup)
|
|
567
|
+
if (postProcessingStep) {
|
|
568
|
+
const postProcessingErrorHandler = new aws_stepfunctions_tasks_1.DynamoUpdateItem(this, 'ChunkedPostProcessingFailDDBUpdate', {
|
|
569
|
+
table: this.documentProcessingTable,
|
|
570
|
+
key: {
|
|
571
|
+
DocumentId: aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.stringAt('$.documentId')),
|
|
572
|
+
},
|
|
573
|
+
updateExpression: 'SET WorkflowStatus = :newStatus',
|
|
574
|
+
expressionAttributeValues: {
|
|
575
|
+
':newStatus': aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString('post-processing-failure'),
|
|
576
|
+
},
|
|
577
|
+
resultPath: aws_stepfunctions_1.JsonPath.DISCARD,
|
|
578
|
+
}).next(this.ingressAdapter.createFailedChain(this, 'ChunkedPostProc'));
|
|
579
|
+
finalChain = postProcessingStep
|
|
580
|
+
.addCatch(postProcessingErrorHandler, {
|
|
581
|
+
resultPath: aws_stepfunctions_1.JsonPath.DISCARD,
|
|
582
|
+
})
|
|
583
|
+
.next(new aws_stepfunctions_tasks_1.DynamoUpdateItem(this, 'ChunkedPostProcessingSuccessUpdate', {
|
|
584
|
+
table: this.documentProcessingTable,
|
|
585
|
+
key: {
|
|
586
|
+
DocumentId: aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.stringAt('$.documentId')),
|
|
587
|
+
},
|
|
588
|
+
updateExpression: 'SET WorkflowStatus = :newStatus, PostProcessingResult = :postProcessingResult',
|
|
589
|
+
expressionAttributeValues: {
|
|
590
|
+
':newStatus': aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString('post-processing-complete'),
|
|
591
|
+
':postProcessingResult': aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.jsonToString(aws_stepfunctions_1.JsonPath.objectAt('$.postProcessedResult'))),
|
|
592
|
+
},
|
|
593
|
+
resultPath: aws_stepfunctions_1.JsonPath.DISCARD,
|
|
594
|
+
}).next(finalChain));
|
|
595
|
+
}
|
|
596
|
+
// Add enrichment if provided (insert before post-processing or cleanup)
|
|
597
|
+
if (enrichmentStep) {
|
|
598
|
+
const enrichmentErrorHandler = new aws_stepfunctions_tasks_1.DynamoUpdateItem(this, 'ChunkedEnrichmentFailDDBUpdate', {
|
|
599
|
+
table: this.documentProcessingTable,
|
|
600
|
+
key: {
|
|
601
|
+
DocumentId: aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.stringAt('$.documentId')),
|
|
602
|
+
},
|
|
603
|
+
updateExpression: 'SET WorkflowStatus = :newStatus',
|
|
604
|
+
expressionAttributeValues: {
|
|
605
|
+
':newStatus': aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString('enrichment-failure'),
|
|
606
|
+
},
|
|
607
|
+
resultPath: aws_stepfunctions_1.JsonPath.DISCARD,
|
|
608
|
+
}).next(this.ingressAdapter.createFailedChain(this, 'ChunkedEnrich'));
|
|
609
|
+
finalChain = enrichmentStep
|
|
610
|
+
.addCatch(enrichmentErrorHandler, {
|
|
611
|
+
resultPath: aws_stepfunctions_1.JsonPath.DISCARD,
|
|
612
|
+
})
|
|
613
|
+
.next(new aws_stepfunctions_tasks_1.DynamoUpdateItem(this, 'ChunkedEnrichmentSuccessUpdate', {
|
|
614
|
+
table: this.documentProcessingTable,
|
|
615
|
+
key: {
|
|
616
|
+
DocumentId: aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.stringAt('$.documentId')),
|
|
617
|
+
},
|
|
618
|
+
updateExpression: 'SET WorkflowStatus = :newStatus, EnrichmentResult = :enrichmentResult',
|
|
619
|
+
expressionAttributeValues: {
|
|
620
|
+
':newStatus': postProcessingStep
|
|
621
|
+
? aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString('enrichment-complete')
|
|
622
|
+
: aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString('complete'),
|
|
623
|
+
':enrichmentResult': aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.jsonToString(aws_stepfunctions_1.JsonPath.objectAt('$.enrichedResult'))),
|
|
624
|
+
},
|
|
625
|
+
resultPath: aws_stepfunctions_1.JsonPath.DISCARD,
|
|
626
|
+
}).next(finalChain));
|
|
627
|
+
}
|
|
628
|
+
// Chain: Map State → Aggregation → Normalize → DynamoDB Update → [Enrichment] → [PostProcessing] → Cleanup → Move to Processed
|
|
629
|
+
return mapState
|
|
630
|
+
.addCatch(aggregationErrorHandler, {
|
|
631
|
+
resultPath: '$.error',
|
|
632
|
+
})
|
|
633
|
+
.next(aggregationLambdaStep
|
|
634
|
+
.addCatch(aggregationErrorHandler, {
|
|
635
|
+
resultPath: '$.error',
|
|
636
|
+
})
|
|
637
|
+
.addRetry({
|
|
638
|
+
errors: ['Lambda.ServiceException', 'Lambda.TooManyRequestsException'],
|
|
639
|
+
interval: aws_cdk_lib_1.Duration.seconds(2),
|
|
640
|
+
maxAttempts: 3,
|
|
641
|
+
backoffRate: 2,
|
|
642
|
+
})
|
|
643
|
+
.next(normalizeState.next(updateAggregatedResultStep
|
|
644
|
+
.addRetry({
|
|
645
|
+
errors: ['DynamoDB.ProvisionedThroughputExceededException'],
|
|
646
|
+
interval: aws_cdk_lib_1.Duration.seconds(1),
|
|
647
|
+
maxAttempts: 3,
|
|
648
|
+
backoffRate: 2,
|
|
649
|
+
})
|
|
650
|
+
.next(finalChain))));
|
|
651
|
+
}
|
|
652
|
+
/**
|
|
653
|
+
* Creates the aggregation step for combining chunk results using Bedrock.
|
|
654
|
+
*
|
|
655
|
+
* Uses the same Bedrock invoke Lambda pattern as the processing step but with
|
|
656
|
+
* a different prompt designed for aggregating multiple chunk results.
|
|
657
|
+
* The chunk processing results are passed as text data to the model.
|
|
658
|
+
*
|
|
659
|
+
* @returns LambdaInvoke task for result aggregation
|
|
660
|
+
*/
|
|
661
|
+
createAggregationStep() {
|
|
662
|
+
// Create Lambda function only once (reuses bedrock-invoke pattern)
|
|
663
|
+
if (!this._aggregationFunction) {
|
|
664
|
+
const prompt = this.bedrockDocumentProcessingProps.aggregationPrompt || BedrockDocumentProcessing.DEFAULT_AGGREGATION_PROMPT;
|
|
665
|
+
const adjustedModelId = bedrock_1.BedrockModelUtils.deriveActualModelId(this.bedrockDocumentProcessingProps.processingBedrockModel);
|
|
666
|
+
const role = this.generateLambdaRoleForBedrock('AggregationLambdaRole', this.bedrockDocumentProcessingProps.processingBedrockModel);
|
|
667
|
+
const { region, account } = aws_cdk_lib_1.Stack.of(this);
|
|
668
|
+
const generatedLogPermissions = utilities_1.LambdaIamUtils.createLogsPermissions({
|
|
669
|
+
account,
|
|
670
|
+
functionName: 'bedrock-idp-aggregation',
|
|
671
|
+
region,
|
|
672
|
+
scope: this,
|
|
673
|
+
enableObservability: this.bedrockDocumentProcessingProps.enableObservability,
|
|
674
|
+
});
|
|
675
|
+
this.encryptionKey.grantEncryptDecrypt(role);
|
|
676
|
+
this._aggregationFunction = new aws_lambda_python_alpha_1.PythonFunction(this, 'BedrockAggregationFunction', {
|
|
677
|
+
functionName: generatedLogPermissions.uniqueFunctionName,
|
|
678
|
+
architecture: aws_lambda_1.Architecture.X86_64,
|
|
679
|
+
runtime: framework_1.DefaultRuntimes.PYTHON,
|
|
680
|
+
entry: path.join(__dirname, 'resources/default-bedrock-invoke'),
|
|
681
|
+
role,
|
|
682
|
+
memorySize: 1024,
|
|
683
|
+
timeout: this.bedrockDocumentProcessingProps.stepTimeouts || aws_cdk_lib_1.Duration.minutes(5),
|
|
684
|
+
environment: {
|
|
685
|
+
MODEL_ID: adjustedModelId,
|
|
686
|
+
PROMPT: prompt,
|
|
687
|
+
INVOKE_TYPE: 'aggregation',
|
|
688
|
+
INVOKE_MAX_TOKENS: '64000', // Aggregation may need more tokens for merged output
|
|
689
|
+
...powertools_config_1.PowertoolsConfig.generateDefaultLambdaConfig(this.bedrockDocumentProcessingProps.enableObservability, this.metricNamespace, this.metricServiceName),
|
|
690
|
+
},
|
|
691
|
+
environmentEncryption: this.encryptionKey,
|
|
692
|
+
vpc: this.bedrockDocumentProcessingProps.network
|
|
693
|
+
? this.bedrockDocumentProcessingProps.network.vpc
|
|
694
|
+
: undefined,
|
|
695
|
+
vpcSubnets: this.bedrockDocumentProcessingProps.network
|
|
696
|
+
? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection()
|
|
697
|
+
: undefined,
|
|
698
|
+
});
|
|
699
|
+
for (const statement of generatedLogPermissions.policyStatements) {
|
|
700
|
+
this._aggregationFunction.role?.addToPrincipalPolicy(statement);
|
|
701
|
+
}
|
|
702
|
+
if (this.bedrockDocumentProcessingProps.network) {
|
|
703
|
+
this._aggregationFunction.role?.addToPrincipalPolicy(utilities_1.LambdaIamUtils.generateLambdaVPCPermissions());
|
|
704
|
+
}
|
|
705
|
+
}
|
|
706
|
+
// Always create a new LambdaInvoke task to allow proper state chaining
|
|
707
|
+
const stepId = `AggregationStep-${this._aggregationStepCounter}`;
|
|
708
|
+
this._aggregationStepCounter++;
|
|
709
|
+
// Pass chunk results as data content - the Lambda will format them for Bedrock
|
|
710
|
+
return new aws_stepfunctions_tasks_1.LambdaInvoke(this, stepId, {
|
|
711
|
+
lambdaFunction: this._aggregationFunction,
|
|
712
|
+
payload: aws_stepfunctions_1.TaskInput.fromObject({
|
|
713
|
+
'documentId.$': '$.documentId',
|
|
714
|
+
'contentType': 'data',
|
|
715
|
+
'content': {
|
|
716
|
+
// Pass the chunk results as JSON string for the Lambda to process
|
|
717
|
+
'data.$': 'States.JsonToString($.chunkResults)',
|
|
718
|
+
},
|
|
719
|
+
}),
|
|
720
|
+
// Store in both aggregatedResult AND processingResult for consistency with non-chunked flow
|
|
721
|
+
// This allows enrichment/post-processing steps to use $.processingResult regardless of chunking
|
|
722
|
+
resultPath: '$.aggregatedResult',
|
|
723
|
+
resultSelector: {
|
|
724
|
+
'result.$': '$.Payload.result',
|
|
725
|
+
},
|
|
726
|
+
});
|
|
727
|
+
}
|
|
728
|
+
/**
|
|
729
|
+
* Creates the DynamoDB update step for storing aggregated results.
|
|
730
|
+
*
|
|
731
|
+
* Updates the document record with:
|
|
732
|
+
* - AggregatedResult: JSON string with classification, entities, and summary
|
|
733
|
+
* - WorkflowStatus: 'complete'
|
|
734
|
+
*
|
|
735
|
+
* @returns DynamoUpdateItem task for storing aggregated results
|
|
736
|
+
*/
|
|
737
|
+
createUpdateAggregatedResultStep() {
|
|
738
|
+
return new aws_stepfunctions_tasks_1.DynamoUpdateItem(this, 'StoreAggregatedResult', {
|
|
739
|
+
table: this.documentProcessingTable,
|
|
740
|
+
key: {
|
|
741
|
+
DocumentId: aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.stringAt('$.documentId')),
|
|
742
|
+
},
|
|
743
|
+
updateExpression: 'SET AggregatedResult = :result, WorkflowStatus = :status',
|
|
744
|
+
expressionAttributeValues: {
|
|
745
|
+
':result': aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.jsonToString(aws_stepfunctions_1.JsonPath.objectAt('$.aggregatedResult'))),
|
|
746
|
+
':status': aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString('complete'),
|
|
747
|
+
},
|
|
748
|
+
resultPath: aws_stepfunctions_1.JsonPath.DISCARD,
|
|
749
|
+
});
|
|
750
|
+
}
|
|
751
|
+
/**
|
|
752
|
+
* Creates the cleanup Lambda step for removing temporary chunk files.
|
|
753
|
+
*
|
|
754
|
+
* The cleanup Lambda:
|
|
755
|
+
* - Deletes all chunk files from S3 chunks/ prefix
|
|
756
|
+
* - Uses batch delete for efficiency (up to 1000 objects per request)
|
|
757
|
+
* - Logs errors but doesn't fail the workflow
|
|
758
|
+
*
|
|
759
|
+
* @returns LambdaInvoke task for chunk cleanup
|
|
760
|
+
*/
|
|
761
|
+
createCleanupStep() {
|
|
762
|
+
// Create Lambda function only once
|
|
763
|
+
if (!this._cleanupFunction) {
|
|
764
|
+
const { region, account } = aws_cdk_lib_1.Stack.of(this);
|
|
765
|
+
const role = new aws_iam_1.Role(this, 'CleanupLambdaRole', {
|
|
766
|
+
assumedBy: new aws_iam_1.ServicePrincipal('lambda.amazonaws.com'),
|
|
767
|
+
inlinePolicies: {
|
|
768
|
+
CleanupPolicy: new aws_iam_1.PolicyDocument({
|
|
769
|
+
statements: [
|
|
770
|
+
// S3 access for deleting chunks only - least privilege
|
|
771
|
+
...this.ingressAdapter.generateAdapterIAMPolicies(['s3:DeleteObject'], true),
|
|
772
|
+
],
|
|
773
|
+
}),
|
|
774
|
+
},
|
|
775
|
+
});
|
|
776
|
+
const generatedLogPermissions = utilities_1.LambdaIamUtils.createLogsPermissions({
|
|
777
|
+
account,
|
|
778
|
+
functionName: 'bedrock-idp-cleanup',
|
|
779
|
+
region,
|
|
780
|
+
scope: this,
|
|
781
|
+
enableObservability: this.bedrockDocumentProcessingProps.enableObservability,
|
|
782
|
+
});
|
|
783
|
+
this.encryptionKey.grantEncryptDecrypt(role);
|
|
784
|
+
this._cleanupFunction = new aws_lambda_python_alpha_1.PythonFunction(this, 'CleanupFunction', {
|
|
785
|
+
functionName: generatedLogPermissions.uniqueFunctionName,
|
|
786
|
+
entry: path.join(__dirname, 'resources/cleanup'),
|
|
787
|
+
index: 'handler.py',
|
|
788
|
+
handler: 'handler',
|
|
789
|
+
runtime: framework_1.DefaultRuntimes.PYTHON,
|
|
790
|
+
architecture: aws_lambda_1.Architecture.X86_64,
|
|
791
|
+
role,
|
|
792
|
+
memorySize: 512,
|
|
793
|
+
timeout: aws_cdk_lib_1.Duration.minutes(5),
|
|
794
|
+
environment: {
|
|
795
|
+
...powertools_config_1.PowertoolsConfig.generateDefaultLambdaConfig(this.bedrockDocumentProcessingProps.enableObservability, this.metricNamespace, this.metricServiceName),
|
|
796
|
+
},
|
|
797
|
+
environmentEncryption: this.encryptionKey,
|
|
798
|
+
vpc: this.bedrockDocumentProcessingProps.network
|
|
799
|
+
? this.bedrockDocumentProcessingProps.network.vpc
|
|
800
|
+
: undefined,
|
|
801
|
+
vpcSubnets: this.bedrockDocumentProcessingProps.network
|
|
802
|
+
? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection()
|
|
803
|
+
: undefined,
|
|
804
|
+
});
|
|
805
|
+
for (const statement of generatedLogPermissions.policyStatements) {
|
|
806
|
+
this._cleanupFunction.role?.addToPrincipalPolicy(statement);
|
|
807
|
+
}
|
|
808
|
+
if (this.bedrockDocumentProcessingProps.network) {
|
|
809
|
+
this._cleanupFunction.role?.addToPrincipalPolicy(utilities_1.LambdaIamUtils.generateLambdaVPCPermissions());
|
|
810
|
+
}
|
|
811
|
+
}
|
|
812
|
+
return new aws_stepfunctions_tasks_1.LambdaInvoke(this, 'CleanupChunks', {
|
|
813
|
+
lambdaFunction: this._cleanupFunction,
|
|
814
|
+
payload: aws_stepfunctions_1.TaskInput.fromObject({
|
|
815
|
+
'documentId.$': '$.documentId',
|
|
816
|
+
'chunks.$': '$.chunkingResult.chunks',
|
|
817
|
+
}),
|
|
818
|
+
resultPath: aws_stepfunctions_1.JsonPath.DISCARD,
|
|
819
|
+
});
|
|
820
|
+
}
|
|
821
|
+
/**
|
|
822
|
+
* Creates the error handler for aggregation failures.
|
|
823
|
+
*
|
|
824
|
+
* When aggregation fails:
|
|
825
|
+
* - Updates DynamoDB with 'aggregation-failure' status
|
|
826
|
+
* - Moves document to failed/ prefix
|
|
827
|
+
*
|
|
828
|
+
* @returns Step Functions chain for handling aggregation errors
|
|
829
|
+
*/
|
|
830
|
+
createAggregationErrorHandler() {
|
|
831
|
+
const updateFailureStatus = new aws_stepfunctions_tasks_1.DynamoUpdateItem(this, 'AggregationFailDDBUpdate', {
|
|
832
|
+
table: this.documentProcessingTable,
|
|
833
|
+
key: {
|
|
834
|
+
DocumentId: aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString(aws_stepfunctions_1.JsonPath.stringAt('$.documentId')),
|
|
835
|
+
},
|
|
836
|
+
updateExpression: 'SET WorkflowStatus = :newStatus',
|
|
837
|
+
expressionAttributeValues: {
|
|
838
|
+
':newStatus': aws_stepfunctions_tasks_1.DynamoAttributeValue.fromString('aggregation-failure'),
|
|
839
|
+
},
|
|
840
|
+
resultPath: aws_stepfunctions_1.JsonPath.DISCARD,
|
|
841
|
+
});
|
|
842
|
+
// Use 'Chunked' prefix to avoid ID collisions with standard workflow
|
|
843
|
+
const moveToFailed = this.ingressAdapter.createFailedChain(this, 'Chunked');
|
|
844
|
+
return updateFailureStatus.next(moveToFailed);
|
|
845
|
+
}
|
|
228
846
|
}
|
|
229
847
|
exports.BedrockDocumentProcessing = BedrockDocumentProcessing;
|
|
230
848
|
_a = JSII_RTTI_SYMBOL_1;
|
|
231
|
-
BedrockDocumentProcessing[_a] = { fqn: "@cdklabs/cdk-appmod-catalog-blueprints.BedrockDocumentProcessing", version: "1.
|
|
849
|
+
BedrockDocumentProcessing[_a] = { fqn: "@cdklabs/cdk-appmod-catalog-blueprints.BedrockDocumentProcessing", version: "1.6.0" };
|
|
232
850
|
BedrockDocumentProcessing.DEFAULT_CLASSIFICATION_PROMPT = `
|
|
233
851
|
Analyze the document below, and classify the type of document it is (eg. INVOICE, IDENTITY_DOCUMENT, RECEIPT, etc). The result should be in JSON and should follow the following structure (only respond in JSON with the following structure and do not use markdown to indicate the json, just output plain old json with nothing else):
|
|
234
852
|
|
|
@@ -258,4 +876,26 @@ BedrockDocumentProcessing.DEFAULT_PROCESSING_PROMPT = `
|
|
|
258
876
|
Attached document is as follows:
|
|
259
877
|
|
|
260
878
|
`;
|
|
261
|
-
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"bedrock-document-processing.js","sourceRoot":"","sources":["../../use-cases/document-processing/bedrock-document-processing.ts"],"names":[],"mappings":";;;;;AAAA,qEAAqE;AACrE,sCAAsC;AAEtC,6BAA6B;AAC7B,8EAAkE;AAClE,6CAA8C;AAC9C,iDAAqE;AACrE,iDAA6E;AAC7E,uDAAgE;AAEhE,iFAAmE;AAEnE,yEAA6H;AAC7H,4CAA+C;AAC/C,kDAA4E;AAC5E,4CAA8C;AAC9C,oFAAgF;AA6ChF;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA6BG;AACH,MAAa,yBAA0B,SAAQ,iDAAsB;IAqCnE;;;;;;;;;;OAUG;IACH,YAAY,KAAgB,EAAE,EAAU,EAAE,KAAqC;QAC7E,KAAK,CAAC,KAAK,EAAE,EAAE,EAAE,KAAK,CAAC,CAAC;QACxB,IAAI,KAAK,CAAC,OAAO,EAAE,CAAC;YAClB,KAAK,CAAC,OAAO,CAAC,qBAAqB,CAAC,cAAc,EAAE,wCAA8B,CAAC,OAAO,CAAC,CAAC;YAC5F,KAAK,CAAC,OAAO,CAAC,qBAAqB,CAAC,sBAAsB,EAAE,wCAA8B,CAAC,eAAe,CAAC,CAAC;QAC9G,CAAC;QAED,IAAI,CAAC,8BAA8B,GAAG,KAAK,CAAC;QAC5C,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,0BAA0B,CAAC,sCAAsC,CAAC,CAAC;IAC9F,CAAC;IAED;;;;;;;;OAQG;IACO,kBAAkB;QAC1B,MAAM,MAAM,GAAG,IAAI,CAAC,8BAA8B,CAAC,oBAAoB,IAAI,yBAAyB,CAAC,6BAA6B,CAAC;QACnI,MAAM,eAAe,GAAG,2BAAiB,CAAC,mBAAmB,CAAC,IAAI,CAAC,8BAA8B,CAAC,0BAA0B,CAAC,CAAC;QAC9H,MAAM,IAAI,GAAG,IAAI,CAAC,4BAA4B,CAAC,0BAA0B,EAAE,IAAI,CAAC,8BAA8B,CAAC,0BAA0B,CAAC,CAAC;QAC3I,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,GAAG,mBAAK,CAAC,EAAE,CAAC,IAAI,CAAC,CAAC;QAC3C,MAAM,uBAAuB,GAAG,0BAAc,CAAC,qBAAqB,CAAC;YACnE,OAAO;YACP,YAAY,EAAE,4BAA4B;YAC1C,MAAM;YACN,KAAK,EAAE,IAAI;YACX,mBAAmB,EAAE,IAAI,CAAC,8BAA8B,CAAC,mBAAmB;SAC7E,CAAC,CAAC;QAEH,IAAI,CAAC,aAAa,CAAC,mBAAmB,CAAC,IAAI,CAAC,CAAC;QAE7C,MAAM,eAAe,GAAG,IAAI,wCAAc,CAAC,IAAI,EAAE,+BAA+B,EAAE;YAChF,YAAY,EAAE,uBAAuB,CAAC,kBAAkB;YACxD,YAAY,EAAE,yBAAY,CAAC,MAAM;YACjC,OAAO,EAAE,2BAAe,CAAC,MAAM;YAC/B,KAAK,EAAE,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,kCAAkC,CAAC;YAC/D,IAAI;YACJ,UAAU,EAAE,GAAG;YACf,OAAO,EAAE,IAAI,CAAC,8BAA8B,CAAC,YAAY,IAAI,sBAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;YAChF,WAAW,EAAE;gBACX,QAAQ,EAAE,eAAe;gBACzB,MAAM,EAAE,MAAM;gBACd,WAAW,EAAE,gBAAgB;gBAC7B,GAAG,oCAAgB,CAAC,2BAA2B,CAC7C,IAAI,CAAC,8BAA8B,CAAC,mBAAmB,EACvD,IAAI,CAAC,eAAe,EACpB,IAAI,CAAC,iBAAiB,CACvB;aACF;YACD,qBAAqB,EAAE,IAAI,CAAC,aAAa;YACzC,GAAG,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,SAAS;YAC9G,UAAU,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,0BAA0B,EAAE,CAAC,CAAC,CAAC,SAAS;SAC/I,CAAC,CAAC;QAEH,KAAK,MAAM,SAAS,IAAI,uBAAuB,CAAC,gBAAgB,EAAE,CAAC;YACjE,eAAe,CAAC,IAAI,EAAE,oBAAoB,CAAC,SAAS,CAAC,CAAC;QACxD,CAAC;QAED,IAAI,IAAI,CAAC,8BAA8B,CAAC,OAAO,EAAE,CAAC;YAChD,eAAe,CAAC,IAAI,EAAE,oBAAoB,CAAC,0BAAc,CAAC,4BAA4B,EAAE,CAAC,CAAC;QAC5F,CAAC;QAED,OAAO,IAAI,sCAAY,CAAC,IAAI,EAAE,oBAAoB,EAAE;YAClD,cAAc,EAAE,eAAe;YAC/B,UAAU,EAAE,wBAAwB;YACpC,cAAc,EAAE;gBACd,0BAA0B,EAAE,kCAAkC;aAC/D;SACF,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;;OAQG;IACO,cAAc;QACtB,MAAM,MAAM,GAAG,IAAI,CAAC,8BAA8B,CAAC,gBAAgB,IAAI,yBAAyB,CAAC,yBAAyB,CAAC;QAC3H,MAAM,eAAe,GAAG,2BAAiB,CAAC,mBAAmB,CAAC,IAAI,CAAC,8BAA8B,CAAC,sBAAsB,CAAC,CAAC;QAC1H,MAAM,IAAI,GAAG,IAAI,CAAC,4BAA4B,CAAC,sBAAsB,EAAE,IAAI,CAAC,8BAA8B,CAAC,sBAAsB,CAAC,CAAC;QACnI,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,GAAG,mBAAK,CAAC,EAAE,CAAC,IAAI,CAAC,CAAC;QAE3C,MAAM,uBAAuB,GAAG,0BAAc,CAAC,qBAAqB,CAAC;YACnE,OAAO;YACP,YAAY,EAAE,wBAAwB;YACtC,MAAM;YACN,KAAK,EAAE,IAAI;SACZ,CAAC,CAAC;QACH,IAAI,CAAC,aAAa,CAAC,mBAAmB,CAAC,IAAI,CAAC,CAAC;QAC7C,MAAM,eAAe,GAAG,IAAI,wCAAc,CAAC,IAAI,EAAE,2BAA2B,EAAE;YAC5E,YAAY,EAAE,uBAAuB,CAAC,kBAAkB;YACxD,OAAO,EAAE,2BAAe,CAAC,MAAM;YAC/B,YAAY,EAAE,yBAAY,CAAC,MAAM;YACjC,KAAK,EAAE,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,kCAAkC,CAAC;YAC/D,IAAI;YACJ,UAAU,EAAE,GAAG;YACf,OAAO,EAAE,IAAI,CAAC,8BAA8B,CAAC,YAAY,IAAI,sBAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;YAChF,WAAW,EAAE;gBACX,QAAQ,EAAE,eAAe;gBACzB,MAAM,EAAE,MAAM;gBACd,WAAW,EAAE,YAAY;gBACzB,GAAG,oCAAgB,CAAC,2BAA2B,CAC7C,IAAI,CAAC,8BAA8B,CAAC,mBAAmB,EACvD,IAAI,CAAC,eAAe,EACpB,IAAI,CAAC,iBAAiB,CACvB;aACF;YACD,qBAAqB,EAAE,IAAI,CAAC,aAAa;YACzC,GAAG,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,SAAS;YAC9G,UAAU,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,0BAA0B,EAAE,CAAC,CAAC,CAAC,SAAS;SAC/I,CAAC,CAAC;QAEH,KAAK,MAAM,SAAS,IAAI,uBAAuB,CAAC,gBAAgB,EAAE,CAAC;YACjE,eAAe,CAAC,IAAI,EAAE,oBAAoB,CAAC,SAAS,CAAC,CAAC;QACxD,CAAC;QAED,IAAI,IAAI,CAAC,8BAA8B,CAAC,OAAO,EAAE,CAAC;YAChD,eAAe,CAAC,IAAI,EAAE,oBAAoB,CAAC,0BAAc,CAAC,4BAA4B,EAAE,CAAC,CAAC;QAC5F,CAAC;QAED,OAAO,IAAI,sCAAY,CAAC,IAAI,EAAE,gBAAgB,EAAE;YAC9C,cAAc,EAAE,eAAe;YAC/B,UAAU,EAAE,oBAAoB;YAChC,cAAc,EAAE;gBACd,0BAA0B,EAAE,kCAAkC;gBAC9D,UAAU,EAAE,kBAAkB;aAC/B;SACF,CAAC,CAAC;IACL,CAAC;IAES,4BAA4B,CAAC,EAAU,EAAE,KAAyB;QAC1E,OAAO,IAAI,cAAI,CAAC,IAAI,EAAE,EAAE,EAAE;YACxB,SAAS,EAAE,IAAI,0BAAgB,CAAC,sBAAsB,CAAC;YACvD,cAAc,EAAE;gBACd,mBAAmB,EAAE,IAAI,wBAAc,CAAC;oBACtC,UAAU,EAAE;wBACV,GAAG,IAAI,CAAC,cAAc,CAAC,0BAA0B,EAAE;wBACnD,2BAAiB,CAAC,2BAA2B,CAAC,IAAI,EAAE,KAAK,CAAC;qBAC3D;iBACF,CAAC;aACH;SACF,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;;OAQG;IACO,cAAc;QACtB,IAAI,CAAC,IAAI,CAAC,8BAA8B,CAAC,wBAAwB,EAAE,CAAC;YAClE,OAAO,SAAS,CAAC;QACnB,CAAC;QAED,OAAO,IAAI,sCAAY,CAAC,IAAI,EAAE,gBAAgB,EAAE;YAC9C,cAAc,EAAE,IAAI,CAAC,8BAA8B,CAAC,wBAAwB;YAC5E,UAAU,EAAE,kBAAkB;SAC/B,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;;OAQG;IACO,kBAAkB;QAC1B,IAAI,CAAC,IAAI,CAAC,8BAA8B,CAAC,4BAA4B,EAAE,CAAC;YACtE,OAAO,SAAS,CAAC;QACnB,CAAC;QAED,OAAO,IAAI,sCAAY,CAAC,IAAI,EAAE,oBAAoB,EAAE;YAClD,cAAc,EAAE,IAAI,CAAC,8BAA8B,CAAC,4BAA4B;YAChF,UAAU,EAAE,uBAAuB;SACpC,CAAC,CAAC;IACL,CAAC;;AA9OH,8DA+OC;;;AA9O2B,uDAA6B,GAAG;;;;;;;;;GASzD,CAAC;AAEwB,mDAAyB,GAAG;;;;;;;;;;;;;;;;;;GAkBrD,CAAC","sourcesContent":["// Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.\n// SPDX-License-Identifier: Apache-2.0\n\nimport * as path from 'path';\nimport { PythonFunction } from '@aws-cdk/aws-lambda-python-alpha';\nimport { Duration, Stack } from 'aws-cdk-lib';\nimport { InterfaceVpcEndpointAwsService } from 'aws-cdk-lib/aws-ec2';\nimport { Role, ServicePrincipal, PolicyDocument } from 'aws-cdk-lib/aws-iam';\nimport { Function, Architecture } from 'aws-cdk-lib/aws-lambda';\nimport { StateMachine } from 'aws-cdk-lib/aws-stepfunctions';\nimport { LambdaInvoke } from 'aws-cdk-lib/aws-stepfunctions-tasks';\nimport { Construct } from 'constructs';\nimport { BaseDocumentProcessing, BaseDocumentProcessingProps, DocumentProcessingStepType } from './base-document-processing';\nimport { DefaultRuntimes } from '../framework';\nimport { BedrockModelProps, BedrockModelUtils } from '../framework/bedrock';\nimport { LambdaIamUtils } from '../utilities';\nimport { PowertoolsConfig } from '../utilities/observability/powertools-config';\n\n/**\n * Configuration properties for BedrockDocumentProcessing construct.\n * Extends BaseDocumentProcessingProps with Bedrock-specific options.\n */\nexport interface BedrockDocumentProcessingProps extends BaseDocumentProcessingProps {\n  /**\n   * Bedrock foundation model for document classification step.\n   */\n  readonly classificationBedrockModel?: BedrockModelProps;\n\n  /**\n   * Bedrock foundation model for document extraction step.\n   */\n  readonly processingBedrockModel?: BedrockModelProps;\n  /**\n   * Custom prompt template for document classification.\n   * Must include placeholder for document content.\n   * @default DEFAULT_CLASSIFICATION_PROMPT\n   */\n  readonly classificationPrompt?: string;\n  /**\n   * Custom prompt template for document extraction.\n   * Must include placeholder for document content and classification result.\n   * @default DEFAULT_EXTRACTION_PROMPT\n   */\n  readonly processingPrompt?: string;\n  /**\n   * Optional Lambda function for document enrichment step.\n   * If provided, will be invoked after extraction with workflow state.\n   */\n  readonly enrichmentLambdaFunction?: Function;\n  /**\n   * Optional Lambda function for post-processing step.\n   * If provided, will be invoked after enrichment with workflow state.\n   */\n  readonly postProcessingLambdaFunction?: Function;\n  /**\n   * Timeout for individual Step Functions tasks (classification, extraction, etc.).\n   * @default Duration.minutes(5)\n   */\n  readonly stepTimeouts?: Duration;\n}\n\n/**\n * Document processing workflow powered by Amazon Bedrock foundation models.\n *\n * Extends BaseDocumentProcessing to provide AI-powered document classification and extraction\n * using Amazon Bedrock foundation models. This implementation offers:\n *\n * ## Key Features\n * - **AI-Powered Classification**: Uses Claude 3.7 Sonnet (configurable) to classify document types\n * - **Intelligent Extraction**: Extracts structured data from documents using foundation models\n * - **Cross-Region Inference**: Optional support for improved availability via inference profiles\n * - **Flexible Processing**: Optional enrichment and post-processing Lambda functions\n * - **Cost Optimized**: Configurable timeouts and model selection for cost control\n *\n * ## Processing Workflow\n * S3 Upload → Classification (Bedrock) → Extraction (Bedrock) → [Enrichment] → [Post-Processing] → Results\n *\n * ## Default Models\n * - Classification: Claude 3.7 Sonnet (anthropic.claude-3-7-sonnet-20250219-v1:0)\n * - Extraction: Claude 3.7 Sonnet (anthropic.claude-3-7-sonnet-20250219-v1:0)\n *\n * ## Prompt Templates\n * The construct uses default prompts that can be customized:\n * - **Classification**: Analyzes document and returns JSON with documentClassification field\n * - **Extraction**: Uses classification result to extract entities in structured JSON format\n *\n * ## Cross-Region Inference\n * When enabled, uses Bedrock inference profiles for improved availability:\n * - US prefix: Routes to US-based regions for lower latency\n * - EU prefix: Routes to EU-based regions for data residency compliance\n */\nexport class BedrockDocumentProcessing extends BaseDocumentProcessing {\n  protected static readonly DEFAULT_CLASSIFICATION_PROMPT = `\n  Analyze the document below, and classify the type of document it is (eg. INVOICE, IDENTITY_DOCUMENT, RECEIPT, etc). The result should be in JSON and should follow the following structure (only respond in JSON with the following structure and do not use markdown to indicate the json, just output plain old json with nothing else):\n\n  {\n      documentClassification: <CLASSIFICATION>\n  }\n\n  Attached document is as follows:\n\n  `;\n\n  protected static readonly DEFAULT_PROCESSING_PROMPT = `\n  The document below has been classified as [ACTUAL_CLASSIFICATION]. Extract important entities from the document and return the result as JSON following the structure below (only respond in JSON with the following structure and do not use markdown to indicate the json, just output plain old json with nothing else):\n\n  {\n      documentClassification: <CLASSIFICATION>,\n      result: {\n        entities: [\n            {\n                type: <TYPE OF ENTITY>\n                value: <VALUE OF ENTITY>\n            },\n            ...\n        ]\n      }\n  }\n\n  Attached document is as follows:\n\n  `;\n\n  /** Configuration properties specific to Bedrock document processing */\n  protected readonly bedrockDocumentProcessingProps: BedrockDocumentProcessingProps;\n  /** The Step Functions state machine that orchestrates the document processing workflow */\n  readonly stateMachine: StateMachine;\n\n  /**\n   * Creates a new BedrockDocumentProcessing construct.\n   *\n   * Initializes the Bedrock-powered document processing pipeline with AI classification\n   * and extraction capabilities. Creates Lambda functions with appropriate IAM roles\n   * for Bedrock model invocation and S3 access.\n   *\n   * @param scope - The scope in which to define this construct\n   * @param id - The scoped construct ID. Must be unique within the scope.\n   * @param props - Configuration properties for the Bedrock document processing pipeline\n   */\n  constructor(scope: Construct, id: string, props: BedrockDocumentProcessingProps) {\n    super(scope, id, props);\n    if (props.network) {\n      props.network.createServiceEndpoint('vpce-bedrock', InterfaceVpcEndpointAwsService.BEDROCK);\n      props.network.createServiceEndpoint('vpce-bedrock-runtime', InterfaceVpcEndpointAwsService.BEDROCK_RUNTIME);\n    }\n\n    this.bedrockDocumentProcessingProps = props;\n    this.stateMachine = this.handleStateMachineCreation('bedrock-document-processing-workflow');\n  }\n\n  /**\n   * Implements the document classification step using Amazon Bedrock.\n   *\n   * Creates a Lambda function that invokes the configured Bedrock model to classify\n   * the document type. The function reads the document from S3 and sends it to\n   * Bedrock with the classification prompt.\n   *\n   * @returns LambdaInvoke task configured for document classification\n   */\n  protected classificationStep(): DocumentProcessingStepType {\n    const prompt = this.bedrockDocumentProcessingProps.classificationPrompt || BedrockDocumentProcessing.DEFAULT_CLASSIFICATION_PROMPT;\n    const adjustedModelId = BedrockModelUtils.deriveActualModelId(this.bedrockDocumentProcessingProps.classificationBedrockModel);\n    const role = this.generateLambdaRoleForBedrock('ClassificationLambdaRole', this.bedrockDocumentProcessingProps.classificationBedrockModel);\n    const { region, account } = Stack.of(this);\n    const generatedLogPermissions = LambdaIamUtils.createLogsPermissions({\n      account,\n      functionName: 'bedrock-idp-classification',\n      region,\n      scope: this,\n      enableObservability: this.bedrockDocumentProcessingProps.enableObservability,\n    });\n\n    this.encryptionKey.grantEncryptDecrypt(role);\n\n    const bedrockFunction = new PythonFunction(this, 'BedrockClassificationFunction', {\n      functionName: generatedLogPermissions.uniqueFunctionName,\n      architecture: Architecture.X86_64,\n      runtime: DefaultRuntimes.PYTHON,\n      entry: path.join(__dirname, 'resources/default-bedrock-invoke'),\n      role,\n      memorySize: 512,\n      timeout: this.bedrockDocumentProcessingProps.stepTimeouts || Duration.minutes(5),\n      environment: {\n        MODEL_ID: adjustedModelId,\n        PROMPT: prompt,\n        INVOKE_TYPE: 'classification',\n        ...PowertoolsConfig.generateDefaultLambdaConfig(\n          this.bedrockDocumentProcessingProps.enableObservability,\n          this.metricNamespace,\n          this.metricServiceName,\n        ),\n      },\n      environmentEncryption: this.encryptionKey,\n      vpc: this.bedrockDocumentProcessingProps.network ? this.bedrockDocumentProcessingProps.network.vpc : undefined,\n      vpcSubnets: this.bedrockDocumentProcessingProps.network ? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection() : undefined,\n    });\n\n    for (const statement of generatedLogPermissions.policyStatements) {\n      bedrockFunction.role?.addToPrincipalPolicy(statement);\n    }\n\n    if (this.bedrockDocumentProcessingProps.network) {\n      bedrockFunction.role?.addToPrincipalPolicy(LambdaIamUtils.generateLambdaVPCPermissions());\n    }\n\n    return new LambdaInvoke(this, 'ClassificationStep', {\n      lambdaFunction: bedrockFunction,\n      resultPath: '$.classificationResult',\n      resultSelector: {\n        'documentClassification.$': '$.Payload.documentClassification',\n      },\n    });\n  }\n\n  /**\n   * Implements the document extraction step using Amazon Bedrock.\n   *\n   * Creates a Lambda function that invokes the configured Bedrock model to extract\n   * structured data from the document. Uses the classification result from the\n   * previous step to provide context for more accurate extraction.\n   *\n   * @returns LambdaInvoke task configured for document extraction\n   */\n  protected processingStep(): DocumentProcessingStepType {\n    const prompt = this.bedrockDocumentProcessingProps.processingPrompt || BedrockDocumentProcessing.DEFAULT_PROCESSING_PROMPT;\n    const adjustedModelId = BedrockModelUtils.deriveActualModelId(this.bedrockDocumentProcessingProps.processingBedrockModel);\n    const role = this.generateLambdaRoleForBedrock('ProcessingLambdaRole', this.bedrockDocumentProcessingProps.processingBedrockModel);\n    const { region, account } = Stack.of(this);\n\n    const generatedLogPermissions = LambdaIamUtils.createLogsPermissions({\n      account,\n      functionName: 'bedrock-idp-processing',\n      region,\n      scope: this,\n    });\n    this.encryptionKey.grantEncryptDecrypt(role);\n    const bedrockFunction = new PythonFunction(this, 'BedrockExtractionFunction', {\n      functionName: generatedLogPermissions.uniqueFunctionName,\n      runtime: DefaultRuntimes.PYTHON,\n      architecture: Architecture.X86_64,\n      entry: path.join(__dirname, 'resources/default-bedrock-invoke'),\n      role,\n      memorySize: 512,\n      timeout: this.bedrockDocumentProcessingProps.stepTimeouts || Duration.minutes(5),\n      environment: {\n        MODEL_ID: adjustedModelId,\n        PROMPT: prompt,\n        INVOKE_TYPE: 'processing',\n        ...PowertoolsConfig.generateDefaultLambdaConfig(\n          this.bedrockDocumentProcessingProps.enableObservability,\n          this.metricNamespace,\n          this.metricServiceName,\n        ),\n      },\n      environmentEncryption: this.encryptionKey,\n      vpc: this.bedrockDocumentProcessingProps.network ? this.bedrockDocumentProcessingProps.network.vpc : undefined,\n      vpcSubnets: this.bedrockDocumentProcessingProps.network ? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection() : undefined,\n    });\n\n    for (const statement of generatedLogPermissions.policyStatements) {\n      bedrockFunction.role?.addToPrincipalPolicy(statement);\n    }\n\n    if (this.bedrockDocumentProcessingProps.network) {\n      bedrockFunction.role?.addToPrincipalPolicy(LambdaIamUtils.generateLambdaVPCPermissions());\n    }\n\n    return new LambdaInvoke(this, 'ProcessingStep', {\n      lambdaFunction: bedrockFunction,\n      resultPath: '$.processingResult',\n      resultSelector: {\n        'documentClassification.$': '$.Payload.documentClassification',\n        'result.$': '$.Payload.result',\n      },\n    });\n  }\n\n  protected generateLambdaRoleForBedrock(id: string, model?: BedrockModelProps) {\n    return new Role(this, id, {\n      assumedBy: new ServicePrincipal('lambda.amazonaws.com'),\n      inlinePolicies: {\n        BedrockInvokePolicy: new PolicyDocument({\n          statements: [\n            ...this.ingressAdapter.generateAdapterIAMPolicies(),\n            BedrockModelUtils.generateModelIAMPermissions(this, model),\n          ],\n        }),\n      },\n    });\n  }\n\n  /**\n   * Implements the optional document enrichment step.\n   *\n   * If an enrichment Lambda function is provided in the props, creates a LambdaInvoke\n   * task to perform additional processing on the extracted data. This step is useful\n   * for data validation, transformation, or integration with external systems.\n   *\n   * @returns LambdaInvoke task for enrichment, or undefined to skip this step\n   */\n  protected enrichmentStep(): DocumentProcessingStepType | undefined {\n    if (!this.bedrockDocumentProcessingProps.enrichmentLambdaFunction) {\n      return undefined;\n    }\n\n    return new LambdaInvoke(this, 'EnrichmentStep', {\n      lambdaFunction: this.bedrockDocumentProcessingProps.enrichmentLambdaFunction,\n      resultPath: '$.enrichedResult',\n    });\n  }\n\n  /**\n   * Implements the optional post-processing step.\n   *\n   * If a post-processing Lambda function is provided in the props, creates a LambdaInvoke\n   * task to perform final processing on the workflow results. This step is useful for\n   * data formatting, notifications, or integration with downstream systems.\n   *\n   * @returns LambdaInvoke task for post-processing, or undefined to skip this step\n   */\n  protected postProcessingStep(): DocumentProcessingStepType | undefined {\n    if (!this.bedrockDocumentProcessingProps.postProcessingLambdaFunction) {\n      return undefined;\n    }\n\n    return new LambdaInvoke(this, 'PostProcessingStep', {\n      lambdaFunction: this.bedrockDocumentProcessingProps.postProcessingLambdaFunction,\n      resultPath: '$.postProcessedResult',\n    });\n  }\n}"]}
|
|
879
|
+
BedrockDocumentProcessing.DEFAULT_AGGREGATION_PROMPT = `
|
|
880
|
+
You are given the processing results from multiple chunks of a large document that was split for processing.
|
|
881
|
+
Your task is to synthesize these chunk results into a single, coherent final result.
|
|
882
|
+
|
|
883
|
+
Instructions:
|
|
884
|
+
1. Review all the chunk results provided below
|
|
885
|
+
2. Merge and deduplicate any overlapping information (chunks may have overlapping pages)
|
|
886
|
+
3. Synthesize the information into a unified, coherent result
|
|
887
|
+
4. Maintain the same output format as the individual chunk results
|
|
888
|
+
5. If the chunks contain summaries, create a comprehensive summary that covers all sections
|
|
889
|
+
6. If the chunks contain entities, deduplicate and consolidate them
|
|
890
|
+
7. Preserve important details from each chunk while avoiding redundancy
|
|
891
|
+
|
|
892
|
+
Return the result as JSON (only respond in JSON without markdown formatting):
|
|
893
|
+
|
|
894
|
+
{
|
|
895
|
+
"result": <SYNTHESIZED_RESULT>
|
|
896
|
+
}
|
|
897
|
+
|
|
898
|
+
The chunk results to aggregate are as follows:
|
|
899
|
+
|
|
900
|
+
`;
|
|
901
|
+
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"bedrock-document-processing.js","sourceRoot":"","sources":["../../use-cases/document-processing/bedrock-document-processing.ts"],"names":[],"mappings":";;;;;AAAA,qEAAqE;AACrE,sCAAsC;AAEtC,6BAA6B;AAC7B,8EAAkE;AAClE,6CAA8C;AAC9C,iDAAqE;AACrE,iDAA6E;AAC7E,uDAAgE;AAChE,qEAA8G;AAC9G,iFAA2G;AAE3G,yEAA6H;AAE7H,4CAA+C;AAC/C,kDAA4E;AAC5E,4CAA8C;AAC9C,oFAAgF;AAoHhF;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA6BG;AACH,MAAa,yBAA0B,SAAQ,iDAAsB;IA+EnE;;;;;;;;;;;OAWG;IACH,YAAY,KAAgB,EAAE,EAAU,EAAE,KAAqC;QAC7E,KAAK,CAAC,KAAK,EAAE,EAAE,EAAE,KAAK,CAAC,CAAC;QA7B1B,4DAA4D;QACpD,+BAA0B,GAAG,CAAC,CAAC;QACvC,wDAAwD;QAChD,2BAAsB,GAAG,CAAC,CAAC;QAGnC,yDAAyD;QACjD,4BAAuB,GAAG,CAAC,CAAC;QAGpC,wDAAwD;QAChD,2BAAsB,GAAG,CAAC,CAAC;QACnC,6DAA6D;QACrD,+BAA0B,GAAG,CAAC,CAAC;QAkBrC,8CAA8C;QAC9C,IAAI,KAAK,CAAC,cAAc,IAAI,KAAK,CAAC,cAAc,EAAE,CAAC;YACjD,IAAI,CAAC,sBAAsB,CAAC,KAAK,CAAC,cAAc,CAAC,CAAC;QACpD,CAAC;QAED,IAAI,KAAK,CAAC,OAAO,EAAE,CAAC;YAClB,KAAK,CAAC,OAAO,CAAC,qBAAqB,CAAC,cAAc,EAAE,wCAA8B,CAAC,OAAO,CAAC,CAAC;YAC5F,KAAK,CAAC,OAAO,CAAC,qBAAqB,CAAC,sBAAsB,EAAE,wCAA8B,CAAC,eAAe,CAAC,CAAC;QAC9G,CAAC;QAED,IAAI,CAAC,8BAA8B,GAAG,KAAK,CAAC;QAC5C,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,0BAA0B,CAAC,sCAAsC,CAAC,CAAC;IAC9F,CAAC;IAED;;;;;;;;;;;;OAYG;IACK,sBAAsB,CAAC,MAAsB;QACnD,iDAAiD;QACjD,IAAI,MAAM,CAAC,SAAS,KAAK,SAAS,EAAE,CAAC;YACnC,IAAI,MAAM,CAAC,SAAS,IAAI,CAAC,EAAE,CAAC;gBAC1B,MAAM,IAAI,KAAK,CAAC,mEAAmE,CAAC,CAAC;YACvF,CAAC;QACH,CAAC;QAED,oDAAoD;QACpD,IAAI,MAAM,CAAC,YAAY,KAAK,SAAS,EAAE,CAAC;YACtC,IAAI,MAAM,CAAC,YAAY,GAAG,CAAC,EAAE,CAAC;gBAC5B,MAAM,IAAI,KAAK,CAAC,oEAAoE,CAAC,CAAC;YACxF,CAAC;YACD,MAAM,kBAAkB,GAAG,MAAM,CAAC,SAAS,IAAI,EAAE,CAAC,CAAC,qBAAqB;YACxE,IAAI,MAAM,CAAC,YAAY,IAAI,kBAAkB,EAAE,CAAC;gBAC9C,MAAM,IAAI,KAAK,CAAC,2EAA2E,CAAC,CAAC;YAC/F,CAAC;QACH,CAAC;QAED,0BAA0B;QAC1B,IAAI,MAAM,CAAC,aAAa,KAAK,SAAS,IAAI,MAAM,CAAC,aAAa,IAAI,CAAC,EAAE,CAAC;YACpE,MAAM,IAAI,KAAK,CAAC,uEAAuE,CAAC,CAAC;QAC3F,CAAC;QAED,2BAA2B;QAC3B,IAAI,MAAM,CAAC,cAAc,KAAK,SAAS,IAAI,MAAM,CAAC,cAAc,IAAI,CAAC,EAAE,CAAC;YACtE,MAAM,IAAI,KAAK,CAAC,wEAAwE,CAAC,CAAC;QAC5F,CAAC;QAED,2DAA2D;QAC3D,IAAI,MAAM,CAAC,iBAAiB,KAAK,SAAS,IAAI,MAAM,CAAC,iBAAiB,IAAI,CAAC,EAAE,CAAC;YAC5E,MAAM,IAAI,KAAK,CAAC,2EAA2E,CAAC,CAAC;QAC/F,CAAC;QAED,kEAAkE;QAClE,IAAI,MAAM,CAAC,aAAa,KAAK,SAAS,EAAE,CAAC;YACvC,IAAI,MAAM,CAAC,aAAa,GAAG,CAAC,EAAE,CAAC;gBAC7B,MAAM,IAAI,KAAK,CAAC,qEAAqE,CAAC,CAAC;YACzF,CAAC;YACD,MAAM,kBAAkB,GAAG,MAAM,CAAC,iBAAiB,IAAI,MAAM,CAAC,CAAC,qBAAqB;YACpF,IAAI,MAAM,CAAC,aAAa,IAAI,kBAAkB,EAAE,CAAC;gBAC/C,MAAM,IAAI,KAAK,CAAC,oFAAoF,CAAC,CAAC;YACxG,CAAC;QACH,CAAC;QAED,qDAAqD;QACrD,IAAI,MAAM,CAAC,gBAAgB,KAAK,SAAS,IAAI,MAAM,CAAC,gBAAgB,IAAI,CAAC,EAAE,CAAC;YAC1E,MAAM,IAAI,KAAK,CAAC,0EAA0E,CAAC,CAAC;QAC9F,CAAC;QAED,yDAAyD;QACzD,IAAI,MAAM,CAAC,oBAAoB,KAAK,SAAS,IAAI,MAAM,CAAC,oBAAoB,IAAI,CAAC,EAAE,CAAC;YAClF,MAAM,IAAI,KAAK,CAAC,8EAA8E,CAAC,CAAC;QAClG,CAAC;QAED,2BAA2B;QAC3B,IAAI,MAAM,CAAC,cAAc,KAAK,SAAS,IAAI,MAAM,CAAC,cAAc,IAAI,CAAC,EAAE,CAAC;YACtE,MAAM,IAAI,KAAK,CAAC,wEAAwE,CAAC,CAAC;QAC5F,CAAC;QAED,iCAAiC;QACjC,IAAI,MAAM,CAAC,mBAAmB,KAAK,SAAS,EAAE,CAAC;YAC7C,IAAI,MAAM,CAAC,mBAAmB,GAAG,CAAC,IAAI,MAAM,CAAC,mBAAmB,GAAG,CAAC,EAAE,CAAC;gBACrE,MAAM,IAAI,KAAK,CAAC,8EAA8E,CAAC,CAAC;YAClG,CAAC;QACH,CAAC;IACH,CAAC;IAED;;;;;;;;;;;OAWG;IACO,kBAAkB;QAC1B,mCAAmC;QACnC,IAAI,CAAC,IAAI,CAAC,uBAAuB,EAAE,CAAC;YAClC,MAAM,MAAM,GAAG,IAAI,CAAC,8BAA8B,CAAC,oBAAoB,IAAI,yBAAyB,CAAC,6BAA6B,CAAC;YACnI,MAAM,eAAe,GAAG,2BAAiB,CAAC,mBAAmB,CAAC,IAAI,CAAC,8BAA8B,CAAC,0BAA0B,CAAC,CAAC;YAC9H,MAAM,IAAI,GAAG,IAAI,CAAC,4BAA4B,CAAC,0BAA0B,EAAE,IAAI,CAAC,8BAA8B,CAAC,0BAA0B,CAAC,CAAC;YAC3I,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,GAAG,mBAAK,CAAC,EAAE,CAAC,IAAI,CAAC,CAAC;YAC3C,MAAM,uBAAuB,GAAG,0BAAc,CAAC,qBAAqB,CAAC;gBACnE,OAAO;gBACP,YAAY,EAAE,4BAA4B;gBAC1C,MAAM;gBACN,KAAK,EAAE,IAAI;gBACX,mBAAmB,EAAE,IAAI,CAAC,8BAA8B,CAAC,mBAAmB;aAC7E,CAAC,CAAC;YAEH,IAAI,CAAC,aAAa,CAAC,mBAAmB,CAAC,IAAI,CAAC,CAAC;YAE7C,IAAI,CAAC,uBAAuB,GAAG,IAAI,wCAAc,CAAC,IAAI,EAAE,+BAA+B,EAAE;gBACvF,YAAY,EAAE,uBAAuB,CAAC,kBAAkB;gBACxD,YAAY,EAAE,yBAAY,CAAC,MAAM;gBACjC,OAAO,EAAE,2BAAe,CAAC,MAAM;gBAC/B,KAAK,EAAE,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,kCAAkC,CAAC;gBAC/D,IAAI;gBACJ,UAAU,EAAE,GAAG;gBACf,OAAO,EAAE,IAAI,CAAC,8BAA8B,CAAC,YAAY,IAAI,sBAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;gBAChF,WAAW,EAAE;oBACX,QAAQ,EAAE,eAAe;oBACzB,MAAM,EAAE,MAAM;oBACd,WAAW,EAAE,gBAAgB;oBAC7B,GAAG,oCAAgB,CAAC,2BAA2B,CAC7C,IAAI,CAAC,8BAA8B,CAAC,mBAAmB,EACvD,IAAI,CAAC,eAAe,EACpB,IAAI,CAAC,iBAAiB,CACvB;iBACF;gBACD,qBAAqB,EAAE,IAAI,CAAC,aAAa;gBACzC,GAAG,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO;oBAC9C,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,GAAG;oBACjD,CAAC,CAAC,SAAS;gBACb,UAAU,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO;oBACrD,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,0BAA0B,EAAE;oBAC1E,CAAC,CAAC,SAAS;aACd,CAAC,CAAC;YAEH,KAAK,MAAM,SAAS,IAAI,uBAAuB,CAAC,gBAAgB,EAAE,CAAC;gBACjE,IAAI,CAAC,uBAAuB,CAAC,IAAI,EAAE,oBAAoB,CAAC,SAAS,CAAC,CAAC;YACrE,CAAC;YAED,IAAI,IAAI,CAAC,8BAA8B,CAAC,OAAO,EAAE,CAAC;gBAChD,IAAI,CAAC,uBAAuB,CAAC,IAAI,EAAE,oBAAoB,CAAC,0BAAc,CAAC,4BAA4B,EAAE,CAAC,CAAC;YACzG,CAAC;QACH,CAAC;QAED,uEAAuE;QACvE,MAAM,MAAM,GAAG,sBAAsB,IAAI,CAAC,0BAA0B,EAAE,CAAC;QACvE,IAAI,CAAC,0BAA0B,EAAE,CAAC;QAElC,OAAO,IAAI,sCAAY,CAAC,IAAI,EAAE,MAAM,EAAE;YACpC,cAAc,EAAE,IAAI,CAAC,uBAAuB;YAC5C,UAAU,EAAE,wBAAwB;YACpC,cAAc,EAAE;gBACd,0BAA0B,EAAE,kCAAkC;aAC/D;SACF,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;;;;;OAWG;IACO,cAAc;QACtB,mCAAmC;QACnC,IAAI,CAAC,IAAI,CAAC,mBAAmB,EAAE,CAAC;YAC9B,MAAM,MAAM,GAAG,IAAI,CAAC,8BAA8B,CAAC,gBAAgB,IAAI,yBAAyB,CAAC,yBAAyB,CAAC;YAC3H,MAAM,eAAe,GAAG,2BAAiB,CAAC,mBAAmB,CAAC,IAAI,CAAC,8BAA8B,CAAC,sBAAsB,CAAC,CAAC;YAC1H,MAAM,IAAI,GAAG,IAAI,CAAC,4BAA4B,CAAC,sBAAsB,EAAE,IAAI,CAAC,8BAA8B,CAAC,sBAAsB,CAAC,CAAC;YACnI,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,GAAG,mBAAK,CAAC,EAAE,CAAC,IAAI,CAAC,CAAC;YAE3C,MAAM,uBAAuB,GAAG,0BAAc,CAAC,qBAAqB,CAAC;gBACnE,OAAO;gBACP,YAAY,EAAE,wBAAwB;gBACtC,MAAM;gBACN,KAAK,EAAE,IAAI;aACZ,CAAC,CAAC;YACH,IAAI,CAAC,aAAa,CAAC,mBAAmB,CAAC,IAAI,CAAC,CAAC;YAC7C,IAAI,CAAC,mBAAmB,GAAG,IAAI,wCAAc,CAAC,IAAI,EAAE,2BAA2B,EAAE;gBAC/E,YAAY,EAAE,uBAAuB,CAAC,kBAAkB;gBACxD,OAAO,EAAE,2BAAe,CAAC,MAAM;gBAC/B,YAAY,EAAE,yBAAY,CAAC,MAAM;gBACjC,KAAK,EAAE,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,kCAAkC,CAAC;gBAC/D,IAAI;gBACJ,UAAU,EAAE,GAAG;gBACf,OAAO,EAAE,IAAI,CAAC,8BAA8B,CAAC,YAAY,IAAI,sBAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;gBAChF,WAAW,EAAE;oBACX,QAAQ,EAAE,eAAe;oBACzB,MAAM,EAAE,MAAM;oBACd,WAAW,EAAE,YAAY;oBACzB,GAAG,oCAAgB,CAAC,2BAA2B,CAC7C,IAAI,CAAC,8BAA8B,CAAC,mBAAmB,EACvD,IAAI,CAAC,eAAe,EACpB,IAAI,CAAC,iBAAiB,CACvB;iBACF;gBACD,qBAAqB,EAAE,IAAI,CAAC,aAAa;gBACzC,GAAG,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO;oBAC9C,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,GAAG;oBACjD,CAAC,CAAC,SAAS;gBACb,UAAU,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO;oBACrD,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,0BAA0B,EAAE;oBAC1E,CAAC,CAAC,SAAS;aACd,CAAC,CAAC;YAEH,KAAK,MAAM,SAAS,IAAI,uBAAuB,CAAC,gBAAgB,EAAE,CAAC;gBACjE,IAAI,CAAC,mBAAmB,CAAC,IAAI,EAAE,oBAAoB,CAAC,SAAS,CAAC,CAAC;YACjE,CAAC;YAED,IAAI,IAAI,CAAC,8BAA8B,CAAC,OAAO,EAAE,CAAC;gBAChD,IAAI,CAAC,mBAAmB,CAAC,IAAI,EAAE,oBAAoB,CAAC,0BAAc,CAAC,4BAA4B,EAAE,CAAC,CAAC;YACrG,CAAC;QACH,CAAC;QAED,uEAAuE;QACvE,MAAM,MAAM,GAAG,kBAAkB,IAAI,CAAC,sBAAsB,EAAE,CAAC;QAC/D,IAAI,CAAC,sBAAsB,EAAE,CAAC;QAE9B,OAAO,IAAI,sCAAY,CAAC,IAAI,EAAE,MAAM,EAAE;YACpC,cAAc,EAAE,IAAI,CAAC,mBAAmB;YACxC,UAAU,EAAE,oBAAoB;YAChC,cAAc,EAAE;gBACd,0BAA0B,EAAE,kCAAkC;gBAC9D,UAAU,EAAE,kBAAkB;aAC/B;SACF,CAAC,CAAC;IACL,CAAC;IAES,4BAA4B,CAAC,EAAU,EAAE,KAAyB;QAC1E,OAAO,IAAI,cAAI,CAAC,IAAI,EAAE,EAAE,EAAE;YACxB,SAAS,EAAE,IAAI,0BAAgB,CAAC,sBAAsB,CAAC;YACvD,cAAc,EAAE;gBACd,mBAAmB,EAAE,IAAI,wBAAc,CAAC;oBACtC,UAAU,EAAE;wBACV,+DAA+D;wBAC/D,GAAG,IAAI,CAAC,cAAc,CAAC,0BAA0B,EAAE;wBACnD,2BAAiB,CAAC,2BAA2B,CAAC,IAAI,EAAE,KAAK,CAAC;qBAC3D;iBACF,CAAC;aACH;SACF,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;;OAQG;IACO,cAAc;QACtB,IAAI,CAAC,IAAI,CAAC,8BAA8B,CAAC,wBAAwB,EAAE,CAAC;YAClE,OAAO,SAAS,CAAC;QACnB,CAAC;QAED,MAAM,MAAM,GAAG,kBAAkB,IAAI,CAAC,sBAAsB,EAAE,CAAC;QAC/D,IAAI,CAAC,sBAAsB,EAAE,CAAC;QAE9B,OAAO,IAAI,sCAAY,CAAC,IAAI,EAAE,MAAM,EAAE;YACpC,cAAc,EAAE,IAAI,CAAC,8BAA8B,CAAC,wBAAwB;YAC5E,UAAU,EAAE,kBAAkB;YAC9B,UAAU,EAAE,GAAG;YACf,mBAAmB,EAAE,IAAI;SAC1B,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;;OAQG;IACO,kBAAkB;QAC1B,IAAI,CAAC,IAAI,CAAC,8BAA8B,CAAC,4BAA4B,EAAE,CAAC;YACtE,OAAO,SAAS,CAAC;QACnB,CAAC;QAED,MAAM,MAAM,GAAG,sBAAsB,IAAI,CAAC,0BAA0B,EAAE,CAAC;QACvE,IAAI,CAAC,0BAA0B,EAAE,CAAC;QAElC,OAAO,IAAI,sCAAY,CAAC,IAAI,EAAE,MAAM,EAAE;YACpC,cAAc,EAAE,IAAI,CAAC,8BAA8B,CAAC,4BAA4B;YAChF,UAAU,EAAE,uBAAuB;YACnC,UAAU,EAAE,GAAG;YACf,mBAAmB,EAAE,IAAI;SAC1B,CAAC,CAAC;IACL,CAAC;IAGD;;;;;;;;;;OAUG;IACO,iBAAiB;QACzB,gDAAgD;QAChD,IAAI,CAAC,IAAI,CAAC,8BAA8B,CAAC,cAAc,EAAE,CAAC;YACxD,OAAO,SAAS,CAAC;QACnB,CAAC;QAED,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,GAAG,mBAAK,CAAC,EAAE,CAAC,IAAI,CAAC,CAAC;QAC3C,MAAM,cAAc,GAAG,IAAI,CAAC,8BAA8B,CAAC,cAAc,IAAI,EAAE,CAAC;QAEhF,uEAAuE;QACvE,6EAA6E;QAC7E,MAAM,IAAI,GAAG,IAAI,cAAI,CAAC,IAAI,EAAE,oBAAoB,EAAE;YAChD,SAAS,EAAE,IAAI,0BAAgB,CAAC,sBAAsB,CAAC;YACvD,cAAc,EAAE;gBACd,cAAc,EAAE,IAAI,wBAAc,CAAC;oBACjC,UAAU,EAAE;wBACV,GAAG,IAAI,CAAC,cAAc,CAAC,0BAA0B,EAAE;qBACpD;iBACF,CAAC;aACH;SACF,CAAC,CAAC;QAEH,MAAM,uBAAuB,GAAG,0BAAc,CAAC,qBAAqB,CAAC;YACnE,OAAO;YACP,YAAY,EAAE,sBAAsB;YACpC,MAAM;YACN,KAAK,EAAE,IAAI;YACX,mBAAmB,EAAE,IAAI,CAAC,8BAA8B,CAAC,mBAAmB;SAC7E,CAAC,CAAC;QAEH,IAAI,CAAC,aAAa,CAAC,mBAAmB,CAAC,IAAI,CAAC,CAAC;QAE7C,wCAAwC;QACxC,MAAM,cAAc,GAAG,IAAI,wCAAc,CAAC,IAAI,EAAE,qBAAqB,EAAE;YACrE,YAAY,EAAE,uBAAuB,CAAC,kBAAkB;YACxD,KAAK,EAAE,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,wBAAwB,CAAC;YACrD,KAAK,EAAE,YAAY;YACnB,OAAO,EAAE,SAAS;YAClB,OAAO,EAAE,2BAAe,CAAC,MAAM;YAC/B,YAAY,EAAE,yBAAY,CAAC,MAAM;YACjC,IAAI;YACJ,UAAU,EAAE,IAAI;YAChB,OAAO,EAAE,sBAAQ,CAAC,OAAO,CAAC,EAAE,CAAC;YAC7B,WAAW,EAAE;gBACX,iBAAiB,EAAE,cAAc,CAAC,QAAQ,IAAI,QAAQ;gBACtD,cAAc,EAAE,MAAM,CAAC,cAAc,CAAC,aAAa,IAAI,GAAG,CAAC;gBAC3D,eAAe,EAAE,MAAM,CAAC,cAAc,CAAC,cAAc,IAAI,MAAM,CAAC;gBAChE,UAAU,EAAE,MAAM,CAAC,cAAc,CAAC,SAAS,IAAI,EAAE,CAAC;gBAClD,aAAa,EAAE,MAAM,CAAC,cAAc,CAAC,YAAY,IAAI,CAAC,CAAC;gBACvD,oBAAoB,EAAE,MAAM,CAAC,cAAc,CAAC,iBAAiB,IAAI,MAAM,CAAC;gBACxE,cAAc,EAAE,MAAM,CAAC,cAAc,CAAC,aAAa,IAAI,IAAI,CAAC;gBAC5D,uBAAuB,EAAE,MAAM,CAAC,cAAc,CAAC,oBAAoB,IAAI,KAAK,CAAC;gBAC7E,mBAAmB,EAAE,MAAM,CAAC,cAAc,CAAC,gBAAgB,IAAI,EAAE,CAAC;gBAClE,GAAG,oCAAgB,CAAC,2BAA2B,CAC7C,IAAI,CAAC,8BAA8B,CAAC,mBAAmB,EACvD,IAAI,CAAC,eAAe,EACpB,IAAI,CAAC,iBAAiB,CACvB;aACF;YACD,qBAAqB,EAAE,IAAI,CAAC,aAAa;YACzC,GAAG,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO;gBAC9C,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,GAAG;gBACjD,CAAC,CAAC,SAAS;YACb,UAAU,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO;gBACrD,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,0BAA0B,EAAE;gBAC1E,CAAC,CAAC,SAAS;SACd,CAAC,CAAC;QAEH,KAAK,MAAM,SAAS,IAAI,uBAAuB,CAAC,gBAAgB,EAAE,CAAC;YACjE,cAAc,CAAC,IAAI,EAAE,oBAAoB,CAAC,SAAS,CAAC,CAAC;QACvD,CAAC;QAED,IAAI,IAAI,CAAC,8BAA8B,CAAC,OAAO,EAAE,CAAC;YAChD,cAAc,CAAC,IAAI,EAAE,oBAAoB,CAAC,0BAAc,CAAC,4BAA4B,EAAE,CAAC,CAAC;QAC3F,CAAC;QAED,OAAO,IAAI,sCAAY,CAAC,IAAI,EAAE,wBAAwB,EAAE;YACtD,cAAc,EAAE,cAAc;YAC9B,UAAU,EAAE,kBAAkB;YAC9B,cAAc,EAAE;gBACd,oBAAoB,EAAE,4BAA4B;gBAClD,iBAAiB,EAAE,yBAAyB;gBAC5C,YAAY,EAAE,oBAAoB;gBAClC,UAAU,EAAE,kBAAkB;aAC/B;SACF,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;;;;OAUG;IACO,qBAAqB;QAC7B,IAAI,CAAC,IAAI,CAAC,8BAA8B,CAAC,cAAc,EAAE,CAAC;YACxD,OAAO,EAAE,CAAC;QACZ,CAAC;QAED,OAAO;YACL,eAAe,EAAE,8CAAoB,CAAC,UAAU,CAC9C,4BAAQ,CAAC,QAAQ,CAAC,0DAA0D,CAAC,CAC9E;YACD,gBAAgB,EAAE,8CAAoB,CAAC,UAAU,CAC/C,4BAAQ,CAAC,QAAQ,CAAC,2BAA2B,CAAC,CAC/C;YACD,aAAa,EAAE,8CAAoB,CAAC,UAAU,CAC5C,4BAAQ,CAAC,YAAY,CAAC,4BAAQ,CAAC,QAAQ,CAAC,gCAAgC,CAAC,CAAC,CAC3E;YACD,aAAa,EAAE,8CAAoB,CAAC,UAAU,CAC5C,4BAAQ,CAAC,YAAY,CAAC,4BAAQ,CAAC,QAAQ,CAAC,yBAAyB,CAAC,CAAC,CACpE;SACF,CAAC;IACJ,CAAC;IAED;;;;;;;;;;OAUG;IACO,wBAAwB;QAChC,oDAAoD;QACpD,IAAI,CAAC,IAAI,CAAC,8BAA8B,CAAC,cAAc,EAAE,CAAC;YACxD,OAAO,IAAI,CAAC,gCAAgC,EAAE,CAAC;QACjD,CAAC;QAED,uDAAuD;QACvD,MAAM,WAAW,GAAG,IAAI,0BAAM,CAAC,IAAI,EAAE,gBAAgB,CAAC,CAAC;QAEvD,WAAW;aACR,IAAI,CACH,6BAAS,CAAC,aAAa,CAAC,mCAAmC,EAAE,IAAI,CAAC,EAClE,IAAI,CAAC,2BAA2B,EAAE,CACnC;aACA,SAAS;QACR,4EAA4E;QAC5E,IAAI,CAAC,gCAAgC,CAAC,UAAU,CAAC,CAClD,CAAC;QAEJ,OAAO,WAAW,CAAC;IACrB,CAAC;IAGD;;;;;;;;;;;OAWG;IACK,2BAA2B;QACjC,MAAM,cAAc,GAAG,IAAI,CAAC,8BAA8B,CAAC,cAAc,IAAI,EAAE,CAAC;QAChF,MAAM,cAAc,GAAG,cAAc,CAAC,cAAc,KAAK,YAAY;YACnE,CAAC,CAAC,CAAC;YACH,CAAC,CAAC,CAAC,cAAc,CAAC,cAAc,IAAI,EAAE,CAAC,CAAC;QAE1C,yCAAyC;QACzC,MAAM,QAAQ,GAAG,IAAI,uBAAG,CAAC,IAAI,EAAE,eAAe,EAAE;YAC9C,SAAS,EAAE,yBAAyB;YACpC,cAAc;YACd,UAAU,EAAE;gBACV,cAAc,EAAE,cAAc;gBAC9B,SAAS,EAAE,mBAAmB;gBAC9B,cAAc,EAAE,mBAAmB;gBACnC,eAAe,EAAE,6CAA6C;gBAC9D,wEAAwE;gBACxE,SAAS,EAAE;oBACT,UAAU,EAAE,IAAI;oBAChB,UAAU,EAAE,0BAA0B;oBACtC,OAAO,EAAE,uBAAuB;oBAChC,YAAY,EAAE,oBAAoB;iBACnC;gBACD,eAAe,EAAE,eAAe;aACjC;YACD,UAAU,EAAE,gBAAgB;SAC7B,CAAC,CAAC;QAEH,2DAA2D;QAC3D,MAAM,mBAAmB,GAAG,IAAI,CAAC,kBAAkB,EAAE,CAAC;QACtD,MAAM,eAAe,GAAG,IAAI,CAAC,cAAc,EAAE,CAAC;QAE9C,QAAQ,CAAC,aAAa,CACpB,mBAAmB,CAAC,IAAI,CAAC,eAAe,CAAC,CAC1C,CAAC;QAEF,+EAA+E;QAC/E,MAAM,qBAAqB,GAAG,IAAI,CAAC,qBAAqB,EAAE,CAAC;QAE3D,mFAAmF;QACnF,iFAAiF;QACjF,qEAAqE;QACrE,MAAM,cAAc,GAAG,IAAI,wBAAI,CAAC,IAAI,EAAE,2BAA2B,EAAE;YACjE,UAAU,EAAE;gBACV,cAAc,EAAE,cAAc;gBAC9B,eAAe,EAAE,eAAe;gBAChC,WAAW,EAAE,WAAW;gBACxB,kBAAkB,EAAE,kBAAkB;gBACtC,gBAAgB,EAAE,gBAAgB;gBAClC,oBAAoB,EAAE,oBAAoB;gBAC1C,0EAA0E;gBAC1E,kBAAkB,EAAE;oBAClB,UAAU,EAAE,2BAA2B;iBACxC;gBACD,gFAAgF;gBAChF,wBAAwB,EAAE,wCAAwC;aACnE;SACF,CAAC,CAAC;QAEH,oDAAoD;QACpD,MAAM,0BAA0B,GAAG,IAAI,CAAC,gCAAgC,EAAE,CAAC;QAE3E,sBAAsB;QACtB,MAAM,WAAW,GAAG,IAAI,CAAC,iBAAiB,EAAE,CAAC;QAE7C,8EAA8E;QAC9E,MAAM,eAAe,GAAG,IAAI,CAAC,cAAc,CAAC,kBAAkB,CAAC,IAAI,EAAE,SAAS,CAAC,CAAC;QAEhF,gDAAgD;QAChD,MAAM,uBAAuB,GAAG,IAAI,CAAC,6BAA6B,EAAE,CAAC;QAErE,oDAAoD;QACpD,MAAM,cAAc,GAAG,IAAI,CAAC,cAAc,EAAE,CAAC;QAC7C,MAAM,kBAAkB,GAAG,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAErD,0CAA0C;QAC1C,mHAAmH;QACnH,IAAI,UAAU,GAAe,WAAW;aACrC,QAAQ,CAAC;YACR,MAAM,EAAE,CAAC,yBAAyB,EAAE,iCAAiC,CAAC;YACtE,QAAQ,EAAE,sBAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;YAC7B,WAAW,EAAE,CAAC;YACd,WAAW,EAAE,CAAC;SACf,CAAC;aACD,IAAI,CAAC,eAAe,CAAC,CAAC;QAEzB,0DAA0D;QAC1D,IAAI,kBAAkB,EAAE,CAAC;YACvB,MAAM,0BAA0B,GAAG,IAAI,0CAAgB,CAAC,IAAI,EAAE,oCAAoC,EAAE;gBAClG,KAAK,EAAE,IAAI,CAAC,uBAAuB;gBACnC,GAAG,EAAE;oBACH,UAAU,EAAE,8CAAoB,CAAC,UAAU,CAAC,4BAAQ,CAAC,QAAQ,CAAC,cAAc,CAAC,CAAC;iBAC/E;gBACD,gBAAgB,EAAE,iCAAiC;gBACnD,yBAAyB,EAAE;oBACzB,YAAY,EAAE,8CAAoB,CAAC,UAAU,CAAC,yBAAyB,CAAC;iBACzE;gBACD,UAAU,EAAE,4BAAQ,CAAC,OAAO;aAC7B,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,cAAc,CAAC,iBAAiB,CAAC,IAAI,EAAE,iBAAiB,CAAC,CAAC,CAAC;YAExE,UAAU,GAAG,kBAAkB;iBAC5B,QAAQ,CAAC,0BAA0B,EAAE;gBACpC,UAAU,EAAE,4BAAQ,CAAC,OAAO;aAC7B,CAAC;iBACD,IAAI,CACH,IAAI,0CAAgB,CAAC,IAAI,EAAE,oCAAoC,EAAE;gBAC/D,KAAK,EAAE,IAAI,CAAC,uBAAuB;gBACnC,GAAG,EAAE;oBACH,UAAU,EAAE,8CAAoB,CAAC,UAAU,CAAC,4BAAQ,CAAC,QAAQ,CAAC,cAAc,CAAC,CAAC;iBAC/E;gBACD,gBAAgB,EAAE,+EAA+E;gBACjG,yBAAyB,EAAE;oBACzB,YAAY,EAAE,8CAAoB,CAAC,UAAU,CAAC,0BAA0B,CAAC;oBACzE,uBAAuB,EAAE,8CAAoB,CAAC,UAAU,CAAC,4BAAQ,CAAC,YAAY,CAAC,4BAAQ,CAAC,QAAQ,CAAC,uBAAuB,CAAC,CAAC,CAAC;iBAC5H;gBACD,UAAU,EAAE,4BAAQ,CAAC,OAAO;aAC7B,CAAC,CAAC,IAAI,CAAC,UAAU,CAAC,CACpB,CAAC;QACN,CAAC;QAED,wEAAwE;QACxE,IAAI,cAAc,EAAE,CAAC;YACnB,MAAM,sBAAsB,GAAG,IAAI,0CAAgB,CAAC,IAAI,EAAE,gCAAgC,EAAE;gBAC1F,KAAK,EAAE,IAAI,CAAC,uBAAuB;gBACnC,GAAG,EAAE;oBACH,UAAU,EAAE,8CAAoB,CAAC,UAAU,CAAC,4BAAQ,CAAC,QAAQ,CAAC,cAAc,CAAC,CAAC;iBAC/E;gBACD,gBAAgB,EAAE,iCAAiC;gBACnD,yBAAyB,EAAE;oBACzB,YAAY,EAAE,8CAAoB,CAAC,UAAU,CAAC,oBAAoB,CAAC;iBACpE;gBACD,UAAU,EAAE,4BAAQ,CAAC,OAAO;aAC7B,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,cAAc,CAAC,iBAAiB,CAAC,IAAI,EAAE,eAAe,CAAC,CAAC,CAAC;YAEtE,UAAU,GAAG,cAAc;iBACxB,QAAQ,CAAC,sBAAsB,EAAE;gBAChC,UAAU,EAAE,4BAAQ,CAAC,OAAO;aAC7B,CAAC;iBACD,IAAI,CACH,IAAI,0CAAgB,CAAC,IAAI,EAAE,gCAAgC,EAAE;gBAC3D,KAAK,EAAE,IAAI,CAAC,uBAAuB;gBACnC,GAAG,EAAE;oBACH,UAAU,EAAE,8CAAoB,CAAC,UAAU,CAAC,4BAAQ,CAAC,QAAQ,CAAC,cAAc,CAAC,CAAC;iBAC/E;gBACD,gBAAgB,EAAE,uEAAuE;gBACzF,yBAAyB,EAAE;oBACzB,YAAY,EAAE,kBAAkB;wBAC9B,CAAC,CAAC,8CAAoB,CAAC,UAAU,CAAC,qBAAqB,CAAC;wBACxD,CAAC,CAAC,8CAAoB,CAAC,UAAU,CAAC,UAAU,CAAC;oBAC/C,mBAAmB,EAAE,8CAAoB,CAAC,UAAU,CAAC,4BAAQ,CAAC,YAAY,CAAC,4BAAQ,CAAC,QAAQ,CAAC,kBAAkB,CAAC,CAAC,CAAC;iBACnH;gBACD,UAAU,EAAE,4BAAQ,CAAC,OAAO;aAC7B,CAAC,CAAC,IAAI,CAAC,UAAU,CAAC,CACpB,CAAC;QACN,CAAC;QAED,+HAA+H;QAC/H,OAAO,QAAQ;aACZ,QAAQ,CAAC,uBAAuB,EAAE;YACjC,UAAU,EAAE,SAAS;SACtB,CAAC;aACD,IAAI,CACH,qBAAqB;aAClB,QAAQ,CAAC,uBAAuB,EAAE;YACjC,UAAU,EAAE,SAAS;SACtB,CAAC;aACD,QAAQ,CAAC;YACR,MAAM,EAAE,CAAC,yBAAyB,EAAE,iCAAiC,CAAC;YACtE,QAAQ,EAAE,sBAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;YAC7B,WAAW,EAAE,CAAC;YACd,WAAW,EAAE,CAAC;SACf,CAAC;aACD,IAAI,CACH,cAAc,CAAC,IAAI,CACjB,0BAA0B;aACvB,QAAQ,CAAC;YACR,MAAM,EAAE,CAAC,iDAAiD,CAAC;YAC3D,QAAQ,EAAE,sBAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;YAC7B,WAAW,EAAE,CAAC;YACd,WAAW,EAAE,CAAC;SACf,CAAC;aACD,IAAI,CAAC,UAAU,CAAC,CACpB,CACF,CACJ,CAAC;IACN,CAAC;IAED;;;;;;;;OAQG;IACK,qBAAqB;QAC3B,mEAAmE;QACnE,IAAI,CAAC,IAAI,CAAC,oBAAoB,EAAE,CAAC;YAC/B,MAAM,MAAM,GAAG,IAAI,CAAC,8BAA8B,CAAC,iBAAiB,IAAI,yBAAyB,CAAC,0BAA0B,CAAC;YAC7H,MAAM,eAAe,GAAG,2BAAiB,CAAC,mBAAmB,CAAC,IAAI,CAAC,8BAA8B,CAAC,sBAAsB,CAAC,CAAC;YAC1H,MAAM,IAAI,GAAG,IAAI,CAAC,4BAA4B,CAAC,uBAAuB,EAAE,IAAI,CAAC,8BAA8B,CAAC,sBAAsB,CAAC,CAAC;YACpI,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,GAAG,mBAAK,CAAC,EAAE,CAAC,IAAI,CAAC,CAAC;YAE3C,MAAM,uBAAuB,GAAG,0BAAc,CAAC,qBAAqB,CAAC;gBACnE,OAAO;gBACP,YAAY,EAAE,yBAAyB;gBACvC,MAAM;gBACN,KAAK,EAAE,IAAI;gBACX,mBAAmB,EAAE,IAAI,CAAC,8BAA8B,CAAC,mBAAmB;aAC7E,CAAC,CAAC;YAEH,IAAI,CAAC,aAAa,CAAC,mBAAmB,CAAC,IAAI,CAAC,CAAC;YAE7C,IAAI,CAAC,oBAAoB,GAAG,IAAI,wCAAc,CAAC,IAAI,EAAE,4BAA4B,EAAE;gBACjF,YAAY,EAAE,uBAAuB,CAAC,kBAAkB;gBACxD,YAAY,EAAE,yBAAY,CAAC,MAAM;gBACjC,OAAO,EAAE,2BAAe,CAAC,MAAM;gBAC/B,KAAK,EAAE,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,kCAAkC,CAAC;gBAC/D,IAAI;gBACJ,UAAU,EAAE,IAAI;gBAChB,OAAO,EAAE,IAAI,CAAC,8BAA8B,CAAC,YAAY,IAAI,sBAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;gBAChF,WAAW,EAAE;oBACX,QAAQ,EAAE,eAAe;oBACzB,MAAM,EAAE,MAAM;oBACd,WAAW,EAAE,aAAa;oBAC1B,iBAAiB,EAAE,OAAO,EAAE,qDAAqD;oBACjF,GAAG,oCAAgB,CAAC,2BAA2B,CAC7C,IAAI,CAAC,8BAA8B,CAAC,mBAAmB,EACvD,IAAI,CAAC,eAAe,EACpB,IAAI,CAAC,iBAAiB,CACvB;iBACF;gBACD,qBAAqB,EAAE,IAAI,CAAC,aAAa;gBACzC,GAAG,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO;oBAC9C,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,GAAG;oBACjD,CAAC,CAAC,SAAS;gBACb,UAAU,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO;oBACrD,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,0BAA0B,EAAE;oBAC1E,CAAC,CAAC,SAAS;aACd,CAAC,CAAC;YAEH,KAAK,MAAM,SAAS,IAAI,uBAAuB,CAAC,gBAAgB,EAAE,CAAC;gBACjE,IAAI,CAAC,oBAAoB,CAAC,IAAI,EAAE,oBAAoB,CAAC,SAAS,CAAC,CAAC;YAClE,CAAC;YAED,IAAI,IAAI,CAAC,8BAA8B,CAAC,OAAO,EAAE,CAAC;gBAChD,IAAI,CAAC,oBAAoB,CAAC,IAAI,EAAE,oBAAoB,CAAC,0BAAc,CAAC,4BAA4B,EAAE,CAAC,CAAC;YACtG,CAAC;QACH,CAAC;QAED,uEAAuE;QACvE,MAAM,MAAM,GAAG,mBAAmB,IAAI,CAAC,uBAAuB,EAAE,CAAC;QACjE,IAAI,CAAC,uBAAuB,EAAE,CAAC;QAE/B,+EAA+E;QAC/E,OAAO,IAAI,sCAAY,CAAC,IAAI,EAAE,MAAM,EAAE;YACpC,cAAc,EAAE,IAAI,CAAC,oBAAoB;YACzC,OAAO,EAAE,6BAAS,CAAC,UAAU,CAAC;gBAC5B,cAAc,EAAE,cAAc;gBAC9B,aAAa,EAAE,MAAM;gBACrB,SAAS,EAAE;oBACT,kEAAkE;oBAClE,QAAQ,EAAE,qCAAqC;iBAChD;aACF,CAAC;YACF,4FAA4F;YAC5F,gGAAgG;YAChG,UAAU,EAAE,oBAAoB;YAChC,cAAc,EAAE;gBACd,UAAU,EAAE,kBAAkB;aAC/B;SACF,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;;OAQG;IACK,gCAAgC;QACtC,OAAO,IAAI,0CAAgB,CAAC,IAAI,EAAE,uBAAuB,EAAE;YACzD,KAAK,EAAE,IAAI,CAAC,uBAAuB;YACnC,GAAG,EAAE;gBACH,UAAU,EAAE,8CAAoB,CAAC,UAAU,CAAC,4BAAQ,CAAC,QAAQ,CAAC,cAAc,CAAC,CAAC;aAC/E;YACD,gBAAgB,EAAE,0DAA0D;YAC5E,yBAAyB,EAAE;gBACzB,SAAS,EAAE,8CAAoB,CAAC,UAAU,CACxC,4BAAQ,CAAC,YAAY,CAAC,4BAAQ,CAAC,QAAQ,CAAC,oBAAoB,CAAC,CAAC,CAC/D;gBACD,SAAS,EAAE,8CAAoB,CAAC,UAAU,CAAC,UAAU,CAAC;aACvD;YACD,UAAU,EAAE,4BAAQ,CAAC,OAAO;SAC7B,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;;;OASG;IACK,iBAAiB;QACvB,mCAAmC;QACnC,IAAI,CAAC,IAAI,CAAC,gBAAgB,EAAE,CAAC;YAC3B,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,GAAG,mBAAK,CAAC,EAAE,CAAC,IAAI,CAAC,CAAC;YAE3C,MAAM,IAAI,GAAG,IAAI,cAAI,CAAC,IAAI,EAAE,mBAAmB,EAAE;gBAC/C,SAAS,EAAE,IAAI,0BAAgB,CAAC,sBAAsB,CAAC;gBACvD,cAAc,EAAE;oBACd,aAAa,EAAE,IAAI,wBAAc,CAAC;wBAChC,UAAU,EAAE;4BACV,uDAAuD;4BACvD,GAAG,IAAI,CAAC,cAAc,CAAC,0BAA0B,CAAC,CAAC,iBAAiB,CAAC,EAAE,IAAI,CAAC;yBAC7E;qBACF,CAAC;iBACH;aACF,CAAC,CAAC;YAEH,MAAM,uBAAuB,GAAG,0BAAc,CAAC,qBAAqB,CAAC;gBACnE,OAAO;gBACP,YAAY,EAAE,qBAAqB;gBACnC,MAAM;gBACN,KAAK,EAAE,IAAI;gBACX,mBAAmB,EAAE,IAAI,CAAC,8BAA8B,CAAC,mBAAmB;aAC7E,CAAC,CAAC;YAEH,IAAI,CAAC,aAAa,CAAC,mBAAmB,CAAC,IAAI,CAAC,CAAC;YAE7C,IAAI,CAAC,gBAAgB,GAAG,IAAI,wCAAc,CAAC,IAAI,EAAE,iBAAiB,EAAE;gBAClE,YAAY,EAAE,uBAAuB,CAAC,kBAAkB;gBACxD,KAAK,EAAE,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,mBAAmB,CAAC;gBAChD,KAAK,EAAE,YAAY;gBACnB,OAAO,EAAE,SAAS;gBAClB,OAAO,EAAE,2BAAe,CAAC,MAAM;gBAC/B,YAAY,EAAE,yBAAY,CAAC,MAAM;gBACjC,IAAI;gBACJ,UAAU,EAAE,GAAG;gBACf,OAAO,EAAE,sBAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;gBAC5B,WAAW,EAAE;oBACX,GAAG,oCAAgB,CAAC,2BAA2B,CAC7C,IAAI,CAAC,8BAA8B,CAAC,mBAAmB,EACvD,IAAI,CAAC,eAAe,EACpB,IAAI,CAAC,iBAAiB,CACvB;iBACF;gBACD,qBAAqB,EAAE,IAAI,CAAC,aAAa;gBACzC,GAAG,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO;oBAC9C,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,GAAG;oBACjD,CAAC,CAAC,SAAS;gBACb,UAAU,EAAE,IAAI,CAAC,8BAA8B,CAAC,OAAO;oBACrD,CAAC,CAAC,IAAI,CAAC,8BAA8B,CAAC,OAAO,CAAC,0BAA0B,EAAE;oBAC1E,CAAC,CAAC,SAAS;aACd,CAAC,CAAC;YAEH,KAAK,MAAM,SAAS,IAAI,uBAAuB,CAAC,gBAAgB,EAAE,CAAC;gBACjE,IAAI,CAAC,gBAAgB,CAAC,IAAI,EAAE,oBAAoB,CAAC,SAAS,CAAC,CAAC;YAC9D,CAAC;YAED,IAAI,IAAI,CAAC,8BAA8B,CAAC,OAAO,EAAE,CAAC;gBAChD,IAAI,CAAC,gBAAgB,CAAC,IAAI,EAAE,oBAAoB,CAAC,0BAAc,CAAC,4BAA4B,EAAE,CAAC,CAAC;YAClG,CAAC;QACH,CAAC;QAED,OAAO,IAAI,sCAAY,CAAC,IAAI,EAAE,eAAe,EAAE;YAC7C,cAAc,EAAE,IAAI,CAAC,gBAAgB;YACrC,OAAO,EAAE,6BAAS,CAAC,UAAU,CAAC;gBAC5B,cAAc,EAAE,cAAc;gBAC9B,UAAU,EAAE,yBAAyB;aACtC,CAAC;YACF,UAAU,EAAE,4BAAQ,CAAC,OAAO;SAC7B,CAAC,CAAC;IACL,CAAC;IAED;;;;;;;;OAQG;IACK,6BAA6B;QACnC,MAAM,mBAAmB,GAAG,IAAI,0CAAgB,CAAC,IAAI,EAAE,0BAA0B,EAAE;YACjF,KAAK,EAAE,IAAI,CAAC,uBAAuB;YACnC,GAAG,EAAE;gBACH,UAAU,EAAE,8CAAoB,CAAC,UAAU,CAAC,4BAAQ,CAAC,QAAQ,CAAC,cAAc,CAAC,CAAC;aAC/E;YACD,gBAAgB,EAAE,iCAAiC;YACnD,yBAAyB,EAAE;gBACzB,YAAY,EAAE,8CAAoB,CAAC,UAAU,CAAC,qBAAqB,CAAC;aACrE;YACD,UAAU,EAAE,4BAAQ,CAAC,OAAO;SAC7B,CAAC,CAAC;QAEH,qEAAqE;QACrE,MAAM,YAAY,GAAG,IAAI,CAAC,cAAc,CAAC,iBAAiB,CAAC,IAAI,EAAE,SAAS,CAAC,CAAC;QAE5E,OAAO,mBAAmB,CAAC,IAAI,CAAC,YAAY,CAAC,CAAC;IAChD,CAAC;;AAn+BH,8DAo+BC;;;AAn+B2B,uDAA6B,GAAG;;;;;;;;;GASzD,AATsD,CASrD;AAEwB,mDAAyB,GAAG;;;;;;;;;;;;;;;;;;GAkBrD,AAlBkD,CAkBjD;AAEwB,oDAA0B,GAAG;;;;;;;;;;;;;;;;;;;;;GAqBtD,AArBmD,CAqBlD","sourcesContent":["// Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.\n// SPDX-License-Identifier: Apache-2.0\n\nimport * as path from 'path';\nimport { PythonFunction } from '@aws-cdk/aws-lambda-python-alpha';\nimport { Duration, Stack } from 'aws-cdk-lib';\nimport { InterfaceVpcEndpointAwsService } from 'aws-cdk-lib/aws-ec2';\nimport { Role, ServicePrincipal, PolicyDocument } from 'aws-cdk-lib/aws-iam';\nimport { Function, Architecture } from 'aws-cdk-lib/aws-lambda';\nimport { IChainable, Choice, Condition, Map, JsonPath, TaskInput, Pass } from 'aws-cdk-lib/aws-stepfunctions';\nimport { DynamoAttributeValue, DynamoUpdateItem, LambdaInvoke } from 'aws-cdk-lib/aws-stepfunctions-tasks';\nimport { Construct } from 'constructs';\nimport { BaseDocumentProcessing, BaseDocumentProcessingProps, DocumentProcessingStepType } from './base-document-processing';\nimport { ChunkingConfig } from './chunking-config';\nimport { DefaultRuntimes } from '../framework';\nimport { BedrockModelProps, BedrockModelUtils } from '../framework/bedrock';\nimport { LambdaIamUtils } from '../utilities';\nimport { PowertoolsConfig } from '../utilities/observability/powertools-config';\n\n/**\n * Configuration properties for BedrockDocumentProcessing construct.\n * Extends BaseDocumentProcessingProps with Bedrock-specific options.\n */\nexport interface BedrockDocumentProcessingProps extends BaseDocumentProcessingProps {\n  /**\n   * Bedrock foundation model for document classification step.\n   */\n  readonly classificationBedrockModel?: BedrockModelProps;\n\n  /**\n   * Bedrock foundation model for document extraction step.\n   */\n  readonly processingBedrockModel?: BedrockModelProps;\n  /**\n   * Custom prompt template for document classification.\n   * Must include placeholder for document content.\n   * @default DEFAULT_CLASSIFICATION_PROMPT\n   */\n  readonly classificationPrompt?: string;\n  /**\n   * Custom prompt template for document extraction.\n   * Must include placeholder for document content and classification result.\n   * @default DEFAULT_EXTRACTION_PROMPT\n   */\n  readonly processingPrompt?: string;\n  /**\n   * Optional Lambda function for document enrichment step.\n   * If provided, will be invoked after extraction with workflow state.\n   */\n  readonly enrichmentLambdaFunction?: Function;\n  /**\n   * Optional Lambda function for post-processing step.\n   * If provided, will be invoked after enrichment with workflow state.\n   */\n  readonly postProcessingLambdaFunction?: Function;\n  /**\n   * Timeout for individual Step Functions tasks (classification, extraction, etc.).\n   * @default Duration.minutes(5)\n   */\n  readonly stepTimeouts?: Duration;\n\n  /**\n   * Custom prompt template for aggregating results from multiple chunks.\n   * Used when chunking is enabled to merge processing results from all chunks\n   * into a single coherent result.\n   *\n   * The prompt receives the concatenated processing results from all chunks\n   * and should instruct the model to synthesize them into a unified output.\n   *\n   * @default DEFAULT_AGGREGATION_PROMPT\n   */\n  readonly aggregationPrompt?: string;\n\n  /**\n   * Enable PDF chunking for large documents.\n   *\n   * When enabled, documents exceeding configured thresholds will be automatically\n   * split into chunks, processed in parallel or sequentially, and results aggregated.\n   *\n   * This feature is useful for:\n   * - Processing large PDFs (>100 pages)\n   * - Handling documents that exceed Bedrock token limits (~200K tokens)\n   * - Improving processing reliability for complex documents\n   * - Processing documents with variable content density\n   *\n   * The chunking workflow:\n   * 1. Analyzes PDF to determine page count and estimate token count\n   * 2. Decides if chunking is needed based on configured thresholds\n   * 3. If chunking is needed, splits PDF into chunks and uploads to S3\n   * 4. Processes each chunk through classification and extraction\n   * 5. Aggregates results using majority voting for classification\n   * 6. Deduplicates entities across chunks\n   * 7. Cleans up temporary chunk files from S3\n   *\n   * @default false\n   */\n  readonly enableChunking?: boolean;\n\n  /**\n   * Configuration for PDF chunking behavior.\n   *\n   * Only applies when `enableChunking` is true. Allows customization of:\n   * - **Chunking strategy**: How documents are split (fixed-pages, token-based, or hybrid)\n   * - **Thresholds**: When to trigger chunking based on page count or token count\n   * - **Chunk size and overlap**: Control chunk boundaries and context preservation\n   * - **Processing mode**: Parallel (faster) or sequential (cost-optimized)\n   * - **Aggregation strategy**: How to combine results from multiple chunks\n   *\n   * ## Default Configuration\n   *\n   * If not provided, uses sensible defaults optimized for most use cases:\n   * - Strategy: `'hybrid'` (recommended - balances token and page limits)\n   * - Page threshold: 100 pages\n   * - Token threshold: 150,000 tokens\n   * - Processing mode: `'parallel'`\n   * - Max concurrency: 10\n   * - Aggregation strategy: `'majority-vote'`\n   *\n   * ## Strategy Comparison\n   *\n   * | Strategy | Best For | Pros | Cons |\n   * |----------|----------|------|------|\n   * | `hybrid` | Most documents | Balances token/page limits | Slightly more complex |\n   * | `token-based` | Variable density | Respects model limits | Slower analysis |\n   * | `fixed-pages` | Uniform density | Simple, fast | May exceed token limits |\n   *\n   * @default undefined (uses default configuration when enableChunking is true)\n   *\n   * @see {@link ChunkingConfig} for detailed configuration options\n   */\n  readonly chunkingConfig?: ChunkingConfig;\n}\n\n/**\n * Document processing workflow powered by Amazon Bedrock foundation models.\n *\n * Extends BaseDocumentProcessing to provide AI-powered document classification and extraction\n * using Amazon Bedrock foundation models. This implementation offers:\n *\n * ## Key Features\n * - **AI-Powered Classification**: Uses Claude 3.7 Sonnet (configurable) to classify document types\n * - **Intelligent Extraction**: Extracts structured data from documents using foundation models\n * - **Cross-Region Inference**: Optional support for improved availability via inference profiles\n * - **Flexible Processing**: Optional enrichment and post-processing Lambda functions\n * - **Cost Optimized**: Configurable timeouts and model selection for cost control\n *\n * ## Processing Workflow\n * S3 Upload → Classification (Bedrock) → Extraction (Bedrock) → [Enrichment] → [Post-Processing] → Results\n *\n * ## Default Models\n * - Classification: Claude 3.7 Sonnet (anthropic.claude-3-7-sonnet-20250219-v1:0)\n * - Extraction: Claude 3.7 Sonnet (anthropic.claude-3-7-sonnet-20250219-v1:0)\n *\n * ## Prompt Templates\n * The construct uses default prompts that can be customized:\n * - **Classification**: Analyzes document and returns JSON with documentClassification field\n * - **Extraction**: Uses classification result to extract entities in structured JSON format\n *\n * ## Cross-Region Inference\n * When enabled, uses Bedrock inference profiles for improved availability:\n * - US prefix: Routes to US-based regions for lower latency\n * - EU prefix: Routes to EU-based regions for data residency compliance\n */\nexport class BedrockDocumentProcessing extends BaseDocumentProcessing {\n  protected static readonly DEFAULT_CLASSIFICATION_PROMPT = `\n  Analyze the document below, and classify the type of document it is (eg. INVOICE, IDENTITY_DOCUMENT, RECEIPT, etc). The result should be in JSON and should follow the following structure (only respond in JSON with the following structure and do not use markdown to indicate the json, just output plain old json with nothing else):\n\n  {\n      documentClassification: <CLASSIFICATION>\n  }\n\n  Attached document is as follows:\n\n  `;\n\n  protected static readonly DEFAULT_PROCESSING_PROMPT = `\n  The document below has been classified as [ACTUAL_CLASSIFICATION]. Extract important entities from the document and return the result as JSON following the structure below (only respond in JSON with the following structure and do not use markdown to indicate the json, just output plain old json with nothing else):\n\n  {\n      documentClassification: <CLASSIFICATION>,\n      result: {\n        entities: [\n            {\n                type: <TYPE OF ENTITY>\n                value: <VALUE OF ENTITY>\n            },\n            ...\n        ]\n      }\n  }\n\n  Attached document is as follows:\n\n  `;\n\n  protected static readonly DEFAULT_AGGREGATION_PROMPT = `\n  You are given the processing results from multiple chunks of a large document that was split for processing.\n  Your task is to synthesize these chunk results into a single, coherent final result.\n\n  Instructions:\n  1. Review all the chunk results provided below\n  2. Merge and deduplicate any overlapping information (chunks may have overlapping pages)\n  3. Synthesize the information into a unified, coherent result\n  4. Maintain the same output format as the individual chunk results\n  5. If the chunks contain summaries, create a comprehensive summary that covers all sections\n  6. If the chunks contain entities, deduplicate and consolidate them\n  7. Preserve important details from each chunk while avoiding redundancy\n\n  Return the result as JSON (only respond in JSON without markdown formatting):\n\n  {\n      \"result\": <SYNTHESIZED_RESULT>\n  }\n\n  The chunk results to aggregate are as follows:\n\n  `;\n\n  /** Configuration properties specific to Bedrock document processing */\n  protected readonly bedrockDocumentProcessingProps: BedrockDocumentProcessingProps;\n  /** The Step Functions state machine that orchestrates the document processing workflow */\n  readonly stateMachine;\n  /** Cached classification Lambda function to avoid duplicate resource creation */\n  private _classificationFunction?: Function;\n  /** Cached processing Lambda function to avoid duplicate resource creation */\n  private _processingFunction?: Function;\n  /** Counter for generating unique classification step IDs */\n  private _classificationStepCounter = 0;\n  /** Counter for generating unique processing step IDs */\n  private _processingStepCounter = 0;\n  /** Cached aggregation Lambda function to avoid duplicate resource creation */\n  private _aggregationFunction?: Function;\n  /** Counter for generating unique aggregation step IDs */\n  private _aggregationStepCounter = 0;\n  /** Cached cleanup Lambda function to avoid duplicate resource creation */\n  private _cleanupFunction?: Function;\n  /** Counter for generating unique enrichment step IDs */\n  private _enrichmentStepCounter = 0;\n  /** Counter for generating unique post-processing step IDs */\n  private _postProcessingStepCounter = 0;\n\n\n  /**\n   * Creates a new BedrockDocumentProcessing construct.\n   *\n   * Initializes the Bedrock-powered document processing pipeline with AI classification\n   * and extraction capabilities. Creates Lambda functions with appropriate IAM roles\n   * for Bedrock model invocation and S3 access.\n   *\n   * @param scope - The scope in which to define this construct\n   * @param id - The scoped construct ID. Must be unique within the scope.\n   * @param props - Configuration properties for the Bedrock document processing pipeline\n   * @throws Error if chunking configuration is invalid\n   */\n  constructor(scope: Construct, id: string, props: BedrockDocumentProcessingProps) {\n    super(scope, id, props);\n\n    // Validate chunking configuration if provided\n    if (props.enableChunking && props.chunkingConfig) {\n      this.validateChunkingConfig(props.chunkingConfig);\n    }\n\n    if (props.network) {\n      props.network.createServiceEndpoint('vpce-bedrock', InterfaceVpcEndpointAwsService.BEDROCK);\n      props.network.createServiceEndpoint('vpce-bedrock-runtime', InterfaceVpcEndpointAwsService.BEDROCK_RUNTIME);\n    }\n\n    this.bedrockDocumentProcessingProps = props;\n    this.stateMachine = this.handleStateMachineCreation('bedrock-document-processing-workflow');\n  }\n\n  /**\n   * Validates the chunking configuration parameters.\n   *\n   * Ensures that:\n   * - Chunk size is greater than 0\n   * - Overlap is non-negative and less than chunk size\n   * - Thresholds are greater than 0\n   * - Max concurrency is greater than 0\n   * - Min success threshold is between 0 and 1\n   *\n   * @param config - The chunking configuration to validate\n   * @throws Error if any configuration parameter is invalid\n   */\n  private validateChunkingConfig(config: ChunkingConfig): void {\n    // Validate chunk size (for fixed-pages strategy)\n    if (config.chunkSize !== undefined) {\n      if (config.chunkSize <= 0) {\n        throw new Error('ChunkingConfig validation error: chunkSize must be greater than 0');\n      }\n    }\n\n    // Validate overlap pages (for fixed-pages strategy)\n    if (config.overlapPages !== undefined) {\n      if (config.overlapPages < 0) {\n        throw new Error('ChunkingConfig validation error: overlapPages must be non-negative');\n      }\n      const effectiveChunkSize = config.chunkSize || 50; // default chunk size\n      if (config.overlapPages >= effectiveChunkSize) {\n        throw new Error('ChunkingConfig validation error: overlapPages must be less than chunkSize');\n      }\n    }\n\n    // Validate page threshold\n    if (config.pageThreshold !== undefined && config.pageThreshold <= 0) {\n      throw new Error('ChunkingConfig validation error: pageThreshold must be greater than 0');\n    }\n\n    // Validate token threshold\n    if (config.tokenThreshold !== undefined && config.tokenThreshold <= 0) {\n      throw new Error('ChunkingConfig validation error: tokenThreshold must be greater than 0');\n    }\n\n    // Validate max tokens per chunk (for token-based strategy)\n    if (config.maxTokensPerChunk !== undefined && config.maxTokensPerChunk <= 0) {\n      throw new Error('ChunkingConfig validation error: maxTokensPerChunk must be greater than 0');\n    }\n\n    // Validate overlap tokens (for token-based and hybrid strategies)\n    if (config.overlapTokens !== undefined) {\n      if (config.overlapTokens < 0) {\n        throw new Error('ChunkingConfig validation error: overlapTokens must be non-negative');\n      }\n      const effectiveMaxTokens = config.maxTokensPerChunk || 100000; // default max tokens\n      if (config.overlapTokens >= effectiveMaxTokens) {\n        throw new Error('ChunkingConfig validation error: overlapTokens must be less than maxTokensPerChunk');\n      }\n    }\n\n    // Validate max pages per chunk (for hybrid strategy)\n    if (config.maxPagesPerChunk !== undefined && config.maxPagesPerChunk <= 0) {\n      throw new Error('ChunkingConfig validation error: maxPagesPerChunk must be greater than 0');\n    }\n\n    // Validate target tokens per chunk (for hybrid strategy)\n    if (config.targetTokensPerChunk !== undefined && config.targetTokensPerChunk <= 0) {\n      throw new Error('ChunkingConfig validation error: targetTokensPerChunk must be greater than 0');\n    }\n\n    // Validate max concurrency\n    if (config.maxConcurrency !== undefined && config.maxConcurrency <= 0) {\n      throw new Error('ChunkingConfig validation error: maxConcurrency must be greater than 0');\n    }\n\n    // Validate min success threshold\n    if (config.minSuccessThreshold !== undefined) {\n      if (config.minSuccessThreshold < 0 || config.minSuccessThreshold > 1) {\n        throw new Error('ChunkingConfig validation error: minSuccessThreshold must be between 0 and 1');\n      }\n    }\n  }\n\n  /**\n   * Implements the document classification step using Amazon Bedrock.\n   *\n   * Creates a Lambda function that invokes the configured Bedrock model to classify\n   * the document type. The function reads the document from S3 and sends it to\n   * Bedrock with the classification prompt.\n   *\n   * This method caches the Lambda function to avoid creating duplicate resources,\n   * but creates a new LambdaInvoke task each time to allow proper state chaining.\n   *\n   * @returns LambdaInvoke task configured for document classification\n   */\n  protected classificationStep(): DocumentProcessingStepType {\n    // Create Lambda function only once\n    if (!this._classificationFunction) {\n      const prompt = this.bedrockDocumentProcessingProps.classificationPrompt || BedrockDocumentProcessing.DEFAULT_CLASSIFICATION_PROMPT;\n      const adjustedModelId = BedrockModelUtils.deriveActualModelId(this.bedrockDocumentProcessingProps.classificationBedrockModel);\n      const role = this.generateLambdaRoleForBedrock('ClassificationLambdaRole', this.bedrockDocumentProcessingProps.classificationBedrockModel);\n      const { region, account } = Stack.of(this);\n      const generatedLogPermissions = LambdaIamUtils.createLogsPermissions({\n        account,\n        functionName: 'bedrock-idp-classification',\n        region,\n        scope: this,\n        enableObservability: this.bedrockDocumentProcessingProps.enableObservability,\n      });\n\n      this.encryptionKey.grantEncryptDecrypt(role);\n\n      this._classificationFunction = new PythonFunction(this, 'BedrockClassificationFunction', {\n        functionName: generatedLogPermissions.uniqueFunctionName,\n        architecture: Architecture.X86_64,\n        runtime: DefaultRuntimes.PYTHON,\n        entry: path.join(__dirname, 'resources/default-bedrock-invoke'),\n        role,\n        memorySize: 512,\n        timeout: this.bedrockDocumentProcessingProps.stepTimeouts || Duration.minutes(5),\n        environment: {\n          MODEL_ID: adjustedModelId,\n          PROMPT: prompt,\n          INVOKE_TYPE: 'classification',\n          ...PowertoolsConfig.generateDefaultLambdaConfig(\n            this.bedrockDocumentProcessingProps.enableObservability,\n            this.metricNamespace,\n            this.metricServiceName,\n          ),\n        },\n        environmentEncryption: this.encryptionKey,\n        vpc: this.bedrockDocumentProcessingProps.network\n          ? this.bedrockDocumentProcessingProps.network.vpc\n          : undefined,\n        vpcSubnets: this.bedrockDocumentProcessingProps.network\n          ? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection()\n          : undefined,\n      });\n\n      for (const statement of generatedLogPermissions.policyStatements) {\n        this._classificationFunction.role?.addToPrincipalPolicy(statement);\n      }\n\n      if (this.bedrockDocumentProcessingProps.network) {\n        this._classificationFunction.role?.addToPrincipalPolicy(LambdaIamUtils.generateLambdaVPCPermissions());\n      }\n    }\n\n    // Always create a new LambdaInvoke task to allow proper state chaining\n    const stepId = `ClassificationStep-${this._classificationStepCounter}`;\n    this._classificationStepCounter++;\n\n    return new LambdaInvoke(this, stepId, {\n      lambdaFunction: this._classificationFunction,\n      resultPath: '$.classificationResult',\n      resultSelector: {\n        'documentClassification.$': '$.Payload.documentClassification',\n      },\n    });\n  }\n\n  /**\n   * Implements the document extraction step using Amazon Bedrock.\n   *\n   * Creates a Lambda function that invokes the configured Bedrock model to extract\n   * structured data from the document. Uses the classification result from the\n   * previous step to provide context for more accurate extraction.\n   *\n   * This method caches the Lambda function to avoid creating duplicate resources,\n   * but creates a new LambdaInvoke task each time to allow proper state chaining.\n   *\n   * @returns LambdaInvoke task configured for document extraction\n   */\n  protected processingStep(): DocumentProcessingStepType {\n    // Create Lambda function only once\n    if (!this._processingFunction) {\n      const prompt = this.bedrockDocumentProcessingProps.processingPrompt || BedrockDocumentProcessing.DEFAULT_PROCESSING_PROMPT;\n      const adjustedModelId = BedrockModelUtils.deriveActualModelId(this.bedrockDocumentProcessingProps.processingBedrockModel);\n      const role = this.generateLambdaRoleForBedrock('ProcessingLambdaRole', this.bedrockDocumentProcessingProps.processingBedrockModel);\n      const { region, account } = Stack.of(this);\n\n      const generatedLogPermissions = LambdaIamUtils.createLogsPermissions({\n        account,\n        functionName: 'bedrock-idp-processing',\n        region,\n        scope: this,\n      });\n      this.encryptionKey.grantEncryptDecrypt(role);\n      this._processingFunction = new PythonFunction(this, 'BedrockExtractionFunction', {\n        functionName: generatedLogPermissions.uniqueFunctionName,\n        runtime: DefaultRuntimes.PYTHON,\n        architecture: Architecture.X86_64,\n        entry: path.join(__dirname, 'resources/default-bedrock-invoke'),\n        role,\n        memorySize: 512,\n        timeout: this.bedrockDocumentProcessingProps.stepTimeouts || Duration.minutes(5),\n        environment: {\n          MODEL_ID: adjustedModelId,\n          PROMPT: prompt,\n          INVOKE_TYPE: 'processing',\n          ...PowertoolsConfig.generateDefaultLambdaConfig(\n            this.bedrockDocumentProcessingProps.enableObservability,\n            this.metricNamespace,\n            this.metricServiceName,\n          ),\n        },\n        environmentEncryption: this.encryptionKey,\n        vpc: this.bedrockDocumentProcessingProps.network\n          ? this.bedrockDocumentProcessingProps.network.vpc\n          : undefined,\n        vpcSubnets: this.bedrockDocumentProcessingProps.network\n          ? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection()\n          : undefined,\n      });\n\n      for (const statement of generatedLogPermissions.policyStatements) {\n        this._processingFunction.role?.addToPrincipalPolicy(statement);\n      }\n\n      if (this.bedrockDocumentProcessingProps.network) {\n        this._processingFunction.role?.addToPrincipalPolicy(LambdaIamUtils.generateLambdaVPCPermissions());\n      }\n    }\n\n    // Always create a new LambdaInvoke task to allow proper state chaining\n    const stepId = `ProcessingStep-${this._processingStepCounter}`;\n    this._processingStepCounter++;\n\n    return new LambdaInvoke(this, stepId, {\n      lambdaFunction: this._processingFunction,\n      resultPath: '$.processingResult',\n      resultSelector: {\n        'documentClassification.$': '$.Payload.documentClassification',\n        'result.$': '$.Payload.result',\n      },\n    });\n  }\n\n  protected generateLambdaRoleForBedrock(id: string, model?: BedrockModelProps) {\n    return new Role(this, id, {\n      assumedBy: new ServicePrincipal('lambda.amazonaws.com'),\n      inlinePolicies: {\n        BedrockInvokePolicy: new PolicyDocument({\n          statements: [\n            // S3 read-only access for document retrieval - least privilege\n            ...this.ingressAdapter.generateAdapterIAMPolicies(),\n            BedrockModelUtils.generateModelIAMPermissions(this, model),\n          ],\n        }),\n      },\n    });\n  }\n\n  /**\n   * Implements the optional document enrichment step.\n   *\n   * If an enrichment Lambda function is provided in the props, creates a LambdaInvoke\n   * task to perform additional processing on the extracted data. This step is useful\n   * for data validation, transformation, or integration with external systems.\n   *\n   * @returns LambdaInvoke task for enrichment, or undefined to skip this step\n   */\n  protected enrichmentStep(): DocumentProcessingStepType | undefined {\n    if (!this.bedrockDocumentProcessingProps.enrichmentLambdaFunction) {\n      return undefined;\n    }\n\n    const stepId = `EnrichmentStep-${this._enrichmentStepCounter}`;\n    this._enrichmentStepCounter++;\n\n    return new LambdaInvoke(this, stepId, {\n      lambdaFunction: this.bedrockDocumentProcessingProps.enrichmentLambdaFunction,\n      resultPath: '$.enrichedResult',\n      outputPath: '$',\n      payloadResponseOnly: true,\n    });\n  }\n\n  /**\n   * Implements the optional post-processing step.\n   *\n   * If a post-processing Lambda function is provided in the props, creates a LambdaInvoke\n   * task to perform final processing on the workflow results. This step is useful for\n   * data formatting, notifications, or integration with downstream systems.\n   *\n   * @returns LambdaInvoke task for post-processing, or undefined to skip this step\n   */\n  protected postProcessingStep(): DocumentProcessingStepType | undefined {\n    if (!this.bedrockDocumentProcessingProps.postProcessingLambdaFunction) {\n      return undefined;\n    }\n\n    const stepId = `PostProcessingStep-${this._postProcessingStepCounter}`;\n    this._postProcessingStepCounter++;\n\n    return new LambdaInvoke(this, stepId, {\n      lambdaFunction: this.bedrockDocumentProcessingProps.postProcessingLambdaFunction,\n      resultPath: '$.postProcessedResult',\n      outputPath: '$',\n      payloadResponseOnly: true,\n    });\n  }\n\n\n  /**\n   * Implements the optional preprocessing step for PDF chunking.\n   *\n   * When chunking is enabled, creates a Lambda function that analyzes PDFs and\n   * splits large documents into manageable chunks. The function:\n   * 1. Analyzes the PDF to determine page count and token estimates\n   * 2. Decides if chunking is needed based on configured thresholds\n   * 3. If chunking is needed, splits the PDF and uploads chunks to S3\n   *\n   * @returns LambdaInvoke task for PDF analysis and chunking, or undefined if chunking is disabled\n   */\n  protected preprocessingStep(): DocumentProcessingStepType | undefined {\n    // Only enable chunking if explicitly configured\n    if (!this.bedrockDocumentProcessingProps.enableChunking) {\n      return undefined;\n    }\n\n    const { region, account } = Stack.of(this);\n    const chunkingConfig = this.bedrockDocumentProcessingProps.chunkingConfig || {};\n\n    // Create IAM role for chunking Lambda with least privilege permissions\n    // Chunking Lambda needs: GetObject (read raw PDFs), PutObject (write chunks)\n    const role = new Role(this, 'ChunkingLambdaRole', {\n      assumedBy: new ServicePrincipal('lambda.amazonaws.com'),\n      inlinePolicies: {\n        ChunkingPolicy: new PolicyDocument({\n          statements: [\n            ...this.ingressAdapter.generateAdapterIAMPolicies(),\n          ],\n        }),\n      },\n    });\n\n    const generatedLogPermissions = LambdaIamUtils.createLogsPermissions({\n      account,\n      functionName: 'bedrock-idp-chunking',\n      region,\n      scope: this,\n      enableObservability: this.bedrockDocumentProcessingProps.enableObservability,\n    });\n\n    this.encryptionKey.grantEncryptDecrypt(role);\n\n    // Create PDF Analysis & Chunking Lambda\n    const chunkingLambda = new PythonFunction(this, 'PDFChunkingFunction', {\n      functionName: generatedLogPermissions.uniqueFunctionName,\n      entry: path.join(__dirname, 'resources/pdf-chunking'),\n      index: 'handler.py',\n      handler: 'handler',\n      runtime: DefaultRuntimes.PYTHON,\n      architecture: Architecture.X86_64,\n      role,\n      memorySize: 2048,\n      timeout: Duration.minutes(10),\n      environment: {\n        CHUNKING_STRATEGY: chunkingConfig.strategy || 'hybrid',\n        PAGE_THRESHOLD: String(chunkingConfig.pageThreshold || 100),\n        TOKEN_THRESHOLD: String(chunkingConfig.tokenThreshold || 150000),\n        CHUNK_SIZE: String(chunkingConfig.chunkSize || 50),\n        OVERLAP_PAGES: String(chunkingConfig.overlapPages || 5),\n        MAX_TOKENS_PER_CHUNK: String(chunkingConfig.maxTokensPerChunk || 100000),\n        OVERLAP_TOKENS: String(chunkingConfig.overlapTokens || 5000),\n        TARGET_TOKENS_PER_CHUNK: String(chunkingConfig.targetTokensPerChunk || 80000),\n        MAX_PAGES_PER_CHUNK: String(chunkingConfig.maxPagesPerChunk || 99),\n        ...PowertoolsConfig.generateDefaultLambdaConfig(\n          this.bedrockDocumentProcessingProps.enableObservability,\n          this.metricNamespace,\n          this.metricServiceName,\n        ),\n      },\n      environmentEncryption: this.encryptionKey,\n      vpc: this.bedrockDocumentProcessingProps.network\n        ? this.bedrockDocumentProcessingProps.network.vpc\n        : undefined,\n      vpcSubnets: this.bedrockDocumentProcessingProps.network\n        ? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection()\n        : undefined,\n    });\n\n    for (const statement of generatedLogPermissions.policyStatements) {\n      chunkingLambda.role?.addToPrincipalPolicy(statement);\n    }\n\n    if (this.bedrockDocumentProcessingProps.network) {\n      chunkingLambda.role?.addToPrincipalPolicy(LambdaIamUtils.generateLambdaVPCPermissions());\n    }\n\n    return new LambdaInvoke(this, 'PDFAnalysisAndChunking', {\n      lambdaFunction: chunkingLambda,\n      resultPath: '$.chunkingResult',\n      resultSelector: {\n        'requiresChunking.$': '$.Payload.requiresChunking',\n        'tokenAnalysis.$': '$.Payload.tokenAnalysis',\n        'strategy.$': '$.Payload.strategy',\n        'chunks.$': '$.Payload.chunks',\n      },\n    });\n  }\n\n  /**\n   * Provides additional metadata fields for chunking to be stored in DynamoDB.\n   *\n   * When chunking is enabled, adds fields for:\n   * - ChunkingEnabled: string representation of boolean flag\n   * - ChunkingStrategy: strategy used (fixed-pages, token-based, hybrid)\n   * - TokenAnalysis: JSON string with token analysis results\n   * - ChunkMetadata: JSON string array with chunk information\n   *\n   * @returns Record of DynamoDB attribute values for chunking metadata\n   */\n  protected preprocessingMetadata(): Record<string, DynamoAttributeValue> {\n    if (!this.bedrockDocumentProcessingProps.enableChunking) {\n      return {};\n    }\n\n    return {\n      ChunkingEnabled: DynamoAttributeValue.fromString(\n        JsonPath.stringAt('States.Format(\\'{}\\', $.chunkingResult.requiresChunking)'),\n      ),\n      ChunkingStrategy: DynamoAttributeValue.fromString(\n        JsonPath.stringAt('$.chunkingResult.strategy'),\n      ),\n      TokenAnalysis: DynamoAttributeValue.fromString(\n        JsonPath.jsonToString(JsonPath.objectAt('$.chunkingResult.tokenAnalysis')),\n      ),\n      ChunkMetadata: DynamoAttributeValue.fromString(\n        JsonPath.jsonToString(JsonPath.objectAt('$.chunkingResult.chunks')),\n      ),\n    };\n  }\n\n  /**\n   * Creates the processing workflow with conditional branching for chunked documents.\n   *\n   * When chunking is enabled, creates a Choice State that:\n   * - Routes to chunked processing flow if document was chunked\n   * - Routes to standard processing flow if document was not chunked\n   *\n   * When chunking is disabled, returns the standard processing workflow.\n   *\n   * @returns Step Functions chain for processing the document\n   */\n  protected createProcessingWorkflow(): IChainable {\n    // If chunking is not enabled, use standard workflow\n    if (!this.bedrockDocumentProcessingProps.enableChunking) {\n      return this.createStandardProcessingWorkflow();\n    }\n\n    // Create Choice State to check if chunking was applied\n    const choiceState = new Choice(this, 'CheckIfChunked');\n\n    choiceState\n      .when(\n        Condition.booleanEquals('$.chunkingResult.requiresChunking', true),\n        this.createChunkedProcessingFlow(),\n      )\n      .otherwise(\n        // Pass 'Standard' prefix to avoid construct ID collisions with chunked flow\n        this.createStandardProcessingWorkflow('Standard'),\n      );\n\n    return choiceState;\n  }\n\n\n  /**\n   * Creates the chunked processing flow for large documents.\n   *\n   * This flow:\n   * 1. Uses a Map State to process each chunk in parallel (or sequentially)\n   * 2. Each chunk goes through classification and processing\n   * 3. Results are aggregated using the aggregation Lambda\n   * 4. DynamoDB is updated with the aggregated result\n   * 5. Temporary chunks are cleaned up from S3\n   *\n   * @returns Step Functions chain for chunked document processing\n   */\n  private createChunkedProcessingFlow(): IChainable {\n    const chunkingConfig = this.bedrockDocumentProcessingProps.chunkingConfig || {};\n    const maxConcurrency = chunkingConfig.processingMode === 'sequential'\n      ? 1\n      : (chunkingConfig.maxConcurrency || 10);\n\n    // Create Map State for processing chunks\n    const mapState = new Map(this, 'ProcessChunks', {\n      itemsPath: '$.chunkingResult.chunks',\n      maxConcurrency,\n      parameters: {\n        'documentId.$': '$.documentId',\n        'chunk.$': '$$.Map.Item.Value',\n        'chunkIndex.$': '$$.Map.Item.Index',\n        'totalChunks.$': 'States.ArrayLength($.chunkingResult.chunks)',\n        // Override content to point to the chunk PDF, not the original document\n        'content': {\n          'location': 's3',\n          'bucket.$': '$$.Map.Item.Value.bucket',\n          'key.$': '$$.Map.Item.Value.key',\n          'filename.$': '$.content.filename',\n        },\n        'contentType.$': '$.contentType',\n      },\n      resultPath: '$.chunkResults',\n    });\n\n    // Define per-chunk processing: classification → processing\n    const chunkClassification = this.classificationStep();\n    const chunkProcessing = this.processingStep();\n\n    mapState.itemProcessor(\n      chunkClassification.next(chunkProcessing),\n    );\n\n    // Create aggregation step (Lambda invoke only, normalization added separately)\n    const aggregationLambdaStep = this.createAggregationStep();\n\n    // Add a Pass state to normalize the aggregated result for downstream compatibility\n    // This copies aggregatedResult to processingResult so enrichment/post-processing\n    // see a consistent structure regardless of whether chunking was used\n    const normalizeState = new Pass(this, 'NormalizeAggregatedResult', {\n      parameters: {\n        'documentId.$': '$.documentId',\n        'contentType.$': '$.contentType',\n        'content.$': '$.content',\n        'chunkingResult.$': '$.chunkingResult',\n        'chunkResults.$': '$.chunkResults',\n        'aggregatedResult.$': '$.aggregatedResult',\n        // Copy aggregated result to processingResult for downstream compatibility\n        'processingResult': {\n          'result.$': '$.aggregatedResult.result',\n        },\n        // Also set classificationResult from the first successful chunk for consistency\n        'classificationResult.$': '$.chunkResults[0].classificationResult',\n      },\n    });\n\n    // Create DynamoDB update step for aggregated result\n    const updateAggregatedResultStep = this.createUpdateAggregatedResultStep();\n\n    // Create cleanup step\n    const cleanupStep = this.createCleanupStep();\n\n    // Create move to processed chain with 'Chunked' prefix to avoid ID collisions\n    const moveToProcessed = this.ingressAdapter.createSuccessChain(this, 'Chunked');\n\n    // Create error handler for aggregation failures\n    const aggregationErrorHandler = this.createAggregationErrorHandler();\n\n    // Get optional enrichment and post-processing steps\n    const enrichmentStep = this.enrichmentStep();\n    const postProcessingStep = this.postProcessingStep();\n\n    // Build the final chain after aggregation\n    // Chain: Map State → Aggregation → DynamoDB Update → [Enrichment] → [PostProcessing] → Cleanup → Move to Processed\n    let finalChain: IChainable = cleanupStep\n      .addRetry({\n        errors: ['Lambda.ServiceException', 'Lambda.TooManyRequestsException'],\n        interval: Duration.seconds(2),\n        maxAttempts: 3,\n        backoffRate: 2,\n      })\n      .next(moveToProcessed);\n\n    // Add post-processing if provided (insert before cleanup)\n    if (postProcessingStep) {\n      const postProcessingErrorHandler = new DynamoUpdateItem(this, 'ChunkedPostProcessingFailDDBUpdate', {\n        table: this.documentProcessingTable,\n        key: {\n          DocumentId: DynamoAttributeValue.fromString(JsonPath.stringAt('$.documentId')),\n        },\n        updateExpression: 'SET WorkflowStatus = :newStatus',\n        expressionAttributeValues: {\n          ':newStatus': DynamoAttributeValue.fromString('post-processing-failure'),\n        },\n        resultPath: JsonPath.DISCARD,\n      }).next(this.ingressAdapter.createFailedChain(this, 'ChunkedPostProc'));\n\n      finalChain = postProcessingStep\n        .addCatch(postProcessingErrorHandler, {\n          resultPath: JsonPath.DISCARD,\n        })\n        .next(\n          new DynamoUpdateItem(this, 'ChunkedPostProcessingSuccessUpdate', {\n            table: this.documentProcessingTable,\n            key: {\n              DocumentId: DynamoAttributeValue.fromString(JsonPath.stringAt('$.documentId')),\n            },\n            updateExpression: 'SET WorkflowStatus = :newStatus, PostProcessingResult = :postProcessingResult',\n            expressionAttributeValues: {\n              ':newStatus': DynamoAttributeValue.fromString('post-processing-complete'),\n              ':postProcessingResult': DynamoAttributeValue.fromString(JsonPath.jsonToString(JsonPath.objectAt('$.postProcessedResult'))),\n            },\n            resultPath: JsonPath.DISCARD,\n          }).next(finalChain),\n        );\n    }\n\n    // Add enrichment if provided (insert before post-processing or cleanup)\n    if (enrichmentStep) {\n      const enrichmentErrorHandler = new DynamoUpdateItem(this, 'ChunkedEnrichmentFailDDBUpdate', {\n        table: this.documentProcessingTable,\n        key: {\n          DocumentId: DynamoAttributeValue.fromString(JsonPath.stringAt('$.documentId')),\n        },\n        updateExpression: 'SET WorkflowStatus = :newStatus',\n        expressionAttributeValues: {\n          ':newStatus': DynamoAttributeValue.fromString('enrichment-failure'),\n        },\n        resultPath: JsonPath.DISCARD,\n      }).next(this.ingressAdapter.createFailedChain(this, 'ChunkedEnrich'));\n\n      finalChain = enrichmentStep\n        .addCatch(enrichmentErrorHandler, {\n          resultPath: JsonPath.DISCARD,\n        })\n        .next(\n          new DynamoUpdateItem(this, 'ChunkedEnrichmentSuccessUpdate', {\n            table: this.documentProcessingTable,\n            key: {\n              DocumentId: DynamoAttributeValue.fromString(JsonPath.stringAt('$.documentId')),\n            },\n            updateExpression: 'SET WorkflowStatus = :newStatus, EnrichmentResult = :enrichmentResult',\n            expressionAttributeValues: {\n              ':newStatus': postProcessingStep\n                ? DynamoAttributeValue.fromString('enrichment-complete')\n                : DynamoAttributeValue.fromString('complete'),\n              ':enrichmentResult': DynamoAttributeValue.fromString(JsonPath.jsonToString(JsonPath.objectAt('$.enrichedResult'))),\n            },\n            resultPath: JsonPath.DISCARD,\n          }).next(finalChain),\n        );\n    }\n\n    // Chain: Map State → Aggregation → Normalize → DynamoDB Update → [Enrichment] → [PostProcessing] → Cleanup → Move to Processed\n    return mapState\n      .addCatch(aggregationErrorHandler, {\n        resultPath: '$.error',\n      })\n      .next(\n        aggregationLambdaStep\n          .addCatch(aggregationErrorHandler, {\n            resultPath: '$.error',\n          })\n          .addRetry({\n            errors: ['Lambda.ServiceException', 'Lambda.TooManyRequestsException'],\n            interval: Duration.seconds(2),\n            maxAttempts: 3,\n            backoffRate: 2,\n          })\n          .next(\n            normalizeState.next(\n              updateAggregatedResultStep\n                .addRetry({\n                  errors: ['DynamoDB.ProvisionedThroughputExceededException'],\n                  interval: Duration.seconds(1),\n                  maxAttempts: 3,\n                  backoffRate: 2,\n                })\n                .next(finalChain),\n            ),\n          ),\n      );\n  }\n\n  /**\n   * Creates the aggregation step for combining chunk results using Bedrock.\n   *\n   * Uses the same Bedrock invoke Lambda pattern as the processing step but with\n   * a different prompt designed for aggregating multiple chunk results.\n   * The chunk processing results are passed as text data to the model.\n   *\n   * @returns LambdaInvoke task for result aggregation\n   */\n  private createAggregationStep(): LambdaInvoke {\n    // Create Lambda function only once (reuses bedrock-invoke pattern)\n    if (!this._aggregationFunction) {\n      const prompt = this.bedrockDocumentProcessingProps.aggregationPrompt || BedrockDocumentProcessing.DEFAULT_AGGREGATION_PROMPT;\n      const adjustedModelId = BedrockModelUtils.deriveActualModelId(this.bedrockDocumentProcessingProps.processingBedrockModel);\n      const role = this.generateLambdaRoleForBedrock('AggregationLambdaRole', this.bedrockDocumentProcessingProps.processingBedrockModel);\n      const { region, account } = Stack.of(this);\n\n      const generatedLogPermissions = LambdaIamUtils.createLogsPermissions({\n        account,\n        functionName: 'bedrock-idp-aggregation',\n        region,\n        scope: this,\n        enableObservability: this.bedrockDocumentProcessingProps.enableObservability,\n      });\n\n      this.encryptionKey.grantEncryptDecrypt(role);\n\n      this._aggregationFunction = new PythonFunction(this, 'BedrockAggregationFunction', {\n        functionName: generatedLogPermissions.uniqueFunctionName,\n        architecture: Architecture.X86_64,\n        runtime: DefaultRuntimes.PYTHON,\n        entry: path.join(__dirname, 'resources/default-bedrock-invoke'),\n        role,\n        memorySize: 1024,\n        timeout: this.bedrockDocumentProcessingProps.stepTimeouts || Duration.minutes(5),\n        environment: {\n          MODEL_ID: adjustedModelId,\n          PROMPT: prompt,\n          INVOKE_TYPE: 'aggregation',\n          INVOKE_MAX_TOKENS: '64000', // Aggregation may need more tokens for merged output\n          ...PowertoolsConfig.generateDefaultLambdaConfig(\n            this.bedrockDocumentProcessingProps.enableObservability,\n            this.metricNamespace,\n            this.metricServiceName,\n          ),\n        },\n        environmentEncryption: this.encryptionKey,\n        vpc: this.bedrockDocumentProcessingProps.network\n          ? this.bedrockDocumentProcessingProps.network.vpc\n          : undefined,\n        vpcSubnets: this.bedrockDocumentProcessingProps.network\n          ? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection()\n          : undefined,\n      });\n\n      for (const statement of generatedLogPermissions.policyStatements) {\n        this._aggregationFunction.role?.addToPrincipalPolicy(statement);\n      }\n\n      if (this.bedrockDocumentProcessingProps.network) {\n        this._aggregationFunction.role?.addToPrincipalPolicy(LambdaIamUtils.generateLambdaVPCPermissions());\n      }\n    }\n\n    // Always create a new LambdaInvoke task to allow proper state chaining\n    const stepId = `AggregationStep-${this._aggregationStepCounter}`;\n    this._aggregationStepCounter++;\n\n    // Pass chunk results as data content - the Lambda will format them for Bedrock\n    return new LambdaInvoke(this, stepId, {\n      lambdaFunction: this._aggregationFunction,\n      payload: TaskInput.fromObject({\n        'documentId.$': '$.documentId',\n        'contentType': 'data',\n        'content': {\n          // Pass the chunk results as JSON string for the Lambda to process\n          'data.$': 'States.JsonToString($.chunkResults)',\n        },\n      }),\n      // Store in both aggregatedResult AND processingResult for consistency with non-chunked flow\n      // This allows enrichment/post-processing steps to use $.processingResult regardless of chunking\n      resultPath: '$.aggregatedResult',\n      resultSelector: {\n        'result.$': '$.Payload.result',\n      },\n    });\n  }\n\n  /**\n   * Creates the DynamoDB update step for storing aggregated results.\n   *\n   * Updates the document record with:\n   * - AggregatedResult: JSON string with classification, entities, and summary\n   * - WorkflowStatus: 'complete'\n   *\n   * @returns DynamoUpdateItem task for storing aggregated results\n   */\n  private createUpdateAggregatedResultStep(): DynamoUpdateItem {\n    return new DynamoUpdateItem(this, 'StoreAggregatedResult', {\n      table: this.documentProcessingTable,\n      key: {\n        DocumentId: DynamoAttributeValue.fromString(JsonPath.stringAt('$.documentId')),\n      },\n      updateExpression: 'SET AggregatedResult = :result, WorkflowStatus = :status',\n      expressionAttributeValues: {\n        ':result': DynamoAttributeValue.fromString(\n          JsonPath.jsonToString(JsonPath.objectAt('$.aggregatedResult')),\n        ),\n        ':status': DynamoAttributeValue.fromString('complete'),\n      },\n      resultPath: JsonPath.DISCARD,\n    });\n  }\n\n  /**\n   * Creates the cleanup Lambda step for removing temporary chunk files.\n   *\n   * The cleanup Lambda:\n   * - Deletes all chunk files from S3 chunks/ prefix\n   * - Uses batch delete for efficiency (up to 1000 objects per request)\n   * - Logs errors but doesn't fail the workflow\n   *\n   * @returns LambdaInvoke task for chunk cleanup\n   */\n  private createCleanupStep(): LambdaInvoke {\n    // Create Lambda function only once\n    if (!this._cleanupFunction) {\n      const { region, account } = Stack.of(this);\n\n      const role = new Role(this, 'CleanupLambdaRole', {\n        assumedBy: new ServicePrincipal('lambda.amazonaws.com'),\n        inlinePolicies: {\n          CleanupPolicy: new PolicyDocument({\n            statements: [\n              // S3 access for deleting chunks only - least privilege\n              ...this.ingressAdapter.generateAdapterIAMPolicies(['s3:DeleteObject'], true),\n            ],\n          }),\n        },\n      });\n\n      const generatedLogPermissions = LambdaIamUtils.createLogsPermissions({\n        account,\n        functionName: 'bedrock-idp-cleanup',\n        region,\n        scope: this,\n        enableObservability: this.bedrockDocumentProcessingProps.enableObservability,\n      });\n\n      this.encryptionKey.grantEncryptDecrypt(role);\n\n      this._cleanupFunction = new PythonFunction(this, 'CleanupFunction', {\n        functionName: generatedLogPermissions.uniqueFunctionName,\n        entry: path.join(__dirname, 'resources/cleanup'),\n        index: 'handler.py',\n        handler: 'handler',\n        runtime: DefaultRuntimes.PYTHON,\n        architecture: Architecture.X86_64,\n        role,\n        memorySize: 512,\n        timeout: Duration.minutes(5),\n        environment: {\n          ...PowertoolsConfig.generateDefaultLambdaConfig(\n            this.bedrockDocumentProcessingProps.enableObservability,\n            this.metricNamespace,\n            this.metricServiceName,\n          ),\n        },\n        environmentEncryption: this.encryptionKey,\n        vpc: this.bedrockDocumentProcessingProps.network\n          ? this.bedrockDocumentProcessingProps.network.vpc\n          : undefined,\n        vpcSubnets: this.bedrockDocumentProcessingProps.network\n          ? this.bedrockDocumentProcessingProps.network.applicationSubnetSelection()\n          : undefined,\n      });\n\n      for (const statement of generatedLogPermissions.policyStatements) {\n        this._cleanupFunction.role?.addToPrincipalPolicy(statement);\n      }\n\n      if (this.bedrockDocumentProcessingProps.network) {\n        this._cleanupFunction.role?.addToPrincipalPolicy(LambdaIamUtils.generateLambdaVPCPermissions());\n      }\n    }\n\n    return new LambdaInvoke(this, 'CleanupChunks', {\n      lambdaFunction: this._cleanupFunction,\n      payload: TaskInput.fromObject({\n        'documentId.$': '$.documentId',\n        'chunks.$': '$.chunkingResult.chunks',\n      }),\n      resultPath: JsonPath.DISCARD,\n    });\n  }\n\n  /**\n   * Creates the error handler for aggregation failures.\n   *\n   * When aggregation fails:\n   * - Updates DynamoDB with 'aggregation-failure' status\n   * - Moves document to failed/ prefix\n   *\n   * @returns Step Functions chain for handling aggregation errors\n   */\n  private createAggregationErrorHandler(): IChainable {\n    const updateFailureStatus = new DynamoUpdateItem(this, 'AggregationFailDDBUpdate', {\n      table: this.documentProcessingTable,\n      key: {\n        DocumentId: DynamoAttributeValue.fromString(JsonPath.stringAt('$.documentId')),\n      },\n      updateExpression: 'SET WorkflowStatus = :newStatus',\n      expressionAttributeValues: {\n        ':newStatus': DynamoAttributeValue.fromString('aggregation-failure'),\n      },\n      resultPath: JsonPath.DISCARD,\n    });\n\n    // Use 'Chunked' prefix to avoid ID collisions with standard workflow\n    const moveToFailed = this.ingressAdapter.createFailedChain(this, 'Chunked');\n\n    return updateFailureStatus.next(moveToFailed);\n  }\n}\n"]}
|