cdk-nuxt 2.0.0 → 2.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +45 -19
- package/index.d.ts +2 -1
- package/index.js +3 -3
- package/lib/cli/deploy-server.js +33 -5
- package/lib/cli/destroy-server.js +13 -0
- package/lib/functions/access-logs-analysis/group-by-date/.gitignore +2 -0
- package/lib/functions/access-logs-analysis/group-by-date/build/app/index.d.ts +2 -0
- package/lib/functions/access-logs-analysis/group-by-date/build/app/index.js +57 -0
- package/lib/functions/access-logs-analysis/group-by-date/build/app/index.js.map +1 -0
- package/lib/functions/access-logs-analysis/group-by-date/index.d.ts +2 -0
- package/lib/functions/access-logs-analysis/group-by-date/index.js +57 -0
- package/lib/functions/access-logs-analysis/group-by-date/index.ts +64 -0
- package/lib/functions/access-logs-analysis/group-by-date/package.json +20 -0
- package/lib/functions/access-logs-analysis/group-by-date/tsconfig.json +33 -0
- package/lib/functions/access-logs-analysis/group-by-date/yarn.lock +1203 -0
- package/lib/functions/access-logs-analysis/partitioning/.gitignore +2 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/create-partition.d.ts +1 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/create-partition.js +57 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/create-partition.js.map +1 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/transform-partition.d.ts +2 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/transform-partition.js +72 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/transform-partition.js.map +1 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/types.d.ts +7 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/types.js +3 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/types.js.map +1 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/util.d.ts +9 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/util.js +44 -0
- package/lib/functions/access-logs-analysis/partitioning/build/app/util.js.map +1 -0
- package/lib/functions/access-logs-analysis/partitioning/create-partition.d.ts +1 -0
- package/lib/functions/access-logs-analysis/partitioning/create-partition.js +57 -0
- package/lib/functions/access-logs-analysis/partitioning/create-partition.ts +58 -0
- package/lib/functions/access-logs-analysis/partitioning/package.json +20 -0
- package/lib/functions/access-logs-analysis/partitioning/transform-partition.d.ts +2 -0
- package/lib/functions/access-logs-analysis/partitioning/transform-partition.js +72 -0
- package/lib/functions/access-logs-analysis/partitioning/transform-partition.ts +83 -0
- package/lib/functions/access-logs-analysis/partitioning/tsconfig.json +33 -0
- package/lib/functions/access-logs-analysis/partitioning/types.d.ts +7 -0
- package/lib/functions/access-logs-analysis/partitioning/types.js +3 -0
- package/lib/functions/access-logs-analysis/partitioning/types.ts +8 -0
- package/lib/functions/access-logs-analysis/partitioning/util.d.ts +9 -0
- package/lib/functions/access-logs-analysis/partitioning/util.js +44 -0
- package/lib/functions/access-logs-analysis/partitioning/util.ts +52 -0
- package/lib/functions/access-logs-analysis/partitioning/yarn.lock +951 -0
- package/lib/functions/assets-cleanup/build/app/index.js +1 -1
- package/lib/functions/assets-cleanup/build/app/index.js.map +1 -1
- package/lib/functions/assets-cleanup/index.js +2 -2
- package/lib/functions/assets-cleanup/index.ts +2 -2
- package/lib/stack/NuxtAppStackProps.js +3 -0
- package/lib/stack/{nuxt-app-static-assets.d.ts → NuxtAppStaticAssets.d.ts} +9 -4
- package/lib/stack/NuxtAppStaticAssets.js +71 -0
- package/lib/stack/{nuxt-app-static-assets.ts → NuxtAppStaticAssets.ts} +31 -24
- package/lib/stack/access-logs-analysis/AccessLogsAnalysis.d.ts +66 -0
- package/lib/stack/access-logs-analysis/AccessLogsAnalysis.js +270 -0
- package/lib/stack/access-logs-analysis/AccessLogsAnalysis.ts +330 -0
- package/lib/stack/access-logs-analysis/AccessLogsAnalysisProps.d.ts +21 -0
- package/lib/stack/access-logs-analysis/AccessLogsAnalysisProps.js +3 -0
- package/lib/stack/access-logs-analysis/AccessLogsAnalysisProps.ts +26 -0
- package/lib/stack/access-logs-analysis/AccessLogsParquetTable.d.ts +9 -0
- package/lib/stack/access-logs-analysis/AccessLogsParquetTable.js +25 -0
- package/lib/stack/access-logs-analysis/AccessLogsParquetTable.ts +23 -0
- package/lib/stack/access-logs-analysis/AccessLogsTableConfig.d.ts +8 -0
- package/lib/stack/access-logs-analysis/AccessLogsTableConfig.js +167 -0
- package/lib/stack/access-logs-analysis/AccessLogsTableConfig.ts +164 -0
- package/lib/stack/access-logs-analysis/AccessLogsTableProps.d.ts +7 -0
- package/lib/stack/access-logs-analysis/AccessLogsTableProps.js +3 -0
- package/lib/stack/access-logs-analysis/AccessLogsTableProps.ts +8 -0
- package/lib/stack/access-logs-analysis/CloudFrontAccessLogsAnalysis.d.ts +36 -0
- package/lib/stack/access-logs-analysis/CloudFrontAccessLogsAnalysis.js +60 -0
- package/lib/stack/access-logs-analysis/CloudFrontAccessLogsAnalysis.ts +73 -0
- package/lib/stack/access-logs-analysis/CloudFrontAccessLogsByDateTable.d.ts +9 -0
- package/lib/stack/access-logs-analysis/CloudFrontAccessLogsByDateTable.js +37 -0
- package/lib/stack/access-logs-analysis/CloudFrontAccessLogsByDateTable.ts +44 -0
- package/lib/stack/server/{nuxt-server-app-stack.d.ts → NuxtServerAppStack.d.ts} +13 -75
- package/lib/stack/server/NuxtServerAppStack.js +483 -0
- package/lib/stack/server/{nuxt-server-app-stack.ts → NuxtServerAppStack.ts} +53 -91
- package/lib/stack/server/NuxtServerAppStackProps.d.ts +80 -0
- package/lib/stack/server/NuxtServerAppStackProps.js +3 -0
- package/lib/stack/server/NuxtServerAppStackProps.ts +94 -0
- package/lib/templates/stack-index-server.ts +108 -15
- package/package.json +3 -1
- package/lib/stack/nuxt-app-stack-props.js +0 -3
- package/lib/stack/nuxt-app-static-assets.js +0 -72
- package/lib/stack/server/nuxt-server-app-stack.js +0 -447
- /package/lib/stack/{nuxt-app-stack-props.d.ts → NuxtAppStackProps.d.ts} +0 -0
- /package/lib/stack/{nuxt-app-stack-props.ts → NuxtAppStackProps.ts} +0 -0
|
@@ -0,0 +1,270 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
|
3
|
+
exports.AccessLogsAnalysis = void 0;
|
|
4
|
+
const aws_s3_1 = require("aws-cdk-lib/aws-s3");
|
|
5
|
+
const constructs_1 = require("constructs");
|
|
6
|
+
const aws_athena_1 = require("aws-cdk-lib/aws-athena");
|
|
7
|
+
const aws_lambda_1 = require("aws-cdk-lib/aws-lambda");
|
|
8
|
+
const aws_events_1 = require("aws-cdk-lib/aws-events");
|
|
9
|
+
const aws_cdk_lib_1 = require("aws-cdk-lib");
|
|
10
|
+
const aws_glue_alpha_1 = require("@aws-cdk/aws-glue-alpha");
|
|
11
|
+
const aws_lambda_event_sources_1 = require("aws-cdk-lib/aws-lambda-event-sources");
|
|
12
|
+
const aws_logs_1 = require("aws-cdk-lib/aws-logs");
|
|
13
|
+
const aws_iam_1 = require("aws-cdk-lib/aws-iam");
|
|
14
|
+
const aws_events_targets_1 = require("aws-cdk-lib/aws-events-targets");
|
|
15
|
+
const path = require("path");
|
|
16
|
+
/**
|
|
17
|
+
* Provides the AWS resources to analyze access logs. This construct is derived from the official AWS sample
|
|
18
|
+
* CloudFormation stack:
|
|
19
|
+
* {@link https://github.com/aws-samples/amazon-cloudfront-access-logs-queries/blob/mainline/template.yaml}
|
|
20
|
+
*/
|
|
21
|
+
class AccessLogsAnalysis extends constructs_1.Construct {
|
|
22
|
+
constructor(scope, id, props) {
|
|
23
|
+
super(scope, id);
|
|
24
|
+
this.resourceIdPrefix = props.resourcePrefix;
|
|
25
|
+
this.bucket = props.bucket;
|
|
26
|
+
this.setupLifecycleRules(props);
|
|
27
|
+
this.workgroup = this.createWorkgroup();
|
|
28
|
+
this.database = this.createGlueDatabase();
|
|
29
|
+
this.accessLogsByDateTable = this.createAccessLogsByDateTable();
|
|
30
|
+
this.accessLogsParquetTable = this.createAccessLogsParquetTable();
|
|
31
|
+
this.groupByDateLayer = this.createGroupByDateLayer();
|
|
32
|
+
this.groupByDateLambda = this.createGroupByDateLambda();
|
|
33
|
+
this.partitioningLayer = this.createPartitioningLayer();
|
|
34
|
+
this.createPartitionLambda = this.createCreatePartitionLambda();
|
|
35
|
+
this.transformPartitionLambda = this.createTransformPartitionLambda();
|
|
36
|
+
this.createPartitionsScheduler = this.createCreatePartitionsScheduler();
|
|
37
|
+
this.transformPartitionsScheduler = this.createTransformPartitionsScheduler(props);
|
|
38
|
+
}
|
|
39
|
+
setupLifecycleRules(props) {
|
|
40
|
+
// cleanup raw and partitioned access logs after a configurable time range
|
|
41
|
+
var _a, _b, _c;
|
|
42
|
+
this.bucket.addLifecycleRule({
|
|
43
|
+
id: `${this.resourceIdPrefix}-cleanup-unprocessed`,
|
|
44
|
+
prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_UNPROCESSED}/*`,
|
|
45
|
+
expiration: (_a = props.expireRawLogsAfter) !== null && _a !== void 0 ? _a : aws_cdk_lib_1.Duration.days(7),
|
|
46
|
+
});
|
|
47
|
+
this.bucket.addLifecycleRule({
|
|
48
|
+
id: `${this.resourceIdPrefix}-cleanup-grouped`,
|
|
49
|
+
prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_GROUPED_BY_DATE}/*`,
|
|
50
|
+
expiration: (_b = props.expireIntermediateLogsAfter) !== null && _b !== void 0 ? _b : aws_cdk_lib_1.Duration.days(7),
|
|
51
|
+
});
|
|
52
|
+
this.bucket.addLifecycleRule({
|
|
53
|
+
id: `${this.resourceIdPrefix}-cleanup-transformed`,
|
|
54
|
+
prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_TRANSFORMED}/*`,
|
|
55
|
+
expiration: (_c = props.expireTransformedLogsAfter) !== null && _c !== void 0 ? _c : aws_cdk_lib_1.Duration.days(180),
|
|
56
|
+
});
|
|
57
|
+
/* CHECKME: delete query results after 1 week
|
|
58
|
+
this.bucket.addLifecycleRule({
|
|
59
|
+
id: `${this.resourceIdPrefix}-cleanup-query-results`,
|
|
60
|
+
prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_ATHENA_RESULTS}/*`,
|
|
61
|
+
expiration: Duration.days(7),
|
|
62
|
+
});
|
|
63
|
+
*/
|
|
64
|
+
}
|
|
65
|
+
createWorkgroup() {
|
|
66
|
+
const workgroupName = `${this.resourceIdPrefix}-workgroup`;
|
|
67
|
+
// due to a current bug, the tags are not automatically assigned to the workgroup
|
|
68
|
+
// note, that the keys must be converted to lower case
|
|
69
|
+
const tags = aws_cdk_lib_1.Stack.of(this)
|
|
70
|
+
.tags.renderTags()
|
|
71
|
+
.map((tag) => ({ key: tag.Key, value: tag.Value }));
|
|
72
|
+
return new aws_athena_1.CfnWorkGroup(this, workgroupName, {
|
|
73
|
+
name: workgroupName,
|
|
74
|
+
workGroupConfiguration: {
|
|
75
|
+
publishCloudWatchMetricsEnabled: false,
|
|
76
|
+
resultConfiguration: {
|
|
77
|
+
outputLocation: `s3://${this.bucket.bucketName}/${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_ATHENA_RESULTS}`,
|
|
78
|
+
},
|
|
79
|
+
enforceWorkGroupConfiguration: true
|
|
80
|
+
},
|
|
81
|
+
tags,
|
|
82
|
+
});
|
|
83
|
+
}
|
|
84
|
+
createGlueDatabase() {
|
|
85
|
+
const databaseName = `${this.resourceIdPrefix}-database`;
|
|
86
|
+
return new aws_glue_alpha_1.Database(this, databaseName, {
|
|
87
|
+
// Athena doesn't support dashes in database/table names
|
|
88
|
+
databaseName: databaseName.replace(/-/g, '_'),
|
|
89
|
+
});
|
|
90
|
+
}
|
|
91
|
+
createGroupByDateLayer() {
|
|
92
|
+
const layerVersionName = `${this.resourceIdPrefix}-group-by-date-dependencies`;
|
|
93
|
+
return new aws_lambda_1.LayerVersion(this, layerVersionName, {
|
|
94
|
+
layerVersionName,
|
|
95
|
+
compatibleArchitectures: [aws_lambda_1.Architecture.ARM_64, aws_lambda_1.Architecture.X86_64],
|
|
96
|
+
compatibleRuntimes: [aws_lambda_1.Runtime.NODEJS_14_X, aws_lambda_1.Runtime.NODEJS_16_X],
|
|
97
|
+
code: aws_lambda_1.Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/group-by-date/build/layer')),
|
|
98
|
+
removalPolicy: aws_cdk_lib_1.RemovalPolicy.DESTROY,
|
|
99
|
+
});
|
|
100
|
+
}
|
|
101
|
+
createPartitioningLayer() {
|
|
102
|
+
const layerVersionName = `${this.resourceIdPrefix}-partitioning-dependencies`;
|
|
103
|
+
return new aws_lambda_1.LayerVersion(this, layerVersionName, {
|
|
104
|
+
layerVersionName,
|
|
105
|
+
compatibleArchitectures: [aws_lambda_1.Architecture.ARM_64, aws_lambda_1.Architecture.X86_64],
|
|
106
|
+
compatibleRuntimes: [aws_lambda_1.Runtime.NODEJS_14_X, aws_lambda_1.Runtime.NODEJS_16_X],
|
|
107
|
+
code: aws_lambda_1.Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/partitioning/build/layer')),
|
|
108
|
+
removalPolicy: aws_cdk_lib_1.RemovalPolicy.DESTROY,
|
|
109
|
+
});
|
|
110
|
+
}
|
|
111
|
+
/**
|
|
112
|
+
* A Lambda function to be triggered whenever a new access log is created.
|
|
113
|
+
* It moves the raw access logs into a sub folder hierarchy by year, month, day and hour.
|
|
114
|
+
*/
|
|
115
|
+
createGroupByDateLambda() {
|
|
116
|
+
const functionName = `${this.resourceIdPrefix}-group-by-date`;
|
|
117
|
+
const lambda = new aws_lambda_1.Function(this, functionName, {
|
|
118
|
+
functionName,
|
|
119
|
+
architecture: aws_lambda_1.Architecture.ARM_64,
|
|
120
|
+
runtime: aws_lambda_1.Runtime.NODEJS_16_X,
|
|
121
|
+
code: aws_lambda_1.Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/group-by-date/build/app')),
|
|
122
|
+
memorySize: 512,
|
|
123
|
+
timeout: aws_cdk_lib_1.Duration.seconds(20),
|
|
124
|
+
handler: 'index.handler',
|
|
125
|
+
layers: [this.groupByDateLayer],
|
|
126
|
+
events: [
|
|
127
|
+
new aws_lambda_event_sources_1.S3EventSource(this.bucket, {
|
|
128
|
+
events: [aws_s3_1.EventType.OBJECT_CREATED],
|
|
129
|
+
filters: [this.getUnprocessedObjectsFilter()],
|
|
130
|
+
}),
|
|
131
|
+
],
|
|
132
|
+
logRetention: aws_logs_1.RetentionDays.TWO_WEEKS,
|
|
133
|
+
environment: {
|
|
134
|
+
AWS_NODEJS_CONNECTION_REUSE_ENABLED: '1',
|
|
135
|
+
NODE_OPTIONS: '--enable-source-maps',
|
|
136
|
+
TARGET_FOLDER: AccessLogsAnalysis.ACCESS_LOGS_FOLDER_GROUPED_BY_DATE,
|
|
137
|
+
RAW_ACCESS_LOG_FILE_PATTERN: this.getRawAccessLogFilePattern().source,
|
|
138
|
+
},
|
|
139
|
+
});
|
|
140
|
+
this.bucket.grantReadWrite(lambda);
|
|
141
|
+
this.bucket.grantDelete(lambda, `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_UNPROCESSED}/*`);
|
|
142
|
+
return lambda;
|
|
143
|
+
}
|
|
144
|
+
/**
|
|
145
|
+
* Creates a new partition for the upcoming hour in the access log database.
|
|
146
|
+
*/
|
|
147
|
+
createCreatePartitionLambda() {
|
|
148
|
+
const functionName = `${this.resourceIdPrefix}-create-part`;
|
|
149
|
+
const lambda = new aws_lambda_1.Function(this, functionName, {
|
|
150
|
+
functionName,
|
|
151
|
+
architecture: aws_lambda_1.Architecture.ARM_64,
|
|
152
|
+
runtime: aws_lambda_1.Runtime.NODEJS_16_X,
|
|
153
|
+
code: aws_lambda_1.Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/partitioning/build/app'), {
|
|
154
|
+
exclude: ['transform-partition*', '*.d.ts'],
|
|
155
|
+
}),
|
|
156
|
+
memorySize: 128,
|
|
157
|
+
timeout: aws_cdk_lib_1.Duration.seconds(20),
|
|
158
|
+
handler: 'create-partition.handler',
|
|
159
|
+
layers: [this.partitioningLayer],
|
|
160
|
+
logRetention: aws_logs_1.RetentionDays.TWO_WEEKS,
|
|
161
|
+
environment: {
|
|
162
|
+
AWS_NODEJS_CONNECTION_REUSE_ENABLED: '1',
|
|
163
|
+
NODE_OPTIONS: '--enable-source-maps',
|
|
164
|
+
WORKGROUP: this.workgroup.name,
|
|
165
|
+
DATABASE: this.database.databaseName,
|
|
166
|
+
TABLE: this.accessLogsByDateTable.tableName,
|
|
167
|
+
},
|
|
168
|
+
});
|
|
169
|
+
// grant access to S3 bucket and to execute Athena queries which create new partitions
|
|
170
|
+
this.bucket.grantReadWrite(lambda);
|
|
171
|
+
lambda.addToRolePolicy(new aws_iam_1.PolicyStatement({
|
|
172
|
+
effect: aws_iam_1.Effect.ALLOW,
|
|
173
|
+
actions: [
|
|
174
|
+
'athena:StartQueryExecution',
|
|
175
|
+
'athena:GetQueryExecution',
|
|
176
|
+
'glue:CreateDatabase',
|
|
177
|
+
'glue:CreatePartition',
|
|
178
|
+
'glue:GetDatabase',
|
|
179
|
+
'glue:GetTable',
|
|
180
|
+
'glue:BatchCreatePartition',
|
|
181
|
+
],
|
|
182
|
+
resources: ['*'],
|
|
183
|
+
}));
|
|
184
|
+
return lambda;
|
|
185
|
+
}
|
|
186
|
+
/**
|
|
187
|
+
* Transforms partitions from the Hive format to Parquet.
|
|
188
|
+
*/
|
|
189
|
+
createTransformPartitionLambda() {
|
|
190
|
+
const functionName = `${this.resourceIdPrefix}-transform-part`;
|
|
191
|
+
const lambda = new aws_lambda_1.Function(this, functionName, {
|
|
192
|
+
functionName,
|
|
193
|
+
architecture: aws_lambda_1.Architecture.ARM_64,
|
|
194
|
+
runtime: aws_lambda_1.Runtime.NODEJS_16_X,
|
|
195
|
+
code: aws_lambda_1.Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/partitioning/build/app'), {
|
|
196
|
+
exclude: ['create-partition*', '*.d.ts'],
|
|
197
|
+
}),
|
|
198
|
+
memorySize: 128,
|
|
199
|
+
timeout: aws_cdk_lib_1.Duration.seconds(20),
|
|
200
|
+
handler: 'transform-partition.handler',
|
|
201
|
+
layers: [this.partitioningLayer],
|
|
202
|
+
logRetention: aws_logs_1.RetentionDays.TWO_WEEKS,
|
|
203
|
+
environment: {
|
|
204
|
+
AWS_NODEJS_CONNECTION_REUSE_ENABLED: '1',
|
|
205
|
+
NODE_OPTIONS: '--enable-source-maps',
|
|
206
|
+
WORKGROUP: this.workgroup.name,
|
|
207
|
+
DATABASE: this.database.databaseName,
|
|
208
|
+
SOURCE_TABLE: this.accessLogsByDateTable.tableName,
|
|
209
|
+
TARGET_TABLE: this.accessLogsParquetTable.tableName,
|
|
210
|
+
},
|
|
211
|
+
});
|
|
212
|
+
// grant access to S3 bucket and to execute Athena queries which create new partitions
|
|
213
|
+
this.bucket.grantReadWrite(lambda);
|
|
214
|
+
lambda.addToRolePolicy(new aws_iam_1.PolicyStatement({
|
|
215
|
+
effect: aws_iam_1.Effect.ALLOW,
|
|
216
|
+
actions: [
|
|
217
|
+
'athena:StartQueryExecution',
|
|
218
|
+
'athena:GetQueryExecution',
|
|
219
|
+
'glue:CreateDatabase',
|
|
220
|
+
'glue:CreatePartition',
|
|
221
|
+
'glue:GetDatabase',
|
|
222
|
+
'glue:GetTable',
|
|
223
|
+
'glue:BatchCreatePartition',
|
|
224
|
+
'glue:GetPartition',
|
|
225
|
+
'glue:GetPartitions',
|
|
226
|
+
'glue:CreateTable',
|
|
227
|
+
'glue:DeleteTable',
|
|
228
|
+
'glue:DeletePartition',
|
|
229
|
+
],
|
|
230
|
+
resources: ['*'],
|
|
231
|
+
}));
|
|
232
|
+
return lambda;
|
|
233
|
+
}
|
|
234
|
+
createCreatePartitionsScheduler() {
|
|
235
|
+
const ruleName = `${this.resourceIdPrefix}-create-part-sched`;
|
|
236
|
+
return new aws_events_1.Rule(this, ruleName, {
|
|
237
|
+
ruleName,
|
|
238
|
+
schedule: aws_events_1.Schedule.cron({ minute: '55' }),
|
|
239
|
+
targets: [new aws_events_targets_1.LambdaFunction(this.createPartitionLambda, { retryAttempts: 10 })],
|
|
240
|
+
});
|
|
241
|
+
}
|
|
242
|
+
createTransformPartitionsScheduler(props) {
|
|
243
|
+
const ruleName = `${this.resourceIdPrefix}-transform-part-sched`;
|
|
244
|
+
return new aws_events_1.Rule(this, ruleName, {
|
|
245
|
+
ruleName,
|
|
246
|
+
schedule: aws_events_1.Schedule.cron({ minute: '1' }),
|
|
247
|
+
targets: [
|
|
248
|
+
new aws_events_targets_1.LambdaFunction(this.transformPartitionLambda, {
|
|
249
|
+
event: this.getTransformPartitionInvocationProps(props),
|
|
250
|
+
retryAttempts: 10,
|
|
251
|
+
}),
|
|
252
|
+
],
|
|
253
|
+
});
|
|
254
|
+
}
|
|
255
|
+
getTransformPartitionInvocationProps(props) {
|
|
256
|
+
return aws_events_1.RuleTargetInput.fromObject({
|
|
257
|
+
columnNames: [
|
|
258
|
+
...this.accessLogsParquetTable.columns,
|
|
259
|
+
...this.accessLogsParquetTable.partitionKeys,
|
|
260
|
+
].map(column => column.name),
|
|
261
|
+
columnTransformations: this.getColumnTransformationRules(props),
|
|
262
|
+
});
|
|
263
|
+
}
|
|
264
|
+
}
|
|
265
|
+
exports.AccessLogsAnalysis = AccessLogsAnalysis;
|
|
266
|
+
AccessLogsAnalysis.ACCESS_LOGS_FOLDER_UNPROCESSED = 'unprocessed';
|
|
267
|
+
AccessLogsAnalysis.ACCESS_LOGS_FOLDER_GROUPED_BY_DATE = 'by-date';
|
|
268
|
+
AccessLogsAnalysis.ACCESS_LOGS_FOLDER_TRANSFORMED = 'transformed';
|
|
269
|
+
AccessLogsAnalysis.ACCESS_LOGS_FOLDER_ATHENA_RESULTS = 'athena-query-results';
|
|
270
|
+
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"AccessLogsAnalysis.js","sourceRoot":"","sources":["AccessLogsAnalysis.ts"],"names":[],"mappings":";;;AAAA,+CAA4E;AAC5E,2CAAqC;AACrC,uDAAoD;AAGpD,uDAA2F;AAC3F,uDAAuE;AACvE,6CAAmE;AACnE,4DAAyD;AACzD,mFAAmE;AACnE,mDAAmD;AACnD,iDAA4D;AAC5D,uEAA8D;AAC9D,6BAA6B;AAI7B;;;;GAIG;AACH,MAAsB,kBAAmB,SAAQ,sBAAS;IAqBtD,YAAsB,KAAgB,EAAE,EAAU,EAAE,KAA8B;QAC9E,KAAK,CAAC,KAAK,EAAE,EAAE,CAAC,CAAC;QACjB,IAAI,CAAC,gBAAgB,GAAG,KAAK,CAAC,cAAc,CAAC;QAC7C,IAAI,CAAC,MAAM,GAAG,KAAK,CAAC,MAAM,CAAC;QAC3B,IAAI,CAAC,mBAAmB,CAAC,KAAK,CAAC,CAAC;QAChC,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC,eAAe,EAAE,CAAC;QACxC,IAAI,CAAC,QAAQ,GAAG,IAAI,CAAC,kBAAkB,EAAE,CAAC;QAC1C,IAAI,CAAC,qBAAqB,GAAG,IAAI,CAAC,2BAA2B,EAAE,CAAC;QAChE,IAAI,CAAC,sBAAsB,GAAG,IAAI,CAAC,4BAA4B,EAAE,CAAC;QAClE,IAAI,CAAC,gBAAgB,GAAG,IAAI,CAAC,sBAAsB,EAAE,CAAC;QACtD,IAAI,CAAC,iBAAiB,GAAG,IAAI,CAAC,uBAAuB,EAAE,CAAC;QACxD,IAAI,CAAC,iBAAiB,GAAG,IAAI,CAAC,uBAAuB,EAAE,CAAC;QACxD,IAAI,CAAC,qBAAqB,GAAG,IAAI,CAAC,2BAA2B,EAAE,CAAC;QAChE,IAAI,CAAC,wBAAwB,GAAG,IAAI,CAAC,8BAA8B,EAAE,CAAC;QACtE,IAAI,CAAC,yBAAyB,GAAG,IAAI,CAAC,+BAA+B,EAAE,CAAC;QACxE,IAAI,CAAC,4BAA4B,GAAG,IAAI,CAAC,kCAAkC,CAAC,KAAK,CAAC,CAAC;IACvF,CAAC;IAEO,mBAAmB,CAAC,KAA8B;QACtD,0EAA0E;;QAE1E,IAAI,CAAC,MAAM,CAAC,gBAAgB,CAAC;YACzB,EAAE,EAAE,GAAG,IAAI,CAAC,gBAAgB,sBAAsB;YAClD,MAAM,EAAE,GAAG,kBAAkB,CAAC,8BAA8B,IAAI;YAChE,UAAU,EAAE,MAAA,KAAK,CAAC,kBAAkB,mCAAI,sBAAQ,CAAC,IAAI,CAAC,CAAC,CAAC;SAC3D,CAAC,CAAC;QAEH,IAAI,CAAC,MAAM,CAAC,gBAAgB,CAAC;YACzB,EAAE,EAAE,GAAG,IAAI,CAAC,gBAAgB,kBAAkB;YAC9C,MAAM,EAAE,GAAG,kBAAkB,CAAC,kCAAkC,IAAI;YACpE,UAAU,EAAE,MAAA,KAAK,CAAC,2BAA2B,mCAAI,sBAAQ,CAAC,IAAI,CAAC,CAAC,CAAC;SACpE,CAAC,CAAC;QAEH,IAAI,CAAC,MAAM,CAAC,gBAAgB,CAAC;YACzB,EAAE,EAAE,GAAG,IAAI,CAAC,gBAAgB,sBAAsB;YAClD,MAAM,EAAE,GAAG,kBAAkB,CAAC,8BAA8B,IAAI;YAChE,UAAU,EAAE,MAAA,KAAK,CAAC,0BAA0B,mCAAI,sBAAQ,CAAC,IAAI,CAAC,GAAG,CAAC;SACrE,CAAC,CAAC;QAEH;;;;;;UAME;IACN,CAAC;IAEO,eAAe;QACnB,MAAM,aAAa,GAAG,GAAG,IAAI,CAAC,gBAAgB,YAAY,CAAC;QAE3D,iFAAiF;QACjF,sDAAsD;QACtD,MAAM,IAAI,GAAa,mBAAK,CAAC,EAAE,CAAC,IAAI,CAAC;aAChC,IAAI,CAAC,UAAU,EAAE;aACjB,GAAG,CAAC,CAAC,GAAmC,EAAE,EAAE,CAAC,CAAC,EAAC,GAAG,EAAE,GAAG,CAAC,GAAG,EAAE,KAAK,EAAE,GAAG,CAAC,KAAK,EAAC,CAAC,CAAC,CAAC;QAEtF,OAAO,IAAI,yBAAY,CAAC,IAAI,EAAE,aAAa,EAAE;YACzC,IAAI,EAAE,aAAa;YACnB,sBAAsB,EAAE;gBACpB,+BAA+B,EAAE,KAAK;gBACtC,mBAAmB,EAAE;oBACjB,cAAc,EAAE,QAAQ,IAAI,CAAC,MAAM,CAAC,UAAU,IAAI,kBAAkB,CAAC,iCAAiC,EAAE;iBAC3G;gBACD,6BAA6B,EAAE,IAAI;aACtC;YACD,IAAI;SACP,CAAC,CAAC;IACP,CAAC;IAEO,kBAAkB;QACtB,MAAM,YAAY,GAAG,GAAG,IAAI,CAAC,gBAAgB,WAAW,CAAC;QACzD,OAAO,IAAI,yBAAQ,CAAC,IAAI,EAAE,YAAY,EAAE;YACpC,wDAAwD;YACxD,YAAY,EAAE,YAAY,CAAC,OAAO,CAAC,IAAI,EAAE,GAAG,CAAC;SAChD,CAAC,CAAC;IACP,CAAC;IAMO,sBAAsB;QAC1B,MAAM,gBAAgB,GAAG,GAAG,IAAI,CAAC,gBAAgB,6BAA6B,CAAC;QAC/E,OAAO,IAAI,yBAAY,CAAC,IAAI,EAAE,gBAAgB,EAAE;YAC5C,gBAAgB;YAChB,uBAAuB,EAAE,CAAC,yBAAY,CAAC,MAAM,EAAE,yBAAY,CAAC,MAAM,CAAC;YACnE,kBAAkB,EAAE,CAAC,oBAAO,CAAC,WAAW,EAAE,oBAAO,CAAC,WAAW,CAAC;YAC9D,IAAI,EAAE,iBAAI,CAAC,SAAS,CAAC,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,gEAAgE,CAAC,CAAC;YAC5G,aAAa,EAAE,2BAAa,CAAC,OAAO;SACvC,CAAC,CAAC;IACP,CAAC;IAEO,uBAAuB;QAC3B,MAAM,gBAAgB,GAAG,GAAG,IAAI,CAAC,gBAAgB,4BAA4B,CAAC;QAC9E,OAAO,IAAI,yBAAY,CAAC,IAAI,EAAE,gBAAgB,EAAE;YAC5C,gBAAgB;YAChB,uBAAuB,EAAE,CAAC,yBAAY,CAAC,MAAM,EAAE,yBAAY,CAAC,MAAM,CAAC;YACnE,kBAAkB,EAAE,CAAC,oBAAO,CAAC,WAAW,EAAE,oBAAO,CAAC,WAAW,CAAC;YAC9D,IAAI,EAAE,iBAAI,CAAC,SAAS,CAAC,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,+DAA+D,CAAC,CAAC;YAC3G,aAAa,EAAE,2BAAa,CAAC,OAAO;SACvC,CAAC,CAAC;IACP,CAAC;IAED;;;OAGG;IACK,uBAAuB;QAC3B,MAAM,YAAY,GAAG,GAAG,IAAI,CAAC,gBAAgB,gBAAgB,CAAC;QAE9D,MAAM,MAAM,GAAG,IAAI,qBAAQ,CAAC,IAAI,EAAE,YAAY,EAAE;YAC5C,YAAY;YACZ,YAAY,EAAE,yBAAY,CAAC,MAAM;YACjC,OAAO,EAAE,oBAAO,CAAC,WAAW;YAC5B,IAAI,EAAE,iBAAI,CAAC,SAAS,CAAC,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,8DAA8D,CAAC,CAAC;YAC1G,UAAU,EAAE,GAAG;YACf,OAAO,EAAE,sBAAQ,CAAC,OAAO,CAAC,EAAE,CAAC;YAC7B,OAAO,EAAE,eAAe;YACxB,MAAM,EAAE,CAAC,IAAI,CAAC,gBAAgB,CAAC;YAC/B,MAAM,EAAE;gBACJ,IAAI,wCAAa,CAAC,IAAI,CAAC,MAAM,EAAE;oBAC3B,MAAM,EAAE,CAAC,kBAAS,CAAC,cAAc,CAAC;oBAClC,OAAO,EAAE,CAAC,IAAI,CAAC,2BAA2B,EAAE,CAAC;iBAChD,CAAC;aACL;YACD,YAAY,EAAE,wBAAa,CAAC,SAAS;YACrC,WAAW,EAAE;gBACT,mCAAmC,EAAE,GAAG;gBACxC,YAAY,EAAE,sBAAsB;gBACpC,aAAa,EAAE,kBAAkB,CAAC,kCAAkC;gBACpE,2BAA2B,EAAE,IAAI,CAAC,0BAA0B,EAAE,CAAC,MAAM;aACxE;SACJ,CAAC,CAAC;QAEH,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,MAAM,CAAC,CAAC;QACnC,IAAI,CAAC,MAAM,CAAC,WAAW,CAAC,MAAM,EAAE,GAAG,kBAAkB,CAAC,8BAA8B,IAAI,CAAC,CAAC;QAE1F,OAAO,MAAM,CAAC;IAClB,CAAC;IAOD;;OAEG;IACK,2BAA2B;QAC/B,MAAM,YAAY,GAAG,GAAG,IAAI,CAAC,gBAAgB,cAAc,CAAC;QAE5D,MAAM,MAAM,GAAG,IAAI,qBAAQ,CAAC,IAAI,EAAE,YAAY,EAAE;YAC5C,YAAY;YACZ,YAAY,EAAE,yBAAY,CAAC,MAAM;YACjC,OAAO,EAAE,oBAAO,CAAC,WAAW;YAC5B,IAAI,EAAE,iBAAI,CAAC,SAAS,CAAC,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,6DAA6D,CAAC,EAAE;gBACtG,OAAO,EAAE,CAAC,sBAAsB,EAAE,QAAQ,CAAC;aAC9C,CAAC;YACF,UAAU,EAAE,GAAG;YACf,OAAO,EAAE,sBAAQ,CAAC,OAAO,CAAC,EAAE,CAAC;YAC7B,OAAO,EAAE,0BAA0B;YACnC,MAAM,EAAE,CAAC,IAAI,CAAC,iBAAiB,CAAC;YAChC,YAAY,EAAE,wBAAa,CAAC,SAAS;YACrC,WAAW,EAAE;gBACT,mCAAmC,EAAE,GAAG;gBACxC,YAAY,EAAE,sBAAsB;gBACpC,SAAS,EAAE,IAAI,CAAC,SAAS,CAAC,IAAI;gBAC9B,QAAQ,EAAE,IAAI,CAAC,QAAQ,CAAC,YAAY;gBACpC,KAAK,EAAE,IAAI,CAAC,qBAAqB,CAAC,SAAS;aAC9C;SACJ,CAAC,CAAC;QAEH,sFAAsF;QACtF,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,MAAM,CAAC,CAAC;QACnC,MAAM,CAAC,eAAe,CAClB,IAAI,yBAAe,CAAC;YAChB,MAAM,EAAE,gBAAM,CAAC,KAAK;YACpB,OAAO,EAAE;gBACL,4BAA4B;gBAC5B,0BAA0B;gBAC1B,qBAAqB;gBACrB,sBAAsB;gBACtB,kBAAkB;gBAClB,eAAe;gBACf,2BAA2B;aAC9B;YACD,SAAS,EAAE,CAAC,GAAG,CAAC;SACnB,CAAC,CACL,CAAC;QAEF,OAAO,MAAM,CAAC;IAClB,CAAC;IAED;;OAEG;IACK,8BAA8B;QAClC,MAAM,YAAY,GAAG,GAAG,IAAI,CAAC,gBAAgB,iBAAiB,CAAC;QAE/D,MAAM,MAAM,GAAG,IAAI,qBAAQ,CAAC,IAAI,EAAE,YAAY,EAAE;YAC5C,YAAY;YACZ,YAAY,EAAE,yBAAY,CAAC,MAAM;YACjC,OAAO,EAAE,oBAAO,CAAC,WAAW;YAC5B,IAAI,EAAE,iBAAI,CAAC,SAAS,CAAC,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,6DAA6D,CAAC,EAAE;gBACtG,OAAO,EAAE,CAAC,mBAAmB,EAAE,QAAQ,CAAC;aAC3C,CAAC;YACF,UAAU,EAAE,GAAG;YACf,OAAO,EAAE,sBAAQ,CAAC,OAAO,CAAC,EAAE,CAAC;YAC7B,OAAO,EAAE,6BAA6B;YACtC,MAAM,EAAE,CAAC,IAAI,CAAC,iBAAiB,CAAC;YAChC,YAAY,EAAE,wBAAa,CAAC,SAAS;YACrC,WAAW,EAAE;gBACT,mCAAmC,EAAE,GAAG;gBACxC,YAAY,EAAE,sBAAsB;gBACpC,SAAS,EAAE,IAAI,CAAC,SAAS,CAAC,IAAI;gBAC9B,QAAQ,EAAE,IAAI,CAAC,QAAQ,CAAC,YAAY;gBACpC,YAAY,EAAE,IAAI,CAAC,qBAAqB,CAAC,SAAS;gBAClD,YAAY,EAAE,IAAI,CAAC,sBAAsB,CAAC,SAAS;aACtD;SACJ,CAAC,CAAC;QAEH,sFAAsF;QACtF,IAAI,CAAC,MAAM,CAAC,cAAc,CAAC,MAAM,CAAC,CAAC;QACnC,MAAM,CAAC,eAAe,CAClB,IAAI,yBAAe,CAAC;YAChB,MAAM,EAAE,gBAAM,CAAC,KAAK;YACpB,OAAO,EAAE;gBACL,4BAA4B;gBAC5B,0BAA0B;gBAC1B,qBAAqB;gBACrB,sBAAsB;gBACtB,kBAAkB;gBAClB,eAAe;gBACf,2BAA2B;gBAC3B,mBAAmB;gBACnB,oBAAoB;gBACpB,kBAAkB;gBAClB,kBAAkB;gBAClB,sBAAsB;aACzB;YACD,SAAS,EAAE,CAAC,GAAG,CAAC;SACnB,CAAC,CACL,CAAC;QAEF,OAAO,MAAM,CAAC;IAClB,CAAC;IAEO,+BAA+B;QACnC,MAAM,QAAQ,GAAG,GAAG,IAAI,CAAC,gBAAgB,oBAAoB,CAAC;QAC9D,OAAO,IAAI,iBAAI,CAAC,IAAI,EAAE,QAAQ,EAAE;YAC5B,QAAQ;YACR,QAAQ,EAAE,qBAAQ,CAAC,IAAI,CAAC,EAAC,MAAM,EAAE,IAAI,EAAC,CAAC;YACvC,OAAO,EAAE,CAAC,IAAI,mCAAc,CAAC,IAAI,CAAC,qBAAqB,EAAE,EAAC,aAAa,EAAE,EAAE,EAAC,CAAC,CAAC;SACjF,CAAC,CAAC;IACP,CAAC;IAEO,kCAAkC,CAAC,KAA8B;QACrE,MAAM,QAAQ,GAAG,GAAG,IAAI,CAAC,gBAAgB,uBAAuB,CAAC;QACjE,OAAO,IAAI,iBAAI,CAAC,IAAI,EAAE,QAAQ,EAAE;YAC5B,QAAQ;YACR,QAAQ,EAAE,qBAAQ,CAAC,IAAI,CAAC,EAAC,MAAM,EAAE,GAAG,EAAC,CAAC;YACtC,OAAO,EAAE;gBACL,IAAI,mCAAc,CAAC,IAAI,CAAC,wBAAwB,EAAE;oBAC9C,KAAK,EAAE,IAAI,CAAC,oCAAoC,CAAC,KAAK,CAAC;oBACvD,aAAa,EAAE,EAAE;iBACpB,CAAC;aACL;SACJ,CAAC,CAAC;IACP,CAAC;IAEO,oCAAoC,CAAC,KAA8B;QACvE,OAAO,4BAAe,CAAC,UAAU,CAAC;YAC9B,WAAW,EAAE;gBACT,GAAG,IAAI,CAAC,sBAAsB,CAAC,OAAO;gBACtC,GAAI,IAAI,CAAC,sBAAsB,CAAC,aAA0B;aAC7D,CAAC,GAAG,CAAC,MAAM,CAAC,EAAE,CAAC,MAAM,CAAC,IAAI,CAAC;YAC5B,qBAAqB,EAAE,IAAI,CAAC,4BAA4B,CAAC,KAAK,CAAC;SAClE,CAAC,CAAC;IACP,CAAC;;AA5SL,gDAmTC;AAjT6B,iDAA8B,GAAG,aAAa,CAAC;AAC/C,qDAAkC,GAAG,SAAS,CAAC;AAC/C,iDAA8B,GAAG,aAAa,CAAC;AAC/C,oDAAiC,GAAG,sBAAsB,CAAC","sourcesContent":["import {Bucket, EventType, NotificationKeyFilter} from 'aws-cdk-lib/aws-s3';\nimport {Construct} from 'constructs';\nimport {CfnWorkGroup} from 'aws-cdk-lib/aws-athena';\nimport {CloudFrontAccessLogsByDateTable} from './CloudFrontAccessLogsByDateTable';\nimport {AccessLogsParquetTable} from './AccessLogsParquetTable';\nimport {Architecture, Code, Function, LayerVersion, Runtime} from 'aws-cdk-lib/aws-lambda';\nimport {Rule, RuleTargetInput, Schedule} from 'aws-cdk-lib/aws-events';\nimport {CfnTag, Duration, RemovalPolicy, Stack} from 'aws-cdk-lib';\nimport {Column, Database} from '@aws-cdk/aws-glue-alpha';\nimport {S3EventSource} from 'aws-cdk-lib/aws-lambda-event-sources';\nimport {RetentionDays} from 'aws-cdk-lib/aws-logs';\nimport {Effect, PolicyStatement} from 'aws-cdk-lib/aws-iam';\nimport {LambdaFunction} from 'aws-cdk-lib/aws-events-targets';\nimport * as path from 'path';\nimport {AccessLogsAnalysisProps} from \"./AccessLogsAnalysisProps\";\nimport {ColumnTransformationRules} from \"../../functions/access-logs-analysis/partitioning/types\";\n\n/**\n * Provides the AWS resources to analyze access logs. This construct is derived from the official AWS sample\n * CloudFormation stack:\n * {@link https://github.com/aws-samples/amazon-cloudfront-access-logs-queries/blob/mainline/template.yaml}\n */\nexport abstract class AccessLogsAnalysis extends Construct {\n\n    protected static readonly ACCESS_LOGS_FOLDER_UNPROCESSED = 'unprocessed';\n    protected static readonly ACCESS_LOGS_FOLDER_GROUPED_BY_DATE = 'by-date';\n    protected static readonly ACCESS_LOGS_FOLDER_TRANSFORMED = 'transformed';\n    protected static readonly ACCESS_LOGS_FOLDER_ATHENA_RESULTS = 'athena-query-results';\n\n    protected readonly resourceIdPrefix: string;\n    protected readonly bucket: Bucket;\n    protected readonly workgroup: CfnWorkGroup;\n    protected readonly database: Database;\n    protected readonly accessLogsByDateTable: CloudFrontAccessLogsByDateTable;\n    protected readonly accessLogsParquetTable: AccessLogsParquetTable;\n    protected readonly groupByDateLayer: LayerVersion;\n    protected readonly groupByDateLambda: Function;\n    protected readonly partitioningLayer: LayerVersion;\n    protected readonly createPartitionLambda: Function;\n    protected readonly transformPartitionLambda: Function;\n    protected readonly createPartitionsScheduler: Rule;\n    protected readonly transformPartitionsScheduler: Rule;\n\n    protected constructor(scope: Construct, id: string, props: AccessLogsAnalysisProps) {\n        super(scope, id);\n        this.resourceIdPrefix = props.resourcePrefix;\n        this.bucket = props.bucket;\n        this.setupLifecycleRules(props);\n        this.workgroup = this.createWorkgroup();\n        this.database = this.createGlueDatabase();\n        this.accessLogsByDateTable = this.createAccessLogsByDateTable();\n        this.accessLogsParquetTable = this.createAccessLogsParquetTable();\n        this.groupByDateLayer = this.createGroupByDateLayer();\n        this.groupByDateLambda = this.createGroupByDateLambda();\n        this.partitioningLayer = this.createPartitioningLayer();\n        this.createPartitionLambda = this.createCreatePartitionLambda();\n        this.transformPartitionLambda = this.createTransformPartitionLambda();\n        this.createPartitionsScheduler = this.createCreatePartitionsScheduler();\n        this.transformPartitionsScheduler = this.createTransformPartitionsScheduler(props);\n    }\n\n    private setupLifecycleRules(props: AccessLogsAnalysisProps): void {\n        // cleanup raw and partitioned access logs after a configurable time range\n\n        this.bucket.addLifecycleRule({\n            id: `${this.resourceIdPrefix}-cleanup-unprocessed`,\n            prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_UNPROCESSED}/*`,\n            expiration: props.expireRawLogsAfter ?? Duration.days(7),\n        });\n\n        this.bucket.addLifecycleRule({\n            id: `${this.resourceIdPrefix}-cleanup-grouped`,\n            prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_GROUPED_BY_DATE}/*`,\n            expiration: props.expireIntermediateLogsAfter ?? Duration.days(7),\n        });\n\n        this.bucket.addLifecycleRule({\n            id: `${this.resourceIdPrefix}-cleanup-transformed`,\n            prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_TRANSFORMED}/*`,\n            expiration: props.expireTransformedLogsAfter ?? Duration.days(180),\n        });\n\n        /* CHECKME: delete query results after 1 week\n        this.bucket.addLifecycleRule({\n          id: `${this.resourceIdPrefix}-cleanup-query-results`,\n          prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_ATHENA_RESULTS}/*`,\n          expiration: Duration.days(7),\n        });\n        */\n    }\n\n    private createWorkgroup(): CfnWorkGroup {\n        const workgroupName = `${this.resourceIdPrefix}-workgroup`;\n\n        // due to a current bug, the tags are not automatically assigned to the workgroup\n        // note, that the keys must be converted to lower case\n        const tags: CfnTag[] = Stack.of(this)\n            .tags.renderTags()\n            .map((tag: { Key: string; Value: string }) => ({key: tag.Key, value: tag.Value}));\n\n        return new CfnWorkGroup(this, workgroupName, {\n            name: workgroupName,\n            workGroupConfiguration: {\n                publishCloudWatchMetricsEnabled: false,\n                resultConfiguration: {\n                    outputLocation: `s3://${this.bucket.bucketName}/${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_ATHENA_RESULTS}`,\n                },\n                enforceWorkGroupConfiguration: true\n            },\n            tags,\n        });\n    }\n\n    private createGlueDatabase(): Database {\n        const databaseName = `${this.resourceIdPrefix}-database`;\n        return new Database(this, databaseName, {\n            // Athena doesn't support dashes in database/table names\n            databaseName: databaseName.replace(/-/g, '_'),\n        });\n    }\n\n    protected abstract createAccessLogsByDateTable(): CloudFrontAccessLogsByDateTable;\n\n    protected abstract createAccessLogsParquetTable(): CloudFrontAccessLogsByDateTable;\n\n    private createGroupByDateLayer(): LayerVersion {\n        const layerVersionName = `${this.resourceIdPrefix}-group-by-date-dependencies`;\n        return new LayerVersion(this, layerVersionName, {\n            layerVersionName,\n            compatibleArchitectures: [Architecture.ARM_64, Architecture.X86_64],\n            compatibleRuntimes: [Runtime.NODEJS_14_X, Runtime.NODEJS_16_X],\n            code: Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/group-by-date/build/layer')),\n            removalPolicy: RemovalPolicy.DESTROY,\n        });\n    }\n\n    private createPartitioningLayer(): LayerVersion {\n        const layerVersionName = `${this.resourceIdPrefix}-partitioning-dependencies`;\n        return new LayerVersion(this, layerVersionName, {\n            layerVersionName,\n            compatibleArchitectures: [Architecture.ARM_64, Architecture.X86_64],\n            compatibleRuntimes: [Runtime.NODEJS_14_X, Runtime.NODEJS_16_X],\n            code: Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/partitioning/build/layer')),\n            removalPolicy: RemovalPolicy.DESTROY,\n        });\n    }\n\n    /**\n     * A Lambda function to be triggered whenever a new access log is created.\n     * It moves the raw access logs into a sub folder hierarchy by year, month, day and hour.\n     */\n    private createGroupByDateLambda(): Function {\n        const functionName = `${this.resourceIdPrefix}-group-by-date`;\n\n        const lambda = new Function(this, functionName, {\n            functionName,\n            architecture: Architecture.ARM_64,\n            runtime: Runtime.NODEJS_16_X,\n            code: Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/group-by-date/build/app')),\n            memorySize: 512,\n            timeout: Duration.seconds(20),\n            handler: 'index.handler',\n            layers: [this.groupByDateLayer],\n            events: [\n                new S3EventSource(this.bucket, {\n                    events: [EventType.OBJECT_CREATED],\n                    filters: [this.getUnprocessedObjectsFilter()],\n                }),\n            ],\n            logRetention: RetentionDays.TWO_WEEKS,\n            environment: {\n                AWS_NODEJS_CONNECTION_REUSE_ENABLED: '1',\n                NODE_OPTIONS: '--enable-source-maps',\n                TARGET_FOLDER: AccessLogsAnalysis.ACCESS_LOGS_FOLDER_GROUPED_BY_DATE,\n                RAW_ACCESS_LOG_FILE_PATTERN: this.getRawAccessLogFilePattern().source,\n            },\n        });\n\n        this.bucket.grantReadWrite(lambda);\n        this.bucket.grantDelete(lambda, `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_UNPROCESSED}/*`);\n\n        return lambda;\n    }\n\n    protected abstract getUnprocessedObjectsFilter(): NotificationKeyFilter;\n\n    /** The pattern to identify unprocessed access logs depends on the producing source */\n    protected abstract getRawAccessLogFilePattern(): RegExp;\n\n    /**\n     * Creates a new partition for the upcoming hour in the access log database.\n     */\n    private createCreatePartitionLambda(): Function {\n        const functionName = `${this.resourceIdPrefix}-create-part`;\n\n        const lambda = new Function(this, functionName, {\n            functionName,\n            architecture: Architecture.ARM_64,\n            runtime: Runtime.NODEJS_16_X,\n            code: Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/partitioning/build/app'), {\n                exclude: ['transform-partition*', '*.d.ts'],\n            }),\n            memorySize: 128,\n            timeout: Duration.seconds(20),\n            handler: 'create-partition.handler',\n            layers: [this.partitioningLayer],\n            logRetention: RetentionDays.TWO_WEEKS,\n            environment: {\n                AWS_NODEJS_CONNECTION_REUSE_ENABLED: '1',\n                NODE_OPTIONS: '--enable-source-maps',\n                WORKGROUP: this.workgroup.name,\n                DATABASE: this.database.databaseName,\n                TABLE: this.accessLogsByDateTable.tableName,\n            },\n        });\n\n        // grant access to S3 bucket and to execute Athena queries which create new partitions\n        this.bucket.grantReadWrite(lambda);\n        lambda.addToRolePolicy(\n            new PolicyStatement({\n                effect: Effect.ALLOW,\n                actions: [\n                    'athena:StartQueryExecution',\n                    'athena:GetQueryExecution',\n                    'glue:CreateDatabase',\n                    'glue:CreatePartition',\n                    'glue:GetDatabase',\n                    'glue:GetTable',\n                    'glue:BatchCreatePartition',\n                ],\n                resources: ['*'],\n            })\n        );\n\n        return lambda;\n    }\n\n    /**\n     * Transforms partitions from the Hive format to Parquet.\n     */\n    private createTransformPartitionLambda(): Function {\n        const functionName = `${this.resourceIdPrefix}-transform-part`;\n\n        const lambda = new Function(this, functionName, {\n            functionName,\n            architecture: Architecture.ARM_64,\n            runtime: Runtime.NODEJS_16_X,\n            code: Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/partitioning/build/app'), {\n                exclude: ['create-partition*', '*.d.ts'],\n            }),\n            memorySize: 128,\n            timeout: Duration.seconds(20),\n            handler: 'transform-partition.handler',\n            layers: [this.partitioningLayer],\n            logRetention: RetentionDays.TWO_WEEKS,\n            environment: {\n                AWS_NODEJS_CONNECTION_REUSE_ENABLED: '1',\n                NODE_OPTIONS: '--enable-source-maps',\n                WORKGROUP: this.workgroup.name,\n                DATABASE: this.database.databaseName,\n                SOURCE_TABLE: this.accessLogsByDateTable.tableName,\n                TARGET_TABLE: this.accessLogsParquetTable.tableName,\n            },\n        });\n\n        // grant access to S3 bucket and to execute Athena queries which create new partitions\n        this.bucket.grantReadWrite(lambda);\n        lambda.addToRolePolicy(\n            new PolicyStatement({\n                effect: Effect.ALLOW,\n                actions: [\n                    'athena:StartQueryExecution',\n                    'athena:GetQueryExecution',\n                    'glue:CreateDatabase',\n                    'glue:CreatePartition',\n                    'glue:GetDatabase',\n                    'glue:GetTable',\n                    'glue:BatchCreatePartition',\n                    'glue:GetPartition',\n                    'glue:GetPartitions',\n                    'glue:CreateTable',\n                    'glue:DeleteTable',\n                    'glue:DeletePartition',\n                ],\n                resources: ['*'],\n            })\n        );\n\n        return lambda;\n    }\n\n    private createCreatePartitionsScheduler(): Rule {\n        const ruleName = `${this.resourceIdPrefix}-create-part-sched`;\n        return new Rule(this, ruleName, {\n            ruleName,\n            schedule: Schedule.cron({minute: '55'}),\n            targets: [new LambdaFunction(this.createPartitionLambda, {retryAttempts: 10})],\n        });\n    }\n\n    private createTransformPartitionsScheduler(props: AccessLogsAnalysisProps): Rule {\n        const ruleName = `${this.resourceIdPrefix}-transform-part-sched`;\n        return new Rule(this, ruleName, {\n            ruleName,\n            schedule: Schedule.cron({minute: '1'}),\n            targets: [\n                new LambdaFunction(this.transformPartitionLambda, {\n                    event: this.getTransformPartitionInvocationProps(props),\n                    retryAttempts: 10,\n                }),\n            ],\n        });\n    }\n\n    private getTransformPartitionInvocationProps(props: AccessLogsAnalysisProps): RuleTargetInput {\n        return RuleTargetInput.fromObject({\n            columnNames: [\n                ...this.accessLogsParquetTable.columns,\n                ...(this.accessLogsParquetTable.partitionKeys as Column[]),\n            ].map(column => column.name),\n            columnTransformations: this.getColumnTransformationRules(props),\n        });\n    }\n\n    /**\n     * Needs to return the log source specific column transformation rules\n     * (e.g. to anonymize IP addresses).\n     */\n    protected abstract getColumnTransformationRules(props: AccessLogsAnalysisProps): ColumnTransformationRules;\n}\n"]}
|
|
@@ -0,0 +1,330 @@
|
|
|
1
|
+
import {Bucket, EventType, NotificationKeyFilter} from 'aws-cdk-lib/aws-s3';
|
|
2
|
+
import {Construct} from 'constructs';
|
|
3
|
+
import {CfnWorkGroup} from 'aws-cdk-lib/aws-athena';
|
|
4
|
+
import {CloudFrontAccessLogsByDateTable} from './CloudFrontAccessLogsByDateTable';
|
|
5
|
+
import {AccessLogsParquetTable} from './AccessLogsParquetTable';
|
|
6
|
+
import {Architecture, Code, Function, LayerVersion, Runtime} from 'aws-cdk-lib/aws-lambda';
|
|
7
|
+
import {Rule, RuleTargetInput, Schedule} from 'aws-cdk-lib/aws-events';
|
|
8
|
+
import {CfnTag, Duration, RemovalPolicy, Stack} from 'aws-cdk-lib';
|
|
9
|
+
import {Column, Database} from '@aws-cdk/aws-glue-alpha';
|
|
10
|
+
import {S3EventSource} from 'aws-cdk-lib/aws-lambda-event-sources';
|
|
11
|
+
import {RetentionDays} from 'aws-cdk-lib/aws-logs';
|
|
12
|
+
import {Effect, PolicyStatement} from 'aws-cdk-lib/aws-iam';
|
|
13
|
+
import {LambdaFunction} from 'aws-cdk-lib/aws-events-targets';
|
|
14
|
+
import * as path from 'path';
|
|
15
|
+
import {AccessLogsAnalysisProps} from "./AccessLogsAnalysisProps";
|
|
16
|
+
import {ColumnTransformationRules} from "../../functions/access-logs-analysis/partitioning/types";
|
|
17
|
+
|
|
18
|
+
/**
|
|
19
|
+
* Provides the AWS resources to analyze access logs. This construct is derived from the official AWS sample
|
|
20
|
+
* CloudFormation stack:
|
|
21
|
+
* {@link https://github.com/aws-samples/amazon-cloudfront-access-logs-queries/blob/mainline/template.yaml}
|
|
22
|
+
*/
|
|
23
|
+
export abstract class AccessLogsAnalysis extends Construct {
|
|
24
|
+
|
|
25
|
+
protected static readonly ACCESS_LOGS_FOLDER_UNPROCESSED = 'unprocessed';
|
|
26
|
+
protected static readonly ACCESS_LOGS_FOLDER_GROUPED_BY_DATE = 'by-date';
|
|
27
|
+
protected static readonly ACCESS_LOGS_FOLDER_TRANSFORMED = 'transformed';
|
|
28
|
+
protected static readonly ACCESS_LOGS_FOLDER_ATHENA_RESULTS = 'athena-query-results';
|
|
29
|
+
|
|
30
|
+
protected readonly resourceIdPrefix: string;
|
|
31
|
+
protected readonly bucket: Bucket;
|
|
32
|
+
protected readonly workgroup: CfnWorkGroup;
|
|
33
|
+
protected readonly database: Database;
|
|
34
|
+
protected readonly accessLogsByDateTable: CloudFrontAccessLogsByDateTable;
|
|
35
|
+
protected readonly accessLogsParquetTable: AccessLogsParquetTable;
|
|
36
|
+
protected readonly groupByDateLayer: LayerVersion;
|
|
37
|
+
protected readonly groupByDateLambda: Function;
|
|
38
|
+
protected readonly partitioningLayer: LayerVersion;
|
|
39
|
+
protected readonly createPartitionLambda: Function;
|
|
40
|
+
protected readonly transformPartitionLambda: Function;
|
|
41
|
+
protected readonly createPartitionsScheduler: Rule;
|
|
42
|
+
protected readonly transformPartitionsScheduler: Rule;
|
|
43
|
+
|
|
44
|
+
protected constructor(scope: Construct, id: string, props: AccessLogsAnalysisProps) {
|
|
45
|
+
super(scope, id);
|
|
46
|
+
this.resourceIdPrefix = props.resourcePrefix;
|
|
47
|
+
this.bucket = props.bucket;
|
|
48
|
+
this.setupLifecycleRules(props);
|
|
49
|
+
this.workgroup = this.createWorkgroup();
|
|
50
|
+
this.database = this.createGlueDatabase();
|
|
51
|
+
this.accessLogsByDateTable = this.createAccessLogsByDateTable();
|
|
52
|
+
this.accessLogsParquetTable = this.createAccessLogsParquetTable();
|
|
53
|
+
this.groupByDateLayer = this.createGroupByDateLayer();
|
|
54
|
+
this.groupByDateLambda = this.createGroupByDateLambda();
|
|
55
|
+
this.partitioningLayer = this.createPartitioningLayer();
|
|
56
|
+
this.createPartitionLambda = this.createCreatePartitionLambda();
|
|
57
|
+
this.transformPartitionLambda = this.createTransformPartitionLambda();
|
|
58
|
+
this.createPartitionsScheduler = this.createCreatePartitionsScheduler();
|
|
59
|
+
this.transformPartitionsScheduler = this.createTransformPartitionsScheduler(props);
|
|
60
|
+
}
|
|
61
|
+
|
|
62
|
+
private setupLifecycleRules(props: AccessLogsAnalysisProps): void {
|
|
63
|
+
// cleanup raw and partitioned access logs after a configurable time range
|
|
64
|
+
|
|
65
|
+
this.bucket.addLifecycleRule({
|
|
66
|
+
id: `${this.resourceIdPrefix}-cleanup-unprocessed`,
|
|
67
|
+
prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_UNPROCESSED}/*`,
|
|
68
|
+
expiration: props.expireRawLogsAfter ?? Duration.days(7),
|
|
69
|
+
});
|
|
70
|
+
|
|
71
|
+
this.bucket.addLifecycleRule({
|
|
72
|
+
id: `${this.resourceIdPrefix}-cleanup-grouped`,
|
|
73
|
+
prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_GROUPED_BY_DATE}/*`,
|
|
74
|
+
expiration: props.expireIntermediateLogsAfter ?? Duration.days(7),
|
|
75
|
+
});
|
|
76
|
+
|
|
77
|
+
this.bucket.addLifecycleRule({
|
|
78
|
+
id: `${this.resourceIdPrefix}-cleanup-transformed`,
|
|
79
|
+
prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_TRANSFORMED}/*`,
|
|
80
|
+
expiration: props.expireTransformedLogsAfter ?? Duration.days(180),
|
|
81
|
+
});
|
|
82
|
+
|
|
83
|
+
/* CHECKME: delete query results after 1 week
|
|
84
|
+
this.bucket.addLifecycleRule({
|
|
85
|
+
id: `${this.resourceIdPrefix}-cleanup-query-results`,
|
|
86
|
+
prefix: `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_ATHENA_RESULTS}/*`,
|
|
87
|
+
expiration: Duration.days(7),
|
|
88
|
+
});
|
|
89
|
+
*/
|
|
90
|
+
}
|
|
91
|
+
|
|
92
|
+
private createWorkgroup(): CfnWorkGroup {
|
|
93
|
+
const workgroupName = `${this.resourceIdPrefix}-workgroup`;
|
|
94
|
+
|
|
95
|
+
// due to a current bug, the tags are not automatically assigned to the workgroup
|
|
96
|
+
// note, that the keys must be converted to lower case
|
|
97
|
+
const tags: CfnTag[] = Stack.of(this)
|
|
98
|
+
.tags.renderTags()
|
|
99
|
+
.map((tag: { Key: string; Value: string }) => ({key: tag.Key, value: tag.Value}));
|
|
100
|
+
|
|
101
|
+
return new CfnWorkGroup(this, workgroupName, {
|
|
102
|
+
name: workgroupName,
|
|
103
|
+
workGroupConfiguration: {
|
|
104
|
+
publishCloudWatchMetricsEnabled: false,
|
|
105
|
+
resultConfiguration: {
|
|
106
|
+
outputLocation: `s3://${this.bucket.bucketName}/${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_ATHENA_RESULTS}`,
|
|
107
|
+
},
|
|
108
|
+
enforceWorkGroupConfiguration: true
|
|
109
|
+
},
|
|
110
|
+
tags,
|
|
111
|
+
});
|
|
112
|
+
}
|
|
113
|
+
|
|
114
|
+
private createGlueDatabase(): Database {
|
|
115
|
+
const databaseName = `${this.resourceIdPrefix}-database`;
|
|
116
|
+
return new Database(this, databaseName, {
|
|
117
|
+
// Athena doesn't support dashes in database/table names
|
|
118
|
+
databaseName: databaseName.replace(/-/g, '_'),
|
|
119
|
+
});
|
|
120
|
+
}
|
|
121
|
+
|
|
122
|
+
protected abstract createAccessLogsByDateTable(): CloudFrontAccessLogsByDateTable;
|
|
123
|
+
|
|
124
|
+
protected abstract createAccessLogsParquetTable(): CloudFrontAccessLogsByDateTable;
|
|
125
|
+
|
|
126
|
+
private createGroupByDateLayer(): LayerVersion {
|
|
127
|
+
const layerVersionName = `${this.resourceIdPrefix}-group-by-date-dependencies`;
|
|
128
|
+
return new LayerVersion(this, layerVersionName, {
|
|
129
|
+
layerVersionName,
|
|
130
|
+
compatibleArchitectures: [Architecture.ARM_64, Architecture.X86_64],
|
|
131
|
+
compatibleRuntimes: [Runtime.NODEJS_14_X, Runtime.NODEJS_16_X],
|
|
132
|
+
code: Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/group-by-date/build/layer')),
|
|
133
|
+
removalPolicy: RemovalPolicy.DESTROY,
|
|
134
|
+
});
|
|
135
|
+
}
|
|
136
|
+
|
|
137
|
+
private createPartitioningLayer(): LayerVersion {
|
|
138
|
+
const layerVersionName = `${this.resourceIdPrefix}-partitioning-dependencies`;
|
|
139
|
+
return new LayerVersion(this, layerVersionName, {
|
|
140
|
+
layerVersionName,
|
|
141
|
+
compatibleArchitectures: [Architecture.ARM_64, Architecture.X86_64],
|
|
142
|
+
compatibleRuntimes: [Runtime.NODEJS_14_X, Runtime.NODEJS_16_X],
|
|
143
|
+
code: Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/partitioning/build/layer')),
|
|
144
|
+
removalPolicy: RemovalPolicy.DESTROY,
|
|
145
|
+
});
|
|
146
|
+
}
|
|
147
|
+
|
|
148
|
+
/**
|
|
149
|
+
* A Lambda function to be triggered whenever a new access log is created.
|
|
150
|
+
* It moves the raw access logs into a sub folder hierarchy by year, month, day and hour.
|
|
151
|
+
*/
|
|
152
|
+
private createGroupByDateLambda(): Function {
|
|
153
|
+
const functionName = `${this.resourceIdPrefix}-group-by-date`;
|
|
154
|
+
|
|
155
|
+
const lambda = new Function(this, functionName, {
|
|
156
|
+
functionName,
|
|
157
|
+
architecture: Architecture.ARM_64,
|
|
158
|
+
runtime: Runtime.NODEJS_16_X,
|
|
159
|
+
code: Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/group-by-date/build/app')),
|
|
160
|
+
memorySize: 512,
|
|
161
|
+
timeout: Duration.seconds(20),
|
|
162
|
+
handler: 'index.handler',
|
|
163
|
+
layers: [this.groupByDateLayer],
|
|
164
|
+
events: [
|
|
165
|
+
new S3EventSource(this.bucket, {
|
|
166
|
+
events: [EventType.OBJECT_CREATED],
|
|
167
|
+
filters: [this.getUnprocessedObjectsFilter()],
|
|
168
|
+
}),
|
|
169
|
+
],
|
|
170
|
+
logRetention: RetentionDays.TWO_WEEKS,
|
|
171
|
+
environment: {
|
|
172
|
+
AWS_NODEJS_CONNECTION_REUSE_ENABLED: '1',
|
|
173
|
+
NODE_OPTIONS: '--enable-source-maps',
|
|
174
|
+
TARGET_FOLDER: AccessLogsAnalysis.ACCESS_LOGS_FOLDER_GROUPED_BY_DATE,
|
|
175
|
+
RAW_ACCESS_LOG_FILE_PATTERN: this.getRawAccessLogFilePattern().source,
|
|
176
|
+
},
|
|
177
|
+
});
|
|
178
|
+
|
|
179
|
+
this.bucket.grantReadWrite(lambda);
|
|
180
|
+
this.bucket.grantDelete(lambda, `${AccessLogsAnalysis.ACCESS_LOGS_FOLDER_UNPROCESSED}/*`);
|
|
181
|
+
|
|
182
|
+
return lambda;
|
|
183
|
+
}
|
|
184
|
+
|
|
185
|
+
protected abstract getUnprocessedObjectsFilter(): NotificationKeyFilter;
|
|
186
|
+
|
|
187
|
+
/** The pattern to identify unprocessed access logs depends on the producing source */
|
|
188
|
+
protected abstract getRawAccessLogFilePattern(): RegExp;
|
|
189
|
+
|
|
190
|
+
/**
|
|
191
|
+
* Creates a new partition for the upcoming hour in the access log database.
|
|
192
|
+
*/
|
|
193
|
+
private createCreatePartitionLambda(): Function {
|
|
194
|
+
const functionName = `${this.resourceIdPrefix}-create-part`;
|
|
195
|
+
|
|
196
|
+
const lambda = new Function(this, functionName, {
|
|
197
|
+
functionName,
|
|
198
|
+
architecture: Architecture.ARM_64,
|
|
199
|
+
runtime: Runtime.NODEJS_16_X,
|
|
200
|
+
code: Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/partitioning/build/app'), {
|
|
201
|
+
exclude: ['transform-partition*', '*.d.ts'],
|
|
202
|
+
}),
|
|
203
|
+
memorySize: 128,
|
|
204
|
+
timeout: Duration.seconds(20),
|
|
205
|
+
handler: 'create-partition.handler',
|
|
206
|
+
layers: [this.partitioningLayer],
|
|
207
|
+
logRetention: RetentionDays.TWO_WEEKS,
|
|
208
|
+
environment: {
|
|
209
|
+
AWS_NODEJS_CONNECTION_REUSE_ENABLED: '1',
|
|
210
|
+
NODE_OPTIONS: '--enable-source-maps',
|
|
211
|
+
WORKGROUP: this.workgroup.name,
|
|
212
|
+
DATABASE: this.database.databaseName,
|
|
213
|
+
TABLE: this.accessLogsByDateTable.tableName,
|
|
214
|
+
},
|
|
215
|
+
});
|
|
216
|
+
|
|
217
|
+
// grant access to S3 bucket and to execute Athena queries which create new partitions
|
|
218
|
+
this.bucket.grantReadWrite(lambda);
|
|
219
|
+
lambda.addToRolePolicy(
|
|
220
|
+
new PolicyStatement({
|
|
221
|
+
effect: Effect.ALLOW,
|
|
222
|
+
actions: [
|
|
223
|
+
'athena:StartQueryExecution',
|
|
224
|
+
'athena:GetQueryExecution',
|
|
225
|
+
'glue:CreateDatabase',
|
|
226
|
+
'glue:CreatePartition',
|
|
227
|
+
'glue:GetDatabase',
|
|
228
|
+
'glue:GetTable',
|
|
229
|
+
'glue:BatchCreatePartition',
|
|
230
|
+
],
|
|
231
|
+
resources: ['*'],
|
|
232
|
+
})
|
|
233
|
+
);
|
|
234
|
+
|
|
235
|
+
return lambda;
|
|
236
|
+
}
|
|
237
|
+
|
|
238
|
+
/**
|
|
239
|
+
* Transforms partitions from the Hive format to Parquet.
|
|
240
|
+
*/
|
|
241
|
+
private createTransformPartitionLambda(): Function {
|
|
242
|
+
const functionName = `${this.resourceIdPrefix}-transform-part`;
|
|
243
|
+
|
|
244
|
+
const lambda = new Function(this, functionName, {
|
|
245
|
+
functionName,
|
|
246
|
+
architecture: Architecture.ARM_64,
|
|
247
|
+
runtime: Runtime.NODEJS_16_X,
|
|
248
|
+
code: Code.fromAsset(path.join(__dirname, '../../functions/access-logs-analysis/partitioning/build/app'), {
|
|
249
|
+
exclude: ['create-partition*', '*.d.ts'],
|
|
250
|
+
}),
|
|
251
|
+
memorySize: 128,
|
|
252
|
+
timeout: Duration.seconds(20),
|
|
253
|
+
handler: 'transform-partition.handler',
|
|
254
|
+
layers: [this.partitioningLayer],
|
|
255
|
+
logRetention: RetentionDays.TWO_WEEKS,
|
|
256
|
+
environment: {
|
|
257
|
+
AWS_NODEJS_CONNECTION_REUSE_ENABLED: '1',
|
|
258
|
+
NODE_OPTIONS: '--enable-source-maps',
|
|
259
|
+
WORKGROUP: this.workgroup.name,
|
|
260
|
+
DATABASE: this.database.databaseName,
|
|
261
|
+
SOURCE_TABLE: this.accessLogsByDateTable.tableName,
|
|
262
|
+
TARGET_TABLE: this.accessLogsParquetTable.tableName,
|
|
263
|
+
},
|
|
264
|
+
});
|
|
265
|
+
|
|
266
|
+
// grant access to S3 bucket and to execute Athena queries which create new partitions
|
|
267
|
+
this.bucket.grantReadWrite(lambda);
|
|
268
|
+
lambda.addToRolePolicy(
|
|
269
|
+
new PolicyStatement({
|
|
270
|
+
effect: Effect.ALLOW,
|
|
271
|
+
actions: [
|
|
272
|
+
'athena:StartQueryExecution',
|
|
273
|
+
'athena:GetQueryExecution',
|
|
274
|
+
'glue:CreateDatabase',
|
|
275
|
+
'glue:CreatePartition',
|
|
276
|
+
'glue:GetDatabase',
|
|
277
|
+
'glue:GetTable',
|
|
278
|
+
'glue:BatchCreatePartition',
|
|
279
|
+
'glue:GetPartition',
|
|
280
|
+
'glue:GetPartitions',
|
|
281
|
+
'glue:CreateTable',
|
|
282
|
+
'glue:DeleteTable',
|
|
283
|
+
'glue:DeletePartition',
|
|
284
|
+
],
|
|
285
|
+
resources: ['*'],
|
|
286
|
+
})
|
|
287
|
+
);
|
|
288
|
+
|
|
289
|
+
return lambda;
|
|
290
|
+
}
|
|
291
|
+
|
|
292
|
+
private createCreatePartitionsScheduler(): Rule {
|
|
293
|
+
const ruleName = `${this.resourceIdPrefix}-create-part-sched`;
|
|
294
|
+
return new Rule(this, ruleName, {
|
|
295
|
+
ruleName,
|
|
296
|
+
schedule: Schedule.cron({minute: '55'}),
|
|
297
|
+
targets: [new LambdaFunction(this.createPartitionLambda, {retryAttempts: 10})],
|
|
298
|
+
});
|
|
299
|
+
}
|
|
300
|
+
|
|
301
|
+
private createTransformPartitionsScheduler(props: AccessLogsAnalysisProps): Rule {
|
|
302
|
+
const ruleName = `${this.resourceIdPrefix}-transform-part-sched`;
|
|
303
|
+
return new Rule(this, ruleName, {
|
|
304
|
+
ruleName,
|
|
305
|
+
schedule: Schedule.cron({minute: '1'}),
|
|
306
|
+
targets: [
|
|
307
|
+
new LambdaFunction(this.transformPartitionLambda, {
|
|
308
|
+
event: this.getTransformPartitionInvocationProps(props),
|
|
309
|
+
retryAttempts: 10,
|
|
310
|
+
}),
|
|
311
|
+
],
|
|
312
|
+
});
|
|
313
|
+
}
|
|
314
|
+
|
|
315
|
+
private getTransformPartitionInvocationProps(props: AccessLogsAnalysisProps): RuleTargetInput {
|
|
316
|
+
return RuleTargetInput.fromObject({
|
|
317
|
+
columnNames: [
|
|
318
|
+
...this.accessLogsParquetTable.columns,
|
|
319
|
+
...(this.accessLogsParquetTable.partitionKeys as Column[]),
|
|
320
|
+
].map(column => column.name),
|
|
321
|
+
columnTransformations: this.getColumnTransformationRules(props),
|
|
322
|
+
});
|
|
323
|
+
}
|
|
324
|
+
|
|
325
|
+
/**
|
|
326
|
+
* Needs to return the log source specific column transformation rules
|
|
327
|
+
* (e.g. to anonymize IP addresses).
|
|
328
|
+
*/
|
|
329
|
+
protected abstract getColumnTransformationRules(props: AccessLogsAnalysisProps): ColumnTransformationRules;
|
|
330
|
+
}
|