@aws-mdaa/dataops-job-l3-construct 1.3.0 → 1.5.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.jsii +114 -389
- package/lib/dataops-job-l3-construct.d.ts +30 -240
- package/lib/dataops-job-l3-construct.js +25 -25
- package/node_modules/@aws-mdaa/s3-bucketpolicy-helper/.npmignore +34 -0
- package/node_modules/@aws-mdaa/s3-bucketpolicy-helper/jest.config.js +5 -0
- package/node_modules/@aws-mdaa/s3-bucketpolicy-helper/lib/index.js +1 -1
- package/node_modules/@aws-mdaa/s3-bucketpolicy-helper/lib/index.ts +241 -0
- package/node_modules/@aws-mdaa/s3-bucketpolicy-helper/package.json +16 -18
- package/node_modules/@aws-mdaa/s3-bucketpolicy-helper/test/bucketpolicy-helper.test.d.ts +5 -0
- package/node_modules/@aws-mdaa/s3-bucketpolicy-helper/test/bucketpolicy-helper.test.js +200 -0
- package/node_modules/@aws-mdaa/s3-bucketpolicy-helper/test/bucketpolicy-helper.test.ts +215 -0
- package/node_modules/@aws-mdaa/s3-bucketpolicy-helper/tsconfig.json +40 -0
- package/node_modules/@aws-mdaa/s3-bucketpolicy-helper/tsconfig.tsbuildinfo +1 -0
- package/node_modules/@aws-mdaa/s3-bucketpolicy-helper/typedoc.json +7 -0
- package/node_modules/@aws-mdaa/s3-inventory-helper/.npmignore +34 -0
- package/node_modules/@aws-mdaa/s3-inventory-helper/jest.config.js +5 -0
- package/node_modules/@aws-mdaa/s3-inventory-helper/lib/index.d.ts +2 -20
- package/node_modules/@aws-mdaa/s3-inventory-helper/lib/index.js +2 -11
- package/node_modules/@aws-mdaa/s3-inventory-helper/lib/index.ts +241 -0
- package/node_modules/@aws-mdaa/s3-inventory-helper/package.json +15 -17
- package/node_modules/@aws-mdaa/s3-inventory-helper/test/TODO +0 -0
- package/node_modules/@aws-mdaa/s3-inventory-helper/tsconfig.json +40 -0
- package/node_modules/@aws-mdaa/s3-inventory-helper/tsconfig.tsbuildinfo +1 -0
- package/node_modules/@aws-mdaa/s3-inventory-helper/typedoc.json +7 -0
- package/node_modules/lodash/README.md +2 -2
- package/node_modules/lodash/_baseUnset.js +47 -2
- package/node_modules/lodash/core.js +1 -1
- package/node_modules/lodash/core.min.js +1 -1
- package/node_modules/lodash/lodash.js +43 -4
- package/node_modules/lodash/lodash.min.js +57 -57
- package/node_modules/lodash/package.json +1 -1
- package/package.json +33 -47
- package/node_modules/lodash/flake.lock +0 -40
- package/node_modules/lodash/flake.nix +0 -20
- package/node_modules/lodash/release.md +0 -48
|
@@ -0,0 +1,34 @@
|
|
|
1
|
+
# Don't include original .ts files when doing `npm pack`
|
|
2
|
+
*.ts
|
|
3
|
+
*.tsbuildinfo
|
|
4
|
+
.eslintrc.js
|
|
5
|
+
tsconfig.json
|
|
6
|
+
typedoc.json
|
|
7
|
+
|
|
8
|
+
# dev-related files
|
|
9
|
+
coverage
|
|
10
|
+
test/
|
|
11
|
+
|
|
12
|
+
# pack output
|
|
13
|
+
*.tgz
|
|
14
|
+
|
|
15
|
+
dist
|
|
16
|
+
|
|
17
|
+
|
|
18
|
+
#Exclude coverage reports for bundled deps
|
|
19
|
+
node_modules/**/coverage/*
|
|
20
|
+
# Exclude typescript source and config
|
|
21
|
+
#*.ts
|
|
22
|
+
#tsconfig.json
|
|
23
|
+
|
|
24
|
+
# Include javascript files and typescript declarations
|
|
25
|
+
!*.js
|
|
26
|
+
!*.d.ts
|
|
27
|
+
|
|
28
|
+
# Exclude jsii outdir
|
|
29
|
+
jsii-dist
|
|
30
|
+
|
|
31
|
+
# Include .jsii and .jsii.gz
|
|
32
|
+
!.jsii
|
|
33
|
+
!.jsii.gz
|
|
34
|
+
jest.config.js
|
|
@@ -8,27 +8,9 @@ import { PolicyStatement } from 'aws-cdk-lib/aws-iam';
|
|
|
8
8
|
import { IBucket, Inventory } from 'aws-cdk-lib/aws-s3';
|
|
9
9
|
import { Construct } from 'constructs';
|
|
10
10
|
export interface BucketInventory {
|
|
11
|
-
/**
|
|
12
|
-
* Q-ENHANCED-PROPERTY
|
|
13
|
-
* Name of the S3 bucket for which inventory data has been generated. Identifies the source bucket in inventory data organization and enables bucket-specific inventory querying through Glue table partitions.
|
|
14
|
-
*
|
|
15
|
-
* Use cases: Source bucket identification; Inventory data organization; Multi-bucket inventory management
|
|
16
|
-
*
|
|
17
|
-
* AWS: AWS S3 bucket name for inventory source identification in Glue table partitions
|
|
18
|
-
*
|
|
19
|
-
* Validation: Must be valid S3 bucket name (3-63 characters, lowercase, no underscores)
|
|
20
|
-
**/
|
|
11
|
+
/** Name of the S3 bucket for which inventory data has been generated */
|
|
21
12
|
readonly bucketName: string;
|
|
22
|
-
/**
|
|
23
|
-
* Q-ENHANCED-PROPERTY
|
|
24
|
-
* Name of the S3 inventory configuration that generated the inventory data for the specified bucket. Enables multiple inventory configurations per bucket and organized inventory data management.
|
|
25
|
-
*
|
|
26
|
-
* Use cases: Inventory configuration identification; Multiple inventories per bucket; Inventory data organization
|
|
27
|
-
*
|
|
28
|
-
* AWS: AWS S3 inventory configuration name for inventory data identification in Glue table partitions
|
|
29
|
-
*
|
|
30
|
-
* Validation: Must be valid S3 inventory configuration name matching the inventory ID used in S3 inventory setup
|
|
31
|
-
**/
|
|
13
|
+
/** Name of the S3 inventory configuration that generated the inventory data for the specified bucket */
|
|
32
14
|
readonly inventoryName: string;
|
|
33
15
|
}
|
|
34
16
|
/** Helper class for creating S3 Inventories and associated Glue/Athena resources for querying these inventories. */
|
|
@@ -24,16 +24,7 @@ class InventoryHelper {
|
|
|
24
24
|
return {
|
|
25
25
|
destination: {
|
|
26
26
|
bucket: destinationBucket,
|
|
27
|
-
/**
|
|
28
|
-
* Q-ENHANCED-PROPERTY
|
|
29
|
-
* Required S3 prefix for inventory report destination organization enabling systematic inventory file organization and management. Provides the S3 key prefix for inventory report storage enabling organized inventory data management and efficient retrieval of inventory reports.
|
|
30
|
-
*
|
|
31
|
-
* Use cases: Inventory organization; Report storage; Data management; Systematic file organization
|
|
32
|
-
*
|
|
33
|
-
* AWS: S3 inventory configuration destination prefix for inventory report organization and storage
|
|
34
|
-
*
|
|
35
|
-
* Validation: Must be valid S3 prefix string; required for inventory report destination organization
|
|
36
|
-
*/
|
|
27
|
+
/** S3 prefix for inventory report destination organization enabling systematic inventory file */
|
|
37
28
|
prefix: s3_constructs_1.MdaaBucket.formatS3Prefix(destinationPrefix),
|
|
38
29
|
bucketOwner: bucketOwner,
|
|
39
30
|
},
|
|
@@ -219,4 +210,4 @@ class InventoryHelper {
|
|
|
219
210
|
}
|
|
220
211
|
}
|
|
221
212
|
exports.InventoryHelper = InventoryHelper;
|
|
222
|
-
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"index.js","sourceRoot":"","sources":["index.ts"],"names":[],"mappings":";AAAA;;;GAGG;;;AAEH,2DAAqD;AAErD,mDAA+D;AAC/D,iDAA8D;AAC9D,+CAAqH;AA4BrH,oHAAoH;AACpH,MAAa,eAAe;IAC1B;;;;;;;OAOG;IACI,MAAM,CAAC,eAAe,CAC3B,iBAA0B,EAC1B,WAAmB,EACnB,aAAsB,EACtB,iBAA0B,EAC1B,kBAA2B;QAE3B,MAAM,WAAW,GAAG,kBAAkB,CAAC,CAAC,CAAC,GAAG,kBAAkB,EAAE,CAAC,CAAC,CAAC,kBAAkB,CAAC;QACtF,OAAO;YACL,WAAW,EAAE;gBACX,MAAM,EAAE,iBAAiB;gBACzB;;;;;;;;;mBASG;gBACH,MAAM,EAAE,0BAAU,CAAC,cAAc,CAAC,iBAAiB,CAAC;gBACpD,WAAW,EAAE,WAAW;aACzB;YACD,MAAM,EAAE,wBAAe,CAAC,OAAO;YAC/B,SAAS,EAAE,2BAAkB,CAAC,KAAK;YACnC,qBAAqB,EAAE,+BAAsB,CAAC,GAAG;YACjD,WAAW,EAAE,WAAW;YACxB,aAAa,EAAE,0BAAU,CAAC,cAAc,CAAC,aAAa,EAAE,KAAK,EAAE,IAAI,CAAC;YACpE,cAAc,EAAE;gBACd,MAAM;gBACN,kBAAkB;gBAClB,cAAc;gBACd,MAAM;gBACN,qBAAqB;gBACrB,mBAAmB;gBACnB,kBAAkB;gBAClB,2BAA2B;gBAC3B,gBAAgB;gBAChB,2BAA2B;gBAC3B,8BAA8B;aAC/B;SACF,CAAC;IACJ,CAAC;IAED;;;;;;;;;;OAUG;IACI,MAAM,CAAC,kBAAkB,CAC9B,KAAgB,EAChB,SAAiB,EACjB,eAAuB,EACvB,QAAkB,EAClB,kBAA0B,EAC1B,iBAAoC,EACpC,cAAuB;QAEvB,MAAM,QAAQ,GAAG,cAAc;YAC7B,CAAC,CAAC,QAAQ,kBAAkB,IAAI,0BAAU,CAAC,cAAc,CAAC,cAAc,CAAC,GAAG;YAC5E,CAAC,CAAC,QAAQ,kBAAkB,GAAG,CAAC;QAClC,MAAM,UAAU,GAAG;YACjB,IAAI,EAAE,GAAG,eAAe,MAAM,CAAC,OAAO,CAAC,KAAK,EAAE,GAAG,CAAC;YAClD,UAAU,EAAE;gBACV,QAAQ,EAAE,MAAM;gBAChB,oBAAoB,EAAE,MAAM;gBAC5B,oBAAoB,EAAE,MAAM;gBAC5B,qBAAqB,EAAE,sBAAsB;gBAC7C,sBAAsB,EAAE,kBAAkB;gBAC1C,wBAAwB,EAAE,GAAG;gBAC7B,6BAA6B,EAAE,OAAO;gBACtC,kCAAkC,EAAE,MAAM;gBAC1C,oCAAoC,EAAE,iBAAiB;qBACpD,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,GAAG,CAAC,CAAC,UAAU,IAAI,CAAC,CAAC,aAAa,EAAE,CAAC;qBAC9C,IAAI,CAAC,GAAG,CAAC;gBACZ,2BAA2B,EAAE,QAAQ,GAAG,mCAAmC;aAC5E;YACD,SAAS,EAAE,gBAAgB;YAC3B,aAAa,EAAE;gBACb;oBACE,IAAI,EAAE,kBAAkB;oBACxB,IAAI,EAAE,QAAQ;iBACf;gBACD;oBACE,IAAI,EAAE,IAAI;oBACV,IAAI,EAAE,QAAQ;iBACf;aACF;YACD,iBAAiB,EAAE;gBACjB,OAAO,EAAE;oBACP;wBACE,IAAI,EAAE,QAAQ;wBACd,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,KAAK;wBACX,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,YAAY;wBAClB,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,WAAW;wBACjB,IAAI,EAAE,SAAS;qBAChB;oBACD;wBACE,IAAI,EAAE,kBAAkB;wBACxB,IAAI,EAAE,SAAS;qBAChB;oBACD;wBACE,IAAI,EAAE,MAAM;wBACZ,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,oBAAoB;wBAC1B,IAAI,EAAE,WAAW;qBAClB;oBACD;wBACE,IAAI,EAAE,OAAO;wBACb,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,eAAe;wBACrB,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,uBAAuB;wBAC7B,IAAI,EAAE,SAAS;qBAChB;oBACD;wBACE,IAAI,EAAE,oBAAoB;wBAC1B,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,mBAAmB;wBACzB,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,0BAA0B;wBAChC,IAAI,EAAE,QAAQ;qBACf;oBACD,IAAI;oBACJ,IAAI;oBACJ,6CAA6C;oBAC7C,wBAAwB;oBACxB,KAAK;oBACL,IAAI;oBACJ,gCAAgC;oBAChC,qBAAqB;oBACrB,KAAK;oBACL,IAAI;oBACJ,6CAA6C;oBAC7C,qBAAqB;oBACrB,IAAI;iBACL;gBACD,QAAQ,EAAE,QAAQ;gBAClB,WAAW,EAAE,qDAAqD;gBAClE,YAAY,EAAE,4DAA4D;gBAC1E,UAAU,EAAE,KAAK;gBACjB,eAAe,EAAE,CAAC,CAAC;gBACnB,SAAS,EAAE;oBACT,oBAAoB,EAAE,6DAA6D;oBACnF,UAAU,EAAE;wBACV,sBAAsB,EAAE,GAAG;qBAC5B;iBACF;aACF;SACF,CAAC;QAEF,MAAM,UAAU,GAAkB;YAChC,SAAS,EAAE,SAAS;YACpB,YAAY,EAAE,QAAQ,CAAC,YAAY;YACnC,UAAU,EAAE,UAAU;SACvB,CAAC;QACF,OAAO,IAAI,mBAAQ,CAAC,KAAK,EAAE,aAAa,eAAe,EAAE,EAAE,UAAU,CAAC,CAAC;IACzE,CAAC;IAED;;;;;;;OAOG;IACI,MAAM,CAAC,oCAAoC,CAChD,SAAiB,EACjB,UAAkB,EAClB,eAAwB,EACxB,eAAwB;QAExB,MAAM,QAAQ,GAAG,eAAe;YAC9B,CAAC,CAAC,GAAG,SAAS,IAAI,0BAAU,CAAC,cAAc,CAAC,eAAe,CAAC,IAAI;YAChE,CAAC,CAAC,GAAG,SAAS,IAAI,CAAC;QACrB,MAAM,gBAAgB,GAAG,IAAI,yBAAe,CAAC;YAC3C,GAAG,EAAE,kBAAkB;YACvB,MAAM,EAAE,gBAAM,CAAC,KAAK;YACpB,SAAS,EAAE,CAAC,QAAQ,CAAC;YACrB,OAAO,EAAE,CAAC,cAAc,CAAC;SAC1B,CAAC,CAAC;QACH,gBAAgB,CAAC,YAAY,CAAC,cAAc,EAAE;YAC5C,mBAAmB,EAAE,UAAU;YAC/B,cAAc,EAAE,2BAA2B;SAC5C,CAAC,CAAC;QACH,IAAI,eAAe,EAAE;YACnB,gBAAgB,CAAC,YAAY,CAAC,SAAS,EAAE;gBACvC,eAAe,EAAE,eAAe;aACjC,CAAC,CAAC;SACJ;QACD,gBAAgB,CAAC,mBAAmB,CAAC,kBAAkB,CAAC,CAAC;QACzD,OAAO,gBAAgB,CAAC;IAC1B,CAAC;CACF;AArOD,0CAqOC","sourcesContent":["/*!\n * Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.\n * SPDX-License-Identifier: Apache-2.0\n */\n\nimport { MdaaBucket } from '@aws-mdaa/s3-constructs';\nimport { Database } from '@aws-cdk/aws-glue-alpha';\nimport { CfnTable, CfnTableProps } from 'aws-cdk-lib/aws-glue';\nimport { Effect, PolicyStatement } from 'aws-cdk-lib/aws-iam';\nimport { IBucket, Inventory, InventoryFormat, InventoryFrequency, InventoryObjectVersion } from 'aws-cdk-lib/aws-s3';\nimport { Construct } from 'constructs';\n\nexport interface BucketInventory {\n  /**\n   * Q-ENHANCED-PROPERTY\n   * Name of the S3 bucket for which inventory data has been generated. Identifies the source bucket in inventory data organization and enables bucket-specific inventory querying through Glue table partitions.\n   *\n   * Use cases: Source bucket identification; Inventory data organization; Multi-bucket inventory management\n   *\n   * AWS: AWS S3 bucket name for inventory source identification in Glue table partitions\n   *\n   * Validation: Must be valid S3 bucket name (3-63 characters, lowercase, no underscores)\n   **/\n  readonly bucketName: string;\n  /**\n   * Q-ENHANCED-PROPERTY\n   * Name of the S3 inventory configuration that generated the inventory data for the specified bucket. Enables multiple inventory configurations per bucket and organized inventory data management.\n   *\n   * Use cases: Inventory configuration identification; Multiple inventories per bucket; Inventory data organization\n   *\n   * AWS: AWS S3 inventory configuration name for inventory data identification in Glue table partitions\n   *\n   * Validation: Must be valid S3 inventory configuration name matching the inventory ID used in S3 inventory setup\n   **/\n  readonly inventoryName: string;\n}\n\n/** Helper class for creating S3 Inventories and associated Glue/Athena resources for querying these inventories. */\nexport class InventoryHelper {\n  /**\n   * Helper method for creating an S3 inventory.\n   * @param destinationBucket The bucket where S3 inventory data will be written\n   * @param inventoryId The S3 inventory ID\n   * @param objectsPrefix The object prefix from which inventory will be produced (on the bucket to which the inventory config is applied)\n   * @param destinationPrefix The object prefix under which inventory will be written on the destination bucket.\n   * @returns An S3 Inventory Config which can be applied to a bucket in order to produce periodic inventory data.\n   */\n  public static createInvConfig(\n    destinationBucket: IBucket,\n    inventoryId: string,\n    objectsPrefix?: string,\n    destinationPrefix?: string,\n    destinationAccount?: string,\n  ): Inventory {\n    const bucketOwner = destinationAccount ? `${destinationAccount}` : destinationAccount;\n    return {\n      destination: {\n        bucket: destinationBucket,\n        /**\n         * Q-ENHANCED-PROPERTY\n         * Required S3 prefix for inventory report destination organization enabling systematic inventory file organization and management. Provides the S3 key prefix for inventory report storage enabling organized inventory data management and efficient retrieval of inventory reports.\n         *\n         * Use cases: Inventory organization; Report storage; Data management; Systematic file organization\n         *\n         * AWS: S3 inventory configuration destination prefix for inventory report organization and storage\n         *\n         * Validation: Must be valid S3 prefix string; required for inventory report destination organization\n         */\n        prefix: MdaaBucket.formatS3Prefix(destinationPrefix),\n        bucketOwner: bucketOwner,\n      },\n      format: InventoryFormat.PARQUET,\n      frequency: InventoryFrequency.DAILY,\n      includeObjectVersions: InventoryObjectVersion.ALL,\n      inventoryId: inventoryId,\n      objectsPrefix: MdaaBucket.formatS3Prefix(objectsPrefix, false, true),\n      optionalFields: [\n        'Size',\n        'LastModifiedDate',\n        'StorageClass',\n        'ETag',\n        'IsMultipartUploaded',\n        'ReplicationStatus',\n        'EncryptionStatus',\n        'ObjectLockRetainUntilDate',\n        'ObjectLockMode',\n        'ObjectLockLegalHoldStatus',\n        'IntelligentTieringAccessTier',\n      ],\n    };\n  }\n\n  /**\n   * Helper method for creating a Glue table which can be used to query inventory data generated by an S3 Inventory config\n   * @param scope Stack in which the table will be created\n   * @param tableNamePrefix Will be used to prefix the table name.\n   * @param locationBucketName The bucket where the inventory data is stored.\n   * @param inventoryBucket The bucket for which inventory data has been generated\n   * @param database The Glue database in which the table will be created\n   * @param inventoryName The name of the S3 Inventory config\n   * @param locationPrefix The S3 Prefix on the location bucket where the inventory is stored.\n   * @returns A Glue table which can be used to query S3 inventory data in an S3 bucket.\n   */\n  public static createGlueInvTable(\n    scope: Construct,\n    catalogId: string,\n    tableNamePrefix: string,\n    database: Database,\n    locationBucketName: string,\n    bucketInventories: BucketInventory[],\n    locationPrefix?: string,\n  ): CfnTable {\n    const location = locationPrefix\n      ? `s3://${locationBucketName}/${MdaaBucket.formatS3Prefix(locationPrefix)}/`\n      : `s3://${locationBucketName}/`;\n    const tableInput = {\n      name: `${tableNamePrefix}_inv`.replace(/-/gi, '_'),\n      parameters: {\n        EXTERNAL: 'TRUE',\n        'projection.enabled': 'true',\n        'projection.dt.type': 'date',\n        'projection.dt.range': '2022-01-01-00-00,NOW',\n        'projection.dt.format': 'yyyy-MM-dd-HH-mm',\n        'projection.dt.interval': '1',\n        'projection.dt.interval.unit': 'HOURS',\n        'projection.bucket_inventory.type': 'enum',\n        'projection.bucket_inventory.values': bucketInventories\n          .map(x => `${x.bucketName}/${x.inventoryName}`)\n          .join(','),\n        'storage.location.template': location + '${bucket_inventory}/hive/dt=${dt}',\n      },\n      tableType: 'EXTERNAL_TABLE',\n      partitionKeys: [\n        {\n          name: 'bucket_inventory',\n          type: 'string',\n        },\n        {\n          name: 'dt',\n          type: 'string',\n        },\n      ],\n      storageDescriptor: {\n        columns: [\n          {\n            name: 'bucket',\n            type: 'string',\n          },\n          {\n            name: 'key',\n            type: 'string',\n          },\n          {\n            name: 'version_id',\n            type: 'string',\n          },\n          {\n            name: 'is_latest',\n            type: 'boolean',\n          },\n          {\n            name: 'is_delete_marker',\n            type: 'boolean',\n          },\n          {\n            name: 'size',\n            type: 'bigint',\n          },\n          {\n            name: 'last_modified_date',\n            type: 'timestamp',\n          },\n          {\n            name: 'e_tag',\n            type: 'string',\n          },\n          {\n            name: 'storage_class',\n            type: 'string',\n          },\n          {\n            name: 'is_multipart_uploaded',\n            type: 'boolean',\n          },\n          {\n            name: 'replication_status',\n            type: 'string',\n          },\n          {\n            name: 'encryption_status',\n            type: 'string',\n          },\n          {\n            name: 'intelligent_tiering_tier',\n            type: 'string',\n          },\n          // ,\n          // {\n          //     name: \"object_lock_retain_until_date\",\n          //     type: \"timestamp\"\n          // },\n          // {\n          //     name: \"object_lock_mode\",\n          //     type: \"string\"\n          // },\n          // {\n          //     name: \"object_lock_legal_hold_status\",\n          //     type: \"string\"\n          // }\n        ],\n        location: location,\n        inputFormat: 'org.apache.hadoop.hive.ql.io.SymlinkTextInputFormat',\n        outputFormat: 'org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat',\n        compressed: false,\n        numberOfBuckets: -1,\n        serdeInfo: {\n          serializationLibrary: 'org.apache.hadoop.hive.ql.io.parquet.serde.ParquetHiveSerDe',\n          parameters: {\n            'serialization.format': '1',\n          },\n        },\n      },\n    };\n\n    const tableProps: CfnTableProps = {\n      catalogId: catalogId,\n      databaseName: database.databaseName,\n      tableInput: tableInput,\n    };\n    return new CfnTable(scope, `inv-table-${tableNamePrefix}`, tableProps);\n  }\n\n  /**\n   * Helper method to generate an S3 Bucket Policy Statement allowing S3 service to write inventories to a bucket.\n   * @param sourceBucketArn The bucket arn for which inventory data is being produced\n   * @param bucketArn  The bucket arn where inventory will be stored\n   * @param srcAccount The account which owns the source bucket from which inventory is being produced.\n   * @param inventoryPrefix The prefix on the destination bucket where inventory data will be stored.\n   * @returns A policy statement which permits the S3 service principal to write inventory for the source bucket/account to the destination bucket.\n   */\n  public static createInventoryBucketPolicyStatement(\n    bucketArn: string,\n    srcAccount: string,\n    sourceBucketArn?: string,\n    inventoryPrefix?: string,\n  ): PolicyStatement {\n    const resource = inventoryPrefix\n      ? `${bucketArn}/${MdaaBucket.formatS3Prefix(inventoryPrefix)}/*`\n      : `${bucketArn}/*`;\n    const allowS3Inventory = new PolicyStatement({\n      sid: 'AllowS3Inventory',\n      effect: Effect.ALLOW,\n      resources: [resource],\n      actions: ['s3:PutObject'],\n    });\n    allowS3Inventory.addCondition('StringEquals', {\n      'aws:SourceAccount': srcAccount,\n      's3:x-amz-acl': 'bucket-owner-full-control',\n    });\n    if (sourceBucketArn) {\n      allowS3Inventory.addCondition('ArnLike', {\n        'aws:SourceArn': sourceBucketArn,\n      });\n    }\n    allowS3Inventory.addServicePrincipal('s3.amazonaws.com');\n    return allowS3Inventory;\n  }\n}\n"]}
|
|
213
|
+
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"index.js","sourceRoot":"","sources":["index.ts"],"names":[],"mappings":";AAAA;;;GAGG;;;AAEH,2DAAqD;AAErD,mDAA+D;AAC/D,iDAA8D;AAC9D,+CAAqH;AAUrH,oHAAoH;AACpH,MAAa,eAAe;IAC1B;;;;;;;OAOG;IACI,MAAM,CAAC,eAAe,CAC3B,iBAA0B,EAC1B,WAAmB,EACnB,aAAsB,EACtB,iBAA0B,EAC1B,kBAA2B;QAE3B,MAAM,WAAW,GAAG,kBAAkB,CAAC,CAAC,CAAC,GAAG,kBAAkB,EAAE,CAAC,CAAC,CAAC,kBAAkB,CAAC;QACtF,OAAO;YACL,WAAW,EAAE;gBACX,MAAM,EAAE,iBAAiB;gBACzB,iGAAiG;gBACjG,MAAM,EAAE,0BAAU,CAAC,cAAc,CAAC,iBAAiB,CAAC;gBACpD,WAAW,EAAE,WAAW;aACzB;YACD,MAAM,EAAE,wBAAe,CAAC,OAAO;YAC/B,SAAS,EAAE,2BAAkB,CAAC,KAAK;YACnC,qBAAqB,EAAE,+BAAsB,CAAC,GAAG;YACjD,WAAW,EAAE,WAAW;YACxB,aAAa,EAAE,0BAAU,CAAC,cAAc,CAAC,aAAa,EAAE,KAAK,EAAE,IAAI,CAAC;YACpE,cAAc,EAAE;gBACd,MAAM;gBACN,kBAAkB;gBAClB,cAAc;gBACd,MAAM;gBACN,qBAAqB;gBACrB,mBAAmB;gBACnB,kBAAkB;gBAClB,2BAA2B;gBAC3B,gBAAgB;gBAChB,2BAA2B;gBAC3B,8BAA8B;aAC/B;SACF,CAAC;IACJ,CAAC;IAED;;;;;;;;;;OAUG;IACI,MAAM,CAAC,kBAAkB,CAC9B,KAAgB,EAChB,SAAiB,EACjB,eAAuB,EACvB,QAAkB,EAClB,kBAA0B,EAC1B,iBAAoC,EACpC,cAAuB;QAEvB,MAAM,QAAQ,GAAG,cAAc;YAC7B,CAAC,CAAC,QAAQ,kBAAkB,IAAI,0BAAU,CAAC,cAAc,CAAC,cAAc,CAAC,GAAG;YAC5E,CAAC,CAAC,QAAQ,kBAAkB,GAAG,CAAC;QAClC,MAAM,UAAU,GAAG;YACjB,IAAI,EAAE,GAAG,eAAe,MAAM,CAAC,OAAO,CAAC,KAAK,EAAE,GAAG,CAAC;YAClD,UAAU,EAAE;gBACV,QAAQ,EAAE,MAAM;gBAChB,oBAAoB,EAAE,MAAM;gBAC5B,oBAAoB,EAAE,MAAM;gBAC5B,qBAAqB,EAAE,sBAAsB;gBAC7C,sBAAsB,EAAE,kBAAkB;gBAC1C,wBAAwB,EAAE,GAAG;gBAC7B,6BAA6B,EAAE,OAAO;gBACtC,kCAAkC,EAAE,MAAM;gBAC1C,oCAAoC,EAAE,iBAAiB;qBACpD,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,GAAG,CAAC,CAAC,UAAU,IAAI,CAAC,CAAC,aAAa,EAAE,CAAC;qBAC9C,IAAI,CAAC,GAAG,CAAC;gBACZ,2BAA2B,EAAE,QAAQ,GAAG,mCAAmC;aAC5E;YACD,SAAS,EAAE,gBAAgB;YAC3B,aAAa,EAAE;gBACb;oBACE,IAAI,EAAE,kBAAkB;oBACxB,IAAI,EAAE,QAAQ;iBACf;gBACD;oBACE,IAAI,EAAE,IAAI;oBACV,IAAI,EAAE,QAAQ;iBACf;aACF;YACD,iBAAiB,EAAE;gBACjB,OAAO,EAAE;oBACP;wBACE,IAAI,EAAE,QAAQ;wBACd,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,KAAK;wBACX,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,YAAY;wBAClB,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,WAAW;wBACjB,IAAI,EAAE,SAAS;qBAChB;oBACD;wBACE,IAAI,EAAE,kBAAkB;wBACxB,IAAI,EAAE,SAAS;qBAChB;oBACD;wBACE,IAAI,EAAE,MAAM;wBACZ,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,oBAAoB;wBAC1B,IAAI,EAAE,WAAW;qBAClB;oBACD;wBACE,IAAI,EAAE,OAAO;wBACb,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,eAAe;wBACrB,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,uBAAuB;wBAC7B,IAAI,EAAE,SAAS;qBAChB;oBACD;wBACE,IAAI,EAAE,oBAAoB;wBAC1B,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,mBAAmB;wBACzB,IAAI,EAAE,QAAQ;qBACf;oBACD;wBACE,IAAI,EAAE,0BAA0B;wBAChC,IAAI,EAAE,QAAQ;qBACf;oBACD,IAAI;oBACJ,IAAI;oBACJ,6CAA6C;oBAC7C,wBAAwB;oBACxB,KAAK;oBACL,IAAI;oBACJ,gCAAgC;oBAChC,qBAAqB;oBACrB,KAAK;oBACL,IAAI;oBACJ,6CAA6C;oBAC7C,qBAAqB;oBACrB,IAAI;iBACL;gBACD,QAAQ,EAAE,QAAQ;gBAClB,WAAW,EAAE,qDAAqD;gBAClE,YAAY,EAAE,4DAA4D;gBAC1E,UAAU,EAAE,KAAK;gBACjB,eAAe,EAAE,CAAC,CAAC;gBACnB,SAAS,EAAE;oBACT,oBAAoB,EAAE,6DAA6D;oBACnF,UAAU,EAAE;wBACV,sBAAsB,EAAE,GAAG;qBAC5B;iBACF;aACF;SACF,CAAC;QAEF,MAAM,UAAU,GAAkB;YAChC,SAAS,EAAE,SAAS;YACpB,YAAY,EAAE,QAAQ,CAAC,YAAY;YACnC,UAAU,EAAE,UAAU;SACvB,CAAC;QACF,OAAO,IAAI,mBAAQ,CAAC,KAAK,EAAE,aAAa,eAAe,EAAE,EAAE,UAAU,CAAC,CAAC;IACzE,CAAC;IAED;;;;;;;OAOG;IACI,MAAM,CAAC,oCAAoC,CAChD,SAAiB,EACjB,UAAkB,EAClB,eAAwB,EACxB,eAAwB;QAExB,MAAM,QAAQ,GAAG,eAAe;YAC9B,CAAC,CAAC,GAAG,SAAS,IAAI,0BAAU,CAAC,cAAc,CAAC,eAAe,CAAC,IAAI;YAChE,CAAC,CAAC,GAAG,SAAS,IAAI,CAAC;QACrB,MAAM,gBAAgB,GAAG,IAAI,yBAAe,CAAC;YAC3C,GAAG,EAAE,kBAAkB;YACvB,MAAM,EAAE,gBAAM,CAAC,KAAK;YACpB,SAAS,EAAE,CAAC,QAAQ,CAAC;YACrB,OAAO,EAAE,CAAC,cAAc,CAAC;SAC1B,CAAC,CAAC;QACH,gBAAgB,CAAC,YAAY,CAAC,cAAc,EAAE;YAC5C,mBAAmB,EAAE,UAAU;YAC/B,cAAc,EAAE,2BAA2B;SAC5C,CAAC,CAAC;QACH,IAAI,eAAe,EAAE,CAAC;YACpB,gBAAgB,CAAC,YAAY,CAAC,SAAS,EAAE;gBACvC,eAAe,EAAE,eAAe;aACjC,CAAC,CAAC;QACL,CAAC;QACD,gBAAgB,CAAC,mBAAmB,CAAC,kBAAkB,CAAC,CAAC;QACzD,OAAO,gBAAgB,CAAC;IAC1B,CAAC;CACF;AA5ND,0CA4NC","sourcesContent":["/*!\n * Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.\n * SPDX-License-Identifier: Apache-2.0\n */\n\nimport { MdaaBucket } from '@aws-mdaa/s3-constructs';\nimport { Database } from '@aws-cdk/aws-glue-alpha';\nimport { CfnTable, CfnTableProps } from 'aws-cdk-lib/aws-glue';\nimport { Effect, PolicyStatement } from 'aws-cdk-lib/aws-iam';\nimport { IBucket, Inventory, InventoryFormat, InventoryFrequency, InventoryObjectVersion } from 'aws-cdk-lib/aws-s3';\nimport { Construct } from 'constructs';\n\nexport interface BucketInventory {\n  /** Name of the S3 bucket for which inventory data has been generated */\n  readonly bucketName: string;\n  /** Name of the S3 inventory configuration that generated the inventory data for the specified bucket */\n  readonly inventoryName: string;\n}\n\n/** Helper class for creating S3 Inventories and associated Glue/Athena resources for querying these inventories. */\nexport class InventoryHelper {\n  /**\n   * Helper method for creating an S3 inventory.\n   * @param destinationBucket The bucket where S3 inventory data will be written\n   * @param inventoryId The S3 inventory ID\n   * @param objectsPrefix The object prefix from which inventory will be produced (on the bucket to which the inventory config is applied)\n   * @param destinationPrefix The object prefix under which inventory will be written on the destination bucket.\n   * @returns An S3 Inventory Config which can be applied to a bucket in order to produce periodic inventory data.\n   */\n  public static createInvConfig(\n    destinationBucket: IBucket,\n    inventoryId: string,\n    objectsPrefix?: string,\n    destinationPrefix?: string,\n    destinationAccount?: string,\n  ): Inventory {\n    const bucketOwner = destinationAccount ? `${destinationAccount}` : destinationAccount;\n    return {\n      destination: {\n        bucket: destinationBucket,\n        /** S3 prefix for inventory report destination organization enabling systematic inventory file */\n        prefix: MdaaBucket.formatS3Prefix(destinationPrefix),\n        bucketOwner: bucketOwner,\n      },\n      format: InventoryFormat.PARQUET,\n      frequency: InventoryFrequency.DAILY,\n      includeObjectVersions: InventoryObjectVersion.ALL,\n      inventoryId: inventoryId,\n      objectsPrefix: MdaaBucket.formatS3Prefix(objectsPrefix, false, true),\n      optionalFields: [\n        'Size',\n        'LastModifiedDate',\n        'StorageClass',\n        'ETag',\n        'IsMultipartUploaded',\n        'ReplicationStatus',\n        'EncryptionStatus',\n        'ObjectLockRetainUntilDate',\n        'ObjectLockMode',\n        'ObjectLockLegalHoldStatus',\n        'IntelligentTieringAccessTier',\n      ],\n    };\n  }\n\n  /**\n   * Helper method for creating a Glue table which can be used to query inventory data generated by an S3 Inventory config\n   * @param scope Stack in which the table will be created\n   * @param tableNamePrefix Will be used to prefix the table name.\n   * @param locationBucketName The bucket where the inventory data is stored.\n   * @param inventoryBucket The bucket for which inventory data has been generated\n   * @param database The Glue database in which the table will be created\n   * @param inventoryName The name of the S3 Inventory config\n   * @param locationPrefix The S3 Prefix on the location bucket where the inventory is stored.\n   * @returns A Glue table which can be used to query S3 inventory data in an S3 bucket.\n   */\n  public static createGlueInvTable(\n    scope: Construct,\n    catalogId: string,\n    tableNamePrefix: string,\n    database: Database,\n    locationBucketName: string,\n    bucketInventories: BucketInventory[],\n    locationPrefix?: string,\n  ): CfnTable {\n    const location = locationPrefix\n      ? `s3://${locationBucketName}/${MdaaBucket.formatS3Prefix(locationPrefix)}/`\n      : `s3://${locationBucketName}/`;\n    const tableInput = {\n      name: `${tableNamePrefix}_inv`.replace(/-/gi, '_'),\n      parameters: {\n        EXTERNAL: 'TRUE',\n        'projection.enabled': 'true',\n        'projection.dt.type': 'date',\n        'projection.dt.range': '2022-01-01-00-00,NOW',\n        'projection.dt.format': 'yyyy-MM-dd-HH-mm',\n        'projection.dt.interval': '1',\n        'projection.dt.interval.unit': 'HOURS',\n        'projection.bucket_inventory.type': 'enum',\n        'projection.bucket_inventory.values': bucketInventories\n          .map(x => `${x.bucketName}/${x.inventoryName}`)\n          .join(','),\n        'storage.location.template': location + '${bucket_inventory}/hive/dt=${dt}',\n      },\n      tableType: 'EXTERNAL_TABLE',\n      partitionKeys: [\n        {\n          name: 'bucket_inventory',\n          type: 'string',\n        },\n        {\n          name: 'dt',\n          type: 'string',\n        },\n      ],\n      storageDescriptor: {\n        columns: [\n          {\n            name: 'bucket',\n            type: 'string',\n          },\n          {\n            name: 'key',\n            type: 'string',\n          },\n          {\n            name: 'version_id',\n            type: 'string',\n          },\n          {\n            name: 'is_latest',\n            type: 'boolean',\n          },\n          {\n            name: 'is_delete_marker',\n            type: 'boolean',\n          },\n          {\n            name: 'size',\n            type: 'bigint',\n          },\n          {\n            name: 'last_modified_date',\n            type: 'timestamp',\n          },\n          {\n            name: 'e_tag',\n            type: 'string',\n          },\n          {\n            name: 'storage_class',\n            type: 'string',\n          },\n          {\n            name: 'is_multipart_uploaded',\n            type: 'boolean',\n          },\n          {\n            name: 'replication_status',\n            type: 'string',\n          },\n          {\n            name: 'encryption_status',\n            type: 'string',\n          },\n          {\n            name: 'intelligent_tiering_tier',\n            type: 'string',\n          },\n          // ,\n          // {\n          //     name: \"object_lock_retain_until_date\",\n          //     type: \"timestamp\"\n          // },\n          // {\n          //     name: \"object_lock_mode\",\n          //     type: \"string\"\n          // },\n          // {\n          //     name: \"object_lock_legal_hold_status\",\n          //     type: \"string\"\n          // }\n        ],\n        location: location,\n        inputFormat: 'org.apache.hadoop.hive.ql.io.SymlinkTextInputFormat',\n        outputFormat: 'org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat',\n        compressed: false,\n        numberOfBuckets: -1,\n        serdeInfo: {\n          serializationLibrary: 'org.apache.hadoop.hive.ql.io.parquet.serde.ParquetHiveSerDe',\n          parameters: {\n            'serialization.format': '1',\n          },\n        },\n      },\n    };\n\n    const tableProps: CfnTableProps = {\n      catalogId: catalogId,\n      databaseName: database.databaseName,\n      tableInput: tableInput,\n    };\n    return new CfnTable(scope, `inv-table-${tableNamePrefix}`, tableProps);\n  }\n\n  /**\n   * Helper method to generate an S3 Bucket Policy Statement allowing S3 service to write inventories to a bucket.\n   * @param sourceBucketArn The bucket arn for which inventory data is being produced\n   * @param bucketArn  The bucket arn where inventory will be stored\n   * @param srcAccount The account which owns the source bucket from which inventory is being produced.\n   * @param inventoryPrefix The prefix on the destination bucket where inventory data will be stored.\n   * @returns A policy statement which permits the S3 service principal to write inventory for the source bucket/account to the destination bucket.\n   */\n  public static createInventoryBucketPolicyStatement(\n    bucketArn: string,\n    srcAccount: string,\n    sourceBucketArn?: string,\n    inventoryPrefix?: string,\n  ): PolicyStatement {\n    const resource = inventoryPrefix\n      ? `${bucketArn}/${MdaaBucket.formatS3Prefix(inventoryPrefix)}/*`\n      : `${bucketArn}/*`;\n    const allowS3Inventory = new PolicyStatement({\n      sid: 'AllowS3Inventory',\n      effect: Effect.ALLOW,\n      resources: [resource],\n      actions: ['s3:PutObject'],\n    });\n    allowS3Inventory.addCondition('StringEquals', {\n      'aws:SourceAccount': srcAccount,\n      's3:x-amz-acl': 'bucket-owner-full-control',\n    });\n    if (sourceBucketArn) {\n      allowS3Inventory.addCondition('ArnLike', {\n        'aws:SourceArn': sourceBucketArn,\n      });\n    }\n    allowS3Inventory.addServicePrincipal('s3.amazonaws.com');\n    return allowS3Inventory;\n  }\n}\n"]}
|
|
@@ -0,0 +1,241 @@
|
|
|
1
|
+
/*!
|
|
2
|
+
* Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
|
|
3
|
+
* SPDX-License-Identifier: Apache-2.0
|
|
4
|
+
*/
|
|
5
|
+
|
|
6
|
+
import { MdaaBucket } from '@aws-mdaa/s3-constructs';
|
|
7
|
+
import { Database } from '@aws-cdk/aws-glue-alpha';
|
|
8
|
+
import { CfnTable, CfnTableProps } from 'aws-cdk-lib/aws-glue';
|
|
9
|
+
import { Effect, PolicyStatement } from 'aws-cdk-lib/aws-iam';
|
|
10
|
+
import { IBucket, Inventory, InventoryFormat, InventoryFrequency, InventoryObjectVersion } from 'aws-cdk-lib/aws-s3';
|
|
11
|
+
import { Construct } from 'constructs';
|
|
12
|
+
|
|
13
|
+
export interface BucketInventory {
|
|
14
|
+
/** Name of the S3 bucket for which inventory data has been generated */
|
|
15
|
+
readonly bucketName: string;
|
|
16
|
+
/** Name of the S3 inventory configuration that generated the inventory data for the specified bucket */
|
|
17
|
+
readonly inventoryName: string;
|
|
18
|
+
}
|
|
19
|
+
|
|
20
|
+
/** Helper class for creating S3 Inventories and associated Glue/Athena resources for querying these inventories. */
|
|
21
|
+
export class InventoryHelper {
|
|
22
|
+
/**
|
|
23
|
+
* Helper method for creating an S3 inventory.
|
|
24
|
+
* @param destinationBucket The bucket where S3 inventory data will be written
|
|
25
|
+
* @param inventoryId The S3 inventory ID
|
|
26
|
+
* @param objectsPrefix The object prefix from which inventory will be produced (on the bucket to which the inventory config is applied)
|
|
27
|
+
* @param destinationPrefix The object prefix under which inventory will be written on the destination bucket.
|
|
28
|
+
* @returns An S3 Inventory Config which can be applied to a bucket in order to produce periodic inventory data.
|
|
29
|
+
*/
|
|
30
|
+
public static createInvConfig(
|
|
31
|
+
destinationBucket: IBucket,
|
|
32
|
+
inventoryId: string,
|
|
33
|
+
objectsPrefix?: string,
|
|
34
|
+
destinationPrefix?: string,
|
|
35
|
+
destinationAccount?: string,
|
|
36
|
+
): Inventory {
|
|
37
|
+
const bucketOwner = destinationAccount ? `${destinationAccount}` : destinationAccount;
|
|
38
|
+
return {
|
|
39
|
+
destination: {
|
|
40
|
+
bucket: destinationBucket,
|
|
41
|
+
/** S3 prefix for inventory report destination organization enabling systematic inventory file */
|
|
42
|
+
prefix: MdaaBucket.formatS3Prefix(destinationPrefix),
|
|
43
|
+
bucketOwner: bucketOwner,
|
|
44
|
+
},
|
|
45
|
+
format: InventoryFormat.PARQUET,
|
|
46
|
+
frequency: InventoryFrequency.DAILY,
|
|
47
|
+
includeObjectVersions: InventoryObjectVersion.ALL,
|
|
48
|
+
inventoryId: inventoryId,
|
|
49
|
+
objectsPrefix: MdaaBucket.formatS3Prefix(objectsPrefix, false, true),
|
|
50
|
+
optionalFields: [
|
|
51
|
+
'Size',
|
|
52
|
+
'LastModifiedDate',
|
|
53
|
+
'StorageClass',
|
|
54
|
+
'ETag',
|
|
55
|
+
'IsMultipartUploaded',
|
|
56
|
+
'ReplicationStatus',
|
|
57
|
+
'EncryptionStatus',
|
|
58
|
+
'ObjectLockRetainUntilDate',
|
|
59
|
+
'ObjectLockMode',
|
|
60
|
+
'ObjectLockLegalHoldStatus',
|
|
61
|
+
'IntelligentTieringAccessTier',
|
|
62
|
+
],
|
|
63
|
+
};
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
/**
|
|
67
|
+
* Helper method for creating a Glue table which can be used to query inventory data generated by an S3 Inventory config
|
|
68
|
+
* @param scope Stack in which the table will be created
|
|
69
|
+
* @param tableNamePrefix Will be used to prefix the table name.
|
|
70
|
+
* @param locationBucketName The bucket where the inventory data is stored.
|
|
71
|
+
* @param inventoryBucket The bucket for which inventory data has been generated
|
|
72
|
+
* @param database The Glue database in which the table will be created
|
|
73
|
+
* @param inventoryName The name of the S3 Inventory config
|
|
74
|
+
* @param locationPrefix The S3 Prefix on the location bucket where the inventory is stored.
|
|
75
|
+
* @returns A Glue table which can be used to query S3 inventory data in an S3 bucket.
|
|
76
|
+
*/
|
|
77
|
+
public static createGlueInvTable(
|
|
78
|
+
scope: Construct,
|
|
79
|
+
catalogId: string,
|
|
80
|
+
tableNamePrefix: string,
|
|
81
|
+
database: Database,
|
|
82
|
+
locationBucketName: string,
|
|
83
|
+
bucketInventories: BucketInventory[],
|
|
84
|
+
locationPrefix?: string,
|
|
85
|
+
): CfnTable {
|
|
86
|
+
const location = locationPrefix
|
|
87
|
+
? `s3://${locationBucketName}/${MdaaBucket.formatS3Prefix(locationPrefix)}/`
|
|
88
|
+
: `s3://${locationBucketName}/`;
|
|
89
|
+
const tableInput = {
|
|
90
|
+
name: `${tableNamePrefix}_inv`.replace(/-/gi, '_'),
|
|
91
|
+
parameters: {
|
|
92
|
+
EXTERNAL: 'TRUE',
|
|
93
|
+
'projection.enabled': 'true',
|
|
94
|
+
'projection.dt.type': 'date',
|
|
95
|
+
'projection.dt.range': '2022-01-01-00-00,NOW',
|
|
96
|
+
'projection.dt.format': 'yyyy-MM-dd-HH-mm',
|
|
97
|
+
'projection.dt.interval': '1',
|
|
98
|
+
'projection.dt.interval.unit': 'HOURS',
|
|
99
|
+
'projection.bucket_inventory.type': 'enum',
|
|
100
|
+
'projection.bucket_inventory.values': bucketInventories
|
|
101
|
+
.map(x => `${x.bucketName}/${x.inventoryName}`)
|
|
102
|
+
.join(','),
|
|
103
|
+
'storage.location.template': location + '${bucket_inventory}/hive/dt=${dt}',
|
|
104
|
+
},
|
|
105
|
+
tableType: 'EXTERNAL_TABLE',
|
|
106
|
+
partitionKeys: [
|
|
107
|
+
{
|
|
108
|
+
name: 'bucket_inventory',
|
|
109
|
+
type: 'string',
|
|
110
|
+
},
|
|
111
|
+
{
|
|
112
|
+
name: 'dt',
|
|
113
|
+
type: 'string',
|
|
114
|
+
},
|
|
115
|
+
],
|
|
116
|
+
storageDescriptor: {
|
|
117
|
+
columns: [
|
|
118
|
+
{
|
|
119
|
+
name: 'bucket',
|
|
120
|
+
type: 'string',
|
|
121
|
+
},
|
|
122
|
+
{
|
|
123
|
+
name: 'key',
|
|
124
|
+
type: 'string',
|
|
125
|
+
},
|
|
126
|
+
{
|
|
127
|
+
name: 'version_id',
|
|
128
|
+
type: 'string',
|
|
129
|
+
},
|
|
130
|
+
{
|
|
131
|
+
name: 'is_latest',
|
|
132
|
+
type: 'boolean',
|
|
133
|
+
},
|
|
134
|
+
{
|
|
135
|
+
name: 'is_delete_marker',
|
|
136
|
+
type: 'boolean',
|
|
137
|
+
},
|
|
138
|
+
{
|
|
139
|
+
name: 'size',
|
|
140
|
+
type: 'bigint',
|
|
141
|
+
},
|
|
142
|
+
{
|
|
143
|
+
name: 'last_modified_date',
|
|
144
|
+
type: 'timestamp',
|
|
145
|
+
},
|
|
146
|
+
{
|
|
147
|
+
name: 'e_tag',
|
|
148
|
+
type: 'string',
|
|
149
|
+
},
|
|
150
|
+
{
|
|
151
|
+
name: 'storage_class',
|
|
152
|
+
type: 'string',
|
|
153
|
+
},
|
|
154
|
+
{
|
|
155
|
+
name: 'is_multipart_uploaded',
|
|
156
|
+
type: 'boolean',
|
|
157
|
+
},
|
|
158
|
+
{
|
|
159
|
+
name: 'replication_status',
|
|
160
|
+
type: 'string',
|
|
161
|
+
},
|
|
162
|
+
{
|
|
163
|
+
name: 'encryption_status',
|
|
164
|
+
type: 'string',
|
|
165
|
+
},
|
|
166
|
+
{
|
|
167
|
+
name: 'intelligent_tiering_tier',
|
|
168
|
+
type: 'string',
|
|
169
|
+
},
|
|
170
|
+
// ,
|
|
171
|
+
// {
|
|
172
|
+
// name: "object_lock_retain_until_date",
|
|
173
|
+
// type: "timestamp"
|
|
174
|
+
// },
|
|
175
|
+
// {
|
|
176
|
+
// name: "object_lock_mode",
|
|
177
|
+
// type: "string"
|
|
178
|
+
// },
|
|
179
|
+
// {
|
|
180
|
+
// name: "object_lock_legal_hold_status",
|
|
181
|
+
// type: "string"
|
|
182
|
+
// }
|
|
183
|
+
],
|
|
184
|
+
location: location,
|
|
185
|
+
inputFormat: 'org.apache.hadoop.hive.ql.io.SymlinkTextInputFormat',
|
|
186
|
+
outputFormat: 'org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat',
|
|
187
|
+
compressed: false,
|
|
188
|
+
numberOfBuckets: -1,
|
|
189
|
+
serdeInfo: {
|
|
190
|
+
serializationLibrary: 'org.apache.hadoop.hive.ql.io.parquet.serde.ParquetHiveSerDe',
|
|
191
|
+
parameters: {
|
|
192
|
+
'serialization.format': '1',
|
|
193
|
+
},
|
|
194
|
+
},
|
|
195
|
+
},
|
|
196
|
+
};
|
|
197
|
+
|
|
198
|
+
const tableProps: CfnTableProps = {
|
|
199
|
+
catalogId: catalogId,
|
|
200
|
+
databaseName: database.databaseName,
|
|
201
|
+
tableInput: tableInput,
|
|
202
|
+
};
|
|
203
|
+
return new CfnTable(scope, `inv-table-${tableNamePrefix}`, tableProps);
|
|
204
|
+
}
|
|
205
|
+
|
|
206
|
+
/**
|
|
207
|
+
* Helper method to generate an S3 Bucket Policy Statement allowing S3 service to write inventories to a bucket.
|
|
208
|
+
* @param sourceBucketArn The bucket arn for which inventory data is being produced
|
|
209
|
+
* @param bucketArn The bucket arn where inventory will be stored
|
|
210
|
+
* @param srcAccount The account which owns the source bucket from which inventory is being produced.
|
|
211
|
+
* @param inventoryPrefix The prefix on the destination bucket where inventory data will be stored.
|
|
212
|
+
* @returns A policy statement which permits the S3 service principal to write inventory for the source bucket/account to the destination bucket.
|
|
213
|
+
*/
|
|
214
|
+
public static createInventoryBucketPolicyStatement(
|
|
215
|
+
bucketArn: string,
|
|
216
|
+
srcAccount: string,
|
|
217
|
+
sourceBucketArn?: string,
|
|
218
|
+
inventoryPrefix?: string,
|
|
219
|
+
): PolicyStatement {
|
|
220
|
+
const resource = inventoryPrefix
|
|
221
|
+
? `${bucketArn}/${MdaaBucket.formatS3Prefix(inventoryPrefix)}/*`
|
|
222
|
+
: `${bucketArn}/*`;
|
|
223
|
+
const allowS3Inventory = new PolicyStatement({
|
|
224
|
+
sid: 'AllowS3Inventory',
|
|
225
|
+
effect: Effect.ALLOW,
|
|
226
|
+
resources: [resource],
|
|
227
|
+
actions: ['s3:PutObject'],
|
|
228
|
+
});
|
|
229
|
+
allowS3Inventory.addCondition('StringEquals', {
|
|
230
|
+
'aws:SourceAccount': srcAccount,
|
|
231
|
+
's3:x-amz-acl': 'bucket-owner-full-control',
|
|
232
|
+
});
|
|
233
|
+
if (sourceBucketArn) {
|
|
234
|
+
allowS3Inventory.addCondition('ArnLike', {
|
|
235
|
+
'aws:SourceArn': sourceBucketArn,
|
|
236
|
+
});
|
|
237
|
+
}
|
|
238
|
+
allowS3Inventory.addServicePrincipal('s3.amazonaws.com');
|
|
239
|
+
return allowS3Inventory;
|
|
240
|
+
}
|
|
241
|
+
}
|
|
@@ -5,35 +5,33 @@
|
|
|
5
5
|
"name": "Amazon Web Services",
|
|
6
6
|
"url": "https://aws.amazon.com/solutions"
|
|
7
7
|
},
|
|
8
|
-
"version": "1.
|
|
8
|
+
"version": "1.5.0",
|
|
9
9
|
"main": "lib/index.js",
|
|
10
10
|
"types": "lib/index.d.ts",
|
|
11
11
|
"license": "Apache-2.0",
|
|
12
12
|
"scripts": {
|
|
13
13
|
"build": "tsc",
|
|
14
14
|
"watch": "tsc -w",
|
|
15
|
-
"test": "jest --passWithNoTests --
|
|
16
|
-
"lint": "eslint --max-warnings 0 -c
|
|
17
|
-
"test
|
|
15
|
+
"test": "jest --passWithNoTests --testPathIgnorePatterns='.*\\.snapshot\\.test\\.ts'",
|
|
16
|
+
"lint": "eslint --max-warnings 0 -c ../../../eslint.config.mjs",
|
|
17
|
+
"test:coverage": "jest --passWithNoTests --coverage --testPathIgnorePatterns='.*\\.snapshot\\.test\\.ts'",
|
|
18
|
+
"test:snapshots": "jest --passWithNoTests --testPathPattern='.*\\.snapshot\\.test\\.ts'",
|
|
19
|
+
"test:snapshots:update": "jest --passWithNoTests --testPathPattern='.*\\.snapshot\\.test\\.ts' --updateSnapshot"
|
|
18
20
|
},
|
|
19
21
|
"devDependencies": {
|
|
20
|
-
"@types/jest": "29.5.
|
|
21
|
-
"@types/node": "
|
|
22
|
+
"@types/jest": "29.5.14",
|
|
23
|
+
"@types/node": "22.9.0",
|
|
22
24
|
"@types/prettier": "2.6.0",
|
|
23
|
-
"jest": "29.
|
|
24
|
-
"ts-jest": "29.
|
|
25
|
-
"ts-node": "10.9.
|
|
26
|
-
"typescript": "
|
|
27
|
-
"typescript-json-schema": "0.
|
|
28
|
-
},
|
|
29
|
-
"overrides": {
|
|
30
|
-
"aws-cdk-lib": "2.220.0",
|
|
31
|
-
"@types/babel__traverse": "7.18.2"
|
|
25
|
+
"jest": "29.7.0",
|
|
26
|
+
"ts-jest": "29.4.6",
|
|
27
|
+
"ts-node": "10.9.2",
|
|
28
|
+
"typescript": "5.9.3",
|
|
29
|
+
"typescript-json-schema": "0.67.1"
|
|
32
30
|
},
|
|
33
31
|
"dependencies": {
|
|
34
32
|
"@aws-cdk/aws-glue-alpha": "2.220.0-alpha.0",
|
|
35
|
-
"@aws-mdaa/naming": "1.
|
|
36
|
-
"@aws-mdaa/s3-constructs": "1.
|
|
33
|
+
"@aws-mdaa/naming": "1.5.0",
|
|
34
|
+
"@aws-mdaa/s3-constructs": "1.5.0",
|
|
37
35
|
"aws-cdk-lib": "2.220.0",
|
|
38
36
|
"cdk-nag": "2.37.55",
|
|
39
37
|
"constructs": "10.0.96"
|
|
File without changes
|
|
@@ -0,0 +1,40 @@
|
|
|
1
|
+
{
|
|
2
|
+
"compilerOptions": {
|
|
3
|
+
"declarationMap": false,
|
|
4
|
+
"inlineSourceMap": true,
|
|
5
|
+
"inlineSources": true,
|
|
6
|
+
"alwaysStrict": true,
|
|
7
|
+
"removeComments": false,
|
|
8
|
+
"declaration": true,
|
|
9
|
+
"experimentalDecorators": true,
|
|
10
|
+
"incremental": true,
|
|
11
|
+
"lib": [
|
|
12
|
+
"es2020"
|
|
13
|
+
],
|
|
14
|
+
"module": "CommonJS",
|
|
15
|
+
"newLine": "lf",
|
|
16
|
+
"noEmitOnError": true,
|
|
17
|
+
"noFallthroughCasesInSwitch": true,
|
|
18
|
+
"noImplicitAny": true,
|
|
19
|
+
"noImplicitReturns": true,
|
|
20
|
+
"noImplicitThis": true,
|
|
21
|
+
"noUnusedLocals": true,
|
|
22
|
+
"noUnusedParameters": true,
|
|
23
|
+
"resolveJsonModule": true,
|
|
24
|
+
"skipLibCheck": true,
|
|
25
|
+
"strict": true,
|
|
26
|
+
"strictNullChecks": true,
|
|
27
|
+
"strictPropertyInitialization": true,
|
|
28
|
+
"stripInternal": false,
|
|
29
|
+
"target": "ES2020",
|
|
30
|
+
"composite": true,
|
|
31
|
+
"tsBuildInfoFile": "tsconfig.tsbuildinfo"
|
|
32
|
+
},
|
|
33
|
+
"include": [
|
|
34
|
+
"**/*.ts"
|
|
35
|
+
],
|
|
36
|
+
"exclude": [
|
|
37
|
+
"node_modules"
|
|
38
|
+
],
|
|
39
|
+
"_generated_by_jsii_": "Generated by jsii - safe to delete, and ideally should be in .gitignore"
|
|
40
|
+
}
|