aws-cdk-neuronx-patterns 0.2.1 → 0.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.jsii +604 -99
- package/API.md +990 -210
- package/README.ja.md +18 -6
- package/README.md +16 -5
- package/lib/base/aws-batch/neuronx-batch-compute-environment.js +1 -1
- package/lib/base/aws-batch/neuronx-batch-ecs-job-definition.js +1 -1
- package/lib/base/aws-batch/neuronx-batch.js +1 -1
- package/lib/base/aws-ecs-patterns/application-load-balanced-neuronx-service.js +4 -4
- package/lib/base/neuronx/deep-learning-containers.js +3 -3
- package/lib/base/neuronx/model.js +2 -2
- package/lib/base/neuronx/neuron-optimized-machine-image.js +1 -1
- package/lib/base/neuronx/neuronx-instance-type.js +4 -4
- package/lib/base/neuronx-compiler/index.d.ts +3 -1
- package/lib/base/neuronx-compiler/index.js +4 -2
- package/lib/base/neuronx-compiler/{neuronx-compiler.d.ts → neuronx-compiler-base.d.ts} +74 -32
- package/lib/base/neuronx-compiler/neuronx-compiler-base.js +129 -0
- package/lib/base/neuronx-compiler/neuronx-cross-compiler.d.ts +30 -0
- package/lib/base/neuronx-compiler/neuronx-cross-compiler.js +83 -0
- package/lib/base/neuronx-compiler/neuronx-native-compiler.d.ts +18 -0
- package/lib/base/neuronx-compiler/neuronx-native-compiler.js +69 -0
- package/lib/base/server-engine/vllm-engine/vllm-engine-argments.js +1 -1
- package/lib/sagemaker-inference-toolkit-tnx/sagemaker-inference-toolkit-tnx-compiler.js +2 -2
- package/lib/sagemaker-inference-toolkit-tnx/sagemaker-inference-toolkit-tnx-sagemaker.d.ts +1 -1
- package/lib/sagemaker-inference-toolkit-tnx/sagemaker-inference-toolkit-tnx-sagemaker.js +2 -2
- package/lib/vllm-nxd-inference/vllm-nxd-inference-compiler.d.ts +8 -0
- package/lib/vllm-nxd-inference/vllm-nxd-inference-compiler.js +32 -4
- package/lib/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.js +6 -6
- package/package.json +5 -5
- package/scripts/compile/vllm-nxd-inference/Dockerfile +5 -0
- package/scripts/compile/vllm-nxd-inference/entrypoint.sh +39 -14
- package/lib/base/neuronx-compiler/neuronx-compiler.js +0 -166
package/README.ja.md
CHANGED
|
@@ -87,7 +87,10 @@ new cdk.CfnOutput(stack, "LoadBalancerDNS", {
|
|
|
87
87
|
## vLLM NxD Inference on ALB & ECS on EC2
|
|
88
88
|
|
|
89
89
|
> [!WARNING]
|
|
90
|
-
> このコンストラクトは EC2 上で Inferentia2
|
|
90
|
+
> このコンストラクトは EC2 上で Inferentia2 インスタンスを推論に使用します。AWS アカウントで Inferentia2 インスタンスのサービスクォータを増やす必要がある場合があります。[Service Quotas コンソール](https://console.aws.amazon.com/servicequotas/)から申請してください。
|
|
91
|
+
>
|
|
92
|
+
> [!NOTE]
|
|
93
|
+
> モデルのコンパイルは標準(非 Neuron)EC2 インスタンス上でクロスコンパイルにより実行されるため、コンパイルフェーズでは Inferentia/Trainium のクォータは不要です。
|
|
91
94
|
|
|
92
95
|
このパターンは、モデルのコンパイルに `VllmNxdInferenceCompiler` を、デプロイに `ApplicationLoadBalancedVllmNxDInferenceService` を組み合わせて使用します。HuggingFace で公開されているモデルを簡単にコンパイルし、Application Load Balancer を使った ECS にデプロイできます。
|
|
93
96
|
|
|
@@ -320,7 +323,16 @@ Secret は、コンパイル Batch Job と推論サーバーを実行する ECS
|
|
|
320
323
|
|
|
321
324
|
## Neuronx Compiler
|
|
322
325
|
|
|
323
|
-
>
|
|
326
|
+
> このコンストラクトは EC2 上で Inferentia2 インスタンスを使用します。AWS アカウントで Inferentia2 インスタンスのサービスクォータを増やす必要がある場合があります。
|
|
327
|
+
|
|
328
|
+
このコンストラクトは、Neuronx でサポートされているモデルをコンパイルし、指定された S3 バケットにアップロードします。コンストラクトは、モデルのパラメータ数に基づいて必要なインスタンスタイプを自動的に選択します。
|
|
329
|
+
|
|
330
|
+
コンパイラーには2つのバリアントがあります:
|
|
331
|
+
|
|
332
|
+
- **`NeuronxNativeCompiler`** — Neuron インスタンス(Inferentia2/Trainium)上でコンパイルします。Neuron デバイスクォータが必要です。
|
|
333
|
+
- **`NeuronxCrossCompiler`** — 標準 EC2 インスタンス(例:`c7i-flex.4xlarge`)上で Neuron ハードウェアなしにクロスコンパイルします。`VllmNxdInferenceCompiler` がデフォルトで使用します。
|
|
334
|
+
|
|
335
|
+
両方とも `INeuronxCompiler` インターフェースを実装し、互換性のあるアーティファクトを生成します。
|
|
324
336
|
> このコンストラクトは EC2 上で Inferentia2 インスタンスを使用します。AWS アカウントで Inferentia2 インスタンスのサービスクォータを増やす必要がある場合があります。
|
|
325
337
|
|
|
326
338
|
このコンストラクトは、Neuronx でサポートされているモデルをコンパイルし、指定された S3 バケットにアップロードします。コンストラクトは、モデルのパラメータ数に基づいて必要なインスタンスタイプを自動的に選択します。
|
|
@@ -330,13 +342,13 @@ Secret は、コンパイル Batch Job と推論サーバーを実行する ECS
|
|
|
330
342
|
```ts
|
|
331
343
|
import * as ec2 from "aws-cdk-lib/aws-ec2";
|
|
332
344
|
import * as s3 from "aws-cdk-lib/aws-s3";
|
|
333
|
-
import {
|
|
345
|
+
import { NeuronxNativeCompiler, Model } from "aws-cdk-neuronx-patterns";
|
|
334
346
|
|
|
335
347
|
declare const vpc: ec2.Vpc;
|
|
336
348
|
declare const bucket: s3.Bucket;
|
|
337
349
|
declare const image: INeuronxContainerImage;
|
|
338
350
|
|
|
339
|
-
const compiler = new
|
|
351
|
+
const compiler = new NeuronxNativeCompiler(this, "NeuronxCompiler", {
|
|
340
352
|
vpc,
|
|
341
353
|
bucket,
|
|
342
354
|
model: Model.fromHuggingFace("HuggingFaceTB/SmolLM-135M-Instruct"),
|
|
@@ -362,13 +374,13 @@ new cdk.CfnOutput(this, "CompiledArtifact", {
|
|
|
362
374
|
```ts
|
|
363
375
|
import * as ec2 from "aws-cdk-lib/aws-ec2";
|
|
364
376
|
import * as s3 from "aws-cdk-lib/aws-s3";
|
|
365
|
-
import {
|
|
377
|
+
import { NeuronxNativeCompiler, Model } from "aws-cdk-neuronx-patterns";
|
|
366
378
|
|
|
367
379
|
declare const vpc: ec2.Vpc;
|
|
368
380
|
declare const bucket: s3.Bucket;
|
|
369
381
|
declare const image: INeuronxContainerImage;
|
|
370
382
|
|
|
371
|
-
new
|
|
383
|
+
new NeuronxNativeCompiler(this, "NeuronxCompiler", {
|
|
372
384
|
vpc,
|
|
373
385
|
bucket,
|
|
374
386
|
model: Model.fromHuggingFace("HuggingFaceTB/SmolLM-135M-Instruct"),
|
package/README.md
CHANGED
|
@@ -87,7 +87,10 @@ new cdk.CfnOutput(stack, "LoadBalancerDNS", {
|
|
|
87
87
|
## vLLM NxD Inference on ALB & ECS on EC2
|
|
88
88
|
|
|
89
89
|
> [!WARNING]
|
|
90
|
-
> This construct uses an Inferentia2 instance on EC2. You may need to increase your service quota for Inferentia2 instances in your AWS account via the [Service Quotas console](https://console.aws.amazon.com/servicequotas/).
|
|
90
|
+
> This construct uses an Inferentia2 instance on EC2 for inference. You may need to increase your service quota for Inferentia2 instances in your AWS account via the [Service Quotas console](https://console.aws.amazon.com/servicequotas/).
|
|
91
|
+
|
|
92
|
+
> [!NOTE]
|
|
93
|
+
> Model compilation is performed on standard (non-Neuron) EC2 instances via cross-compilation, so no Inferentia/Trainium quota is needed for the compilation phase.
|
|
91
94
|
|
|
92
95
|
This pattern combines `VllmNxdInferenceCompiler` for model compilation and `ApplicationLoadBalancedVllmNxDInferenceService` for deployment. Models published on HuggingFace can be easily compiled and deployed to ECS with Application Load Balancer.
|
|
93
96
|
|
|
@@ -325,18 +328,25 @@ The secret will be securely passed as an environment variable to the compilation
|
|
|
325
328
|
|
|
326
329
|
This construct compiles models supported by Neuronx and uploads them to the specified S3 bucket. The construct automatically selects the required instance type based on the number of model parameters.
|
|
327
330
|
|
|
331
|
+
There are two compiler variants:
|
|
332
|
+
|
|
333
|
+
- **`NeuronxNativeCompiler`** — Compiles on Neuron instances (Inferentia2/Trainium). Requires Neuron device quota.
|
|
334
|
+
- **`NeuronxCrossCompiler`** — Compiles on standard EC2 instances (e.g., `c7i-flex.4xlarge`) without Neuron hardware. Used by `VllmNxdInferenceCompiler` by default.
|
|
335
|
+
|
|
336
|
+
Both implement the `INeuronxCompiler` interface and produce compatible artifacts.
|
|
337
|
+
|
|
328
338
|

|
|
329
339
|
|
|
330
340
|
```ts
|
|
331
341
|
import * as ec2 from "aws-cdk-lib/aws-ec2";
|
|
332
342
|
import * as s3 from "aws-cdk-lib/aws-s3";
|
|
333
|
-
import {
|
|
343
|
+
import { NeuronxNativeCompiler, Model } from "aws-cdk-neuronx-patterns";
|
|
334
344
|
|
|
335
345
|
declare const vpc: ec2.Vpc;
|
|
336
346
|
declare const bucket: s3.Bucket;
|
|
337
347
|
declare const image: INeuronxContainerImage;
|
|
338
348
|
|
|
339
|
-
const compiler = new
|
|
349
|
+
const compiler = new NeuronxNativeCompiler(this, "NeuronxCompiler", {
|
|
340
350
|
vpc,
|
|
341
351
|
bucket,
|
|
342
352
|
model: Model.fromHuggingFace("HuggingFaceTB/SmolLM-135M-Instruct"),
|
|
@@ -362,13 +372,13 @@ You can reduce costs by using Spot Instances for compilation:
|
|
|
362
372
|
```ts
|
|
363
373
|
import * as ec2 from "aws-cdk-lib/aws-ec2";
|
|
364
374
|
import * as s3 from "aws-cdk-lib/aws-s3";
|
|
365
|
-
import {
|
|
375
|
+
import { NeuronxNativeCompiler, Model } from "aws-cdk-neuronx-patterns";
|
|
366
376
|
|
|
367
377
|
declare const vpc: ec2.Vpc;
|
|
368
378
|
declare const bucket: s3.Bucket;
|
|
369
379
|
declare const image: INeuronxContainerImage;
|
|
370
380
|
|
|
371
|
-
new
|
|
381
|
+
new NeuronxNativeCompiler(this, "NeuronxCompiler", {
|
|
372
382
|
vpc,
|
|
373
383
|
bucket,
|
|
374
384
|
model: Model.fromHuggingFace("HuggingFaceTB/SmolLM-135M-Instruct"),
|
|
@@ -395,6 +405,7 @@ For detailed API documentation, see [API.md](./API.md).
|
|
|
395
405
|
For cost estimates, use the [AWS Pricing Calculator](https://calculator.aws).
|
|
396
406
|
|
|
397
407
|
**Cost optimization tips:**
|
|
408
|
+
- The `VllmNxdInferenceCompiler` uses cross-compilation on standard EC2 instances by default, avoiding expensive Neuron instances during compilation
|
|
398
409
|
- Use Spot Instances for compilation jobs (can save up to 90%)
|
|
399
410
|
- Delete resources when not in use (`cdk destroy`)
|
|
400
411
|
- Use appropriate instance sizes for your workload
|
|
@@ -44,5 +44,5 @@ class NeuronxBatchComputeEnvironment extends constructs_1.Construct {
|
|
|
44
44
|
}
|
|
45
45
|
exports.NeuronxBatchComputeEnvironment = NeuronxBatchComputeEnvironment;
|
|
46
46
|
_a = JSII_RTTI_SYMBOL_1;
|
|
47
|
-
NeuronxBatchComputeEnvironment[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatchComputeEnvironment", version: "0.
|
|
47
|
+
NeuronxBatchComputeEnvironment[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatchComputeEnvironment", version: "0.3.0" };
|
|
48
48
|
//# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoibmV1cm9ueC1iYXRjaC1jb21wdXRlLWVudmlyb25tZW50LmpzIiwic291cmNlUm9vdCI6IiIsInNvdXJjZXMiOlsiLi4vLi4vLi4vc3JjL2Jhc2UvYXdzLWJhdGNoL25ldXJvbngtYmF0Y2gtY29tcHV0ZS1lbnZpcm9ubWVudC50cyJdLCJuYW1lcyI6W10sIm1hcHBpbmdzIjoiOzs7OztBQUNBLCtDQUErQztBQUMvQyxpREFBcUQ7QUFFckQsMkNBQXVDO0FBQ3ZDLHdDQUF5RDtBQVF6RDs7R0FFRztBQUNILE1BQWEsOEJBQ1gsU0FBUSxzQkFBUztJQVVqQixJQUFJLHFCQUFxQjtRQUN2QixPQUFPLEVBQUUscUJBQXFCLEVBQUUsSUFBSSxDQUFDLHFCQUFxQixFQUFFLENBQUM7SUFDL0QsQ0FBQztJQUVELFlBQ0UsS0FBZ0IsRUFDaEIsRUFBVSxFQUNWLEtBQTBDO1FBRTFDLEtBQUssQ0FBQyxLQUFLLEVBQUUsRUFBRSxDQUFDLENBQUM7UUFFakIsTUFBTSxNQUFNLEdBQUcsS0FBSyxDQUFDLE1BQU0sSUFBSTtZQUM3QjtnQkFDRSxLQUFLLEVBQUUsSUFBSSxxQ0FBMkIsQ0FDcEMsSUFBSSxFQUNKLDZCQUE2QixDQUM5QjtnQkFDRCxTQUFTLEVBQUUsS0FBSyxDQUFDLG1CQUFtQixDQUFDLFVBQVU7YUFDaEQ7U0FDRixDQUFDO1FBQ0YsSUFBSSxDQUFDLFFBQVEsR0FBRyxJQUFJLEtBQUssQ0FBQywrQkFBK0IsQ0FDdkQsSUFBSSxFQUNKLFVBQVUsRUFDVjtZQUNFLEdBQUcsS0FBSztZQUNSLE1BQU07U0FDUCxDQUNGLENBQUM7UUFDRixJQUNFLEtBQUssQ0FBQyxjQUFjO1lBQ3BCLEtBQUssQ0FBQyxjQUFjLFlBQVksd0JBQWMsRUFDOUMsQ0FBQztZQUVDLElBQUksQ0FBQyxRQUFRLENBQUMsSUFBSSxDQUFDLFlBQ3BCLENBQUMsbUJBQW1CLENBQ25CLHlDQUF5QyxFQUN6QyxLQUFLLENBQUMsY0FBYyxDQUFDLG1CQUFtQixDQUN6QyxDQUFDO1FBQ0osQ0FBQztRQUVELElBQUksQ0FBQyxxQkFBcUIsR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLHFCQUFxQixDQUFDO1FBQ2pFLElBQUksQ0FBQyxzQkFBc0IsR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLHNCQUFzQixDQUFDO1FBQ25FLElBQUksQ0FBQyxPQUFPLEdBQUcsSUFBSSxDQUFDLFFBQVEsQ0FBQyxPQUFPLENBQUM7UUFDckMsSUFBSSxDQUFDLEdBQUcsR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLEdBQUcsQ0FBQztRQUM3QixJQUFJLENBQUMsV0FBVyxHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsV0FBVyxDQUFDO1FBQzdDLElBQUksQ0FBQyxLQUFLLEdBQUcsSUFBSSxDQUFDLFFBQVEsQ0FBQyxLQUFLLENBQUM7UUFDakMsSUFBSSxDQUFDLFlBQVksR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLFlBQWEsQ0FBQztJQUNsRCxDQUFDO0lBQ0Qsa0JBQWtCLENBQUMsTUFBcUI7UUFDdEMsSUFBSSxDQUFDLFFBQVEsQ0FBQyxrQkFBa0IsQ0FBQyxNQUFNLENBQUMsQ0FBQztJQUMzQyxDQUFDOztBQTdESCx3RUE4REMiLCJzb3VyY2VzQ29udGVudCI6WyJpbXBvcnQgeyBSZW1vdmFsUG9saWN5LCBSZXNvdXJjZUVudmlyb25tZW50LCBTdGFjayB9IGZyb20gXCJhd3MtY2RrLWxpYlwiO1xuaW1wb3J0ICogYXMgYmF0Y2ggZnJvbSBcImF3cy1jZGstbGliL2F3cy1iYXRjaFwiO1xuaW1wb3J0IHsgTGF1bmNoVGVtcGxhdGUgfSBmcm9tIFwiYXdzLWNkay1saWIvYXdzLWVjMlwiO1xuaW1wb3J0IHsgSVJvbGUgfSBmcm9tIFwiYXdzLWNkay1saWIvYXdzLWlhbVwiO1xuaW1wb3J0IHsgQ29uc3RydWN0IH0gZnJvbSBcImNvbnN0cnVjdHNcIjtcbmltcG9ydCB7IE5ldXJvbk9wdGltaXplZE1hY2hpbmVJbWFnZSB9IGZyb20gXCIuLi9uZXVyb254XCI7XG5cbi8qKlxuICogUHJvcHMgb2YgTmV1cm9ueEJhdGNoLlxuICovXG5leHBvcnQgaW50ZXJmYWNlIE5ldXJvbnhCYXRjaENvbXB1dGVFbnZpcm9ubWVudFByb3BzXG4gIGV4dGVuZHMgYmF0Y2guTWFuYWdlZEVjMkVjc0NvbXB1dGVFbnZpcm9ubWVudFByb3BzIHt9XG5cbi8qKlxuICogTmV1cm9ueCBiYXRjaCBjb25zdHJ1Y3QuXG4gKi9cbmV4cG9ydCBjbGFzcyBOZXVyb254QmF0Y2hDb21wdXRlRW52aXJvbm1lbnRcbiAgZXh0ZW5kcyBDb25zdHJ1Y3RcbiAgaW1wbGVtZW50cyBiYXRjaC5JQ29tcHV0ZUVudmlyb25tZW50XG57XG4gIHJlYWRvbmx5IGNvbXB1dGVFbnZpcm9ubWVudE5hbWU6IHN0cmluZztcbiAgcmVhZG9ubHkgY29tcHV0ZUVudmlyb25tZW50QXJuOiBzdHJpbmc7XG4gIHJlYWRvbmx5IHNlcnZpY2VSb2xlPzogSVJvbGUgfCB1bmRlZmluZWQ7XG4gIHJlYWRvbmx5IGVuYWJsZWQ6IGJvb2xlYW47XG4gIHJlYWRvbmx5IHN0YWNrOiBTdGFjaztcbiAgcmVhZG9ubHkgZW52OiBSZXNvdXJjZUVudmlyb25tZW50O1xuICByZWFkb25seSBpbnN0YW5jZVJvbGU6IElSb2xlO1xuICBnZXQgY29tcHV0ZUVudmlyb25tZW50UmVmKCk6IGJhdGNoLkNvbXB1dGVFbnZpcm9ubWVudFJlZmVyZW5jZSB7XG4gICAgcmV0dXJuIHsgY29tcHV0ZUVudmlyb25tZW50QXJuOiB0aGlzLmNvbXB1dGVFbnZpcm9ubWVudEFybiB9O1xuICB9XG4gIHByaXZhdGUgcmVhZG9ubHkgcmVzb3VyY2U6IGJhdGNoLk1hbmFnZWRFYzJFY3NDb21wdXRlRW52aXJvbm1lbnQ7XG4gIGNvbnN0cnVjdG9yKFxuICAgIHNjb3BlOiBDb25zdHJ1Y3QsXG4gICAgaWQ6IHN0cmluZyxcbiAgICBwcm9wczogTmV1cm9ueEJhdGNoQ29tcHV0ZUVudmlyb25tZW50UHJvcHMsXG4gICkge1xuICAgIHN1cGVyKHNjb3BlLCBpZCk7XG5cbiAgICBjb25zdCBpbWFnZXMgPSBwcm9wcy5pbWFnZXMgPz8gW1xuICAgICAge1xuICAgICAgICBpbWFnZTogbmV3IE5ldXJvbk9wdGltaXplZE1hY2hpbmVJbWFnZShcbiAgICAgICAgICB0aGlzLFxuICAgICAgICAgIFwiTmV1cm9uT3B0aW1pemVkTWFjaGluZUltYWdlXCIsXG4gICAgICAgICksXG4gICAgICAgIGltYWdlVHlwZTogYmF0Y2guRWNzTWFjaGluZUltYWdlVHlwZS5FQ1NfQUwyMDIzLFxuICAgICAgfSxcbiAgICBdO1xuICAgIHRoaXMucmVzb3VyY2UgPSBuZXcgYmF0Y2guTWFuYWdlZEVjMkVjc0NvbXB1dGVFbnZpcm9ubWVudChcbiAgICAgIHRoaXMsXG4gICAgICBcIlJlc291cmNlXCIsXG4gICAgICB7XG4gICAgICAgIC4uLnByb3BzLFxuICAgICAgICBpbWFnZXMsXG4gICAgICB9LFxuICAgICk7XG4gICAgaWYgKFxuICAgICAgcHJvcHMubGF1bmNoVGVtcGxhdGUgJiZcbiAgICAgIHByb3BzLmxhdW5jaFRlbXBsYXRlIGluc3RhbmNlb2YgTGF1bmNoVGVtcGxhdGVcbiAgICApIHtcbiAgICAgIChcbiAgICAgICAgdGhpcy5yZXNvdXJjZS5ub2RlLmRlZmF1bHRDaGlsZCBhcyBiYXRjaC5DZm5Db21wdXRlRW52aXJvbm1lbnRcbiAgICAgICkuYWRkUHJvcGVydHlPdmVycmlkZShcbiAgICAgICAgXCJDb21wdXRlUmVzb3VyY2VzLkxhdW5jaFRlbXBsYXRlLlZlcnNpb25cIixcbiAgICAgICAgcHJvcHMubGF1bmNoVGVtcGxhdGUubGF0ZXN0VmVyc2lvbk51bWJlcixcbiAgICAgICk7XG4gICAgfVxuXG4gICAgdGhpcy5jb21wdXRlRW52aXJvbm1lbnRBcm4gPSB0aGlzLnJlc291cmNlLmNvbXB1dGVFbnZpcm9ubWVudEFybjtcbiAgICB0aGlzLmNvbXB1dGVFbnZpcm9ubWVudE5hbWUgPSB0aGlzLnJlc291cmNlLmNvbXB1dGVFbnZpcm9ubWVudE5hbWU7XG4gICAgdGhpcy5lbmFibGVkID0gdGhpcy5yZXNvdXJjZS5lbmFibGVkO1xuICAgIHRoaXMuZW52ID0gdGhpcy5yZXNvdXJjZS5lbnY7XG4gICAgdGhpcy5zZXJ2aWNlUm9sZSA9IHRoaXMucmVzb3VyY2Uuc2VydmljZVJvbGU7XG4gICAgdGhpcy5zdGFjayA9IHRoaXMucmVzb3VyY2Uuc3RhY2s7XG4gICAgdGhpcy5pbnN0YW5jZVJvbGUgPSB0aGlzLnJlc291cmNlLmluc3RhbmNlUm9sZSE7XG4gIH1cbiAgYXBwbHlSZW1vdmFsUG9saWN5KHBvbGljeTogUmVtb3ZhbFBvbGljeSk6IHZvaWQge1xuICAgIHRoaXMucmVzb3VyY2UuYXBwbHlSZW1vdmFsUG9saWN5KHBvbGljeSk7XG4gIH1cbn1cbiJdfQ==
|
|
@@ -58,5 +58,5 @@ class NeuronxBatchEcsJobDefinition extends constructs_1.Construct {
|
|
|
58
58
|
}
|
|
59
59
|
exports.NeuronxBatchEcsJobDefinition = NeuronxBatchEcsJobDefinition;
|
|
60
60
|
_a = JSII_RTTI_SYMBOL_1;
|
|
61
|
-
NeuronxBatchEcsJobDefinition[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatchEcsJobDefinition", version: "0.
|
|
61
|
+
NeuronxBatchEcsJobDefinition[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatchEcsJobDefinition", version: "0.3.0" };
|
|
62
62
|
//# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoibmV1cm9ueC1iYXRjaC1lY3Mtam9iLWRlZmluaXRpb24uanMiLCJzb3VyY2VSb290IjoiIiwic291cmNlcyI6WyIuLi8uLi8uLi9zcmMvYmFzZS9hd3MtYmF0Y2gvbmV1cm9ueC1iYXRjaC1lY3Mtam9iLWRlZmluaXRpb24udHMiXSwibmFtZXMiOltdLCJtYXBwaW5ncyI6Ijs7Ozs7QUFNQSwrQ0FBK0M7QUFFL0MsMkNBQXVDO0FBV3ZDOztHQUVHO0FBQ0gsTUFBYSw0QkFDWCxTQUFRLHNCQUFTO0lBWWpCLElBQUksZ0JBQWdCO1FBQ2xCLE9BQU8sRUFBRSxnQkFBZ0IsRUFBRSxJQUFJLENBQUMsZ0JBQWdCLEVBQUUsQ0FBQztJQUNyRCxDQUFDO0lBRUQsWUFDRSxLQUFnQixFQUNoQixFQUFVLEVBQ1YsS0FBd0M7UUFFeEMsS0FBSyxDQUFDLEtBQUssRUFBRSxFQUFFLENBQUMsQ0FBQztRQUNqQixNQUFNLGVBQWUsR0FDbkIsS0FBSyxDQUFDLGVBQWU7WUFDckIsSUFBSSxLQUFLLENBQUMsZUFBZSxDQUFDLElBQUksRUFBRSxpQkFBaUIsQ0FBQyxDQUFDO1FBQ3JELGVBQWUsQ0FBQyxVQUFVLENBQ3hCLEdBQUcsS0FBSyxDQUFDLElBQUksQ0FBQztZQUNaLE1BQU0sRUFBRSxLQUFLLENBQUMsbUJBQW1CLENBQUMsZ0JBQWdCLENBQUMsS0FBSztTQUN6RCxDQUFDLENBQUMsR0FBRyxDQUFDLENBQUMsQ0FBQyxFQUFFLEtBQUssRUFBRSxFQUFFLENBQUMsQ0FBQztZQUNwQixRQUFRLEVBQUUsY0FBYyxLQUFLLEVBQUU7WUFDL0IsYUFBYSxFQUFFLGNBQWMsS0FBSyxFQUFFO1lBQ3BDLFdBQVcsRUFBRTtnQkFDWCxLQUFLLENBQUMsZ0JBQWdCLENBQUMsSUFBSTtnQkFDM0IsS0FBSyxDQUFDLGdCQUFnQixDQUFDLEtBQUs7YUFDN0I7U0FDRixDQUFDLENBQUMsQ0FDSixDQUFDO1FBQ0YsSUFBSSxDQUFDLFFBQVEsR0FBRyxJQUFJLEtBQUssQ0FBQyxnQkFBZ0IsQ0FBQyxJQUFJLEVBQUUsVUFBVSxFQUFFO1lBQzNELEdBQUcsS0FBSztZQUNSLFNBQVMsRUFBRSxJQUFJLEtBQUssQ0FBQyx5QkFBeUIsQ0FDNUMsSUFBSSxFQUNKLHFCQUFxQixFQUNyQjtnQkFDRSxHQUFHLEtBQUs7Z0JBQ1IsZUFBZTthQUNoQixDQUNGO1NBQ0YsQ0FBQyxDQUFDO1FBQ0gsSUFBSSxDQUFDLGdCQUFnQixHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsZ0JBQWdCLENBQUM7UUFDdkQsSUFBSSxDQUFDLGlCQUFpQixHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsaUJBQWlCLENBQUM7UUFDekQsSUFBSSxDQUFDLFVBQVUsR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLFVBQVUsQ0FBQztRQUMzQyxJQUFJLENBQUMsYUFBYSxHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsYUFBYSxDQUFDO1FBQ2pELElBQUksQ0FBQyxlQUFlLEdBQUcsSUFBSSxDQUFDLFFBQVEsQ0FBQyxlQUFlLENBQUM7UUFDckQsSUFBSSxDQUFDLGtCQUFrQixHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsa0JBQWtCLENBQUM7UUFDM0QsSUFBSSxDQUFDLE9BQU8sR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLE9BQU8sQ0FBQztRQUNyQyxJQUFJLENBQUMsS0FBSyxHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsS0FBSyxDQUFDO1FBQ2pDLElBQUksQ0FBQyxHQUFHLEdBQUcsSUFBSSxDQUFDLFFBQVEsQ0FBQyxHQUFHLENBQUM7SUFDL0IsQ0FBQztJQUNELGtCQUFrQixDQUFDLE1BQXFCO1FBQ3RDLElBQUksQ0FBQyxRQUFRLENBQUMsa0JBQWtCLENBQUMsTUFBTSxDQUFDLENBQUM7SUFDM0MsQ0FBQztJQUNELGdCQUFnQixDQUFDLFFBQTZCO1FBQzVDLElBQUksQ0FBQyxRQUFRLENBQUMsZ0JBQWdCLENBQUMsUUFBUSxDQUFDLENBQUM7SUFDM0MsQ0FBQztJQUNEOztPQUVHO0lBQ0gsY0FBYyxDQUFDLFFBQW9CLEVBQUUsS0FBc0I7UUFDekQsSUFBSSxDQUFDLFFBQVEsQ0FBQyxjQUFjLENBQUMsUUFBUSxFQUFFLEtBQUssQ0FBQyxDQUFDO0lBQ2hELENBQUM7O0FBdEVILG9FQXVFQyIsInNvdXJjZXNDb250ZW50IjpbImltcG9ydCB7XG4gIER1cmF0aW9uLFxuICBSZW1vdmFsUG9saWN5LFxuICBSZXNvdXJjZUVudmlyb25tZW50LFxuICBTdGFjayxcbn0gZnJvbSBcImF3cy1jZGstbGliXCI7XG5pbXBvcnQgKiBhcyBiYXRjaCBmcm9tIFwiYXdzLWNkay1saWIvYXdzLWJhdGNoXCI7XG5pbXBvcnQgeyBJR3JhbnRhYmxlIH0gZnJvbSBcImF3cy1jZGstbGliL2F3cy1pYW1cIjtcbmltcG9ydCB7IENvbnN0cnVjdCB9IGZyb20gXCJjb25zdHJ1Y3RzXCI7XG5pbXBvcnQgeyBJTmV1cm9ueEluc3RhbmNlVHlwZSB9IGZyb20gXCIuLi9uZXVyb254XCI7XG5cbi8qKlxuICogUHJvcHMgb2YgTmV1cm9ueEJhdGNoLlxuICovXG5leHBvcnQgaW50ZXJmYWNlIE5ldXJvbnhCYXRjaEVjc0pvYkRlZmluaXRpb25Qcm9wc1xuICBleHRlbmRzIGJhdGNoLkVjc0VjMkNvbnRhaW5lckRlZmluaXRpb25Qcm9wcywgYmF0Y2guSm9iRGVmaW5pdGlvblByb3BzIHtcbiAgcmVhZG9ubHkgbmV1cm9ueEluc3RhbmNlVHlwZTogSU5ldXJvbnhJbnN0YW5jZVR5cGU7XG59XG5cbi8qKlxuICogTmV1cm9ueCBiYXRjaCBjb25zdHJ1Y3QuXG4gKi9cbmV4cG9ydCBjbGFzcyBOZXVyb254QmF0Y2hFY3NKb2JEZWZpbml0aW9uXG4gIGV4dGVuZHMgQ29uc3RydWN0XG4gIGltcGxlbWVudHMgYmF0Y2guSUpvYkRlZmluaXRpb25cbntcbiAgcmVhZG9ubHkgam9iRGVmaW5pdGlvbkFybjogc3RyaW5nO1xuICByZWFkb25seSBqb2JEZWZpbml0aW9uTmFtZTogc3RyaW5nO1xuICByZWFkb25seSBwYXJhbWV0ZXJzPzogeyBba2V5OiBzdHJpbmddOiBhbnkgfTtcbiAgcmVhZG9ubHkgcmV0cnlBdHRlbXB0cz86IG51bWJlcjtcbiAgcmVhZG9ubHkgcmV0cnlTdHJhdGVnaWVzOiBiYXRjaC5SZXRyeVN0cmF0ZWd5W107XG4gIHJlYWRvbmx5IHNjaGVkdWxpbmdQcmlvcml0eT86IG51bWJlcjtcbiAgcmVhZG9ubHkgdGltZW91dD86IER1cmF0aW9uO1xuICByZWFkb25seSBzdGFjazogU3RhY2s7XG4gIHJlYWRvbmx5IGVudjogUmVzb3VyY2VFbnZpcm9ubWVudDtcbiAgZ2V0IGpvYkRlZmluaXRpb25SZWYoKTogYmF0Y2guSm9iRGVmaW5pdGlvblJlZmVyZW5jZSB7XG4gICAgcmV0dXJuIHsgam9iRGVmaW5pdGlvbkFybjogdGhpcy5qb2JEZWZpbml0aW9uQXJuIH07XG4gIH1cbiAgcHJpdmF0ZSByZWFkb25seSByZXNvdXJjZTogYmF0Y2guRWNzSm9iRGVmaW5pdGlvbjtcbiAgY29uc3RydWN0b3IoXG4gICAgc2NvcGU6IENvbnN0cnVjdCxcbiAgICBpZDogc3RyaW5nLFxuICAgIHByb3BzOiBOZXVyb254QmF0Y2hFY3NKb2JEZWZpbml0aW9uUHJvcHMsXG4gICkge1xuICAgIHN1cGVyKHNjb3BlLCBpZCk7XG4gICAgY29uc3QgbGludXhQYXJhbWV0ZXJzID1cbiAgICAgIHByb3BzLmxpbnV4UGFyYW1ldGVycyA/P1xuICAgICAgbmV3IGJhdGNoLkxpbnV4UGFyYW1ldGVycyh0aGlzLCBcIkxpbnV4UGFyYW1ldGVyc1wiKTtcbiAgICBsaW51eFBhcmFtZXRlcnMuYWRkRGV2aWNlcyhcbiAgICAgIC4uLkFycmF5LmZyb20oe1xuICAgICAgICBsZW5ndGg6IHByb3BzLm5ldXJvbnhJbnN0YW5jZVR5cGUuYWNjZWxlcmF0b3JDaGlwcy5jaGlwcyxcbiAgICAgIH0pLm1hcCgoXywgaW5kZXgpID0+ICh7XG4gICAgICAgIGhvc3RQYXRoOiBgL2Rldi9uZXVyb24ke2luZGV4fWAsXG4gICAgICAgIGNvbnRhaW5lclBhdGg6IGAvZGV2L25ldXJvbiR7aW5kZXh9YCxcbiAgICAgICAgcGVybWlzc2lvbnM6IFtcbiAgICAgICAgICBiYXRjaC5EZXZpY2VQZXJtaXNzaW9uLlJFQUQsXG4gICAgICAgICAgYmF0Y2guRGV2aWNlUGVybWlzc2lvbi5XUklURSxcbiAgICAgICAgXSxcbiAgICAgIH0pKSxcbiAgICApO1xuICAgIHRoaXMucmVzb3VyY2UgPSBuZXcgYmF0Y2guRWNzSm9iRGVmaW5pdGlvbih0aGlzLCBcIlJlc291cmNlXCIsIHtcbiAgICAgIC4uLnByb3BzLFxuICAgICAgY29udGFpbmVyOiBuZXcgYmF0Y2guRWNzRWMyQ29udGFpbmVyRGVmaW5pdGlvbihcbiAgICAgICAgdGhpcyxcbiAgICAgICAgXCJDb250YWluZXJEZWZpbml0aW9uXCIsXG4gICAgICAgIHtcbiAgICAgICAgICAuLi5wcm9wcyxcbiAgICAgICAgICBsaW51eFBhcmFtZXRlcnMsXG4gICAgICAgIH0sXG4gICAgICApLFxuICAgIH0pO1xuICAgIHRoaXMuam9iRGVmaW5pdGlvbkFybiA9IHRoaXMucmVzb3VyY2Uuam9iRGVmaW5pdGlvbkFybjtcbiAgICB0aGlzLmpvYkRlZmluaXRpb25OYW1lID0gdGhpcy5yZXNvdXJjZS5qb2JEZWZpbml0aW9uTmFtZTtcbiAgICB0aGlzLnBhcmFtZXRlcnMgPSB0aGlzLnJlc291cmNlLnBhcmFtZXRlcnM7XG4gICAgdGhpcy5yZXRyeUF0dGVtcHRzID0gdGhpcy5yZXNvdXJjZS5yZXRyeUF0dGVtcHRzO1xuICAgIHRoaXMucmV0cnlTdHJhdGVnaWVzID0gdGhpcy5yZXNvdXJjZS5yZXRyeVN0cmF0ZWdpZXM7XG4gICAgdGhpcy5zY2hlZHVsaW5nUHJpb3JpdHkgPSB0aGlzLnJlc291cmNlLnNjaGVkdWxpbmdQcmlvcml0eTtcbiAgICB0aGlzLnRpbWVvdXQgPSB0aGlzLnJlc291cmNlLnRpbWVvdXQ7XG4gICAgdGhpcy5zdGFjayA9IHRoaXMucmVzb3VyY2Uuc3RhY2s7XG4gICAgdGhpcy5lbnYgPSB0aGlzLnJlc291cmNlLmVudjtcbiAgfVxuICBhcHBseVJlbW92YWxQb2xpY3kocG9saWN5OiBSZW1vdmFsUG9saWN5KTogdm9pZCB7XG4gICAgdGhpcy5yZXNvdXJjZS5hcHBseVJlbW92YWxQb2xpY3kocG9saWN5KTtcbiAgfVxuICBhZGRSZXRyeVN0cmF0ZWd5KHN0cmF0ZWd5OiBiYXRjaC5SZXRyeVN0cmF0ZWd5KTogdm9pZCB7XG4gICAgdGhpcy5yZXNvdXJjZS5hZGRSZXRyeVN0cmF0ZWd5KHN0cmF0ZWd5KTtcbiAgfVxuICAvKipcbiAgICogR3JhbnRzIHRoZSBgYmF0Y2g6c3VibWl0Sm9iYCBwZXJtaXNzaW9uIHRvIHRoZSBpZGVudGl0eSBvbiBib3RoIHRoaXMgam9iIGRlZmluaXRpb24gYW5kIHRoZSBgcXVldWVgXG4gICAqL1xuICBncmFudFN1Ym1pdEpvYihpZGVudGl0eTogSUdyYW50YWJsZSwgcXVldWU6IGJhdGNoLklKb2JRdWV1ZSk6IHZvaWQge1xuICAgIHRoaXMucmVzb3VyY2UuZ3JhbnRTdWJtaXRKb2IoaWRlbnRpdHksIHF1ZXVlKTtcbiAgfVxufVxuIl19
|
|
@@ -58,5 +58,5 @@ class NeuronxBatch extends constructs_1.Construct {
|
|
|
58
58
|
}
|
|
59
59
|
exports.NeuronxBatch = NeuronxBatch;
|
|
60
60
|
_a = JSII_RTTI_SYMBOL_1;
|
|
61
|
-
NeuronxBatch[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatch", version: "0.
|
|
61
|
+
NeuronxBatch[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatch", version: "0.3.0" };
|
|
62
62
|
//# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoibmV1cm9ueC1iYXRjaC5qcyIsInNvdXJjZVJvb3QiOiIiLCJzb3VyY2VzIjpbIi4uLy4uLy4uL3NyYy9iYXNlL2F3cy1iYXRjaC9uZXVyb254LWJhdGNoLnRzIl0sIm5hbWVzIjpbXSwibWFwcGluZ3MiOiI7Ozs7O0FBQ0EsK0NBQStDO0FBQy9DLDJDQUEyQztBQUMzQywyQ0FBdUM7QUFDdkMsd0NBQStFO0FBb0MvRTs7R0FFRztBQUNILE1BQWEsWUFBYSxTQUFRLHNCQUFTO0lBR3pDLFlBQVksS0FBZ0IsRUFBRSxFQUFVLEVBQUUsS0FBd0I7UUFDaEUsS0FBSyxDQUFDLEtBQUssRUFBRSxFQUFFLENBQUMsQ0FBQztRQUNqQixNQUFNLGNBQWMsR0FBRyxJQUFJLEdBQUcsQ0FBQyxjQUFjLENBQUMsSUFBSSxFQUFFLGdCQUFnQixFQUFFO1lBQ3BFLFlBQVksRUFBRTtnQkFDWjtvQkFDRSxVQUFVLEVBQUUsV0FBVztvQkFDdkIsTUFBTSxFQUFFLEdBQUcsQ0FBQyxpQkFBaUIsQ0FBQyxHQUFHLENBQUMsS0FBSyxDQUFDLFVBQVUsQ0FBQyxXQUFXLEVBQUUsQ0FBQztpQkFDbEU7YUFDRjtTQUNGLENBQUMsQ0FBQztRQUNILElBQUksQ0FBQyxrQkFBa0IsR0FBRyxJQUFJLEtBQUssQ0FBQywrQkFBK0IsQ0FDakUsSUFBSSxFQUNKLG9CQUFvQixFQUNwQjtZQUNFLEdBQUcsRUFBRSxLQUFLLENBQUMsR0FBRztZQUNkLFVBQVUsRUFBRSxLQUFLLENBQUMsVUFBVTtZQUM1QixhQUFhLEVBQUUsQ0FBQyxLQUFLLENBQUMsbUJBQW1CLENBQUMsWUFBWSxDQUFDO1lBQ3ZELHlCQUF5QixFQUFFLEtBQUs7WUFDaEMsTUFBTSxFQUFFO2dCQUNOO29CQUNFLEtBQUssRUFBRSxJQUFJLHFDQUEyQixDQUFDLElBQUksRUFBRSxhQUFhLENBQUM7b0JBQzNELFNBQVMsRUFBRSxLQUFLLENBQUMsbUJBQW1CLENBQUMsVUFBVTtpQkFDaEQ7YUFDRjtZQUNELGNBQWM7WUFDZCxJQUFJLEVBQUUsS0FBSyxDQUFDLElBQUk7U0FDakIsQ0FDRixDQUFDO1FBRUEsSUFBSSxDQUFDLGtCQUFrQixDQUFDLElBQUksQ0FBQyxZQUM5QixDQUFDLG1CQUFtQixDQUNuQix5Q0FBeUMsRUFDekMsY0FBYyxDQUFDLG1CQUFtQixDQUNuQyxDQUFDO1FBQ0YsTUFBTSxlQUFlLEdBQ25CLEtBQUssQ0FBQyxlQUFlO1lBQ3JCLElBQUksS0FBSyxDQUFDLGVBQWUsQ0FBQyxJQUFJLEVBQUUsaUJBQWlCLENBQUMsQ0FBQztRQUNyRCxlQUFlLENBQUMsVUFBVSxDQUN4QixHQUFHLEtBQUssQ0FBQyxJQUFJLENBQUM7WUFDWixNQUFNLEVBQUUsS0FBSyxDQUFDLG1CQUFtQixDQUFDLGdCQUFnQixDQUFDLEtBQUs7U0FDekQsQ0FBQyxDQUFDLEdBQUcsQ0FBQyxDQUFDLENBQUMsRUFBRSxLQUFLLEVBQUUsRUFBRSxDQUFDLENBQUM7WUFDcEIsUUFBUSxFQUFFLGNBQWMsS0FBSyxFQUFFO1lBQy9CLGFBQWEsRUFBRSxjQUFjLEtBQUssRUFBRTtZQUNwQyxXQUFXLEVBQUU7Z0JBQ1gsS0FBSyxDQUFDLGdCQUFnQixDQUFDLElBQUk7Z0JBQzNCLEtBQUssQ0FBQyxnQkFBZ0IsQ0FBQyxLQUFLO2FBQzdCO1NBQ0YsQ0FBQyxDQUFDLENBQ0osQ0FBQztRQUNGLElBQUksQ0FBQyxhQUFhLEdBQUcsSUFBSSxLQUFLLENBQUMsZ0JBQWdCLENBQUMsSUFBSSxFQUFFLGVBQWUsRUFBRTtZQUNyRSxTQUFTLEVBQUUsSUFBSSxLQUFLLENBQUMseUJBQXlCLENBQzVDLElBQUksRUFDSixxQkFBcUIsRUFDckI7Z0JBQ0UsR0FBRyxLQUFLO2dCQUNSLGVBQWU7YUFDaEIsQ0FDRjtTQUNGLENBQUMsQ0FBQztJQUNMLENBQUM7O0FBOURILG9DQStEQyIsInNvdXJjZXNDb250ZW50IjpbImltcG9ydCB7IFNpemUgfSBmcm9tIFwiYXdzLWNkay1saWJcIjtcbmltcG9ydCAqIGFzIGJhdGNoIGZyb20gXCJhd3MtY2RrLWxpYi9hd3MtYmF0Y2hcIjtcbmltcG9ydCAqIGFzIGVjMiBmcm9tIFwiYXdzLWNkay1saWIvYXdzLWVjMlwiO1xuaW1wb3J0IHsgQ29uc3RydWN0IH0gZnJvbSBcImNvbnN0cnVjdHNcIjtcbmltcG9ydCB7IElOZXVyb254SW5zdGFuY2VUeXBlLCBOZXVyb25PcHRpbWl6ZWRNYWNoaW5lSW1hZ2UgfSBmcm9tIFwiLi4vbmV1cm9ueFwiO1xuXG4vKipcbiAqIFByb3BzIG9mIE5ldXJvbnhCYXRjaC5cbiAqL1xuZXhwb3J0IGludGVyZmFjZSBOZXVyb254QmF0Y2hQcm9wc1xuICBleHRlbmRzIGJhdGNoLkVjc0VjMkNvbnRhaW5lckRlZmluaXRpb25Qcm9wcyB7XG4gIC8qKlxuICAgKiBWUEMgaW4gd2hpY2ggdGhpcyB3aWxsIGxhdW5jaCB3b3JrZXIgaW5zdGFuY2UuXG4gICAqL1xuICByZWFkb25seSB2cGM6IGVjMi5JVnBjO1xuICAvKipcbiAgICogVGhlIGluc3RhbmNlIHR5cGUgb2Ygd29ya2VyIGluc3RhbmNlLlxuICAgKi9cbiAgcmVhZG9ubHkgbmV1cm9ueEluc3RhbmNlVHlwZTogSU5ldXJvbnhJbnN0YW5jZVR5cGU7XG4gIC8qKlxuICAgKiBUaGUgcm9vdCB2b2x1bWUgb2Ygd29ya2VyIGluc3RhbmNlLlxuICAgKiBAZGVmYXVsdCAtIE4gYmlsaW9uIHBhcmFtZXRlcnMgKiA1R2lCIEVCU1xuICAgKi9cbiAgcmVhZG9ubHkgdm9sdW1lU2l6ZTogU2l6ZTtcbiAgLyoqXG4gICAqIFdoZXRoZXIgb3Igbm90IHRvIHVzZSBzcG90IGluc3RhbmNlcy5cbiAgICogU3BvdCBpbnN0YW5jZXMgYXJlIGxlc3MgZXhwZW5zaXZlIEVDMiBpbnN0YW5jZXMgdGhhdCBjYW4gYmUgcmVjbGFpbWVkIGJ5IEVDMiBhdCBhbnkgdGltZTtcbiAgICogeW91ciBqb2Igd2lsbCBiZSBnaXZlbiB0d28gbWludXRlcyBvZiBub3RpY2UgYmVmb3JlIHJlY2xhbWF0aW9uLlxuICAgKlxuICAgKiBAZGVmYXVsdCBmYWxzZVxuICAgKi9cbiAgcmVhZG9ubHkgc3BvdD86IGJvb2xlYW47XG4gIC8qKlxuICAgKiBUaGUgVlBDIFN1Ym5ldHMgdGhpcyBDb21wdXRlIEVudmlyb25tZW50IHdpbGwgbGF1bmNoIGluc3RhbmNlcyBpbi5cbiAgICpcbiAgICogQGRlZmF1bHQgLSBuZXcgc3VibmV0cyB3aWxsIGJlIGNyZWF0ZWRcbiAgICovXG4gIHJlYWRvbmx5IHZwY1N1Ym5ldHM/OiBlYzIuU3VibmV0U2VsZWN0aW9uO1xufVxuXG4vKipcbiAqIE5ldXJvbnggYmF0Y2ggY29uc3RydWN0LlxuICovXG5leHBvcnQgY2xhc3MgTmV1cm9ueEJhdGNoIGV4dGVuZHMgQ29uc3RydWN0IHtcbiAgcmVhZG9ubHkgY29tcHV0ZUVudmlyb25tZW50OiBiYXRjaC5NYW5hZ2VkRWMyRWNzQ29tcHV0ZUVudmlyb25tZW50O1xuICByZWFkb25seSBqb2JEZWZpbml0aW9uOiBiYXRjaC5FY3NKb2JEZWZpbml0aW9uO1xuICBjb25zdHJ1Y3RvcihzY29wZTogQ29uc3RydWN0LCBpZDogc3RyaW5nLCBwcm9wczogTmV1cm9ueEJhdGNoUHJvcHMpIHtcbiAgICBzdXBlcihzY29wZSwgaWQpO1xuICAgIGNvbnN0IGxhdW5jaFRlbXBsYXRlID0gbmV3IGVjMi5MYXVuY2hUZW1wbGF0ZSh0aGlzLCBcIkxhdW5jaFRlbXBsYXRlXCIsIHtcbiAgICAgIGJsb2NrRGV2aWNlczogW1xuICAgICAgICB7XG4gICAgICAgICAgZGV2aWNlTmFtZTogXCIvZGV2L3h2ZGFcIixcbiAgICAgICAgICB2b2x1bWU6IGVjMi5CbG9ja0RldmljZVZvbHVtZS5lYnMocHJvcHMudm9sdW1lU2l6ZS50b0dpYmlieXRlcygpKSxcbiAgICAgICAgfSxcbiAgICAgIF0sXG4gICAgfSk7XG4gICAgdGhpcy5jb21wdXRlRW52aXJvbm1lbnQgPSBuZXcgYmF0Y2guTWFuYWdlZEVjMkVjc0NvbXB1dGVFbnZpcm9ubWVudChcbiAgICAgIHRoaXMsXG4gICAgICBcIkNvbXB1dGVFbnZpcm9ubWVudFwiLFxuICAgICAge1xuICAgICAgICB2cGM6IHByb3BzLnZwYyxcbiAgICAgICAgdnBjU3VibmV0czogcHJvcHMudnBjU3VibmV0cyxcbiAgICAgICAgaW5zdGFuY2VUeXBlczogW3Byb3BzLm5ldXJvbnhJbnN0YW5jZVR5cGUuaW5zdGFuY2VUeXBlXSxcbiAgICAgICAgdXNlT3B0aW1hbEluc3RhbmNlQ2xhc3NlczogZmFsc2UsXG4gICAgICAgIGltYWdlczogW1xuICAgICAgICAgIHtcbiAgICAgICAgICAgIGltYWdlOiBuZXcgTmV1cm9uT3B0aW1pemVkTWFjaGluZUltYWdlKHRoaXMsIFwiTWFjaGluSW1hZ2VcIiksXG4gICAgICAgICAgICBpbWFnZVR5cGU6IGJhdGNoLkVjc01hY2hpbmVJbWFnZVR5cGUuRUNTX0FMMjAyMyxcbiAgICAgICAgICB9LFxuICAgICAgICBdLFxuICAgICAgICBsYXVuY2hUZW1wbGF0ZSxcbiAgICAgICAgc3BvdDogcHJvcHMuc3BvdCxcbiAgICAgIH0sXG4gICAgKTtcbiAgICAoXG4gICAgICB0aGlzLmNvbXB1dGVFbnZpcm9ubWVudC5ub2RlLmRlZmF1bHRDaGlsZCBhcyBiYXRjaC5DZm5Db21wdXRlRW52aXJvbm1lbnRcbiAgICApLmFkZFByb3BlcnR5T3ZlcnJpZGUoXG4gICAgICBcIkNvbXB1dGVSZXNvdXJjZXMuTGF1bmNoVGVtcGxhdGUuVmVyc2lvblwiLFxuICAgICAgbGF1bmNoVGVtcGxhdGUubGF0ZXN0VmVyc2lvbk51bWJlcixcbiAgICApO1xuICAgIGNvbnN0IGxpbnV4UGFyYW1ldGVycyA9XG4gICAgICBwcm9wcy5saW51eFBhcmFtZXRlcnMgPz9cbiAgICAgIG5ldyBiYXRjaC5MaW51eFBhcmFtZXRlcnModGhpcywgXCJMaW51eFBhcmFtZXRlcnNcIik7XG4gICAgbGludXhQYXJhbWV0ZXJzLmFkZERldmljZXMoXG4gICAgICAuLi5BcnJheS5mcm9tKHtcbiAgICAgICAgbGVuZ3RoOiBwcm9wcy5uZXVyb254SW5zdGFuY2VUeXBlLmFjY2VsZXJhdG9yQ2hpcHMuY2hpcHMsXG4gICAgICB9KS5tYXAoKF8sIGluZGV4KSA9PiAoe1xuICAgICAgICBob3N0UGF0aDogYC9kZXYvbmV1cm9uJHtpbmRleH1gLFxuICAgICAgICBjb250YWluZXJQYXRoOiBgL2Rldi9uZXVyb24ke2luZGV4fWAsXG4gICAgICAgIHBlcm1pc3Npb25zOiBbXG4gICAgICAgICAgYmF0Y2guRGV2aWNlUGVybWlzc2lvbi5SRUFELFxuICAgICAgICAgIGJhdGNoLkRldmljZVBlcm1pc3Npb24uV1JJVEUsXG4gICAgICAgIF0sXG4gICAgICB9KSksXG4gICAgKTtcbiAgICB0aGlzLmpvYkRlZmluaXRpb24gPSBuZXcgYmF0Y2guRWNzSm9iRGVmaW5pdGlvbih0aGlzLCBcIkpvYkRlZmluaXRpb25cIiwge1xuICAgICAgY29udGFpbmVyOiBuZXcgYmF0Y2guRWNzRWMyQ29udGFpbmVyRGVmaW5pdGlvbihcbiAgICAgICAgdGhpcyxcbiAgICAgICAgXCJDb250YWluZXJEZWZpbml0aW9uXCIsXG4gICAgICAgIHtcbiAgICAgICAgICAuLi5wcm9wcyxcbiAgICAgICAgICBsaW51eFBhcmFtZXRlcnMsXG4gICAgICAgIH0sXG4gICAgICApLFxuICAgIH0pO1xuICB9XG59XG4iXX0=
|
|
@@ -11,7 +11,7 @@ const aws_ecs_patterns_1 = require("aws-cdk-lib/aws-ecs-patterns");
|
|
|
11
11
|
const neuronx_1 = require("../neuronx");
|
|
12
12
|
class NeuronxTaskDefinition extends ecs.Ec2TaskDefinition {
|
|
13
13
|
constructor(scope, id, props) {
|
|
14
|
-
const neuronxInstanceType = props.neuronxInstanceType ?? props.compiledModel.
|
|
14
|
+
const neuronxInstanceType = props.neuronxInstanceType ?? props.compiledModel.recommendedInstanceType;
|
|
15
15
|
const tensorParallelSize = props.tensorParallelSize ?? 1;
|
|
16
16
|
const tasksPerInstance = Math.floor(neuronxInstanceType.acceleratorChips.neuronxCores / tensorParallelSize);
|
|
17
17
|
const placementConstraints = tasksPerInstance >= 2
|
|
@@ -63,7 +63,7 @@ class NeuronxTaskDefinition extends ecs.Ec2TaskDefinition {
|
|
|
63
63
|
}
|
|
64
64
|
exports.NeuronxTaskDefinition = NeuronxTaskDefinition;
|
|
65
65
|
_a = JSII_RTTI_SYMBOL_1;
|
|
66
|
-
NeuronxTaskDefinition[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxTaskDefinition", version: "0.
|
|
66
|
+
NeuronxTaskDefinition[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxTaskDefinition", version: "0.3.0" };
|
|
67
67
|
class ApplicationLoadBalancedNeuronxService extends aws_ecs_patterns_1.ApplicationLoadBalancedEc2Service {
|
|
68
68
|
constructor(scope, id, props) {
|
|
69
69
|
const neuronxTaskDefinition = props.taskDefinition;
|
|
@@ -141,5 +141,5 @@ mount-s3 ${neuronxTaskDefinition.compiledModel.bucket.bucketName} /mnt/${neuronx
|
|
|
141
141
|
}
|
|
142
142
|
exports.ApplicationLoadBalancedNeuronxService = ApplicationLoadBalancedNeuronxService;
|
|
143
143
|
_b = JSII_RTTI_SYMBOL_1;
|
|
144
|
-
ApplicationLoadBalancedNeuronxService[_b] = { fqn: "aws-cdk-neuronx-patterns.ApplicationLoadBalancedNeuronxService", version: "0.
|
|
145
|
-
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"application-load-balanced-neuronx-service.js","sourceRoot":"","sources":["../../../src/base/aws-ecs-patterns/application-load-balanced-neuronx-service.ts"],"names":[],"mappings":";;;;;AAAA,6CAAuC;AACvC,iEAIqC;AACrC,iDAAqD;AACrD,2CAA2C;AAC3C,mEAGsC;AAEtC,wCAIoB;AA6BpB,MAAa,qBACX,SAAQ,GAAG,CAAC,iBAAiB;IAQ7B,YAAY,KAAgB,EAAE,EAAU,EAAE,KAAiC;QACzE,MAAM,mBAAmB,GACvB,KAAK,CAAC,mBAAmB,IAAI,KAAK,CAAC,aAAa,CAAC,uBAAuB,CAAC;QAC3E,MAAM,kBAAkB,GAAG,KAAK,CAAC,kBAAkB,IAAI,CAAC,CAAC;QACzD,MAAM,gBAAgB,GAAG,IAAI,CAAC,KAAK,CACjC,mBAAmB,CAAC,gBAAgB,CAAC,YAAY,GAAG,kBAAkB,CACvE,CAAC;QACF,MAAM,oBAAoB,GACxB,gBAAgB,IAAI,CAAC;YACnB,CAAC,CAAC;gBACE,GAAG,CAAC,mBAAmB,CAAC,QAAQ,CAC9B,qBAAqB,gBAAgB,EAAE,CACxC;aACF;YACH,CAAC,CAAC,EAAE,CAAC;QACT,KAAK,CAAC,KAAK,EAAE,EAAE,EAAE;YACf,GAAG,KAAK;YACR,oBAAoB,EAAE;gBACpB,GAAG,CAAC,KAAK,CAAC,oBAAoB,IAAI,EAAE,CAAC;gBACrC,GAAG,oBAAoB;aACxB;SACF,CAAC,CAAC;QACH,IAAI,CAAC,eAAe,GAAG,IAAI,GAAG,CAAC,eAAe,CAAC,IAAI,EAAE,iBAAiB,CAAC,CAAC;QACxE,IAAI,CAAC,eAAe,CAAC,UAAU,CAC7B,GAAG,KAAK,CAAC,IAAI,CAAC;YACZ,MAAM,EAAE,mBAAmB,EAAE,gBAAgB,CAAC,KAAK,IAAI,CAAC;SACzD,CAAC,CAAC,GAAG,CAAa,CAAC,CAAC,EAAE,KAAK,EAAE,EAAE,CAAC,CAAC;YAChC,QAAQ,EAAE,cAAc,KAAK,EAAE;YAC/B,aAAa,EAAE,cAAc,KAAK,EAAE;YACpC,WAAW,EAAE,CAAC,GAAG,CAAC,gBAAgB,CAAC,IAAI,EAAE,GAAG,CAAC,gBAAgB,CAAC,KAAK,CAAC;SACrE,CAAC,CAAC,CACJ,CAAC;QACF,IAAI,IAAI,CAAC,aAAa,EAAE,CAAC;YACvB,KAAK,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,IAAI,CAAC,aAAa,CAAC,CAAC;QAC3D,CAAC;QACD,KAAK,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QACpD,IAAI,CAAC,aAAa,GAAG,KAAK,CAAC,aAAa,CAAC;QACzC,IAAI,CAAC,mBAAmB,GAAG,mBAAmB,CAAC;QAC/C,IAAI,CAAC,kBAAkB,GAAG,kBAAkB,CAAC;QAC7C,IAAI,CAAC,gBAAgB,GAAG,gBAAgB,CAAC;IAC3C,CAAC;IAED,uBAAuB,CACrB,EAAU,EACV,KAAqC;QAErC,MAAM,SAAS,GAAG,KAAK,CAAC,YAAY,CAAC,EAAE,EAAE;YACvC,OAAO,EAAE,GAAG,CAAC,SAAS,CAAC,OAAO,CAAC;gBAC7B,YAAY,EAAE,EAAE;aACjB,CAAC;YACF,eAAe,EAAE,IAAI,CAAC,eAAe;YACrC,oBAAoB,EAAE,IAAI,CAAC,IAAI,CAC7B,CAAC,IAAI,CAAC,mBAAmB,CAAC,MAAM,CAAC,WAAW,EAAE,GAAG,GAAG,CAAC;gBACnD,IAAI,CAAC,gBAAgB,CACxB;YACD,GAAG,KAAK;SACT,CAAC,CAAC;QACH,SAAS,CAAC,cAAc,CAAC;YACvB,YAAY,EAAE,OAAO;YACrB,aAAa,EAAE,eAAe;YAC9B,QAAQ,EAAE,KAAK;SAChB,CAAC,CAAC;QACH,OAAO,SAAS,CAAC;IACnB,CAAC;;AAxEH,sDAyEC;;;AAGD,MAAa,qCAAsC,SAAQ,oDAAiC;IAC1F,YACE,KAAgB,EAChB,EAAU,EACV,KAAiD;QAEjD,MAAM,qBAAqB,GAAG,KAAK,CAAC,cAAc,CAAC;QACnD,IACE,CAAC,qBAAqB;YACtB,CAAC,CAAC,qBAAqB,YAAY,qBAAqB,CAAC,EACzD,CAAC;YACD,MAAM,IAAI,KAAK,CAAC,kDAAkD,CAAC,CAAC;QACtE,CAAC;QACD,KAAK,CAAC,KAAK,EAAE,EAAE,EAAE;YACf,sBAAsB,EACpB,KAAK,CAAC,sBAAsB,IAAI,sBAAQ,CAAC,OAAO,CAAC,EAAE,CAAC;YACtD,GAAG,KAAK;SACT,CAAC,CAAC;QAEH,MAAM,OAAO,GAAG,IAAI,CAAC,iBAAiB,CAAC,IAAI,EAAE,KAAK,CAAC,GAAG,CAAC,CAAC;QAExD,sCAAsC;QACtC,MAAM,QAAQ,GAAG,kBAAQ,CAAC,QAAQ,EAAE,CAAC;QACrC,QAAQ,CAAC,WAAW,CAAC;;;;;;;;;;;;;;;;;;;;;;;uBAuBF,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU;WACjE,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,SAAS,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,+CAA+C,CAAC,CAAC;QAE3K,qBAAqB,CAAC,SAAS,CAAC;YAC9B,IAAI,EAAE,OAAO;YACb,IAAI,EAAE;gBACJ,UAAU,EAAE,QAAQ,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,EAAE;aAC5E;SACF,CAAC,CAAC;QAEH,MAAM,UAAU,GAAG,IAAI,CAAC,IAAI,CAC1B,qCAA2B,CAAC,IAAI,CAAC,WAAW,EAAE;YAC5C,qCAA2B,CAAC,IAAI,CAAC,WAAW,EAAE,CACjD,CAAC;QACF,MAAM,eAAe,GAAG,IAAI,CAAC,IAAI,CAC/B,CAAC,KAAK,CAAC,YAAY,IAAI,CAAC,CAAC,GAAG,qBAAqB,CAAC,gBAAgB,CACnE,CAAC;QACF,MAAM,gBAAgB,GAAG,IAAI,kCAAgB,CAAC,IAAI,EAAE,kBAAkB,EAAE;YACtE,GAAG,EAAE,OAAO,CAAC,GAAG;YAChB,YAAY,EAAE,qBAAqB,CAAC,mBAAmB,CAAC,YAAY;YACpE,YAAY,EAAE,IAAI,qCAA2B,CAC3C,IAAI,EACJ,6BAA6B,CAC9B;YACD,YAAY,EAAE;gBACZ;oBACE,UAAU,EAAE,WAAW;oBACvB,MAAM,EAAE,mCAAiB,CAAC,GAAG,CAAC,UAAU,EAAE;wBACxC,UAAU,EAAE,qCAAmB,CAAC,GAAG;wBACnC,SAAS,EAAE,IAAI;qBAChB,CAAC;iBACH;aACF;YACD,QAAQ;YACR,eAAe;YACf,WAAW,EACT,qBAAqB,CAAC,gBAAgB,KAAK,CAAC;gBAC1C,CAAC,CAAC,eAAe,GAAG,CAAC;gBACrB,CAAC,CAAC,SAAS;SAChB,CAAC,CAAC;QACH,gBAAgB,CAAC,WAAW,CAAC,SAAS,CACpC,IAAI,CAAC,YAAY,EACjB,cAAI,CAAC,QAAQ,CAAC,KAAK,EAAE,KAAK,CAAC,CAC5B,CAAC;QACF,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,gBAAgB,CAAC,CAAC;QACvE,MAAM,QAAQ,GAAG,IAAI,GAAG,CAAC,mBAAmB,CAAC,IAAI,EAAE,qBAAqB,EAAE;YACxE,gBAAgB;SACjB,CAAC,CAAC;QACH,OAAO,CAAC,sBAAsB,CAAC,QAAQ,CAAC,CAAC;IAC3C,CAAC;;AA/FH,sFAgGC","sourcesContent":["import { Duration } from \"aws-cdk-lib\";\nimport {\n  AutoScalingGroup,\n  BlockDeviceVolume,\n  EbsDeviceVolumeType,\n} from \"aws-cdk-lib/aws-autoscaling\";\nimport { Port, UserData } from \"aws-cdk-lib/aws-ec2\";\nimport * as ecs from \"aws-cdk-lib/aws-ecs\";\nimport {\n  ApplicationLoadBalancedEc2Service,\n  ApplicationLoadBalancedEc2ServiceProps,\n} from \"aws-cdk-lib/aws-ecs-patterns\";\nimport { Construct } from \"constructs\";\nimport {\n  INeuronxInstanceType,\n  NeuronOptimizedMachineImage,\n  PytorchTrainingNeuronxImage,\n} from \"../neuronx\";\nimport { NeuronxCompiledModel } from \"../neuronx-compiler\";\n\nexport interface NeuronxTaskDefinitionPropsBase\n  extends ecs.Ec2TaskDefinitionProps {\n  /**\n   * The instance type of compile worker instance.\n   */\n  readonly neuronxInstanceType?: INeuronxInstanceType;\n  /**\n   * The number of tensor parallel size.\n   * @default - 1\n   */\n  readonly tensorParallelSize?: number;\n}\n\nexport interface NeuronxTaskDefinitionProps extends NeuronxTaskDefinitionPropsBase {\n  /**\n   * The model to be compiled.\n   */\n  readonly compiledModel: NeuronxCompiledModel;\n}\n\nexport interface INeuronxTaskDefinition extends ecs.IEc2TaskDefinition {\n  readonly neuronxInstanceType: INeuronxInstanceType;\n  readonly tensorParallelSize: number;\n  readonly tasksPerInstance: number;\n  readonly compiledModel: NeuronxCompiledModel;\n}\nexport class NeuronxTaskDefinition\n  extends ecs.Ec2TaskDefinition\n  implements INeuronxTaskDefinition\n{\n  readonly neuronxInstanceType: INeuronxInstanceType;\n  readonly tensorParallelSize: number;\n  readonly tasksPerInstance: number;\n  readonly compiledModel: NeuronxCompiledModel;\n  protected readonly linuxParameters: ecs.LinuxParameters;\n  constructor(scope: Construct, id: string, props: NeuronxTaskDefinitionProps) {\n    const neuronxInstanceType =\n      props.neuronxInstanceType ?? props.compiledModel.compileTimeInstanceType;\n    const tensorParallelSize = props.tensorParallelSize ?? 1;\n    const tasksPerInstance = Math.floor(\n      neuronxInstanceType.acceleratorChips.neuronxCores / tensorParallelSize,\n    );\n    const placementConstraints =\n      tasksPerInstance >= 2\n        ? [\n            ecs.PlacementConstraint.memberOf(\n              `runningTasksCount<${tasksPerInstance}`,\n            ),\n          ]\n        : [];\n    super(scope, id, {\n      ...props,\n      placementConstraints: [\n        ...(props.placementConstraints ?? []),\n        ...placementConstraints,\n      ],\n    });\n    this.linuxParameters = new ecs.LinuxParameters(this, \"LinuxParameters\");\n    this.linuxParameters.addDevices(\n      ...Array.from({\n        length: neuronxInstanceType?.acceleratorChips.chips ?? 1,\n      }).map<ecs.Device>((_, index) => ({\n        hostPath: `/dev/neuron${index}`,\n        containerPath: `/dev/neuron${index}`,\n        permissions: [ecs.DevicePermission.READ, ecs.DevicePermission.WRITE],\n      })),\n    );\n    if (this.executionRole) {\n      props.compiledModel.bucket.grantRead(this.executionRole);\n    }\n    props.compiledModel.bucket.grantRead(this.taskRole);\n    this.compiledModel = props.compiledModel;\n    this.neuronxInstanceType = neuronxInstanceType;\n    this.tensorParallelSize = tensorParallelSize;\n    this.tasksPerInstance = tasksPerInstance;\n  }\n\n  addContainerWithDefault(\n    id: string,\n    props: ecs.ContainerDefinitionOptions,\n  ): ecs.ContainerDefinition {\n    const container = super.addContainer(id, {\n      logging: ecs.LogDriver.awsLogs({\n        streamPrefix: id,\n      }),\n      linuxParameters: this.linuxParameters,\n      memoryReservationMiB: Math.ceil(\n        (this.neuronxInstanceType.memory.toMebibytes() * 0.8) /\n          this.tasksPerInstance,\n      ),\n      ...props,\n    });\n    container.addMountPoints({\n      sourceVolume: \"model\",\n      containerPath: \"/opt/ml/model\",\n      readOnly: false,\n    });\n    return container;\n  }\n}\n\nexport interface ApplicationLoadBalancedNeuronxServiceProps extends ApplicationLoadBalancedEc2ServiceProps {}\nexport class ApplicationLoadBalancedNeuronxService extends ApplicationLoadBalancedEc2Service {\n  constructor(\n    scope: Construct,\n    id: string,\n    props: ApplicationLoadBalancedNeuronxServiceProps,\n  ) {\n    const neuronxTaskDefinition = props.taskDefinition;\n    if (\n      !neuronxTaskDefinition ||\n      !(neuronxTaskDefinition instanceof NeuronxTaskDefinition)\n    ) {\n      throw new Error(\"taskDefinition must extend NeuronxTaskDefinition\");\n    }\n    super(scope, id, {\n      healthCheckGracePeriod:\n        props.healthCheckGracePeriod ?? Duration.minutes(15),\n      ...props,\n    });\n\n    const cluster = this.getDefaultCluster(this, props.vpc);\n\n    // install and mount mountpoint for s3\n    const userData = UserData.forLinux();\n    userData.addCommands(`\n#!/bin/bash -e\n\n# Install Mountpoint\nMP_RPM=$(mktemp --suffix=.rpm)\ncurl https://s3.amazonaws.com/mountpoint-s3-release/latest/x86_64/mount-s3.rpm > $MP_RPM\n\n# cloud-init installs conflict with SSM agent: https://github.com/amazonlinux/amazon-linux-2023/issues/397\nattempt=0\nmax_attempts=5\nuntil dnf install -y $MP_RPM; do\n    attempt=$((attempt + 1))\n    if [ $attempt -ge $max_attempts ]; then\n        echo \"Failed to install mount-s3 after $max_attempts attempts. Exiting.\"\n        exit 1\n    fi\n    echo \"dnf install mount-s3 failed (attempt $attempt/$max_attempts), retrying in 3 seconds...\"\n    sleep 3\ndone\n\nrm $MP_RPM\n\n# Setup the fstab file and create the mount\nmkdir --parents /mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName}\nmount-s3 ${neuronxTaskDefinition.compiledModel.bucket.bucketName} /mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName} --allow-other --file-mode=644 --dir-mode=755`);\n\n    neuronxTaskDefinition.addVolume({\n      name: \"model\",\n      host: {\n        sourcePath: `/mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName}`,\n      },\n    });\n\n    const volumeSize = Math.ceil(\n      PytorchTrainingNeuronxImage.size.toGibibytes() +\n        NeuronOptimizedMachineImage.size.toGibibytes(),\n    );\n    const desiredCapacity = Math.ceil(\n      (props.desiredCount ?? 1) / neuronxTaskDefinition.tasksPerInstance,\n    );\n    const autoScalingGroup = new AutoScalingGroup(this, \"AutoScalingGroup\", {\n      vpc: cluster.vpc,\n      instanceType: neuronxTaskDefinition.neuronxInstanceType.instanceType,\n      machineImage: new NeuronOptimizedMachineImage(\n        this,\n        \"NeuronOptimizedMachineImage\",\n      ),\n      blockDevices: [\n        {\n          deviceName: \"/dev/xvda\",\n          volume: BlockDeviceVolume.ebs(volumeSize, {\n            volumeType: EbsDeviceVolumeType.GP3,\n            encrypted: true,\n          }),\n        },\n      ],\n      userData,\n      desiredCapacity,\n      maxCapacity:\n        neuronxTaskDefinition.tasksPerInstance === 1\n          ? desiredCapacity + 1\n          : undefined,\n    });\n    autoScalingGroup.connections.allowFrom(\n      this.loadBalancer,\n      Port.tcpRange(32768, 60999),\n    );\n    neuronxTaskDefinition.compiledModel.bucket.grantRead(autoScalingGroup);\n    const provider = new ecs.AsgCapacityProvider(this, \"AsgCapacityProvider\", {\n      autoScalingGroup,\n    });\n    cluster.addAsgCapacityProvider(provider);\n  }\n}\n"]}
|
|
144
|
+
ApplicationLoadBalancedNeuronxService[_b] = { fqn: "aws-cdk-neuronx-patterns.ApplicationLoadBalancedNeuronxService", version: "0.3.0" };
|
|
145
|
+
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"application-load-balanced-neuronx-service.js","sourceRoot":"","sources":["../../../src/base/aws-ecs-patterns/application-load-balanced-neuronx-service.ts"],"names":[],"mappings":";;;;;AAAA,6CAAuC;AACvC,iEAIqC;AACrC,iDAAqD;AACrD,2CAA2C;AAC3C,mEAGsC;AAEtC,wCAIoB;AA6BpB,MAAa,qBACX,SAAQ,GAAG,CAAC,iBAAiB;IAQ7B,YAAY,KAAgB,EAAE,EAAU,EAAE,KAAiC;QACzE,MAAM,mBAAmB,GACvB,KAAK,CAAC,mBAAmB,IAAI,KAAK,CAAC,aAAa,CAAC,uBAAuB,CAAC;QAC3E,MAAM,kBAAkB,GAAG,KAAK,CAAC,kBAAkB,IAAI,CAAC,CAAC;QACzD,MAAM,gBAAgB,GAAG,IAAI,CAAC,KAAK,CACjC,mBAAmB,CAAC,gBAAgB,CAAC,YAAY,GAAG,kBAAkB,CACvE,CAAC;QACF,MAAM,oBAAoB,GACxB,gBAAgB,IAAI,CAAC;YACnB,CAAC,CAAC;gBACE,GAAG,CAAC,mBAAmB,CAAC,QAAQ,CAC9B,qBAAqB,gBAAgB,EAAE,CACxC;aACF;YACH,CAAC,CAAC,EAAE,CAAC;QACT,KAAK,CAAC,KAAK,EAAE,EAAE,EAAE;YACf,GAAG,KAAK;YACR,oBAAoB,EAAE;gBACpB,GAAG,CAAC,KAAK,CAAC,oBAAoB,IAAI,EAAE,CAAC;gBACrC,GAAG,oBAAoB;aACxB;SACF,CAAC,CAAC;QACH,IAAI,CAAC,eAAe,GAAG,IAAI,GAAG,CAAC,eAAe,CAAC,IAAI,EAAE,iBAAiB,CAAC,CAAC;QACxE,IAAI,CAAC,eAAe,CAAC,UAAU,CAC7B,GAAG,KAAK,CAAC,IAAI,CAAC;YACZ,MAAM,EAAE,mBAAmB,EAAE,gBAAgB,CAAC,KAAK,IAAI,CAAC;SACzD,CAAC,CAAC,GAAG,CAAa,CAAC,CAAC,EAAE,KAAK,EAAE,EAAE,CAAC,CAAC;YAChC,QAAQ,EAAE,cAAc,KAAK,EAAE;YAC/B,aAAa,EAAE,cAAc,KAAK,EAAE;YACpC,WAAW,EAAE,CAAC,GAAG,CAAC,gBAAgB,CAAC,IAAI,EAAE,GAAG,CAAC,gBAAgB,CAAC,KAAK,CAAC;SACrE,CAAC,CAAC,CACJ,CAAC;QACF,IAAI,IAAI,CAAC,aAAa,EAAE,CAAC;YACvB,KAAK,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,IAAI,CAAC,aAAa,CAAC,CAAC;QAC3D,CAAC;QACD,KAAK,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QACpD,IAAI,CAAC,aAAa,GAAG,KAAK,CAAC,aAAa,CAAC;QACzC,IAAI,CAAC,mBAAmB,GAAG,mBAAmB,CAAC;QAC/C,IAAI,CAAC,kBAAkB,GAAG,kBAAkB,CAAC;QAC7C,IAAI,CAAC,gBAAgB,GAAG,gBAAgB,CAAC;IAC3C,CAAC;IAED,uBAAuB,CACrB,EAAU,EACV,KAAqC;QAErC,MAAM,SAAS,GAAG,KAAK,CAAC,YAAY,CAAC,EAAE,EAAE;YACvC,OAAO,EAAE,GAAG,CAAC,SAAS,CAAC,OAAO,CAAC;gBAC7B,YAAY,EAAE,EAAE;aACjB,CAAC;YACF,eAAe,EAAE,IAAI,CAAC,eAAe;YACrC,oBAAoB,EAAE,IAAI,CAAC,IAAI,CAC7B,CAAC,IAAI,CAAC,mBAAmB,CAAC,MAAM,CAAC,WAAW,EAAE,GAAG,GAAG,CAAC;gBACnD,IAAI,CAAC,gBAAgB,CACxB;YACD,GAAG,KAAK;SACT,CAAC,CAAC;QACH,SAAS,CAAC,cAAc,CAAC;YACvB,YAAY,EAAE,OAAO;YACrB,aAAa,EAAE,eAAe;YAC9B,QAAQ,EAAE,KAAK;SAChB,CAAC,CAAC;QACH,OAAO,SAAS,CAAC;IACnB,CAAC;;AAxEH,sDAyEC;;;AAGD,MAAa,qCAAsC,SAAQ,oDAAiC;IAC1F,YACE,KAAgB,EAChB,EAAU,EACV,KAAiD;QAEjD,MAAM,qBAAqB,GAAG,KAAK,CAAC,cAAc,CAAC;QACnD,IACE,CAAC,qBAAqB;YACtB,CAAC,CAAC,qBAAqB,YAAY,qBAAqB,CAAC,EACzD,CAAC;YACD,MAAM,IAAI,KAAK,CAAC,kDAAkD,CAAC,CAAC;QACtE,CAAC;QACD,KAAK,CAAC,KAAK,EAAE,EAAE,EAAE;YACf,sBAAsB,EACpB,KAAK,CAAC,sBAAsB,IAAI,sBAAQ,CAAC,OAAO,CAAC,EAAE,CAAC;YACtD,GAAG,KAAK;SACT,CAAC,CAAC;QAEH,MAAM,OAAO,GAAG,IAAI,CAAC,iBAAiB,CAAC,IAAI,EAAE,KAAK,CAAC,GAAG,CAAC,CAAC;QAExD,sCAAsC;QACtC,MAAM,QAAQ,GAAG,kBAAQ,CAAC,QAAQ,EAAE,CAAC;QACrC,QAAQ,CAAC,WAAW,CAAC;;;;;;;;;;;;;;;;;;;;;;;uBAuBF,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU;WACjE,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,SAAS,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,+CAA+C,CAAC,CAAC;QAE3K,qBAAqB,CAAC,SAAS,CAAC;YAC9B,IAAI,EAAE,OAAO;YACb,IAAI,EAAE;gBACJ,UAAU,EAAE,QAAQ,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,EAAE;aAC5E;SACF,CAAC,CAAC;QAEH,MAAM,UAAU,GAAG,IAAI,CAAC,IAAI,CAC1B,qCAA2B,CAAC,IAAI,CAAC,WAAW,EAAE;YAC5C,qCAA2B,CAAC,IAAI,CAAC,WAAW,EAAE,CACjD,CAAC;QACF,MAAM,eAAe,GAAG,IAAI,CAAC,IAAI,CAC/B,CAAC,KAAK,CAAC,YAAY,IAAI,CAAC,CAAC,GAAG,qBAAqB,CAAC,gBAAgB,CACnE,CAAC;QACF,MAAM,gBAAgB,GAAG,IAAI,kCAAgB,CAAC,IAAI,EAAE,kBAAkB,EAAE;YACtE,GAAG,EAAE,OAAO,CAAC,GAAG;YAChB,YAAY,EAAE,qBAAqB,CAAC,mBAAmB,CAAC,YAAY;YACpE,YAAY,EAAE,IAAI,qCAA2B,CAC3C,IAAI,EACJ,6BAA6B,CAC9B;YACD,YAAY,EAAE;gBACZ;oBACE,UAAU,EAAE,WAAW;oBACvB,MAAM,EAAE,mCAAiB,CAAC,GAAG,CAAC,UAAU,EAAE;wBACxC,UAAU,EAAE,qCAAmB,CAAC,GAAG;wBACnC,SAAS,EAAE,IAAI;qBAChB,CAAC;iBACH;aACF;YACD,QAAQ;YACR,eAAe;YACf,WAAW,EACT,qBAAqB,CAAC,gBAAgB,KAAK,CAAC;gBAC1C,CAAC,CAAC,eAAe,GAAG,CAAC;gBACrB,CAAC,CAAC,SAAS;SAChB,CAAC,CAAC;QACH,gBAAgB,CAAC,WAAW,CAAC,SAAS,CACpC,IAAI,CAAC,YAAY,EACjB,cAAI,CAAC,QAAQ,CAAC,KAAK,EAAE,KAAK,CAAC,CAC5B,CAAC;QACF,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,gBAAgB,CAAC,CAAC;QACvE,MAAM,QAAQ,GAAG,IAAI,GAAG,CAAC,mBAAmB,CAAC,IAAI,EAAE,qBAAqB,EAAE;YACxE,gBAAgB;SACjB,CAAC,CAAC;QACH,OAAO,CAAC,sBAAsB,CAAC,QAAQ,CAAC,CAAC;IAC3C,CAAC;;AA/FH,sFAgGC","sourcesContent":["import { Duration } from \"aws-cdk-lib\";\nimport {\n  AutoScalingGroup,\n  BlockDeviceVolume,\n  EbsDeviceVolumeType,\n} from \"aws-cdk-lib/aws-autoscaling\";\nimport { Port, UserData } from \"aws-cdk-lib/aws-ec2\";\nimport * as ecs from \"aws-cdk-lib/aws-ecs\";\nimport {\n  ApplicationLoadBalancedEc2Service,\n  ApplicationLoadBalancedEc2ServiceProps,\n} from \"aws-cdk-lib/aws-ecs-patterns\";\nimport { Construct } from \"constructs\";\nimport {\n  INeuronxInstanceType,\n  NeuronOptimizedMachineImage,\n  PytorchTrainingNeuronxImage,\n} from \"../neuronx\";\nimport { NeuronxCompiledModel } from \"../neuronx-compiler\";\n\nexport interface NeuronxTaskDefinitionPropsBase\n  extends ecs.Ec2TaskDefinitionProps {\n  /**\n   * The instance type of compile worker instance.\n   */\n  readonly neuronxInstanceType?: INeuronxInstanceType;\n  /**\n   * The number of tensor parallel size.\n   * @default - 1\n   */\n  readonly tensorParallelSize?: number;\n}\n\nexport interface NeuronxTaskDefinitionProps extends NeuronxTaskDefinitionPropsBase {\n  /**\n   * The model to be compiled.\n   */\n  readonly compiledModel: NeuronxCompiledModel;\n}\n\nexport interface INeuronxTaskDefinition extends ecs.IEc2TaskDefinition {\n  readonly neuronxInstanceType: INeuronxInstanceType;\n  readonly tensorParallelSize: number;\n  readonly tasksPerInstance: number;\n  readonly compiledModel: NeuronxCompiledModel;\n}\nexport class NeuronxTaskDefinition\n  extends ecs.Ec2TaskDefinition\n  implements INeuronxTaskDefinition\n{\n  readonly neuronxInstanceType: INeuronxInstanceType;\n  readonly tensorParallelSize: number;\n  readonly tasksPerInstance: number;\n  readonly compiledModel: NeuronxCompiledModel;\n  protected readonly linuxParameters: ecs.LinuxParameters;\n  constructor(scope: Construct, id: string, props: NeuronxTaskDefinitionProps) {\n    const neuronxInstanceType =\n      props.neuronxInstanceType ?? props.compiledModel.recommendedInstanceType;\n    const tensorParallelSize = props.tensorParallelSize ?? 1;\n    const tasksPerInstance = Math.floor(\n      neuronxInstanceType.acceleratorChips.neuronxCores / tensorParallelSize,\n    );\n    const placementConstraints =\n      tasksPerInstance >= 2\n        ? [\n            ecs.PlacementConstraint.memberOf(\n              `runningTasksCount<${tasksPerInstance}`,\n            ),\n          ]\n        : [];\n    super(scope, id, {\n      ...props,\n      placementConstraints: [\n        ...(props.placementConstraints ?? []),\n        ...placementConstraints,\n      ],\n    });\n    this.linuxParameters = new ecs.LinuxParameters(this, \"LinuxParameters\");\n    this.linuxParameters.addDevices(\n      ...Array.from({\n        length: neuronxInstanceType?.acceleratorChips.chips ?? 1,\n      }).map<ecs.Device>((_, index) => ({\n        hostPath: `/dev/neuron${index}`,\n        containerPath: `/dev/neuron${index}`,\n        permissions: [ecs.DevicePermission.READ, ecs.DevicePermission.WRITE],\n      })),\n    );\n    if (this.executionRole) {\n      props.compiledModel.bucket.grantRead(this.executionRole);\n    }\n    props.compiledModel.bucket.grantRead(this.taskRole);\n    this.compiledModel = props.compiledModel;\n    this.neuronxInstanceType = neuronxInstanceType;\n    this.tensorParallelSize = tensorParallelSize;\n    this.tasksPerInstance = tasksPerInstance;\n  }\n\n  addContainerWithDefault(\n    id: string,\n    props: ecs.ContainerDefinitionOptions,\n  ): ecs.ContainerDefinition {\n    const container = super.addContainer(id, {\n      logging: ecs.LogDriver.awsLogs({\n        streamPrefix: id,\n      }),\n      linuxParameters: this.linuxParameters,\n      memoryReservationMiB: Math.ceil(\n        (this.neuronxInstanceType.memory.toMebibytes() * 0.8) /\n          this.tasksPerInstance,\n      ),\n      ...props,\n    });\n    container.addMountPoints({\n      sourceVolume: \"model\",\n      containerPath: \"/opt/ml/model\",\n      readOnly: false,\n    });\n    return container;\n  }\n}\n\nexport interface ApplicationLoadBalancedNeuronxServiceProps extends ApplicationLoadBalancedEc2ServiceProps {}\nexport class ApplicationLoadBalancedNeuronxService extends ApplicationLoadBalancedEc2Service {\n  constructor(\n    scope: Construct,\n    id: string,\n    props: ApplicationLoadBalancedNeuronxServiceProps,\n  ) {\n    const neuronxTaskDefinition = props.taskDefinition;\n    if (\n      !neuronxTaskDefinition ||\n      !(neuronxTaskDefinition instanceof NeuronxTaskDefinition)\n    ) {\n      throw new Error(\"taskDefinition must extend NeuronxTaskDefinition\");\n    }\n    super(scope, id, {\n      healthCheckGracePeriod:\n        props.healthCheckGracePeriod ?? Duration.minutes(15),\n      ...props,\n    });\n\n    const cluster = this.getDefaultCluster(this, props.vpc);\n\n    // install and mount mountpoint for s3\n    const userData = UserData.forLinux();\n    userData.addCommands(`\n#!/bin/bash -e\n\n# Install Mountpoint\nMP_RPM=$(mktemp --suffix=.rpm)\ncurl https://s3.amazonaws.com/mountpoint-s3-release/latest/x86_64/mount-s3.rpm > $MP_RPM\n\n# cloud-init installs conflict with SSM agent: https://github.com/amazonlinux/amazon-linux-2023/issues/397\nattempt=0\nmax_attempts=5\nuntil dnf install -y $MP_RPM; do\n    attempt=$((attempt + 1))\n    if [ $attempt -ge $max_attempts ]; then\n        echo \"Failed to install mount-s3 after $max_attempts attempts. Exiting.\"\n        exit 1\n    fi\n    echo \"dnf install mount-s3 failed (attempt $attempt/$max_attempts), retrying in 3 seconds...\"\n    sleep 3\ndone\n\nrm $MP_RPM\n\n# Setup the fstab file and create the mount\nmkdir --parents /mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName}\nmount-s3 ${neuronxTaskDefinition.compiledModel.bucket.bucketName} /mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName} --allow-other --file-mode=644 --dir-mode=755`);\n\n    neuronxTaskDefinition.addVolume({\n      name: \"model\",\n      host: {\n        sourcePath: `/mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName}`,\n      },\n    });\n\n    const volumeSize = Math.ceil(\n      PytorchTrainingNeuronxImage.size.toGibibytes() +\n        NeuronOptimizedMachineImage.size.toGibibytes(),\n    );\n    const desiredCapacity = Math.ceil(\n      (props.desiredCount ?? 1) / neuronxTaskDefinition.tasksPerInstance,\n    );\n    const autoScalingGroup = new AutoScalingGroup(this, \"AutoScalingGroup\", {\n      vpc: cluster.vpc,\n      instanceType: neuronxTaskDefinition.neuronxInstanceType.instanceType,\n      machineImage: new NeuronOptimizedMachineImage(\n        this,\n        \"NeuronOptimizedMachineImage\",\n      ),\n      blockDevices: [\n        {\n          deviceName: \"/dev/xvda\",\n          volume: BlockDeviceVolume.ebs(volumeSize, {\n            volumeType: EbsDeviceVolumeType.GP3,\n            encrypted: true,\n          }),\n        },\n      ],\n      userData,\n      desiredCapacity,\n      maxCapacity:\n        neuronxTaskDefinition.tasksPerInstance === 1\n          ? desiredCapacity + 1\n          : undefined,\n    });\n    autoScalingGroup.connections.allowFrom(\n      this.loadBalancer,\n      Port.tcpRange(32768, 60999),\n    );\n    neuronxTaskDefinition.compiledModel.bucket.grantRead(autoScalingGroup);\n    const provider = new ecs.AsgCapacityProvider(this, \"AsgCapacityProvider\", {\n      autoScalingGroup,\n    });\n    cluster.addAsgCapacityProvider(provider);\n  }\n}\n"]}
|
|
@@ -63,7 +63,7 @@ class PytorchInferenceNeuronxImage extends PytorchNeuronxImage {
|
|
|
63
63
|
}
|
|
64
64
|
exports.PytorchInferenceNeuronxImage = PytorchInferenceNeuronxImage;
|
|
65
65
|
_b = PytorchInferenceNeuronxImage, _c = JSII_RTTI_SYMBOL_1;
|
|
66
|
-
PytorchInferenceNeuronxImage[_c] = { fqn: "aws-cdk-neuronx-patterns.PytorchInferenceNeuronxImage", version: "0.
|
|
66
|
+
PytorchInferenceNeuronxImage[_c] = { fqn: "aws-cdk-neuronx-patterns.PytorchInferenceNeuronxImage", version: "0.3.0" };
|
|
67
67
|
PytorchInferenceNeuronxImage.imageName = "public.ecr.aws/neuron/pytorch-inference-neuronx";
|
|
68
68
|
/** Neuron SDK 2.28.0 */
|
|
69
69
|
PytorchInferenceNeuronxImage.SDK_2_28_0 = _b.fromNeuronSdkVersion("2.28.0", "3.12", "2.9.0", "24.04");
|
|
@@ -87,7 +87,7 @@ class PytorchTrainingNeuronxImage extends PytorchNeuronxImage {
|
|
|
87
87
|
}
|
|
88
88
|
exports.PytorchTrainingNeuronxImage = PytorchTrainingNeuronxImage;
|
|
89
89
|
_d = JSII_RTTI_SYMBOL_1;
|
|
90
|
-
PytorchTrainingNeuronxImage[_d] = { fqn: "aws-cdk-neuronx-patterns.PytorchTrainingNeuronxImage", version: "0.
|
|
90
|
+
PytorchTrainingNeuronxImage[_d] = { fqn: "aws-cdk-neuronx-patterns.PytorchTrainingNeuronxImage", version: "0.3.0" };
|
|
91
91
|
PytorchTrainingNeuronxImage.imageName = "public.ecr.aws/neuron/pytorch-training-neuronx";
|
|
92
92
|
class VllmInferenceNeuronxImage extends NeuronxImage {
|
|
93
93
|
static fromNeuronSdkVersion(neuronSdkVersion, vllmVersion, pythonVersion, ubuntuVersion) {
|
|
@@ -101,7 +101,7 @@ class VllmInferenceNeuronxImage extends NeuronxImage {
|
|
|
101
101
|
}
|
|
102
102
|
exports.VllmInferenceNeuronxImage = VllmInferenceNeuronxImage;
|
|
103
103
|
_e = VllmInferenceNeuronxImage, _f = JSII_RTTI_SYMBOL_1;
|
|
104
|
-
VllmInferenceNeuronxImage[_f] = { fqn: "aws-cdk-neuronx-patterns.VllmInferenceNeuronxImage", version: "0.
|
|
104
|
+
VllmInferenceNeuronxImage[_f] = { fqn: "aws-cdk-neuronx-patterns.VllmInferenceNeuronxImage", version: "0.3.0" };
|
|
105
105
|
/** Neuron SDK 2.28.0 with vLLM 0.13.0 */
|
|
106
106
|
VllmInferenceNeuronxImage.SDK_2_28_0 = _e.fromNeuronSdkVersion("2.28.0", "0.13.0", "3.12", "24.04");
|
|
107
107
|
/** Neuron SDK 2.27.1 with vLLM 0.13.0 */
|
|
@@ -84,7 +84,7 @@ class Parameters {
|
|
|
84
84
|
}
|
|
85
85
|
exports.Parameters = Parameters;
|
|
86
86
|
_a = JSII_RTTI_SYMBOL_1;
|
|
87
|
-
Parameters[_a] = { fqn: "aws-cdk-neuronx-patterns.Parameters", version: "0.
|
|
87
|
+
Parameters[_a] = { fqn: "aws-cdk-neuronx-patterns.Parameters", version: "0.3.0" };
|
|
88
88
|
/**
|
|
89
89
|
* Compile target model.
|
|
90
90
|
*/
|
|
@@ -149,5 +149,5 @@ class Model {
|
|
|
149
149
|
}
|
|
150
150
|
exports.Model = Model;
|
|
151
151
|
_b = JSII_RTTI_SYMBOL_1;
|
|
152
|
-
Model[_b] = { fqn: "aws-cdk-neuronx-patterns.Model", version: "0.
|
|
152
|
+
Model[_b] = { fqn: "aws-cdk-neuronx-patterns.Model", version: "0.3.0" };
|
|
153
153
|
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"model.js","sourceRoot":"","sources":["../../../src/base/neuronx/model.ts"],"names":[],"mappings":";;;;;AAAA,6CAA0C;AAG1C,IAAY,YAGX;AAHD,WAAY,YAAY;IACtB,gEAAiB,CAAA;IACjB,6DAAe,CAAA;AACjB,CAAC,EAHW,YAAY,4BAAZ,YAAY,QAGvB;AAED;;GAEG;AACH,IAAY,UAKX;AALD,WAAY,UAAU;IACpB;;OAEG;IACH,uBAAS,CAAA;AACX,CAAC,EALW,UAAU,0BAAV,UAAU,QAKrB;AAED;;GAEG;AACH,IAAY,QAaX;AAbD,WAAY,QAAQ;IAClB;;OAEG;IACH,6EAA2B,CAAA;IAC3B;;OAEG;IACH,uDAAgB,CAAA;IAChB;;OAEG;IACH,qFAA+B,CAAA;AACjC,CAAC,EAbW,QAAQ,wBAAR,QAAQ,QAanB;AAED;;GAEG;AACH,MAAa,UAAU;IACrB;;;;OAIG;IACH,MAAM,CAAC,OAAO,CAAC,UAAkB;QAC/B,OAAO,IAAI,UAAU,CAAC,UAAU,GAAG,OAAO,CAAC,CAAC;IAC9C,CAAC;IACD;;;;OAIG;IACH,MAAM,CAAC,OAAO,CAAC,UAAkB;QAC/B,OAAO,IAAI,UAAU,CAAC,UAAU,GAAG,UAAU,CAAC,CAAC;IACjD,CAAC;IACD;IACE;;OAEG;IACc,UAAkB;QAAlB,eAAU,GAAV,UAAU,CAAQ;IAClC,CAAC;IACJ;;;OAGG;IACH,SAAS;QACP,OAAO,IAAI,CAAC,UAAU,GAAG,OAAO,CAAC;IACnC,CAAC;IACD;;;OAGG;IACH,SAAS;QACP,OAAO,IAAI,CAAC,UAAU,GAAG,UAAU,CAAC;IACtC,CAAC;IACD,UAAU;QACR,OAAO,kBAAI,CAAC,SAAS,CAAC,IAAI,CAAC,SAAS,EAAE,GAAG,GAAG,CAAC,CAAC;IAChD,CAAC;;AAvCH,gCAwCC;;;AAiBD;;GAEG;AACH,MAAa,KAAK;IAChB;;;;;OAKG;IACH,MAAM,CAAC,eAAe,CAAC,OAAe,EAAE,OAAsB;QAC5D,MAAM,UAAU,GAAG,OAAO,EAAE,UAAU,IAAI,KAAK,CAAC,WAAW,CAAC,OAAO,CAAC,CAAC;QACrE,IAAI,CAAC,UAAU,EAAE,CAAC;YAChB,MAAM,IAAI,KAAK,CACb,yFAAyF,CAC1F,CAAC;QACJ,CAAC;QACD,OAAO,IAAI,KAAK,CAAC,OAAO,EAAE,OAAO,EAAE,SAAS,IAAI,OAAO,EAAE;YACvD,GAAG,OAAO;YACV,UAAU;SACX,CAAC,CAAC;IACL,CAAC;IACD;;;;;;OAMG;IACH,MAAM,CAAC,UAAU,CAAC,MAAe,EAAE,MAAc,EAAE,OAAsB;QACvE,IAAI,mBAAK,CAAC,YAAY,CAAC,MAAM,CAAC,IAAI,CAAC,OAAO,EAAE,SAAS,EAAE,CAAC;YACtD,MAAM,IAAI,KAAK,CAAC,iDAAiD,CAAC,CAAC;QACrE,CAAC;QACD,MAAM,SAAS,GAAG,OAAO,EAAE,SAAS,IAAI,MAAM,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;QACvE,MAAM,UAAU,GAAG,OAAO,EAAE,UAAU,IAAI,KAAK,CAAC,WAAW,CAAC,SAAS,CAAC,CAAC;QACvE,IAAI,CAAC,UAAU,EAAE,CAAC;YAChB,MAAM,IAAI,KAAK,CACb,yFAAyF,CAC1F,CAAC;QACJ,CAAC;QACD,OAAO,IAAI,KAAK,CACd,MAAM,CAAC,cAAc,CAAC,MAAM,CAAC,EAC7B,SAAS,EACT,EAAE,GAAG,OAAO,EAAE,UAAU,EAAE,EAC1B,MAAM,EACN,MAAM,CACP,CAAC;IACJ,CAAC;IACO,MAAM,CAAC,WAAW,CAAC,MAAc;QACvC,IAAI,CAAC;YACH,MAAM,OAAO,GAAG,MAAM,CAAC,KAAK,CAAC,YAAY,CAAC,CAAC;YAC3C,IAAI,OAAO,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;gBACjB,OAAO,UAAU,CAAC,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YAClD,CAAC;YACD,MAAM,OAAO,GAAG,MAAM,CAAC,KAAK,CAAC,YAAY,CAAC,CAAC;YAC3C,IAAI,OAAO,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;gBACjB,OAAO,UAAU,CAAC,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YAClD,CAAC;QACH,CAAC;QAAC,MAAM,CAAC;YACP,MAAM;QACR,CAAC;QACD,OAAO,SAAS,CAAC;IACnB,CAAC;IACD,YACW,OAAe,EACf,SAAiB,EACjB,OAAqB,EACrB,MAAgB,EAChB,MAAe;QAJf,YAAO,GAAP,OAAO,CAAQ;QACf,cAAS,GAAT,SAAS,CAAQ;QACjB,YAAO,GAAP,OAAO,CAAc;QACrB,WAAM,GAAN,MAAM,CAAU;QAChB,WAAM,GAAN,MAAM,CAAS;IACvB,CAAC;;AAlEN,sBAmEC","sourcesContent":["import { Size, Token } from \"aws-cdk-lib\";\nimport { IBucket } from \"aws-cdk-lib/aws-s3\";\n\nexport enum DataTypeBits {\n  BF16_OR_FP16 = 16,\n  FP8_OR_INT8 = 8,\n}\n\n/**\n * Quant data type.\n */\nexport enum QuantDtype {\n  /**\n   * int8 weight storage.\n   */\n  S8 = \"s8\",\n}\n\n/**\n * Optimization level.\n */\nexport enum OptLevel {\n  /**\n   * enables the core performance optimizations in the compiler, while also minimizing compile time.\n   */\n  MINIMIZING_COMPILE_TIME = 1,\n  /**\n   * provides the best balance between model performance and compile time.\n   */\n  BEST_BALANCE = 2,\n  /**\n   * may provide additional model execution performance but may incur longer compile times and higher host memory usage during model compilation.\n   */\n  MODEL_EXECUTION_PERFORMANCE = 3,\n}\n\n/**\n * Represents the amount of parameters.\n */\nexport class Parameters {\n  /**\n   * Create a Parameters representing an amount million.\n   * @param parameters number of parameters millionX\n   * @returns parameters\n   */\n  static million(parameters: number) {\n    return new Parameters(parameters * 1000000);\n  }\n  /**\n   * Create a Parameters representing an amount billion.\n   * @param parameters number of parameters billionX\n   * @returns parameters\n   */\n  static billion(parameters: number) {\n    return new Parameters(parameters * 1000000000);\n  }\n  private constructor(\n    /**\n     * number of paremters.\n     */\n    private readonly parameters: number,\n  ) {}\n  /**\n   * Return this number of parameters as million.\n   * @returns This number of parameters as million.\n   */\n  toMillion() {\n    return this.parameters / 1000000;\n  }\n  /**\n   * Return this number of parameters as billion.\n   * @returns This number of parameters as billion.\n   */\n  toBillion() {\n    return this.parameters / 1000000000;\n  }\n  weightSize() {\n    return Size.gibibytes(this.toBillion() * 2.5);\n  }\n}\n\nexport interface ModelConfig {\n  readonly layers: number;\n  readonly embeddingDimension: number;\n  readonly attentionHeads: number;\n}\n\n/**\n * Compile target model basic infromation\n */\nexport interface ModelOptions {\n  readonly parameters: Parameters;\n  readonly config?: ModelConfig;\n  readonly modelName?: string;\n}\n\n/**\n * Compile target model.\n */\nexport class Model {\n  /**\n   * model informations at HuggingFace\n   * @param modelId model id on the HuggingFace\n   * @param options model basic information\n   * @returns model instance\n   */\n  static fromHuggingFace(modelId: string, options?: ModelOptions) {\n    const parameters = options?.parameters ?? Model.maybeParams(modelId);\n    if (!parameters) {\n      throw new Error(\n        \"The number of parameters cannot be inferred from the model ID. Set optional parameters.\",\n      );\n    }\n    return new Model(modelId, options?.modelName ?? modelId, {\n      ...options,\n      parameters,\n    });\n  }\n  /**\n   * model informations at S3 Bucket\n   * @param bucket Model stored S3 Bucket\n   * @param prefix Model stored objects prefix\n   * @param options model basic information\n   * @returns model instance\n   */\n  static fromBucket(bucket: IBucket, prefix: string, options?: ModelOptions) {\n    if (Token.isUnresolved(prefix) && !options?.modelName) {\n      throw new Error(\"ModelName is required when prefix is unresolved\");\n    }\n    const modelName = options?.modelName ?? prefix.split(\"/\").slice(-1)[0];\n    const parameters = options?.parameters ?? Model.maybeParams(modelName);\n    if (!parameters) {\n      throw new Error(\n        \"The number of parameters cannot be inferred from the model ID. Set optional parameters.\",\n      );\n    }\n    return new Model(\n      bucket.s3UrlForObject(prefix),\n      modelName,\n      { ...options, parameters },\n      bucket,\n      prefix,\n    );\n  }\n  private static maybeParams(source: string) {\n    try {\n      const billion = source.match(/-(\\d+)[bB]/);\n      if (billion?.[1]) {\n        return Parameters.billion(parseInt(billion[1]));\n      }\n      const million = source.match(/-(\\d+)[mM]/);\n      if (million?.[1]) {\n        return Parameters.million(parseInt(million[1]));\n      }\n    } catch {\n      // NOP\n    }\n    return undefined;\n  }\n  private constructor(\n    readonly modelId: string,\n    readonly modelName: string,\n    readonly options: ModelOptions,\n    readonly bucket?: IBucket,\n    readonly prefix?: string,\n  ) {}\n}\n"]}
|
|
@@ -42,6 +42,6 @@ class NeuronOptimizedMachineImage extends constructs_1.Construct {
|
|
|
42
42
|
}
|
|
43
43
|
exports.NeuronOptimizedMachineImage = NeuronOptimizedMachineImage;
|
|
44
44
|
_a = JSII_RTTI_SYMBOL_1;
|
|
45
|
-
NeuronOptimizedMachineImage[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronOptimizedMachineImage", version: "0.
|
|
45
|
+
NeuronOptimizedMachineImage[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronOptimizedMachineImage", version: "0.3.0" };
|
|
46
46
|
NeuronOptimizedMachineImage.size = aws_cdk_lib_1.Size.gibibytes(30);
|
|
47
47
|
//# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoibmV1cm9uLW9wdGltaXplZC1tYWNoaW5lLWltYWdlLmpzIiwic291cmNlUm9vdCI6IiIsInNvdXJjZXMiOlsiLi4vLi4vLi4vc3JjL2Jhc2UvbmV1cm9ueC9uZXVyb24tb3B0aW1pemVkLW1hY2hpbmUtaW1hZ2UudHMiXSwibmFtZXMiOltdLCJtYXBwaW5ncyI6Ijs7Ozs7QUFBQSw2Q0FBbUQ7QUFDbkQsaURBSzZCO0FBQzdCLHVEQUEwRTtBQUMxRSwyQ0FBMkM7QUFDM0MsbUVBQXdEO0FBQ3hELDJDQUF1QztBQUN2Qyw2QkFBNkI7QUFFN0IsTUFBYSwyQkFDWCxTQUFRLHNCQUFTO0lBS2pCLElBQUksT0FBTztRQUNULE9BQU8sSUFBSSxDQUFDLFFBQVEsQ0FBQyxZQUFZLENBQUMsVUFBVSxDQUFDLENBQUM7SUFDaEQsQ0FBQztJQUVELFlBQVksS0FBZ0IsRUFBRSxFQUFVO1FBQ3RDLEtBQUssQ0FBQyxLQUFLLEVBQUUsRUFBRSxDQUFDLENBQUM7UUFFakIsTUFBTSxRQUFRLEdBQUcsSUFBSSwyQkFBUSxDQUFDLElBQUksRUFBRSxvQkFBb0IsRUFBRTtZQUN4RCxjQUFjLEVBQUUsSUFBSSw4QkFBaUIsQ0FBQyxJQUFJLEVBQUUsb0JBQW9CLEVBQUU7Z0JBQ2hFLElBQUksRUFBRSxpQkFBSSxDQUFDLFNBQVMsQ0FBQyxJQUFJLENBQUMsSUFBSSxDQUFDLFNBQVMsRUFBRSxxQkFBcUIsQ0FBQyxDQUFDO2dCQUNqRSxPQUFPLEVBQUUsZUFBZTtnQkFDeEIsT0FBTyxFQUFFLG9CQUFPLENBQUMsYUFBYTtnQkFDOUIsSUFBSSxFQUFFLHNDQUFzQzthQUM3QyxDQUFDO1NBQ0gsQ0FBQyxDQUFDO1FBQ0gsSUFBSSxDQUFDLFFBQVEsR0FBRyxJQUFJLDRCQUFjLENBQUMsSUFBSSxFQUFFLFlBQVksRUFBRTtZQUNyRCxZQUFZLEVBQUUsUUFBUSxDQUFDLFlBQVk7WUFDbkMsWUFBWSxFQUFFLG9CQUFvQjtZQUNsQyxVQUFVLEVBQUU7Z0JBQ1YsS0FBSyxFQUFFLEdBQUcsQ0FBQyxlQUFlLENBQUMsdUJBQXVCLENBQ2hELElBQUksRUFDSixPQUFPLEVBQ1AscUVBQXFFLENBQ3RFLENBQUMsV0FBVzthQUNkO1NBQ0YsQ0FBQyxDQUFDO0lBQ0wsQ0FBQztJQUNELFFBQVEsQ0FBQyxNQUFpQjtRQUN4QixPQUFPO1lBQ0wsT0FBTyxFQUFFLElBQUksQ0FBQyxPQUFPO1lBQ3JCLE1BQU0sRUFBRSw2QkFBbUIsQ0FBQyxLQUFLO1lBQ2pDLFFBQVEsRUFBRSxrQkFBUSxDQUFDLFFBQVEsRUFBRTtTQUM5QixDQUFDO0lBQ0osQ0FBQzs7QUF2Q0gsa0VBd0NDOzs7QUFwQ2lCLGdDQUFJLEdBQUcsa0JBQUksQ0FBQyxTQUFTLENBQUMsRUFBRSxDQUFDLENBQUMiLCJzb3VyY2VzQ29udGVudCI6WyJpbXBvcnQgeyBDdXN0b21SZXNvdXJjZSwgU2l6ZSB9IGZyb20gXCJhd3MtY2RrLWxpYlwiO1xuaW1wb3J0IHtcbiAgSU1hY2hpbmVJbWFnZSxcbiAgTWFjaGluZUltYWdlQ29uZmlnLFxuICBPcGVyYXRpbmdTeXN0ZW1UeXBlLFxuICBVc2VyRGF0YSxcbn0gZnJvbSBcImF3cy1jZGstbGliL2F3cy1lYzJcIjtcbmltcG9ydCB7IENvZGUsIFJ1bnRpbWUsIFNpbmdsZXRvbkZ1bmN0aW9uIH0gZnJvbSBcImF3cy1jZGstbGliL2F3cy1sYW1iZGFcIjtcbmltcG9ydCAqIGFzIHNzbSBmcm9tIFwiYXdzLWNkay1saWIvYXdzLXNzbVwiO1xuaW1wb3J0IHsgUHJvdmlkZXIgfSBmcm9tIFwiYXdzLWNkay1saWIvY3VzdG9tLXJlc291cmNlc1wiO1xuaW1wb3J0IHsgQ29uc3RydWN0IH0gZnJvbSBcImNvbnN0cnVjdHNcIjtcbmltcG9ydCAqIGFzIHBhdGggZnJvbSBcInBhdGhcIjtcblxuZXhwb3J0IGNsYXNzIE5ldXJvbk9wdGltaXplZE1hY2hpbmVJbWFnZVxuICBleHRlbmRzIENvbnN0cnVjdFxuICBpbXBsZW1lbnRzIElNYWNoaW5lSW1hZ2VcbntcbiAgc3RhdGljIHJlYWRvbmx5IHNpemUgPSBTaXplLmdpYmlieXRlcygzMCk7XG4gIHByaXZhdGUgcmVhZG9ubHkgcmVzb3VyY2U6IEN1c3RvbVJlc291cmNlO1xuICBnZXQgaW1hZ2VJZCgpIHtcbiAgICByZXR1cm4gdGhpcy5yZXNvdXJjZS5nZXRBdHRTdHJpbmcoXCJpbWFnZV9pZFwiKTtcbiAgfVxuXG4gIGNvbnN0cnVjdG9yKHNjb3BlOiBDb25zdHJ1Y3QsIGlkOiBzdHJpbmcpIHtcbiAgICBzdXBlcihzY29wZSwgaWQpO1xuXG4gICAgY29uc3QgcHJvdmlkZXIgPSBuZXcgUHJvdmlkZXIodGhpcywgXCJOZXVyb254QW1pUHJvdmlkZXJcIiwge1xuICAgICAgb25FdmVudEhhbmRsZXI6IG5ldyBTaW5nbGV0b25GdW5jdGlvbih0aGlzLCBcIk5ldXJvbnhBbWlGdW5jdGlvblwiLCB7XG4gICAgICAgIGNvZGU6IENvZGUuZnJvbUFzc2V0KHBhdGguam9pbihfX2Rpcm5hbWUsIFwicHJpdmF0ZS9uZXVyb254LWFtaVwiKSksXG4gICAgICAgIGhhbmRsZXI6IFwiaW5kZXgub25FdmVudFwiLFxuICAgICAgICBydW50aW1lOiBSdW50aW1lLk5PREVKU19MQVRFU1QsXG4gICAgICAgIHV1aWQ6IFwiMDhjOTg1MGEtNmYxMy00ZWQ0LTllMmQtNzg4OGQ3YjVhMjU4XCIsXG4gICAgICB9KSxcbiAgICB9KTtcbiAgICB0aGlzLnJlc291cmNlID0gbmV3IEN1c3RvbVJlc291cmNlKHRoaXMsIFwiTmV1cm9ueEFtaVwiLCB7XG4gICAgICBzZXJ2aWNlVG9rZW46IHByb3ZpZGVyLnNlcnZpY2VUb2tlbixcbiAgICAgIHJlc291cmNlVHlwZTogXCJDdXN0b206Ok5ldXJvbnhBbWlcIixcbiAgICAgIHByb3BlcnRpZXM6IHtcbiAgICAgICAgaW1hZ2U6IHNzbS5TdHJpbmdQYXJhbWV0ZXIuZnJvbVN0cmluZ1BhcmFtZXRlck5hbWUoXG4gICAgICAgICAgdGhpcyxcbiAgICAgICAgICBcIkltYWdlXCIsXG4gICAgICAgICAgXCIvYXdzL3NlcnZpY2UvZWNzL29wdGltaXplZC1hbWkvYW1hem9uLWxpbnV4LTIwMjMvbmV1cm9uL3JlY29tbWVuZGVkXCIsXG4gICAgICAgICkuc3RyaW5nVmFsdWUsXG4gICAgICB9LFxuICAgIH0pO1xuICB9XG4gIGdldEltYWdlKF9zY29wZTogQ29uc3RydWN0KTogTWFjaGluZUltYWdlQ29uZmlnIHtcbiAgICByZXR1cm4ge1xuICAgICAgaW1hZ2VJZDogdGhpcy5pbWFnZUlkLFxuICAgICAgb3NUeXBlOiBPcGVyYXRpbmdTeXN0ZW1UeXBlLkxJTlVYLFxuICAgICAgdXNlckRhdGE6IFVzZXJEYXRhLmZvckxpbnV4KCksXG4gICAgfTtcbiAgfVxufVxuIl19
|
|
@@ -14,7 +14,7 @@ class Inferentia2Chips {
|
|
|
14
14
|
}
|
|
15
15
|
exports.Inferentia2Chips = Inferentia2Chips;
|
|
16
16
|
_a = JSII_RTTI_SYMBOL_1;
|
|
17
|
-
Inferentia2Chips[_a] = { fqn: "aws-cdk-neuronx-patterns.Inferentia2Chips", version: "0.
|
|
17
|
+
Inferentia2Chips[_a] = { fqn: "aws-cdk-neuronx-patterns.Inferentia2Chips", version: "0.3.0" };
|
|
18
18
|
class Trainium1Chips {
|
|
19
19
|
constructor(chips) {
|
|
20
20
|
this.chips = chips;
|
|
@@ -24,7 +24,7 @@ class Trainium1Chips {
|
|
|
24
24
|
}
|
|
25
25
|
exports.Trainium1Chips = Trainium1Chips;
|
|
26
26
|
_b = JSII_RTTI_SYMBOL_1;
|
|
27
|
-
Trainium1Chips[_b] = { fqn: "aws-cdk-neuronx-patterns.Trainium1Chips", version: "0.
|
|
27
|
+
Trainium1Chips[_b] = { fqn: "aws-cdk-neuronx-patterns.Trainium1Chips", version: "0.3.0" };
|
|
28
28
|
class Trainium2Chips {
|
|
29
29
|
constructor(chips) {
|
|
30
30
|
this.chips = chips;
|
|
@@ -37,7 +37,7 @@ class Trainium2Chips {
|
|
|
37
37
|
}
|
|
38
38
|
exports.Trainium2Chips = Trainium2Chips;
|
|
39
39
|
_c = JSII_RTTI_SYMBOL_1;
|
|
40
|
-
Trainium2Chips[_c] = { fqn: "aws-cdk-neuronx-patterns.Trainium2Chips", version: "0.
|
|
40
|
+
Trainium2Chips[_c] = { fqn: "aws-cdk-neuronx-patterns.Trainium2Chips", version: "0.3.0" };
|
|
41
41
|
class NeuronxInstanceTypeBase {
|
|
42
42
|
constructor(props) {
|
|
43
43
|
this.instanceType = props.instanceType;
|
|
@@ -96,7 +96,7 @@ class NeuronxInstanceType {
|
|
|
96
96
|
}
|
|
97
97
|
exports.NeuronxInstanceType = NeuronxInstanceType;
|
|
98
98
|
_d = JSII_RTTI_SYMBOL_1;
|
|
99
|
-
NeuronxInstanceType[_d] = { fqn: "aws-cdk-neuronx-patterns.NeuronxInstanceType", version: "0.
|
|
99
|
+
NeuronxInstanceType[_d] = { fqn: "aws-cdk-neuronx-patterns.NeuronxInstanceType", version: "0.3.0" };
|
|
100
100
|
/**
|
|
101
101
|
* inf2.xlarge
|
|
102
102
|
*/
|
|
@@ -14,5 +14,7 @@ var __exportStar = (this && this.__exportStar) || function(m, exports) {
|
|
|
14
14
|
for (var p in m) if (p !== "default" && !Object.prototype.hasOwnProperty.call(exports, p)) __createBinding(exports, m, p);
|
|
15
15
|
};
|
|
16
16
|
Object.defineProperty(exports, "__esModule", { value: true });
|
|
17
|
-
__exportStar(require("./neuronx-compiler"), exports);
|
|
18
|
-
|
|
17
|
+
__exportStar(require("./neuronx-compiler-base"), exports);
|
|
18
|
+
__exportStar(require("./neuronx-native-compiler"), exports);
|
|
19
|
+
__exportStar(require("./neuronx-cross-compiler"), exports);
|
|
20
|
+
//# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoiaW5kZXguanMiLCJzb3VyY2VSb290IjoiIiwic291cmNlcyI6WyIuLi8uLi8uLi9zcmMvYmFzZS9uZXVyb254LWNvbXBpbGVyL2luZGV4LnRzIl0sIm5hbWVzIjpbXSwibWFwcGluZ3MiOiI7Ozs7Ozs7Ozs7Ozs7Ozs7QUFBQSwwREFBd0M7QUFDeEMsNERBQTBDO0FBQzFDLDJEQUF5QyIsInNvdXJjZXNDb250ZW50IjpbImV4cG9ydCAqIGZyb20gXCIuL25ldXJvbngtY29tcGlsZXItYmFzZVwiO1xuZXhwb3J0ICogZnJvbSBcIi4vbmV1cm9ueC1uYXRpdmUtY29tcGlsZXJcIjtcbmV4cG9ydCAqIGZyb20gXCIuL25ldXJvbngtY3Jvc3MtY29tcGlsZXJcIjtcbiJdfQ==
|
|
@@ -1,7 +1,8 @@
|
|
|
1
1
|
import { Size } from "aws-cdk-lib";
|
|
2
2
|
import * as batch from "aws-cdk-lib/aws-batch";
|
|
3
|
-
import
|
|
3
|
+
import { IVpc, SubnetSelection } from "aws-cdk-lib/aws-ec2";
|
|
4
4
|
import { ContainerImage } from "aws-cdk-lib/aws-ecs";
|
|
5
|
+
import { IRole } from "aws-cdk-lib/aws-iam";
|
|
5
6
|
import { IBucket } from "aws-cdk-lib/aws-s3";
|
|
6
7
|
import { Construct } from "constructs";
|
|
7
8
|
import { INeuronxInstanceType, Model } from "../neuronx";
|
|
@@ -19,13 +20,48 @@ export interface INeuronxContainerImage {
|
|
|
19
20
|
readonly neuronSdkVersion: string;
|
|
20
21
|
}
|
|
21
22
|
/**
|
|
22
|
-
*
|
|
23
|
+
* The model compiled by Neuronx compiler.
|
|
23
24
|
*/
|
|
24
|
-
export interface
|
|
25
|
+
export interface NeuronxCompiledModel {
|
|
26
|
+
/**
|
|
27
|
+
* The recommended Neuron instance type for running inference with this compiled model.
|
|
28
|
+
*/
|
|
29
|
+
readonly recommendedInstanceType: INeuronxInstanceType;
|
|
30
|
+
/**
|
|
31
|
+
* The bucket to upload compiled artifacts.
|
|
32
|
+
*/
|
|
33
|
+
readonly bucket: IBucket;
|
|
34
|
+
/**
|
|
35
|
+
* S3 URL that compiled artifact uploaded.
|
|
36
|
+
*/
|
|
37
|
+
readonly s3Uri: string;
|
|
38
|
+
/**
|
|
39
|
+
* S3 prefix that compiled artifact uploaded.
|
|
40
|
+
*/
|
|
41
|
+
readonly s3Prefix: string;
|
|
42
|
+
/**
|
|
43
|
+
* The model name.
|
|
44
|
+
*/
|
|
45
|
+
readonly modelName: string;
|
|
46
|
+
/**
|
|
47
|
+
* The weight size of the model.
|
|
48
|
+
*/
|
|
49
|
+
readonly weightSize: Size;
|
|
50
|
+
}
|
|
51
|
+
/**
|
|
52
|
+
* Interface for Neuronx compilers.
|
|
53
|
+
*/
|
|
54
|
+
export interface INeuronxCompiler {
|
|
55
|
+
compile(): NeuronxCompiledModel;
|
|
56
|
+
}
|
|
57
|
+
/**
|
|
58
|
+
* Common props for NeuronxCompilerBase.
|
|
59
|
+
*/
|
|
60
|
+
export interface NeuronxCompilerBaseProps {
|
|
25
61
|
/**
|
|
26
62
|
* VPC in which this will launch compile worker instance.
|
|
27
63
|
*/
|
|
28
|
-
readonly vpc:
|
|
64
|
+
readonly vpc: IVpc;
|
|
29
65
|
/**
|
|
30
66
|
* The bucket to upload compiled artifacts.
|
|
31
67
|
*/
|
|
@@ -53,10 +89,13 @@ export interface NeuronxCompilerProps {
|
|
|
53
89
|
* An image of the container where the compile job is executed.
|
|
54
90
|
*/
|
|
55
91
|
readonly image: INeuronxContainerImage;
|
|
92
|
+
/**
|
|
93
|
+
* The command to run in the container.
|
|
94
|
+
*/
|
|
56
95
|
readonly command?: string[];
|
|
57
96
|
/**
|
|
58
97
|
* The root volume of worker instance.
|
|
59
|
-
* @default - N
|
|
98
|
+
* @default - N billion parameters * 5GiB EBS
|
|
60
99
|
*/
|
|
61
100
|
readonly volumeSize?: Size;
|
|
62
101
|
/**
|
|
@@ -70,7 +109,7 @@ export interface NeuronxCompilerProps {
|
|
|
70
109
|
*
|
|
71
110
|
* @default - new subnets will be created
|
|
72
111
|
*/
|
|
73
|
-
readonly vpcSubnets?:
|
|
112
|
+
readonly vpcSubnets?: SubnetSelection;
|
|
74
113
|
/**
|
|
75
114
|
* The environment variables to pass to the container.
|
|
76
115
|
* This is only applicable when using container runtime.
|
|
@@ -81,40 +120,43 @@ export interface NeuronxCompilerProps {
|
|
|
81
120
|
[key: string]: string;
|
|
82
121
|
};
|
|
83
122
|
}
|
|
84
|
-
|
|
85
|
-
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
*/
|
|
89
|
-
readonly bucket: IBucket;
|
|
90
|
-
/**
|
|
91
|
-
* S3 URL that compiled artifact uploaded.
|
|
92
|
-
*/
|
|
93
|
-
readonly s3Uri: string;
|
|
123
|
+
/**
|
|
124
|
+
* Result of creating a compute environment.
|
|
125
|
+
*/
|
|
126
|
+
export interface ComputeEnvironmentResult {
|
|
94
127
|
/**
|
|
95
|
-
*
|
|
128
|
+
* The compute environment.
|
|
96
129
|
*/
|
|
97
|
-
readonly
|
|
130
|
+
readonly computeEnvironment: batch.IComputeEnvironment;
|
|
98
131
|
/**
|
|
99
|
-
* The
|
|
132
|
+
* The instance role associated with the compute environment.
|
|
100
133
|
*/
|
|
101
|
-
readonly
|
|
102
|
-
readonly weightSize: Size;
|
|
134
|
+
readonly instanceRole: IRole;
|
|
103
135
|
}
|
|
104
136
|
/**
|
|
105
|
-
* Neuronx
|
|
106
|
-
*
|
|
137
|
+
* Abstract base class for Neuronx compilers.
|
|
138
|
+
* Provides the common orchestration logic (Lambda, CustomResource, WaitCondition)
|
|
139
|
+
* while subclasses define how to create the Batch compute environment and job definition.
|
|
107
140
|
*/
|
|
108
|
-
export declare class
|
|
141
|
+
export declare abstract class NeuronxCompilerBase extends Construct implements INeuronxCompiler {
|
|
109
142
|
private compiledModel?;
|
|
110
143
|
private readonly entrypoint;
|
|
111
|
-
|
|
112
|
-
|
|
113
|
-
|
|
114
|
-
|
|
115
|
-
|
|
116
|
-
|
|
117
|
-
|
|
118
|
-
|
|
144
|
+
protected readonly artifactS3Prefix: string;
|
|
145
|
+
protected readonly weightSize: Size;
|
|
146
|
+
protected readonly neuronxInstanceType: INeuronxInstanceType;
|
|
147
|
+
protected readonly model: Model;
|
|
148
|
+
protected readonly bucket: IBucket;
|
|
149
|
+
constructor(scope: Construct, id: string, props: NeuronxCompilerBaseProps);
|
|
150
|
+
/**
|
|
151
|
+
* Create the Batch compute environment.
|
|
152
|
+
* Subclasses must implement this to provide the appropriate compute environment.
|
|
153
|
+
*/
|
|
154
|
+
protected abstract createComputeEnvironment(props: NeuronxCompilerBaseProps): ComputeEnvironmentResult;
|
|
155
|
+
/**
|
|
156
|
+
* Create the Batch job definition.
|
|
157
|
+
* Subclasses must implement this to provide the appropriate job definition.
|
|
158
|
+
*/
|
|
159
|
+
protected abstract createJobDefinition(props: NeuronxCompilerBaseProps): batch.IJobDefinition;
|
|
160
|
+
private createJobQueue;
|
|
119
161
|
compile(): NeuronxCompiledModel;
|
|
120
162
|
}
|