aws-cdk-neuronx-patterns 0.2.1 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (31) hide show
  1. package/.jsii +604 -99
  2. package/API.md +990 -210
  3. package/README.ja.md +18 -6
  4. package/README.md +16 -5
  5. package/lib/base/aws-batch/neuronx-batch-compute-environment.js +1 -1
  6. package/lib/base/aws-batch/neuronx-batch-ecs-job-definition.js +1 -1
  7. package/lib/base/aws-batch/neuronx-batch.js +1 -1
  8. package/lib/base/aws-ecs-patterns/application-load-balanced-neuronx-service.js +4 -4
  9. package/lib/base/neuronx/deep-learning-containers.js +3 -3
  10. package/lib/base/neuronx/model.js +2 -2
  11. package/lib/base/neuronx/neuron-optimized-machine-image.js +1 -1
  12. package/lib/base/neuronx/neuronx-instance-type.js +4 -4
  13. package/lib/base/neuronx-compiler/index.d.ts +3 -1
  14. package/lib/base/neuronx-compiler/index.js +4 -2
  15. package/lib/base/neuronx-compiler/{neuronx-compiler.d.ts → neuronx-compiler-base.d.ts} +74 -32
  16. package/lib/base/neuronx-compiler/neuronx-compiler-base.js +129 -0
  17. package/lib/base/neuronx-compiler/neuronx-cross-compiler.d.ts +30 -0
  18. package/lib/base/neuronx-compiler/neuronx-cross-compiler.js +83 -0
  19. package/lib/base/neuronx-compiler/neuronx-native-compiler.d.ts +18 -0
  20. package/lib/base/neuronx-compiler/neuronx-native-compiler.js +69 -0
  21. package/lib/base/server-engine/vllm-engine/vllm-engine-argments.js +1 -1
  22. package/lib/sagemaker-inference-toolkit-tnx/sagemaker-inference-toolkit-tnx-compiler.js +2 -2
  23. package/lib/sagemaker-inference-toolkit-tnx/sagemaker-inference-toolkit-tnx-sagemaker.d.ts +1 -1
  24. package/lib/sagemaker-inference-toolkit-tnx/sagemaker-inference-toolkit-tnx-sagemaker.js +2 -2
  25. package/lib/vllm-nxd-inference/vllm-nxd-inference-compiler.d.ts +8 -0
  26. package/lib/vllm-nxd-inference/vllm-nxd-inference-compiler.js +32 -4
  27. package/lib/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.js +6 -6
  28. package/package.json +5 -5
  29. package/scripts/compile/vllm-nxd-inference/Dockerfile +5 -0
  30. package/scripts/compile/vllm-nxd-inference/entrypoint.sh +39 -14
  31. package/lib/base/neuronx-compiler/neuronx-compiler.js +0 -166
package/README.ja.md CHANGED
@@ -87,7 +87,10 @@ new cdk.CfnOutput(stack, "LoadBalancerDNS", {
87
87
  ## vLLM NxD Inference on ALB & ECS on EC2
88
88
 
89
89
  > [!WARNING]
90
- > このコンストラクトは EC2 上で Inferentia2 インスタンスを使用します。AWS アカウントで Inferentia2 インスタンスのサービスクォータを増やす必要がある場合があります。[Service Quotas コンソール](https://console.aws.amazon.com/servicequotas/)から申請してください。
90
+ > このコンストラクトは EC2 上で Inferentia2 インスタンスを推論に使用します。AWS アカウントで Inferentia2 インスタンスのサービスクォータを増やす必要がある場合があります。[Service Quotas コンソール](https://console.aws.amazon.com/servicequotas/)から申請してください。
91
+ >
92
+ > [!NOTE]
93
+ > モデルのコンパイルは標準(非 Neuron)EC2 インスタンス上でクロスコンパイルにより実行されるため、コンパイルフェーズでは Inferentia/Trainium のクォータは不要です。
91
94
 
92
95
  このパターンは、モデルのコンパイルに `VllmNxdInferenceCompiler` を、デプロイに `ApplicationLoadBalancedVllmNxDInferenceService` を組み合わせて使用します。HuggingFace で公開されているモデルを簡単にコンパイルし、Application Load Balancer を使った ECS にデプロイできます。
93
96
 
@@ -320,7 +323,16 @@ Secret は、コンパイル Batch Job と推論サーバーを実行する ECS
320
323
 
321
324
  ## Neuronx Compiler
322
325
 
323
- > [!WARNING]
326
+ > このコンストラクトは EC2 上で Inferentia2 インスタンスを使用します。AWS アカウントで Inferentia2 インスタンスのサービスクォータを増やす必要がある場合があります。
327
+
328
+ このコンストラクトは、Neuronx でサポートされているモデルをコンパイルし、指定された S3 バケットにアップロードします。コンストラクトは、モデルのパラメータ数に基づいて必要なインスタンスタイプを自動的に選択します。
329
+
330
+ コンパイラーには2つのバリアントがあります:
331
+
332
+ - **`NeuronxNativeCompiler`** — Neuron インスタンス(Inferentia2/Trainium)上でコンパイルします。Neuron デバイスクォータが必要です。
333
+ - **`NeuronxCrossCompiler`** — 標準 EC2 インスタンス(例:`c7i-flex.4xlarge`)上で Neuron ハードウェアなしにクロスコンパイルします。`VllmNxdInferenceCompiler` がデフォルトで使用します。
334
+
335
+ 両方とも `INeuronxCompiler` インターフェースを実装し、互換性のあるアーティファクトを生成します。
324
336
  > このコンストラクトは EC2 上で Inferentia2 インスタンスを使用します。AWS アカウントで Inferentia2 インスタンスのサービスクォータを増やす必要がある場合があります。
325
337
 
326
338
  このコンストラクトは、Neuronx でサポートされているモデルをコンパイルし、指定された S3 バケットにアップロードします。コンストラクトは、モデルのパラメータ数に基づいて必要なインスタンスタイプを自動的に選択します。
@@ -330,13 +342,13 @@ Secret は、コンパイル Batch Job と推論サーバーを実行する ECS
330
342
  ```ts
331
343
  import * as ec2 from "aws-cdk-lib/aws-ec2";
332
344
  import * as s3 from "aws-cdk-lib/aws-s3";
333
- import { NeuronxCompiler, Model } from "aws-cdk-neuronx-patterns";
345
+ import { NeuronxNativeCompiler, Model } from "aws-cdk-neuronx-patterns";
334
346
 
335
347
  declare const vpc: ec2.Vpc;
336
348
  declare const bucket: s3.Bucket;
337
349
  declare const image: INeuronxContainerImage;
338
350
 
339
- const compiler = new NeuronxCompiler(this, "NeuronxCompiler", {
351
+ const compiler = new NeuronxNativeCompiler(this, "NeuronxCompiler", {
340
352
  vpc,
341
353
  bucket,
342
354
  model: Model.fromHuggingFace("HuggingFaceTB/SmolLM-135M-Instruct"),
@@ -362,13 +374,13 @@ new cdk.CfnOutput(this, "CompiledArtifact", {
362
374
  ```ts
363
375
  import * as ec2 from "aws-cdk-lib/aws-ec2";
364
376
  import * as s3 from "aws-cdk-lib/aws-s3";
365
- import { NeuronxCompiler, Model } from "aws-cdk-neuronx-patterns";
377
+ import { NeuronxNativeCompiler, Model } from "aws-cdk-neuronx-patterns";
366
378
 
367
379
  declare const vpc: ec2.Vpc;
368
380
  declare const bucket: s3.Bucket;
369
381
  declare const image: INeuronxContainerImage;
370
382
 
371
- new NeuronxCompiler(this, "NeuronxCompiler", {
383
+ new NeuronxNativeCompiler(this, "NeuronxCompiler", {
372
384
  vpc,
373
385
  bucket,
374
386
  model: Model.fromHuggingFace("HuggingFaceTB/SmolLM-135M-Instruct"),
package/README.md CHANGED
@@ -87,7 +87,10 @@ new cdk.CfnOutput(stack, "LoadBalancerDNS", {
87
87
  ## vLLM NxD Inference on ALB & ECS on EC2
88
88
 
89
89
  > [!WARNING]
90
- > This construct uses an Inferentia2 instance on EC2. You may need to increase your service quota for Inferentia2 instances in your AWS account via the [Service Quotas console](https://console.aws.amazon.com/servicequotas/).
90
+ > This construct uses an Inferentia2 instance on EC2 for inference. You may need to increase your service quota for Inferentia2 instances in your AWS account via the [Service Quotas console](https://console.aws.amazon.com/servicequotas/).
91
+
92
+ > [!NOTE]
93
+ > Model compilation is performed on standard (non-Neuron) EC2 instances via cross-compilation, so no Inferentia/Trainium quota is needed for the compilation phase.
91
94
 
92
95
  This pattern combines `VllmNxdInferenceCompiler` for model compilation and `ApplicationLoadBalancedVllmNxDInferenceService` for deployment. Models published on HuggingFace can be easily compiled and deployed to ECS with Application Load Balancer.
93
96
 
@@ -325,18 +328,25 @@ The secret will be securely passed as an environment variable to the compilation
325
328
 
326
329
  This construct compiles models supported by Neuronx and uploads them to the specified S3 bucket. The construct automatically selects the required instance type based on the number of model parameters.
327
330
 
331
+ There are two compiler variants:
332
+
333
+ - **`NeuronxNativeCompiler`** — Compiles on Neuron instances (Inferentia2/Trainium). Requires Neuron device quota.
334
+ - **`NeuronxCrossCompiler`** — Compiles on standard EC2 instances (e.g., `c7i-flex.4xlarge`) without Neuron hardware. Used by `VllmNxdInferenceCompiler` by default.
335
+
336
+ Both implement the `INeuronxCompiler` interface and produce compatible artifacts.
337
+
328
338
  ![NeuronxCompiler architecture](./docs/neuronx-compile-architecture.png)
329
339
 
330
340
  ```ts
331
341
  import * as ec2 from "aws-cdk-lib/aws-ec2";
332
342
  import * as s3 from "aws-cdk-lib/aws-s3";
333
- import { NeuronxCompiler, Model } from "aws-cdk-neuronx-patterns";
343
+ import { NeuronxNativeCompiler, Model } from "aws-cdk-neuronx-patterns";
334
344
 
335
345
  declare const vpc: ec2.Vpc;
336
346
  declare const bucket: s3.Bucket;
337
347
  declare const image: INeuronxContainerImage;
338
348
 
339
- const compiler = new NeuronxCompiler(this, "NeuronxCompiler", {
349
+ const compiler = new NeuronxNativeCompiler(this, "NeuronxCompiler", {
340
350
  vpc,
341
351
  bucket,
342
352
  model: Model.fromHuggingFace("HuggingFaceTB/SmolLM-135M-Instruct"),
@@ -362,13 +372,13 @@ You can reduce costs by using Spot Instances for compilation:
362
372
  ```ts
363
373
  import * as ec2 from "aws-cdk-lib/aws-ec2";
364
374
  import * as s3 from "aws-cdk-lib/aws-s3";
365
- import { NeuronxCompiler, Model } from "aws-cdk-neuronx-patterns";
375
+ import { NeuronxNativeCompiler, Model } from "aws-cdk-neuronx-patterns";
366
376
 
367
377
  declare const vpc: ec2.Vpc;
368
378
  declare const bucket: s3.Bucket;
369
379
  declare const image: INeuronxContainerImage;
370
380
 
371
- new NeuronxCompiler(this, "NeuronxCompiler", {
381
+ new NeuronxNativeCompiler(this, "NeuronxCompiler", {
372
382
  vpc,
373
383
  bucket,
374
384
  model: Model.fromHuggingFace("HuggingFaceTB/SmolLM-135M-Instruct"),
@@ -395,6 +405,7 @@ For detailed API documentation, see [API.md](./API.md).
395
405
  For cost estimates, use the [AWS Pricing Calculator](https://calculator.aws).
396
406
 
397
407
  **Cost optimization tips:**
408
+ - The `VllmNxdInferenceCompiler` uses cross-compilation on standard EC2 instances by default, avoiding expensive Neuron instances during compilation
398
409
  - Use Spot Instances for compilation jobs (can save up to 90%)
399
410
  - Delete resources when not in use (`cdk destroy`)
400
411
  - Use appropriate instance sizes for your workload
@@ -44,5 +44,5 @@ class NeuronxBatchComputeEnvironment extends constructs_1.Construct {
44
44
  }
45
45
  exports.NeuronxBatchComputeEnvironment = NeuronxBatchComputeEnvironment;
46
46
  _a = JSII_RTTI_SYMBOL_1;
47
- NeuronxBatchComputeEnvironment[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatchComputeEnvironment", version: "0.2.1" };
47
+ NeuronxBatchComputeEnvironment[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatchComputeEnvironment", version: "0.3.0" };
48
48
  //# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoibmV1cm9ueC1iYXRjaC1jb21wdXRlLWVudmlyb25tZW50LmpzIiwic291cmNlUm9vdCI6IiIsInNvdXJjZXMiOlsiLi4vLi4vLi4vc3JjL2Jhc2UvYXdzLWJhdGNoL25ldXJvbngtYmF0Y2gtY29tcHV0ZS1lbnZpcm9ubWVudC50cyJdLCJuYW1lcyI6W10sIm1hcHBpbmdzIjoiOzs7OztBQUNBLCtDQUErQztBQUMvQyxpREFBcUQ7QUFFckQsMkNBQXVDO0FBQ3ZDLHdDQUF5RDtBQVF6RDs7R0FFRztBQUNILE1BQWEsOEJBQ1gsU0FBUSxzQkFBUztJQVVqQixJQUFJLHFCQUFxQjtRQUN2QixPQUFPLEVBQUUscUJBQXFCLEVBQUUsSUFBSSxDQUFDLHFCQUFxQixFQUFFLENBQUM7SUFDL0QsQ0FBQztJQUVELFlBQ0UsS0FBZ0IsRUFDaEIsRUFBVSxFQUNWLEtBQTBDO1FBRTFDLEtBQUssQ0FBQyxLQUFLLEVBQUUsRUFBRSxDQUFDLENBQUM7UUFFakIsTUFBTSxNQUFNLEdBQUcsS0FBSyxDQUFDLE1BQU0sSUFBSTtZQUM3QjtnQkFDRSxLQUFLLEVBQUUsSUFBSSxxQ0FBMkIsQ0FDcEMsSUFBSSxFQUNKLDZCQUE2QixDQUM5QjtnQkFDRCxTQUFTLEVBQUUsS0FBSyxDQUFDLG1CQUFtQixDQUFDLFVBQVU7YUFDaEQ7U0FDRixDQUFDO1FBQ0YsSUFBSSxDQUFDLFFBQVEsR0FBRyxJQUFJLEtBQUssQ0FBQywrQkFBK0IsQ0FDdkQsSUFBSSxFQUNKLFVBQVUsRUFDVjtZQUNFLEdBQUcsS0FBSztZQUNSLE1BQU07U0FDUCxDQUNGLENBQUM7UUFDRixJQUNFLEtBQUssQ0FBQyxjQUFjO1lBQ3BCLEtBQUssQ0FBQyxjQUFjLFlBQVksd0JBQWMsRUFDOUMsQ0FBQztZQUVDLElBQUksQ0FBQyxRQUFRLENBQUMsSUFBSSxDQUFDLFlBQ3BCLENBQUMsbUJBQW1CLENBQ25CLHlDQUF5QyxFQUN6QyxLQUFLLENBQUMsY0FBYyxDQUFDLG1CQUFtQixDQUN6QyxDQUFDO1FBQ0osQ0FBQztRQUVELElBQUksQ0FBQyxxQkFBcUIsR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLHFCQUFxQixDQUFDO1FBQ2pFLElBQUksQ0FBQyxzQkFBc0IsR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLHNCQUFzQixDQUFDO1FBQ25FLElBQUksQ0FBQyxPQUFPLEdBQUcsSUFBSSxDQUFDLFFBQVEsQ0FBQyxPQUFPLENBQUM7UUFDckMsSUFBSSxDQUFDLEdBQUcsR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLEdBQUcsQ0FBQztRQUM3QixJQUFJLENBQUMsV0FBVyxHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsV0FBVyxDQUFDO1FBQzdDLElBQUksQ0FBQyxLQUFLLEdBQUcsSUFBSSxDQUFDLFFBQVEsQ0FBQyxLQUFLLENBQUM7UUFDakMsSUFBSSxDQUFDLFlBQVksR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLFlBQWEsQ0FBQztJQUNsRCxDQUFDO0lBQ0Qsa0JBQWtCLENBQUMsTUFBcUI7UUFDdEMsSUFBSSxDQUFDLFFBQVEsQ0FBQyxrQkFBa0IsQ0FBQyxNQUFNLENBQUMsQ0FBQztJQUMzQyxDQUFDOztBQTdESCx3RUE4REMiLCJzb3VyY2VzQ29udGVudCI6WyJpbXBvcnQgeyBSZW1vdmFsUG9saWN5LCBSZXNvdXJjZUVudmlyb25tZW50LCBTdGFjayB9IGZyb20gXCJhd3MtY2RrLWxpYlwiO1xuaW1wb3J0ICogYXMgYmF0Y2ggZnJvbSBcImF3cy1jZGstbGliL2F3cy1iYXRjaFwiO1xuaW1wb3J0IHsgTGF1bmNoVGVtcGxhdGUgfSBmcm9tIFwiYXdzLWNkay1saWIvYXdzLWVjMlwiO1xuaW1wb3J0IHsgSVJvbGUgfSBmcm9tIFwiYXdzLWNkay1saWIvYXdzLWlhbVwiO1xuaW1wb3J0IHsgQ29uc3RydWN0IH0gZnJvbSBcImNvbnN0cnVjdHNcIjtcbmltcG9ydCB7IE5ldXJvbk9wdGltaXplZE1hY2hpbmVJbWFnZSB9IGZyb20gXCIuLi9uZXVyb254XCI7XG5cbi8qKlxuICogUHJvcHMgb2YgTmV1cm9ueEJhdGNoLlxuICovXG5leHBvcnQgaW50ZXJmYWNlIE5ldXJvbnhCYXRjaENvbXB1dGVFbnZpcm9ubWVudFByb3BzXG4gIGV4dGVuZHMgYmF0Y2guTWFuYWdlZEVjMkVjc0NvbXB1dGVFbnZpcm9ubWVudFByb3BzIHt9XG5cbi8qKlxuICogTmV1cm9ueCBiYXRjaCBjb25zdHJ1Y3QuXG4gKi9cbmV4cG9ydCBjbGFzcyBOZXVyb254QmF0Y2hDb21wdXRlRW52aXJvbm1lbnRcbiAgZXh0ZW5kcyBDb25zdHJ1Y3RcbiAgaW1wbGVtZW50cyBiYXRjaC5JQ29tcHV0ZUVudmlyb25tZW50XG57XG4gIHJlYWRvbmx5IGNvbXB1dGVFbnZpcm9ubWVudE5hbWU6IHN0cmluZztcbiAgcmVhZG9ubHkgY29tcHV0ZUVudmlyb25tZW50QXJuOiBzdHJpbmc7XG4gIHJlYWRvbmx5IHNlcnZpY2VSb2xlPzogSVJvbGUgfCB1bmRlZmluZWQ7XG4gIHJlYWRvbmx5IGVuYWJsZWQ6IGJvb2xlYW47XG4gIHJlYWRvbmx5IHN0YWNrOiBTdGFjaztcbiAgcmVhZG9ubHkgZW52OiBSZXNvdXJjZUVudmlyb25tZW50O1xuICByZWFkb25seSBpbnN0YW5jZVJvbGU6IElSb2xlO1xuICBnZXQgY29tcHV0ZUVudmlyb25tZW50UmVmKCk6IGJhdGNoLkNvbXB1dGVFbnZpcm9ubWVudFJlZmVyZW5jZSB7XG4gICAgcmV0dXJuIHsgY29tcHV0ZUVudmlyb25tZW50QXJuOiB0aGlzLmNvbXB1dGVFbnZpcm9ubWVudEFybiB9O1xuICB9XG4gIHByaXZhdGUgcmVhZG9ubHkgcmVzb3VyY2U6IGJhdGNoLk1hbmFnZWRFYzJFY3NDb21wdXRlRW52aXJvbm1lbnQ7XG4gIGNvbnN0cnVjdG9yKFxuICAgIHNjb3BlOiBDb25zdHJ1Y3QsXG4gICAgaWQ6IHN0cmluZyxcbiAgICBwcm9wczogTmV1cm9ueEJhdGNoQ29tcHV0ZUVudmlyb25tZW50UHJvcHMsXG4gICkge1xuICAgIHN1cGVyKHNjb3BlLCBpZCk7XG5cbiAgICBjb25zdCBpbWFnZXMgPSBwcm9wcy5pbWFnZXMgPz8gW1xuICAgICAge1xuICAgICAgICBpbWFnZTogbmV3IE5ldXJvbk9wdGltaXplZE1hY2hpbmVJbWFnZShcbiAgICAgICAgICB0aGlzLFxuICAgICAgICAgIFwiTmV1cm9uT3B0aW1pemVkTWFjaGluZUltYWdlXCIsXG4gICAgICAgICksXG4gICAgICAgIGltYWdlVHlwZTogYmF0Y2guRWNzTWFjaGluZUltYWdlVHlwZS5FQ1NfQUwyMDIzLFxuICAgICAgfSxcbiAgICBdO1xuICAgIHRoaXMucmVzb3VyY2UgPSBuZXcgYmF0Y2guTWFuYWdlZEVjMkVjc0NvbXB1dGVFbnZpcm9ubWVudChcbiAgICAgIHRoaXMsXG4gICAgICBcIlJlc291cmNlXCIsXG4gICAgICB7XG4gICAgICAgIC4uLnByb3BzLFxuICAgICAgICBpbWFnZXMsXG4gICAgICB9LFxuICAgICk7XG4gICAgaWYgKFxuICAgICAgcHJvcHMubGF1bmNoVGVtcGxhdGUgJiZcbiAgICAgIHByb3BzLmxhdW5jaFRlbXBsYXRlIGluc3RhbmNlb2YgTGF1bmNoVGVtcGxhdGVcbiAgICApIHtcbiAgICAgIChcbiAgICAgICAgdGhpcy5yZXNvdXJjZS5ub2RlLmRlZmF1bHRDaGlsZCBhcyBiYXRjaC5DZm5Db21wdXRlRW52aXJvbm1lbnRcbiAgICAgICkuYWRkUHJvcGVydHlPdmVycmlkZShcbiAgICAgICAgXCJDb21wdXRlUmVzb3VyY2VzLkxhdW5jaFRlbXBsYXRlLlZlcnNpb25cIixcbiAgICAgICAgcHJvcHMubGF1bmNoVGVtcGxhdGUubGF0ZXN0VmVyc2lvbk51bWJlcixcbiAgICAgICk7XG4gICAgfVxuXG4gICAgdGhpcy5jb21wdXRlRW52aXJvbm1lbnRBcm4gPSB0aGlzLnJlc291cmNlLmNvbXB1dGVFbnZpcm9ubWVudEFybjtcbiAgICB0aGlzLmNvbXB1dGVFbnZpcm9ubWVudE5hbWUgPSB0aGlzLnJlc291cmNlLmNvbXB1dGVFbnZpcm9ubWVudE5hbWU7XG4gICAgdGhpcy5lbmFibGVkID0gdGhpcy5yZXNvdXJjZS5lbmFibGVkO1xuICAgIHRoaXMuZW52ID0gdGhpcy5yZXNvdXJjZS5lbnY7XG4gICAgdGhpcy5zZXJ2aWNlUm9sZSA9IHRoaXMucmVzb3VyY2Uuc2VydmljZVJvbGU7XG4gICAgdGhpcy5zdGFjayA9IHRoaXMucmVzb3VyY2Uuc3RhY2s7XG4gICAgdGhpcy5pbnN0YW5jZVJvbGUgPSB0aGlzLnJlc291cmNlLmluc3RhbmNlUm9sZSE7XG4gIH1cbiAgYXBwbHlSZW1vdmFsUG9saWN5KHBvbGljeTogUmVtb3ZhbFBvbGljeSk6IHZvaWQge1xuICAgIHRoaXMucmVzb3VyY2UuYXBwbHlSZW1vdmFsUG9saWN5KHBvbGljeSk7XG4gIH1cbn1cbiJdfQ==
@@ -58,5 +58,5 @@ class NeuronxBatchEcsJobDefinition extends constructs_1.Construct {
58
58
  }
59
59
  exports.NeuronxBatchEcsJobDefinition = NeuronxBatchEcsJobDefinition;
60
60
  _a = JSII_RTTI_SYMBOL_1;
61
- NeuronxBatchEcsJobDefinition[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatchEcsJobDefinition", version: "0.2.1" };
61
+ NeuronxBatchEcsJobDefinition[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatchEcsJobDefinition", version: "0.3.0" };
62
62
  //# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoibmV1cm9ueC1iYXRjaC1lY3Mtam9iLWRlZmluaXRpb24uanMiLCJzb3VyY2VSb290IjoiIiwic291cmNlcyI6WyIuLi8uLi8uLi9zcmMvYmFzZS9hd3MtYmF0Y2gvbmV1cm9ueC1iYXRjaC1lY3Mtam9iLWRlZmluaXRpb24udHMiXSwibmFtZXMiOltdLCJtYXBwaW5ncyI6Ijs7Ozs7QUFNQSwrQ0FBK0M7QUFFL0MsMkNBQXVDO0FBV3ZDOztHQUVHO0FBQ0gsTUFBYSw0QkFDWCxTQUFRLHNCQUFTO0lBWWpCLElBQUksZ0JBQWdCO1FBQ2xCLE9BQU8sRUFBRSxnQkFBZ0IsRUFBRSxJQUFJLENBQUMsZ0JBQWdCLEVBQUUsQ0FBQztJQUNyRCxDQUFDO0lBRUQsWUFDRSxLQUFnQixFQUNoQixFQUFVLEVBQ1YsS0FBd0M7UUFFeEMsS0FBSyxDQUFDLEtBQUssRUFBRSxFQUFFLENBQUMsQ0FBQztRQUNqQixNQUFNLGVBQWUsR0FDbkIsS0FBSyxDQUFDLGVBQWU7WUFDckIsSUFBSSxLQUFLLENBQUMsZUFBZSxDQUFDLElBQUksRUFBRSxpQkFBaUIsQ0FBQyxDQUFDO1FBQ3JELGVBQWUsQ0FBQyxVQUFVLENBQ3hCLEdBQUcsS0FBSyxDQUFDLElBQUksQ0FBQztZQUNaLE1BQU0sRUFBRSxLQUFLLENBQUMsbUJBQW1CLENBQUMsZ0JBQWdCLENBQUMsS0FBSztTQUN6RCxDQUFDLENBQUMsR0FBRyxDQUFDLENBQUMsQ0FBQyxFQUFFLEtBQUssRUFBRSxFQUFFLENBQUMsQ0FBQztZQUNwQixRQUFRLEVBQUUsY0FBYyxLQUFLLEVBQUU7WUFDL0IsYUFBYSxFQUFFLGNBQWMsS0FBSyxFQUFFO1lBQ3BDLFdBQVcsRUFBRTtnQkFDWCxLQUFLLENBQUMsZ0JBQWdCLENBQUMsSUFBSTtnQkFDM0IsS0FBSyxDQUFDLGdCQUFnQixDQUFDLEtBQUs7YUFDN0I7U0FDRixDQUFDLENBQUMsQ0FDSixDQUFDO1FBQ0YsSUFBSSxDQUFDLFFBQVEsR0FBRyxJQUFJLEtBQUssQ0FBQyxnQkFBZ0IsQ0FBQyxJQUFJLEVBQUUsVUFBVSxFQUFFO1lBQzNELEdBQUcsS0FBSztZQUNSLFNBQVMsRUFBRSxJQUFJLEtBQUssQ0FBQyx5QkFBeUIsQ0FDNUMsSUFBSSxFQUNKLHFCQUFxQixFQUNyQjtnQkFDRSxHQUFHLEtBQUs7Z0JBQ1IsZUFBZTthQUNoQixDQUNGO1NBQ0YsQ0FBQyxDQUFDO1FBQ0gsSUFBSSxDQUFDLGdCQUFnQixHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsZ0JBQWdCLENBQUM7UUFDdkQsSUFBSSxDQUFDLGlCQUFpQixHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsaUJBQWlCLENBQUM7UUFDekQsSUFBSSxDQUFDLFVBQVUsR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLFVBQVUsQ0FBQztRQUMzQyxJQUFJLENBQUMsYUFBYSxHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsYUFBYSxDQUFDO1FBQ2pELElBQUksQ0FBQyxlQUFlLEdBQUcsSUFBSSxDQUFDLFFBQVEsQ0FBQyxlQUFlLENBQUM7UUFDckQsSUFBSSxDQUFDLGtCQUFrQixHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsa0JBQWtCLENBQUM7UUFDM0QsSUFBSSxDQUFDLE9BQU8sR0FBRyxJQUFJLENBQUMsUUFBUSxDQUFDLE9BQU8sQ0FBQztRQUNyQyxJQUFJLENBQUMsS0FBSyxHQUFHLElBQUksQ0FBQyxRQUFRLENBQUMsS0FBSyxDQUFDO1FBQ2pDLElBQUksQ0FBQyxHQUFHLEdBQUcsSUFBSSxDQUFDLFFBQVEsQ0FBQyxHQUFHLENBQUM7SUFDL0IsQ0FBQztJQUNELGtCQUFrQixDQUFDLE1BQXFCO1FBQ3RDLElBQUksQ0FBQyxRQUFRLENBQUMsa0JBQWtCLENBQUMsTUFBTSxDQUFDLENBQUM7SUFDM0MsQ0FBQztJQUNELGdCQUFnQixDQUFDLFFBQTZCO1FBQzVDLElBQUksQ0FBQyxRQUFRLENBQUMsZ0JBQWdCLENBQUMsUUFBUSxDQUFDLENBQUM7SUFDM0MsQ0FBQztJQUNEOztPQUVHO0lBQ0gsY0FBYyxDQUFDLFFBQW9CLEVBQUUsS0FBc0I7UUFDekQsSUFBSSxDQUFDLFFBQVEsQ0FBQyxjQUFjLENBQUMsUUFBUSxFQUFFLEtBQUssQ0FBQyxDQUFDO0lBQ2hELENBQUM7O0FBdEVILG9FQXVFQyIsInNvdXJjZXNDb250ZW50IjpbImltcG9ydCB7XG4gIER1cmF0aW9uLFxuICBSZW1vdmFsUG9saWN5LFxuICBSZXNvdXJjZUVudmlyb25tZW50LFxuICBTdGFjayxcbn0gZnJvbSBcImF3cy1jZGstbGliXCI7XG5pbXBvcnQgKiBhcyBiYXRjaCBmcm9tIFwiYXdzLWNkay1saWIvYXdzLWJhdGNoXCI7XG5pbXBvcnQgeyBJR3JhbnRhYmxlIH0gZnJvbSBcImF3cy1jZGstbGliL2F3cy1pYW1cIjtcbmltcG9ydCB7IENvbnN0cnVjdCB9IGZyb20gXCJjb25zdHJ1Y3RzXCI7XG5pbXBvcnQgeyBJTmV1cm9ueEluc3RhbmNlVHlwZSB9IGZyb20gXCIuLi9uZXVyb254XCI7XG5cbi8qKlxuICogUHJvcHMgb2YgTmV1cm9ueEJhdGNoLlxuICovXG5leHBvcnQgaW50ZXJmYWNlIE5ldXJvbnhCYXRjaEVjc0pvYkRlZmluaXRpb25Qcm9wc1xuICBleHRlbmRzIGJhdGNoLkVjc0VjMkNvbnRhaW5lckRlZmluaXRpb25Qcm9wcywgYmF0Y2guSm9iRGVmaW5pdGlvblByb3BzIHtcbiAgcmVhZG9ubHkgbmV1cm9ueEluc3RhbmNlVHlwZTogSU5ldXJvbnhJbnN0YW5jZVR5cGU7XG59XG5cbi8qKlxuICogTmV1cm9ueCBiYXRjaCBjb25zdHJ1Y3QuXG4gKi9cbmV4cG9ydCBjbGFzcyBOZXVyb254QmF0Y2hFY3NKb2JEZWZpbml0aW9uXG4gIGV4dGVuZHMgQ29uc3RydWN0XG4gIGltcGxlbWVudHMgYmF0Y2guSUpvYkRlZmluaXRpb25cbntcbiAgcmVhZG9ubHkgam9iRGVmaW5pdGlvbkFybjogc3RyaW5nO1xuICByZWFkb25seSBqb2JEZWZpbml0aW9uTmFtZTogc3RyaW5nO1xuICByZWFkb25seSBwYXJhbWV0ZXJzPzogeyBba2V5OiBzdHJpbmddOiBhbnkgfTtcbiAgcmVhZG9ubHkgcmV0cnlBdHRlbXB0cz86IG51bWJlcjtcbiAgcmVhZG9ubHkgcmV0cnlTdHJhdGVnaWVzOiBiYXRjaC5SZXRyeVN0cmF0ZWd5W107XG4gIHJlYWRvbmx5IHNjaGVkdWxpbmdQcmlvcml0eT86IG51bWJlcjtcbiAgcmVhZG9ubHkgdGltZW91dD86IER1cmF0aW9uO1xuICByZWFkb25seSBzdGFjazogU3RhY2s7XG4gIHJlYWRvbmx5IGVudjogUmVzb3VyY2VFbnZpcm9ubWVudDtcbiAgZ2V0IGpvYkRlZmluaXRpb25SZWYoKTogYmF0Y2guSm9iRGVmaW5pdGlvblJlZmVyZW5jZSB7XG4gICAgcmV0dXJuIHsgam9iRGVmaW5pdGlvbkFybjogdGhpcy5qb2JEZWZpbml0aW9uQXJuIH07XG4gIH1cbiAgcHJpdmF0ZSByZWFkb25seSByZXNvdXJjZTogYmF0Y2guRWNzSm9iRGVmaW5pdGlvbjtcbiAgY29uc3RydWN0b3IoXG4gICAgc2NvcGU6IENvbnN0cnVjdCxcbiAgICBpZDogc3RyaW5nLFxuICAgIHByb3BzOiBOZXVyb254QmF0Y2hFY3NKb2JEZWZpbml0aW9uUHJvcHMsXG4gICkge1xuICAgIHN1cGVyKHNjb3BlLCBpZCk7XG4gICAgY29uc3QgbGludXhQYXJhbWV0ZXJzID1cbiAgICAgIHByb3BzLmxpbnV4UGFyYW1ldGVycyA/P1xuICAgICAgbmV3IGJhdGNoLkxpbnV4UGFyYW1ldGVycyh0aGlzLCBcIkxpbnV4UGFyYW1ldGVyc1wiKTtcbiAgICBsaW51eFBhcmFtZXRlcnMuYWRkRGV2aWNlcyhcbiAgICAgIC4uLkFycmF5LmZyb20oe1xuICAgICAgICBsZW5ndGg6IHByb3BzLm5ldXJvbnhJbnN0YW5jZVR5cGUuYWNjZWxlcmF0b3JDaGlwcy5jaGlwcyxcbiAgICAgIH0pLm1hcCgoXywgaW5kZXgpID0+ICh7XG4gICAgICAgIGhvc3RQYXRoOiBgL2Rldi9uZXVyb24ke2luZGV4fWAsXG4gICAgICAgIGNvbnRhaW5lclBhdGg6IGAvZGV2L25ldXJvbiR7aW5kZXh9YCxcbiAgICAgICAgcGVybWlzc2lvbnM6IFtcbiAgICAgICAgICBiYXRjaC5EZXZpY2VQZXJtaXNzaW9uLlJFQUQsXG4gICAgICAgICAgYmF0Y2guRGV2aWNlUGVybWlzc2lvbi5XUklURSxcbiAgICAgICAgXSxcbiAgICAgIH0pKSxcbiAgICApO1xuICAgIHRoaXMucmVzb3VyY2UgPSBuZXcgYmF0Y2guRWNzSm9iRGVmaW5pdGlvbih0aGlzLCBcIlJlc291cmNlXCIsIHtcbiAgICAgIC4uLnByb3BzLFxuICAgICAgY29udGFpbmVyOiBuZXcgYmF0Y2guRWNzRWMyQ29udGFpbmVyRGVmaW5pdGlvbihcbiAgICAgICAgdGhpcyxcbiAgICAgICAgXCJDb250YWluZXJEZWZpbml0aW9uXCIsXG4gICAgICAgIHtcbiAgICAgICAgICAuLi5wcm9wcyxcbiAgICAgICAgICBsaW51eFBhcmFtZXRlcnMsXG4gICAgICAgIH0sXG4gICAgICApLFxuICAgIH0pO1xuICAgIHRoaXMuam9iRGVmaW5pdGlvbkFybiA9IHRoaXMucmVzb3VyY2Uuam9iRGVmaW5pdGlvbkFybjtcbiAgICB0aGlzLmpvYkRlZmluaXRpb25OYW1lID0gdGhpcy5yZXNvdXJjZS5qb2JEZWZpbml0aW9uTmFtZTtcbiAgICB0aGlzLnBhcmFtZXRlcnMgPSB0aGlzLnJlc291cmNlLnBhcmFtZXRlcnM7XG4gICAgdGhpcy5yZXRyeUF0dGVtcHRzID0gdGhpcy5yZXNvdXJjZS5yZXRyeUF0dGVtcHRzO1xuICAgIHRoaXMucmV0cnlTdHJhdGVnaWVzID0gdGhpcy5yZXNvdXJjZS5yZXRyeVN0cmF0ZWdpZXM7XG4gICAgdGhpcy5zY2hlZHVsaW5nUHJpb3JpdHkgPSB0aGlzLnJlc291cmNlLnNjaGVkdWxpbmdQcmlvcml0eTtcbiAgICB0aGlzLnRpbWVvdXQgPSB0aGlzLnJlc291cmNlLnRpbWVvdXQ7XG4gICAgdGhpcy5zdGFjayA9IHRoaXMucmVzb3VyY2Uuc3RhY2s7XG4gICAgdGhpcy5lbnYgPSB0aGlzLnJlc291cmNlLmVudjtcbiAgfVxuICBhcHBseVJlbW92YWxQb2xpY3kocG9saWN5OiBSZW1vdmFsUG9saWN5KTogdm9pZCB7XG4gICAgdGhpcy5yZXNvdXJjZS5hcHBseVJlbW92YWxQb2xpY3kocG9saWN5KTtcbiAgfVxuICBhZGRSZXRyeVN0cmF0ZWd5KHN0cmF0ZWd5OiBiYXRjaC5SZXRyeVN0cmF0ZWd5KTogdm9pZCB7XG4gICAgdGhpcy5yZXNvdXJjZS5hZGRSZXRyeVN0cmF0ZWd5KHN0cmF0ZWd5KTtcbiAgfVxuICAvKipcbiAgICogR3JhbnRzIHRoZSBgYmF0Y2g6c3VibWl0Sm9iYCBwZXJtaXNzaW9uIHRvIHRoZSBpZGVudGl0eSBvbiBib3RoIHRoaXMgam9iIGRlZmluaXRpb24gYW5kIHRoZSBgcXVldWVgXG4gICAqL1xuICBncmFudFN1Ym1pdEpvYihpZGVudGl0eTogSUdyYW50YWJsZSwgcXVldWU6IGJhdGNoLklKb2JRdWV1ZSk6IHZvaWQge1xuICAgIHRoaXMucmVzb3VyY2UuZ3JhbnRTdWJtaXRKb2IoaWRlbnRpdHksIHF1ZXVlKTtcbiAgfVxufVxuIl19
@@ -58,5 +58,5 @@ class NeuronxBatch extends constructs_1.Construct {
58
58
  }
59
59
  exports.NeuronxBatch = NeuronxBatch;
60
60
  _a = JSII_RTTI_SYMBOL_1;
61
- NeuronxBatch[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatch", version: "0.2.1" };
61
+ NeuronxBatch[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxBatch", version: "0.3.0" };
62
62
  //# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoibmV1cm9ueC1iYXRjaC5qcyIsInNvdXJjZVJvb3QiOiIiLCJzb3VyY2VzIjpbIi4uLy4uLy4uL3NyYy9iYXNlL2F3cy1iYXRjaC9uZXVyb254LWJhdGNoLnRzIl0sIm5hbWVzIjpbXSwibWFwcGluZ3MiOiI7Ozs7O0FBQ0EsK0NBQStDO0FBQy9DLDJDQUEyQztBQUMzQywyQ0FBdUM7QUFDdkMsd0NBQStFO0FBb0MvRTs7R0FFRztBQUNILE1BQWEsWUFBYSxTQUFRLHNCQUFTO0lBR3pDLFlBQVksS0FBZ0IsRUFBRSxFQUFVLEVBQUUsS0FBd0I7UUFDaEUsS0FBSyxDQUFDLEtBQUssRUFBRSxFQUFFLENBQUMsQ0FBQztRQUNqQixNQUFNLGNBQWMsR0FBRyxJQUFJLEdBQUcsQ0FBQyxjQUFjLENBQUMsSUFBSSxFQUFFLGdCQUFnQixFQUFFO1lBQ3BFLFlBQVksRUFBRTtnQkFDWjtvQkFDRSxVQUFVLEVBQUUsV0FBVztvQkFDdkIsTUFBTSxFQUFFLEdBQUcsQ0FBQyxpQkFBaUIsQ0FBQyxHQUFHLENBQUMsS0FBSyxDQUFDLFVBQVUsQ0FBQyxXQUFXLEVBQUUsQ0FBQztpQkFDbEU7YUFDRjtTQUNGLENBQUMsQ0FBQztRQUNILElBQUksQ0FBQyxrQkFBa0IsR0FBRyxJQUFJLEtBQUssQ0FBQywrQkFBK0IsQ0FDakUsSUFBSSxFQUNKLG9CQUFvQixFQUNwQjtZQUNFLEdBQUcsRUFBRSxLQUFLLENBQUMsR0FBRztZQUNkLFVBQVUsRUFBRSxLQUFLLENBQUMsVUFBVTtZQUM1QixhQUFhLEVBQUUsQ0FBQyxLQUFLLENBQUMsbUJBQW1CLENBQUMsWUFBWSxDQUFDO1lBQ3ZELHlCQUF5QixFQUFFLEtBQUs7WUFDaEMsTUFBTSxFQUFFO2dCQUNOO29CQUNFLEtBQUssRUFBRSxJQUFJLHFDQUEyQixDQUFDLElBQUksRUFBRSxhQUFhLENBQUM7b0JBQzNELFNBQVMsRUFBRSxLQUFLLENBQUMsbUJBQW1CLENBQUMsVUFBVTtpQkFDaEQ7YUFDRjtZQUNELGNBQWM7WUFDZCxJQUFJLEVBQUUsS0FBSyxDQUFDLElBQUk7U0FDakIsQ0FDRixDQUFDO1FBRUEsSUFBSSxDQUFDLGtCQUFrQixDQUFDLElBQUksQ0FBQyxZQUM5QixDQUFDLG1CQUFtQixDQUNuQix5Q0FBeUMsRUFDekMsY0FBYyxDQUFDLG1CQUFtQixDQUNuQyxDQUFDO1FBQ0YsTUFBTSxlQUFlLEdBQ25CLEtBQUssQ0FBQyxlQUFlO1lBQ3JCLElBQUksS0FBSyxDQUFDLGVBQWUsQ0FBQyxJQUFJLEVBQUUsaUJBQWlCLENBQUMsQ0FBQztRQUNyRCxlQUFlLENBQUMsVUFBVSxDQUN4QixHQUFHLEtBQUssQ0FBQyxJQUFJLENBQUM7WUFDWixNQUFNLEVBQUUsS0FBSyxDQUFDLG1CQUFtQixDQUFDLGdCQUFnQixDQUFDLEtBQUs7U0FDekQsQ0FBQyxDQUFDLEdBQUcsQ0FBQyxDQUFDLENBQUMsRUFBRSxLQUFLLEVBQUUsRUFBRSxDQUFDLENBQUM7WUFDcEIsUUFBUSxFQUFFLGNBQWMsS0FBSyxFQUFFO1lBQy9CLGFBQWEsRUFBRSxjQUFjLEtBQUssRUFBRTtZQUNwQyxXQUFXLEVBQUU7Z0JBQ1gsS0FBSyxDQUFDLGdCQUFnQixDQUFDLElBQUk7Z0JBQzNCLEtBQUssQ0FBQyxnQkFBZ0IsQ0FBQyxLQUFLO2FBQzdCO1NBQ0YsQ0FBQyxDQUFDLENBQ0osQ0FBQztRQUNGLElBQUksQ0FBQyxhQUFhLEdBQUcsSUFBSSxLQUFLLENBQUMsZ0JBQWdCLENBQUMsSUFBSSxFQUFFLGVBQWUsRUFBRTtZQUNyRSxTQUFTLEVBQUUsSUFBSSxLQUFLLENBQUMseUJBQXlCLENBQzVDLElBQUksRUFDSixxQkFBcUIsRUFDckI7Z0JBQ0UsR0FBRyxLQUFLO2dCQUNSLGVBQWU7YUFDaEIsQ0FDRjtTQUNGLENBQUMsQ0FBQztJQUNMLENBQUM7O0FBOURILG9DQStEQyIsInNvdXJjZXNDb250ZW50IjpbImltcG9ydCB7IFNpemUgfSBmcm9tIFwiYXdzLWNkay1saWJcIjtcbmltcG9ydCAqIGFzIGJhdGNoIGZyb20gXCJhd3MtY2RrLWxpYi9hd3MtYmF0Y2hcIjtcbmltcG9ydCAqIGFzIGVjMiBmcm9tIFwiYXdzLWNkay1saWIvYXdzLWVjMlwiO1xuaW1wb3J0IHsgQ29uc3RydWN0IH0gZnJvbSBcImNvbnN0cnVjdHNcIjtcbmltcG9ydCB7IElOZXVyb254SW5zdGFuY2VUeXBlLCBOZXVyb25PcHRpbWl6ZWRNYWNoaW5lSW1hZ2UgfSBmcm9tIFwiLi4vbmV1cm9ueFwiO1xuXG4vKipcbiAqIFByb3BzIG9mIE5ldXJvbnhCYXRjaC5cbiAqL1xuZXhwb3J0IGludGVyZmFjZSBOZXVyb254QmF0Y2hQcm9wc1xuICBleHRlbmRzIGJhdGNoLkVjc0VjMkNvbnRhaW5lckRlZmluaXRpb25Qcm9wcyB7XG4gIC8qKlxuICAgKiBWUEMgaW4gd2hpY2ggdGhpcyB3aWxsIGxhdW5jaCB3b3JrZXIgaW5zdGFuY2UuXG4gICAqL1xuICByZWFkb25seSB2cGM6IGVjMi5JVnBjO1xuICAvKipcbiAgICogVGhlIGluc3RhbmNlIHR5cGUgb2Ygd29ya2VyIGluc3RhbmNlLlxuICAgKi9cbiAgcmVhZG9ubHkgbmV1cm9ueEluc3RhbmNlVHlwZTogSU5ldXJvbnhJbnN0YW5jZVR5cGU7XG4gIC8qKlxuICAgKiBUaGUgcm9vdCB2b2x1bWUgb2Ygd29ya2VyIGluc3RhbmNlLlxuICAgKiBAZGVmYXVsdCAtIE4gYmlsaW9uIHBhcmFtZXRlcnMgKiA1R2lCIEVCU1xuICAgKi9cbiAgcmVhZG9ubHkgdm9sdW1lU2l6ZTogU2l6ZTtcbiAgLyoqXG4gICAqIFdoZXRoZXIgb3Igbm90IHRvIHVzZSBzcG90IGluc3RhbmNlcy5cbiAgICogU3BvdCBpbnN0YW5jZXMgYXJlIGxlc3MgZXhwZW5zaXZlIEVDMiBpbnN0YW5jZXMgdGhhdCBjYW4gYmUgcmVjbGFpbWVkIGJ5IEVDMiBhdCBhbnkgdGltZTtcbiAgICogeW91ciBqb2Igd2lsbCBiZSBnaXZlbiB0d28gbWludXRlcyBvZiBub3RpY2UgYmVmb3JlIHJlY2xhbWF0aW9uLlxuICAgKlxuICAgKiBAZGVmYXVsdCBmYWxzZVxuICAgKi9cbiAgcmVhZG9ubHkgc3BvdD86IGJvb2xlYW47XG4gIC8qKlxuICAgKiBUaGUgVlBDIFN1Ym5ldHMgdGhpcyBDb21wdXRlIEVudmlyb25tZW50IHdpbGwgbGF1bmNoIGluc3RhbmNlcyBpbi5cbiAgICpcbiAgICogQGRlZmF1bHQgLSBuZXcgc3VibmV0cyB3aWxsIGJlIGNyZWF0ZWRcbiAgICovXG4gIHJlYWRvbmx5IHZwY1N1Ym5ldHM/OiBlYzIuU3VibmV0U2VsZWN0aW9uO1xufVxuXG4vKipcbiAqIE5ldXJvbnggYmF0Y2ggY29uc3RydWN0LlxuICovXG5leHBvcnQgY2xhc3MgTmV1cm9ueEJhdGNoIGV4dGVuZHMgQ29uc3RydWN0IHtcbiAgcmVhZG9ubHkgY29tcHV0ZUVudmlyb25tZW50OiBiYXRjaC5NYW5hZ2VkRWMyRWNzQ29tcHV0ZUVudmlyb25tZW50O1xuICByZWFkb25seSBqb2JEZWZpbml0aW9uOiBiYXRjaC5FY3NKb2JEZWZpbml0aW9uO1xuICBjb25zdHJ1Y3RvcihzY29wZTogQ29uc3RydWN0LCBpZDogc3RyaW5nLCBwcm9wczogTmV1cm9ueEJhdGNoUHJvcHMpIHtcbiAgICBzdXBlcihzY29wZSwgaWQpO1xuICAgIGNvbnN0IGxhdW5jaFRlbXBsYXRlID0gbmV3IGVjMi5MYXVuY2hUZW1wbGF0ZSh0aGlzLCBcIkxhdW5jaFRlbXBsYXRlXCIsIHtcbiAgICAgIGJsb2NrRGV2aWNlczogW1xuICAgICAgICB7XG4gICAgICAgICAgZGV2aWNlTmFtZTogXCIvZGV2L3h2ZGFcIixcbiAgICAgICAgICB2b2x1bWU6IGVjMi5CbG9ja0RldmljZVZvbHVtZS5lYnMocHJvcHMudm9sdW1lU2l6ZS50b0dpYmlieXRlcygpKSxcbiAgICAgICAgfSxcbiAgICAgIF0sXG4gICAgfSk7XG4gICAgdGhpcy5jb21wdXRlRW52aXJvbm1lbnQgPSBuZXcgYmF0Y2guTWFuYWdlZEVjMkVjc0NvbXB1dGVFbnZpcm9ubWVudChcbiAgICAgIHRoaXMsXG4gICAgICBcIkNvbXB1dGVFbnZpcm9ubWVudFwiLFxuICAgICAge1xuICAgICAgICB2cGM6IHByb3BzLnZwYyxcbiAgICAgICAgdnBjU3VibmV0czogcHJvcHMudnBjU3VibmV0cyxcbiAgICAgICAgaW5zdGFuY2VUeXBlczogW3Byb3BzLm5ldXJvbnhJbnN0YW5jZVR5cGUuaW5zdGFuY2VUeXBlXSxcbiAgICAgICAgdXNlT3B0aW1hbEluc3RhbmNlQ2xhc3NlczogZmFsc2UsXG4gICAgICAgIGltYWdlczogW1xuICAgICAgICAgIHtcbiAgICAgICAgICAgIGltYWdlOiBuZXcgTmV1cm9uT3B0aW1pemVkTWFjaGluZUltYWdlKHRoaXMsIFwiTWFjaGluSW1hZ2VcIiksXG4gICAgICAgICAgICBpbWFnZVR5cGU6IGJhdGNoLkVjc01hY2hpbmVJbWFnZVR5cGUuRUNTX0FMMjAyMyxcbiAgICAgICAgICB9LFxuICAgICAgICBdLFxuICAgICAgICBsYXVuY2hUZW1wbGF0ZSxcbiAgICAgICAgc3BvdDogcHJvcHMuc3BvdCxcbiAgICAgIH0sXG4gICAgKTtcbiAgICAoXG4gICAgICB0aGlzLmNvbXB1dGVFbnZpcm9ubWVudC5ub2RlLmRlZmF1bHRDaGlsZCBhcyBiYXRjaC5DZm5Db21wdXRlRW52aXJvbm1lbnRcbiAgICApLmFkZFByb3BlcnR5T3ZlcnJpZGUoXG4gICAgICBcIkNvbXB1dGVSZXNvdXJjZXMuTGF1bmNoVGVtcGxhdGUuVmVyc2lvblwiLFxuICAgICAgbGF1bmNoVGVtcGxhdGUubGF0ZXN0VmVyc2lvbk51bWJlcixcbiAgICApO1xuICAgIGNvbnN0IGxpbnV4UGFyYW1ldGVycyA9XG4gICAgICBwcm9wcy5saW51eFBhcmFtZXRlcnMgPz9cbiAgICAgIG5ldyBiYXRjaC5MaW51eFBhcmFtZXRlcnModGhpcywgXCJMaW51eFBhcmFtZXRlcnNcIik7XG4gICAgbGludXhQYXJhbWV0ZXJzLmFkZERldmljZXMoXG4gICAgICAuLi5BcnJheS5mcm9tKHtcbiAgICAgICAgbGVuZ3RoOiBwcm9wcy5uZXVyb254SW5zdGFuY2VUeXBlLmFjY2VsZXJhdG9yQ2hpcHMuY2hpcHMsXG4gICAgICB9KS5tYXAoKF8sIGluZGV4KSA9PiAoe1xuICAgICAgICBob3N0UGF0aDogYC9kZXYvbmV1cm9uJHtpbmRleH1gLFxuICAgICAgICBjb250YWluZXJQYXRoOiBgL2Rldi9uZXVyb24ke2luZGV4fWAsXG4gICAgICAgIHBlcm1pc3Npb25zOiBbXG4gICAgICAgICAgYmF0Y2guRGV2aWNlUGVybWlzc2lvbi5SRUFELFxuICAgICAgICAgIGJhdGNoLkRldmljZVBlcm1pc3Npb24uV1JJVEUsXG4gICAgICAgIF0sXG4gICAgICB9KSksXG4gICAgKTtcbiAgICB0aGlzLmpvYkRlZmluaXRpb24gPSBuZXcgYmF0Y2guRWNzSm9iRGVmaW5pdGlvbih0aGlzLCBcIkpvYkRlZmluaXRpb25cIiwge1xuICAgICAgY29udGFpbmVyOiBuZXcgYmF0Y2guRWNzRWMyQ29udGFpbmVyRGVmaW5pdGlvbihcbiAgICAgICAgdGhpcyxcbiAgICAgICAgXCJDb250YWluZXJEZWZpbml0aW9uXCIsXG4gICAgICAgIHtcbiAgICAgICAgICAuLi5wcm9wcyxcbiAgICAgICAgICBsaW51eFBhcmFtZXRlcnMsXG4gICAgICAgIH0sXG4gICAgICApLFxuICAgIH0pO1xuICB9XG59XG4iXX0=
@@ -11,7 +11,7 @@ const aws_ecs_patterns_1 = require("aws-cdk-lib/aws-ecs-patterns");
11
11
  const neuronx_1 = require("../neuronx");
12
12
  class NeuronxTaskDefinition extends ecs.Ec2TaskDefinition {
13
13
  constructor(scope, id, props) {
14
- const neuronxInstanceType = props.neuronxInstanceType ?? props.compiledModel.compileTimeInstanceType;
14
+ const neuronxInstanceType = props.neuronxInstanceType ?? props.compiledModel.recommendedInstanceType;
15
15
  const tensorParallelSize = props.tensorParallelSize ?? 1;
16
16
  const tasksPerInstance = Math.floor(neuronxInstanceType.acceleratorChips.neuronxCores / tensorParallelSize);
17
17
  const placementConstraints = tasksPerInstance >= 2
@@ -63,7 +63,7 @@ class NeuronxTaskDefinition extends ecs.Ec2TaskDefinition {
63
63
  }
64
64
  exports.NeuronxTaskDefinition = NeuronxTaskDefinition;
65
65
  _a = JSII_RTTI_SYMBOL_1;
66
- NeuronxTaskDefinition[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxTaskDefinition", version: "0.2.1" };
66
+ NeuronxTaskDefinition[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronxTaskDefinition", version: "0.3.0" };
67
67
  class ApplicationLoadBalancedNeuronxService extends aws_ecs_patterns_1.ApplicationLoadBalancedEc2Service {
68
68
  constructor(scope, id, props) {
69
69
  const neuronxTaskDefinition = props.taskDefinition;
@@ -141,5 +141,5 @@ mount-s3 ${neuronxTaskDefinition.compiledModel.bucket.bucketName} /mnt/${neuronx
141
141
  }
142
142
  exports.ApplicationLoadBalancedNeuronxService = ApplicationLoadBalancedNeuronxService;
143
143
  _b = JSII_RTTI_SYMBOL_1;
144
- ApplicationLoadBalancedNeuronxService[_b] = { fqn: "aws-cdk-neuronx-patterns.ApplicationLoadBalancedNeuronxService", version: "0.2.1" };
145
- //# sourceMappingURL=data:application/json;base64,{"version":3,"file":"application-load-balanced-neuronx-service.js","sourceRoot":"","sources":["../../../src/base/aws-ecs-patterns/application-load-balanced-neuronx-service.ts"],"names":[],"mappings":";;;;;AAAA,6CAAuC;AACvC,iEAIqC;AACrC,iDAAqD;AACrD,2CAA2C;AAC3C,mEAGsC;AAEtC,wCAIoB;AA6BpB,MAAa,qBACX,SAAQ,GAAG,CAAC,iBAAiB;IAQ7B,YAAY,KAAgB,EAAE,EAAU,EAAE,KAAiC;QACzE,MAAM,mBAAmB,GACvB,KAAK,CAAC,mBAAmB,IAAI,KAAK,CAAC,aAAa,CAAC,uBAAuB,CAAC;QAC3E,MAAM,kBAAkB,GAAG,KAAK,CAAC,kBAAkB,IAAI,CAAC,CAAC;QACzD,MAAM,gBAAgB,GAAG,IAAI,CAAC,KAAK,CACjC,mBAAmB,CAAC,gBAAgB,CAAC,YAAY,GAAG,kBAAkB,CACvE,CAAC;QACF,MAAM,oBAAoB,GACxB,gBAAgB,IAAI,CAAC;YACnB,CAAC,CAAC;gBACE,GAAG,CAAC,mBAAmB,CAAC,QAAQ,CAC9B,qBAAqB,gBAAgB,EAAE,CACxC;aACF;YACH,CAAC,CAAC,EAAE,CAAC;QACT,KAAK,CAAC,KAAK,EAAE,EAAE,EAAE;YACf,GAAG,KAAK;YACR,oBAAoB,EAAE;gBACpB,GAAG,CAAC,KAAK,CAAC,oBAAoB,IAAI,EAAE,CAAC;gBACrC,GAAG,oBAAoB;aACxB;SACF,CAAC,CAAC;QACH,IAAI,CAAC,eAAe,GAAG,IAAI,GAAG,CAAC,eAAe,CAAC,IAAI,EAAE,iBAAiB,CAAC,CAAC;QACxE,IAAI,CAAC,eAAe,CAAC,UAAU,CAC7B,GAAG,KAAK,CAAC,IAAI,CAAC;YACZ,MAAM,EAAE,mBAAmB,EAAE,gBAAgB,CAAC,KAAK,IAAI,CAAC;SACzD,CAAC,CAAC,GAAG,CAAa,CAAC,CAAC,EAAE,KAAK,EAAE,EAAE,CAAC,CAAC;YAChC,QAAQ,EAAE,cAAc,KAAK,EAAE;YAC/B,aAAa,EAAE,cAAc,KAAK,EAAE;YACpC,WAAW,EAAE,CAAC,GAAG,CAAC,gBAAgB,CAAC,IAAI,EAAE,GAAG,CAAC,gBAAgB,CAAC,KAAK,CAAC;SACrE,CAAC,CAAC,CACJ,CAAC;QACF,IAAI,IAAI,CAAC,aAAa,EAAE,CAAC;YACvB,KAAK,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,IAAI,CAAC,aAAa,CAAC,CAAC;QAC3D,CAAC;QACD,KAAK,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QACpD,IAAI,CAAC,aAAa,GAAG,KAAK,CAAC,aAAa,CAAC;QACzC,IAAI,CAAC,mBAAmB,GAAG,mBAAmB,CAAC;QAC/C,IAAI,CAAC,kBAAkB,GAAG,kBAAkB,CAAC;QAC7C,IAAI,CAAC,gBAAgB,GAAG,gBAAgB,CAAC;IAC3C,CAAC;IAED,uBAAuB,CACrB,EAAU,EACV,KAAqC;QAErC,MAAM,SAAS,GAAG,KAAK,CAAC,YAAY,CAAC,EAAE,EAAE;YACvC,OAAO,EAAE,GAAG,CAAC,SAAS,CAAC,OAAO,CAAC;gBAC7B,YAAY,EAAE,EAAE;aACjB,CAAC;YACF,eAAe,EAAE,IAAI,CAAC,eAAe;YACrC,oBAAoB,EAAE,IAAI,CAAC,IAAI,CAC7B,CAAC,IAAI,CAAC,mBAAmB,CAAC,MAAM,CAAC,WAAW,EAAE,GAAG,GAAG,CAAC;gBACnD,IAAI,CAAC,gBAAgB,CACxB;YACD,GAAG,KAAK;SACT,CAAC,CAAC;QACH,SAAS,CAAC,cAAc,CAAC;YACvB,YAAY,EAAE,OAAO;YACrB,aAAa,EAAE,eAAe;YAC9B,QAAQ,EAAE,KAAK;SAChB,CAAC,CAAC;QACH,OAAO,SAAS,CAAC;IACnB,CAAC;;AAxEH,sDAyEC;;;AAGD,MAAa,qCAAsC,SAAQ,oDAAiC;IAC1F,YACE,KAAgB,EAChB,EAAU,EACV,KAAiD;QAEjD,MAAM,qBAAqB,GAAG,KAAK,CAAC,cAAc,CAAC;QACnD,IACE,CAAC,qBAAqB;YACtB,CAAC,CAAC,qBAAqB,YAAY,qBAAqB,CAAC,EACzD,CAAC;YACD,MAAM,IAAI,KAAK,CAAC,kDAAkD,CAAC,CAAC;QACtE,CAAC;QACD,KAAK,CAAC,KAAK,EAAE,EAAE,EAAE;YACf,sBAAsB,EACpB,KAAK,CAAC,sBAAsB,IAAI,sBAAQ,CAAC,OAAO,CAAC,EAAE,CAAC;YACtD,GAAG,KAAK;SACT,CAAC,CAAC;QAEH,MAAM,OAAO,GAAG,IAAI,CAAC,iBAAiB,CAAC,IAAI,EAAE,KAAK,CAAC,GAAG,CAAC,CAAC;QAExD,sCAAsC;QACtC,MAAM,QAAQ,GAAG,kBAAQ,CAAC,QAAQ,EAAE,CAAC;QACrC,QAAQ,CAAC,WAAW,CAAC;;;;;;;;;;;;;;;;;;;;;;;uBAuBF,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU;WACjE,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,SAAS,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,+CAA+C,CAAC,CAAC;QAE3K,qBAAqB,CAAC,SAAS,CAAC;YAC9B,IAAI,EAAE,OAAO;YACb,IAAI,EAAE;gBACJ,UAAU,EAAE,QAAQ,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,EAAE;aAC5E;SACF,CAAC,CAAC;QAEH,MAAM,UAAU,GAAG,IAAI,CAAC,IAAI,CAC1B,qCAA2B,CAAC,IAAI,CAAC,WAAW,EAAE;YAC5C,qCAA2B,CAAC,IAAI,CAAC,WAAW,EAAE,CACjD,CAAC;QACF,MAAM,eAAe,GAAG,IAAI,CAAC,IAAI,CAC/B,CAAC,KAAK,CAAC,YAAY,IAAI,CAAC,CAAC,GAAG,qBAAqB,CAAC,gBAAgB,CACnE,CAAC;QACF,MAAM,gBAAgB,GAAG,IAAI,kCAAgB,CAAC,IAAI,EAAE,kBAAkB,EAAE;YACtE,GAAG,EAAE,OAAO,CAAC,GAAG;YAChB,YAAY,EAAE,qBAAqB,CAAC,mBAAmB,CAAC,YAAY;YACpE,YAAY,EAAE,IAAI,qCAA2B,CAC3C,IAAI,EACJ,6BAA6B,CAC9B;YACD,YAAY,EAAE;gBACZ;oBACE,UAAU,EAAE,WAAW;oBACvB,MAAM,EAAE,mCAAiB,CAAC,GAAG,CAAC,UAAU,EAAE;wBACxC,UAAU,EAAE,qCAAmB,CAAC,GAAG;wBACnC,SAAS,EAAE,IAAI;qBAChB,CAAC;iBACH;aACF;YACD,QAAQ;YACR,eAAe;YACf,WAAW,EACT,qBAAqB,CAAC,gBAAgB,KAAK,CAAC;gBAC1C,CAAC,CAAC,eAAe,GAAG,CAAC;gBACrB,CAAC,CAAC,SAAS;SAChB,CAAC,CAAC;QACH,gBAAgB,CAAC,WAAW,CAAC,SAAS,CACpC,IAAI,CAAC,YAAY,EACjB,cAAI,CAAC,QAAQ,CAAC,KAAK,EAAE,KAAK,CAAC,CAC5B,CAAC;QACF,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,gBAAgB,CAAC,CAAC;QACvE,MAAM,QAAQ,GAAG,IAAI,GAAG,CAAC,mBAAmB,CAAC,IAAI,EAAE,qBAAqB,EAAE;YACxE,gBAAgB;SACjB,CAAC,CAAC;QACH,OAAO,CAAC,sBAAsB,CAAC,QAAQ,CAAC,CAAC;IAC3C,CAAC;;AA/FH,sFAgGC","sourcesContent":["import { Duration } from \"aws-cdk-lib\";\nimport {\n  AutoScalingGroup,\n  BlockDeviceVolume,\n  EbsDeviceVolumeType,\n} from \"aws-cdk-lib/aws-autoscaling\";\nimport { Port, UserData } from \"aws-cdk-lib/aws-ec2\";\nimport * as ecs from \"aws-cdk-lib/aws-ecs\";\nimport {\n  ApplicationLoadBalancedEc2Service,\n  ApplicationLoadBalancedEc2ServiceProps,\n} from \"aws-cdk-lib/aws-ecs-patterns\";\nimport { Construct } from \"constructs\";\nimport {\n  INeuronxInstanceType,\n  NeuronOptimizedMachineImage,\n  PytorchTrainingNeuronxImage,\n} from \"../neuronx\";\nimport { NeuronxCompiledModel } from \"../neuronx-compiler\";\n\nexport interface NeuronxTaskDefinitionPropsBase\n  extends ecs.Ec2TaskDefinitionProps {\n  /**\n   * The instance type of compile worker instance.\n   */\n  readonly neuronxInstanceType?: INeuronxInstanceType;\n  /**\n   * The number of tensor parallel size.\n   * @default - 1\n   */\n  readonly tensorParallelSize?: number;\n}\n\nexport interface NeuronxTaskDefinitionProps extends NeuronxTaskDefinitionPropsBase {\n  /**\n   * The model to be compiled.\n   */\n  readonly compiledModel: NeuronxCompiledModel;\n}\n\nexport interface INeuronxTaskDefinition extends ecs.IEc2TaskDefinition {\n  readonly neuronxInstanceType: INeuronxInstanceType;\n  readonly tensorParallelSize: number;\n  readonly tasksPerInstance: number;\n  readonly compiledModel: NeuronxCompiledModel;\n}\nexport class NeuronxTaskDefinition\n  extends ecs.Ec2TaskDefinition\n  implements INeuronxTaskDefinition\n{\n  readonly neuronxInstanceType: INeuronxInstanceType;\n  readonly tensorParallelSize: number;\n  readonly tasksPerInstance: number;\n  readonly compiledModel: NeuronxCompiledModel;\n  protected readonly linuxParameters: ecs.LinuxParameters;\n  constructor(scope: Construct, id: string, props: NeuronxTaskDefinitionProps) {\n    const neuronxInstanceType =\n      props.neuronxInstanceType ?? props.compiledModel.compileTimeInstanceType;\n    const tensorParallelSize = props.tensorParallelSize ?? 1;\n    const tasksPerInstance = Math.floor(\n      neuronxInstanceType.acceleratorChips.neuronxCores / tensorParallelSize,\n    );\n    const placementConstraints =\n      tasksPerInstance >= 2\n        ? [\n            ecs.PlacementConstraint.memberOf(\n              `runningTasksCount<${tasksPerInstance}`,\n            ),\n          ]\n        : [];\n    super(scope, id, {\n      ...props,\n      placementConstraints: [\n        ...(props.placementConstraints ?? []),\n        ...placementConstraints,\n      ],\n    });\n    this.linuxParameters = new ecs.LinuxParameters(this, \"LinuxParameters\");\n    this.linuxParameters.addDevices(\n      ...Array.from({\n        length: neuronxInstanceType?.acceleratorChips.chips ?? 1,\n      }).map<ecs.Device>((_, index) => ({\n        hostPath: `/dev/neuron${index}`,\n        containerPath: `/dev/neuron${index}`,\n        permissions: [ecs.DevicePermission.READ, ecs.DevicePermission.WRITE],\n      })),\n    );\n    if (this.executionRole) {\n      props.compiledModel.bucket.grantRead(this.executionRole);\n    }\n    props.compiledModel.bucket.grantRead(this.taskRole);\n    this.compiledModel = props.compiledModel;\n    this.neuronxInstanceType = neuronxInstanceType;\n    this.tensorParallelSize = tensorParallelSize;\n    this.tasksPerInstance = tasksPerInstance;\n  }\n\n  addContainerWithDefault(\n    id: string,\n    props: ecs.ContainerDefinitionOptions,\n  ): ecs.ContainerDefinition {\n    const container = super.addContainer(id, {\n      logging: ecs.LogDriver.awsLogs({\n        streamPrefix: id,\n      }),\n      linuxParameters: this.linuxParameters,\n      memoryReservationMiB: Math.ceil(\n        (this.neuronxInstanceType.memory.toMebibytes() * 0.8) /\n          this.tasksPerInstance,\n      ),\n      ...props,\n    });\n    container.addMountPoints({\n      sourceVolume: \"model\",\n      containerPath: \"/opt/ml/model\",\n      readOnly: false,\n    });\n    return container;\n  }\n}\n\nexport interface ApplicationLoadBalancedNeuronxServiceProps extends ApplicationLoadBalancedEc2ServiceProps {}\nexport class ApplicationLoadBalancedNeuronxService extends ApplicationLoadBalancedEc2Service {\n  constructor(\n    scope: Construct,\n    id: string,\n    props: ApplicationLoadBalancedNeuronxServiceProps,\n  ) {\n    const neuronxTaskDefinition = props.taskDefinition;\n    if (\n      !neuronxTaskDefinition ||\n      !(neuronxTaskDefinition instanceof NeuronxTaskDefinition)\n    ) {\n      throw new Error(\"taskDefinition must extend NeuronxTaskDefinition\");\n    }\n    super(scope, id, {\n      healthCheckGracePeriod:\n        props.healthCheckGracePeriod ?? Duration.minutes(15),\n      ...props,\n    });\n\n    const cluster = this.getDefaultCluster(this, props.vpc);\n\n    // install and mount mountpoint for s3\n    const userData = UserData.forLinux();\n    userData.addCommands(`\n#!/bin/bash -e\n\n# Install Mountpoint\nMP_RPM=$(mktemp --suffix=.rpm)\ncurl https://s3.amazonaws.com/mountpoint-s3-release/latest/x86_64/mount-s3.rpm > $MP_RPM\n\n# cloud-init installs conflict with SSM agent: https://github.com/amazonlinux/amazon-linux-2023/issues/397\nattempt=0\nmax_attempts=5\nuntil dnf install -y $MP_RPM; do\n    attempt=$((attempt + 1))\n    if [ $attempt -ge $max_attempts ]; then\n        echo \"Failed to install mount-s3 after $max_attempts attempts. Exiting.\"\n        exit 1\n    fi\n    echo \"dnf install mount-s3 failed (attempt $attempt/$max_attempts), retrying in 3 seconds...\"\n    sleep 3\ndone\n\nrm $MP_RPM\n\n# Setup the fstab file and create the mount\nmkdir --parents /mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName}\nmount-s3 ${neuronxTaskDefinition.compiledModel.bucket.bucketName} /mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName} --allow-other --file-mode=644 --dir-mode=755`);\n\n    neuronxTaskDefinition.addVolume({\n      name: \"model\",\n      host: {\n        sourcePath: `/mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName}`,\n      },\n    });\n\n    const volumeSize = Math.ceil(\n      PytorchTrainingNeuronxImage.size.toGibibytes() +\n        NeuronOptimizedMachineImage.size.toGibibytes(),\n    );\n    const desiredCapacity = Math.ceil(\n      (props.desiredCount ?? 1) / neuronxTaskDefinition.tasksPerInstance,\n    );\n    const autoScalingGroup = new AutoScalingGroup(this, \"AutoScalingGroup\", {\n      vpc: cluster.vpc,\n      instanceType: neuronxTaskDefinition.neuronxInstanceType.instanceType,\n      machineImage: new NeuronOptimizedMachineImage(\n        this,\n        \"NeuronOptimizedMachineImage\",\n      ),\n      blockDevices: [\n        {\n          deviceName: \"/dev/xvda\",\n          volume: BlockDeviceVolume.ebs(volumeSize, {\n            volumeType: EbsDeviceVolumeType.GP3,\n            encrypted: true,\n          }),\n        },\n      ],\n      userData,\n      desiredCapacity,\n      maxCapacity:\n        neuronxTaskDefinition.tasksPerInstance === 1\n          ? desiredCapacity + 1\n          : undefined,\n    });\n    autoScalingGroup.connections.allowFrom(\n      this.loadBalancer,\n      Port.tcpRange(32768, 60999),\n    );\n    neuronxTaskDefinition.compiledModel.bucket.grantRead(autoScalingGroup);\n    const provider = new ecs.AsgCapacityProvider(this, \"AsgCapacityProvider\", {\n      autoScalingGroup,\n    });\n    cluster.addAsgCapacityProvider(provider);\n  }\n}\n"]}
144
+ ApplicationLoadBalancedNeuronxService[_b] = { fqn: "aws-cdk-neuronx-patterns.ApplicationLoadBalancedNeuronxService", version: "0.3.0" };
145
+ //# sourceMappingURL=data:application/json;base64,{"version":3,"file":"application-load-balanced-neuronx-service.js","sourceRoot":"","sources":["../../../src/base/aws-ecs-patterns/application-load-balanced-neuronx-service.ts"],"names":[],"mappings":";;;;;AAAA,6CAAuC;AACvC,iEAIqC;AACrC,iDAAqD;AACrD,2CAA2C;AAC3C,mEAGsC;AAEtC,wCAIoB;AA6BpB,MAAa,qBACX,SAAQ,GAAG,CAAC,iBAAiB;IAQ7B,YAAY,KAAgB,EAAE,EAAU,EAAE,KAAiC;QACzE,MAAM,mBAAmB,GACvB,KAAK,CAAC,mBAAmB,IAAI,KAAK,CAAC,aAAa,CAAC,uBAAuB,CAAC;QAC3E,MAAM,kBAAkB,GAAG,KAAK,CAAC,kBAAkB,IAAI,CAAC,CAAC;QACzD,MAAM,gBAAgB,GAAG,IAAI,CAAC,KAAK,CACjC,mBAAmB,CAAC,gBAAgB,CAAC,YAAY,GAAG,kBAAkB,CACvE,CAAC;QACF,MAAM,oBAAoB,GACxB,gBAAgB,IAAI,CAAC;YACnB,CAAC,CAAC;gBACE,GAAG,CAAC,mBAAmB,CAAC,QAAQ,CAC9B,qBAAqB,gBAAgB,EAAE,CACxC;aACF;YACH,CAAC,CAAC,EAAE,CAAC;QACT,KAAK,CAAC,KAAK,EAAE,EAAE,EAAE;YACf,GAAG,KAAK;YACR,oBAAoB,EAAE;gBACpB,GAAG,CAAC,KAAK,CAAC,oBAAoB,IAAI,EAAE,CAAC;gBACrC,GAAG,oBAAoB;aACxB;SACF,CAAC,CAAC;QACH,IAAI,CAAC,eAAe,GAAG,IAAI,GAAG,CAAC,eAAe,CAAC,IAAI,EAAE,iBAAiB,CAAC,CAAC;QACxE,IAAI,CAAC,eAAe,CAAC,UAAU,CAC7B,GAAG,KAAK,CAAC,IAAI,CAAC;YACZ,MAAM,EAAE,mBAAmB,EAAE,gBAAgB,CAAC,KAAK,IAAI,CAAC;SACzD,CAAC,CAAC,GAAG,CAAa,CAAC,CAAC,EAAE,KAAK,EAAE,EAAE,CAAC,CAAC;YAChC,QAAQ,EAAE,cAAc,KAAK,EAAE;YAC/B,aAAa,EAAE,cAAc,KAAK,EAAE;YACpC,WAAW,EAAE,CAAC,GAAG,CAAC,gBAAgB,CAAC,IAAI,EAAE,GAAG,CAAC,gBAAgB,CAAC,KAAK,CAAC;SACrE,CAAC,CAAC,CACJ,CAAC;QACF,IAAI,IAAI,CAAC,aAAa,EAAE,CAAC;YACvB,KAAK,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,IAAI,CAAC,aAAa,CAAC,CAAC;QAC3D,CAAC;QACD,KAAK,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;QACpD,IAAI,CAAC,aAAa,GAAG,KAAK,CAAC,aAAa,CAAC;QACzC,IAAI,CAAC,mBAAmB,GAAG,mBAAmB,CAAC;QAC/C,IAAI,CAAC,kBAAkB,GAAG,kBAAkB,CAAC;QAC7C,IAAI,CAAC,gBAAgB,GAAG,gBAAgB,CAAC;IAC3C,CAAC;IAED,uBAAuB,CACrB,EAAU,EACV,KAAqC;QAErC,MAAM,SAAS,GAAG,KAAK,CAAC,YAAY,CAAC,EAAE,EAAE;YACvC,OAAO,EAAE,GAAG,CAAC,SAAS,CAAC,OAAO,CAAC;gBAC7B,YAAY,EAAE,EAAE;aACjB,CAAC;YACF,eAAe,EAAE,IAAI,CAAC,eAAe;YACrC,oBAAoB,EAAE,IAAI,CAAC,IAAI,CAC7B,CAAC,IAAI,CAAC,mBAAmB,CAAC,MAAM,CAAC,WAAW,EAAE,GAAG,GAAG,CAAC;gBACnD,IAAI,CAAC,gBAAgB,CACxB;YACD,GAAG,KAAK;SACT,CAAC,CAAC;QACH,SAAS,CAAC,cAAc,CAAC;YACvB,YAAY,EAAE,OAAO;YACrB,aAAa,EAAE,eAAe;YAC9B,QAAQ,EAAE,KAAK;SAChB,CAAC,CAAC;QACH,OAAO,SAAS,CAAC;IACnB,CAAC;;AAxEH,sDAyEC;;;AAGD,MAAa,qCAAsC,SAAQ,oDAAiC;IAC1F,YACE,KAAgB,EAChB,EAAU,EACV,KAAiD;QAEjD,MAAM,qBAAqB,GAAG,KAAK,CAAC,cAAc,CAAC;QACnD,IACE,CAAC,qBAAqB;YACtB,CAAC,CAAC,qBAAqB,YAAY,qBAAqB,CAAC,EACzD,CAAC;YACD,MAAM,IAAI,KAAK,CAAC,kDAAkD,CAAC,CAAC;QACtE,CAAC;QACD,KAAK,CAAC,KAAK,EAAE,EAAE,EAAE;YACf,sBAAsB,EACpB,KAAK,CAAC,sBAAsB,IAAI,sBAAQ,CAAC,OAAO,CAAC,EAAE,CAAC;YACtD,GAAG,KAAK;SACT,CAAC,CAAC;QAEH,MAAM,OAAO,GAAG,IAAI,CAAC,iBAAiB,CAAC,IAAI,EAAE,KAAK,CAAC,GAAG,CAAC,CAAC;QAExD,sCAAsC;QACtC,MAAM,QAAQ,GAAG,kBAAQ,CAAC,QAAQ,EAAE,CAAC;QACrC,QAAQ,CAAC,WAAW,CAAC;;;;;;;;;;;;;;;;;;;;;;;uBAuBF,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU;WACjE,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,SAAS,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,+CAA+C,CAAC,CAAC;QAE3K,qBAAqB,CAAC,SAAS,CAAC;YAC9B,IAAI,EAAE,OAAO;YACb,IAAI,EAAE;gBACJ,UAAU,EAAE,QAAQ,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,UAAU,EAAE;aAC5E;SACF,CAAC,CAAC;QAEH,MAAM,UAAU,GAAG,IAAI,CAAC,IAAI,CAC1B,qCAA2B,CAAC,IAAI,CAAC,WAAW,EAAE;YAC5C,qCAA2B,CAAC,IAAI,CAAC,WAAW,EAAE,CACjD,CAAC;QACF,MAAM,eAAe,GAAG,IAAI,CAAC,IAAI,CAC/B,CAAC,KAAK,CAAC,YAAY,IAAI,CAAC,CAAC,GAAG,qBAAqB,CAAC,gBAAgB,CACnE,CAAC;QACF,MAAM,gBAAgB,GAAG,IAAI,kCAAgB,CAAC,IAAI,EAAE,kBAAkB,EAAE;YACtE,GAAG,EAAE,OAAO,CAAC,GAAG;YAChB,YAAY,EAAE,qBAAqB,CAAC,mBAAmB,CAAC,YAAY;YACpE,YAAY,EAAE,IAAI,qCAA2B,CAC3C,IAAI,EACJ,6BAA6B,CAC9B;YACD,YAAY,EAAE;gBACZ;oBACE,UAAU,EAAE,WAAW;oBACvB,MAAM,EAAE,mCAAiB,CAAC,GAAG,CAAC,UAAU,EAAE;wBACxC,UAAU,EAAE,qCAAmB,CAAC,GAAG;wBACnC,SAAS,EAAE,IAAI;qBAChB,CAAC;iBACH;aACF;YACD,QAAQ;YACR,eAAe;YACf,WAAW,EACT,qBAAqB,CAAC,gBAAgB,KAAK,CAAC;gBAC1C,CAAC,CAAC,eAAe,GAAG,CAAC;gBACrB,CAAC,CAAC,SAAS;SAChB,CAAC,CAAC;QACH,gBAAgB,CAAC,WAAW,CAAC,SAAS,CACpC,IAAI,CAAC,YAAY,EACjB,cAAI,CAAC,QAAQ,CAAC,KAAK,EAAE,KAAK,CAAC,CAC5B,CAAC;QACF,qBAAqB,CAAC,aAAa,CAAC,MAAM,CAAC,SAAS,CAAC,gBAAgB,CAAC,CAAC;QACvE,MAAM,QAAQ,GAAG,IAAI,GAAG,CAAC,mBAAmB,CAAC,IAAI,EAAE,qBAAqB,EAAE;YACxE,gBAAgB;SACjB,CAAC,CAAC;QACH,OAAO,CAAC,sBAAsB,CAAC,QAAQ,CAAC,CAAC;IAC3C,CAAC;;AA/FH,sFAgGC","sourcesContent":["import { Duration } from \"aws-cdk-lib\";\nimport {\n  AutoScalingGroup,\n  BlockDeviceVolume,\n  EbsDeviceVolumeType,\n} from \"aws-cdk-lib/aws-autoscaling\";\nimport { Port, UserData } from \"aws-cdk-lib/aws-ec2\";\nimport * as ecs from \"aws-cdk-lib/aws-ecs\";\nimport {\n  ApplicationLoadBalancedEc2Service,\n  ApplicationLoadBalancedEc2ServiceProps,\n} from \"aws-cdk-lib/aws-ecs-patterns\";\nimport { Construct } from \"constructs\";\nimport {\n  INeuronxInstanceType,\n  NeuronOptimizedMachineImage,\n  PytorchTrainingNeuronxImage,\n} from \"../neuronx\";\nimport { NeuronxCompiledModel } from \"../neuronx-compiler\";\n\nexport interface NeuronxTaskDefinitionPropsBase\n  extends ecs.Ec2TaskDefinitionProps {\n  /**\n   * The instance type of compile worker instance.\n   */\n  readonly neuronxInstanceType?: INeuronxInstanceType;\n  /**\n   * The number of tensor parallel size.\n   * @default - 1\n   */\n  readonly tensorParallelSize?: number;\n}\n\nexport interface NeuronxTaskDefinitionProps extends NeuronxTaskDefinitionPropsBase {\n  /**\n   * The model to be compiled.\n   */\n  readonly compiledModel: NeuronxCompiledModel;\n}\n\nexport interface INeuronxTaskDefinition extends ecs.IEc2TaskDefinition {\n  readonly neuronxInstanceType: INeuronxInstanceType;\n  readonly tensorParallelSize: number;\n  readonly tasksPerInstance: number;\n  readonly compiledModel: NeuronxCompiledModel;\n}\nexport class NeuronxTaskDefinition\n  extends ecs.Ec2TaskDefinition\n  implements INeuronxTaskDefinition\n{\n  readonly neuronxInstanceType: INeuronxInstanceType;\n  readonly tensorParallelSize: number;\n  readonly tasksPerInstance: number;\n  readonly compiledModel: NeuronxCompiledModel;\n  protected readonly linuxParameters: ecs.LinuxParameters;\n  constructor(scope: Construct, id: string, props: NeuronxTaskDefinitionProps) {\n    const neuronxInstanceType =\n      props.neuronxInstanceType ?? props.compiledModel.recommendedInstanceType;\n    const tensorParallelSize = props.tensorParallelSize ?? 1;\n    const tasksPerInstance = Math.floor(\n      neuronxInstanceType.acceleratorChips.neuronxCores / tensorParallelSize,\n    );\n    const placementConstraints =\n      tasksPerInstance >= 2\n        ? [\n            ecs.PlacementConstraint.memberOf(\n              `runningTasksCount<${tasksPerInstance}`,\n            ),\n          ]\n        : [];\n    super(scope, id, {\n      ...props,\n      placementConstraints: [\n        ...(props.placementConstraints ?? []),\n        ...placementConstraints,\n      ],\n    });\n    this.linuxParameters = new ecs.LinuxParameters(this, \"LinuxParameters\");\n    this.linuxParameters.addDevices(\n      ...Array.from({\n        length: neuronxInstanceType?.acceleratorChips.chips ?? 1,\n      }).map<ecs.Device>((_, index) => ({\n        hostPath: `/dev/neuron${index}`,\n        containerPath: `/dev/neuron${index}`,\n        permissions: [ecs.DevicePermission.READ, ecs.DevicePermission.WRITE],\n      })),\n    );\n    if (this.executionRole) {\n      props.compiledModel.bucket.grantRead(this.executionRole);\n    }\n    props.compiledModel.bucket.grantRead(this.taskRole);\n    this.compiledModel = props.compiledModel;\n    this.neuronxInstanceType = neuronxInstanceType;\n    this.tensorParallelSize = tensorParallelSize;\n    this.tasksPerInstance = tasksPerInstance;\n  }\n\n  addContainerWithDefault(\n    id: string,\n    props: ecs.ContainerDefinitionOptions,\n  ): ecs.ContainerDefinition {\n    const container = super.addContainer(id, {\n      logging: ecs.LogDriver.awsLogs({\n        streamPrefix: id,\n      }),\n      linuxParameters: this.linuxParameters,\n      memoryReservationMiB: Math.ceil(\n        (this.neuronxInstanceType.memory.toMebibytes() * 0.8) /\n          this.tasksPerInstance,\n      ),\n      ...props,\n    });\n    container.addMountPoints({\n      sourceVolume: \"model\",\n      containerPath: \"/opt/ml/model\",\n      readOnly: false,\n    });\n    return container;\n  }\n}\n\nexport interface ApplicationLoadBalancedNeuronxServiceProps extends ApplicationLoadBalancedEc2ServiceProps {}\nexport class ApplicationLoadBalancedNeuronxService extends ApplicationLoadBalancedEc2Service {\n  constructor(\n    scope: Construct,\n    id: string,\n    props: ApplicationLoadBalancedNeuronxServiceProps,\n  ) {\n    const neuronxTaskDefinition = props.taskDefinition;\n    if (\n      !neuronxTaskDefinition ||\n      !(neuronxTaskDefinition instanceof NeuronxTaskDefinition)\n    ) {\n      throw new Error(\"taskDefinition must extend NeuronxTaskDefinition\");\n    }\n    super(scope, id, {\n      healthCheckGracePeriod:\n        props.healthCheckGracePeriod ?? Duration.minutes(15),\n      ...props,\n    });\n\n    const cluster = this.getDefaultCluster(this, props.vpc);\n\n    // install and mount mountpoint for s3\n    const userData = UserData.forLinux();\n    userData.addCommands(`\n#!/bin/bash -e\n\n# Install Mountpoint\nMP_RPM=$(mktemp --suffix=.rpm)\ncurl https://s3.amazonaws.com/mountpoint-s3-release/latest/x86_64/mount-s3.rpm > $MP_RPM\n\n# cloud-init installs conflict with SSM agent: https://github.com/amazonlinux/amazon-linux-2023/issues/397\nattempt=0\nmax_attempts=5\nuntil dnf install -y $MP_RPM; do\n    attempt=$((attempt + 1))\n    if [ $attempt -ge $max_attempts ]; then\n        echo \"Failed to install mount-s3 after $max_attempts attempts. Exiting.\"\n        exit 1\n    fi\n    echo \"dnf install mount-s3 failed (attempt $attempt/$max_attempts), retrying in 3 seconds...\"\n    sleep 3\ndone\n\nrm $MP_RPM\n\n# Setup the fstab file and create the mount\nmkdir --parents /mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName}\nmount-s3 ${neuronxTaskDefinition.compiledModel.bucket.bucketName} /mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName} --allow-other --file-mode=644 --dir-mode=755`);\n\n    neuronxTaskDefinition.addVolume({\n      name: \"model\",\n      host: {\n        sourcePath: `/mnt/${neuronxTaskDefinition.compiledModel.bucket.bucketName}`,\n      },\n    });\n\n    const volumeSize = Math.ceil(\n      PytorchTrainingNeuronxImage.size.toGibibytes() +\n        NeuronOptimizedMachineImage.size.toGibibytes(),\n    );\n    const desiredCapacity = Math.ceil(\n      (props.desiredCount ?? 1) / neuronxTaskDefinition.tasksPerInstance,\n    );\n    const autoScalingGroup = new AutoScalingGroup(this, \"AutoScalingGroup\", {\n      vpc: cluster.vpc,\n      instanceType: neuronxTaskDefinition.neuronxInstanceType.instanceType,\n      machineImage: new NeuronOptimizedMachineImage(\n        this,\n        \"NeuronOptimizedMachineImage\",\n      ),\n      blockDevices: [\n        {\n          deviceName: \"/dev/xvda\",\n          volume: BlockDeviceVolume.ebs(volumeSize, {\n            volumeType: EbsDeviceVolumeType.GP3,\n            encrypted: true,\n          }),\n        },\n      ],\n      userData,\n      desiredCapacity,\n      maxCapacity:\n        neuronxTaskDefinition.tasksPerInstance === 1\n          ? desiredCapacity + 1\n          : undefined,\n    });\n    autoScalingGroup.connections.allowFrom(\n      this.loadBalancer,\n      Port.tcpRange(32768, 60999),\n    );\n    neuronxTaskDefinition.compiledModel.bucket.grantRead(autoScalingGroup);\n    const provider = new ecs.AsgCapacityProvider(this, \"AsgCapacityProvider\", {\n      autoScalingGroup,\n    });\n    cluster.addAsgCapacityProvider(provider);\n  }\n}\n"]}
@@ -63,7 +63,7 @@ class PytorchInferenceNeuronxImage extends PytorchNeuronxImage {
63
63
  }
64
64
  exports.PytorchInferenceNeuronxImage = PytorchInferenceNeuronxImage;
65
65
  _b = PytorchInferenceNeuronxImage, _c = JSII_RTTI_SYMBOL_1;
66
- PytorchInferenceNeuronxImage[_c] = { fqn: "aws-cdk-neuronx-patterns.PytorchInferenceNeuronxImage", version: "0.2.1" };
66
+ PytorchInferenceNeuronxImage[_c] = { fqn: "aws-cdk-neuronx-patterns.PytorchInferenceNeuronxImage", version: "0.3.0" };
67
67
  PytorchInferenceNeuronxImage.imageName = "public.ecr.aws/neuron/pytorch-inference-neuronx";
68
68
  /** Neuron SDK 2.28.0 */
69
69
  PytorchInferenceNeuronxImage.SDK_2_28_0 = _b.fromNeuronSdkVersion("2.28.0", "3.12", "2.9.0", "24.04");
@@ -87,7 +87,7 @@ class PytorchTrainingNeuronxImage extends PytorchNeuronxImage {
87
87
  }
88
88
  exports.PytorchTrainingNeuronxImage = PytorchTrainingNeuronxImage;
89
89
  _d = JSII_RTTI_SYMBOL_1;
90
- PytorchTrainingNeuronxImage[_d] = { fqn: "aws-cdk-neuronx-patterns.PytorchTrainingNeuronxImage", version: "0.2.1" };
90
+ PytorchTrainingNeuronxImage[_d] = { fqn: "aws-cdk-neuronx-patterns.PytorchTrainingNeuronxImage", version: "0.3.0" };
91
91
  PytorchTrainingNeuronxImage.imageName = "public.ecr.aws/neuron/pytorch-training-neuronx";
92
92
  class VllmInferenceNeuronxImage extends NeuronxImage {
93
93
  static fromNeuronSdkVersion(neuronSdkVersion, vllmVersion, pythonVersion, ubuntuVersion) {
@@ -101,7 +101,7 @@ class VllmInferenceNeuronxImage extends NeuronxImage {
101
101
  }
102
102
  exports.VllmInferenceNeuronxImage = VllmInferenceNeuronxImage;
103
103
  _e = VllmInferenceNeuronxImage, _f = JSII_RTTI_SYMBOL_1;
104
- VllmInferenceNeuronxImage[_f] = { fqn: "aws-cdk-neuronx-patterns.VllmInferenceNeuronxImage", version: "0.2.1" };
104
+ VllmInferenceNeuronxImage[_f] = { fqn: "aws-cdk-neuronx-patterns.VllmInferenceNeuronxImage", version: "0.3.0" };
105
105
  /** Neuron SDK 2.28.0 with vLLM 0.13.0 */
106
106
  VllmInferenceNeuronxImage.SDK_2_28_0 = _e.fromNeuronSdkVersion("2.28.0", "0.13.0", "3.12", "24.04");
107
107
  /** Neuron SDK 2.27.1 with vLLM 0.13.0 */
@@ -84,7 +84,7 @@ class Parameters {
84
84
  }
85
85
  exports.Parameters = Parameters;
86
86
  _a = JSII_RTTI_SYMBOL_1;
87
- Parameters[_a] = { fqn: "aws-cdk-neuronx-patterns.Parameters", version: "0.2.1" };
87
+ Parameters[_a] = { fqn: "aws-cdk-neuronx-patterns.Parameters", version: "0.3.0" };
88
88
  /**
89
89
  * Compile target model.
90
90
  */
@@ -149,5 +149,5 @@ class Model {
149
149
  }
150
150
  exports.Model = Model;
151
151
  _b = JSII_RTTI_SYMBOL_1;
152
- Model[_b] = { fqn: "aws-cdk-neuronx-patterns.Model", version: "0.2.1" };
152
+ Model[_b] = { fqn: "aws-cdk-neuronx-patterns.Model", version: "0.3.0" };
153
153
  //# sourceMappingURL=data:application/json;base64,{"version":3,"file":"model.js","sourceRoot":"","sources":["../../../src/base/neuronx/model.ts"],"names":[],"mappings":";;;;;AAAA,6CAA0C;AAG1C,IAAY,YAGX;AAHD,WAAY,YAAY;IACtB,gEAAiB,CAAA;IACjB,6DAAe,CAAA;AACjB,CAAC,EAHW,YAAY,4BAAZ,YAAY,QAGvB;AAED;;GAEG;AACH,IAAY,UAKX;AALD,WAAY,UAAU;IACpB;;OAEG;IACH,uBAAS,CAAA;AACX,CAAC,EALW,UAAU,0BAAV,UAAU,QAKrB;AAED;;GAEG;AACH,IAAY,QAaX;AAbD,WAAY,QAAQ;IAClB;;OAEG;IACH,6EAA2B,CAAA;IAC3B;;OAEG;IACH,uDAAgB,CAAA;IAChB;;OAEG;IACH,qFAA+B,CAAA;AACjC,CAAC,EAbW,QAAQ,wBAAR,QAAQ,QAanB;AAED;;GAEG;AACH,MAAa,UAAU;IACrB;;;;OAIG;IACH,MAAM,CAAC,OAAO,CAAC,UAAkB;QAC/B,OAAO,IAAI,UAAU,CAAC,UAAU,GAAG,OAAO,CAAC,CAAC;IAC9C,CAAC;IACD;;;;OAIG;IACH,MAAM,CAAC,OAAO,CAAC,UAAkB;QAC/B,OAAO,IAAI,UAAU,CAAC,UAAU,GAAG,UAAU,CAAC,CAAC;IACjD,CAAC;IACD;IACE;;OAEG;IACc,UAAkB;QAAlB,eAAU,GAAV,UAAU,CAAQ;IAClC,CAAC;IACJ;;;OAGG;IACH,SAAS;QACP,OAAO,IAAI,CAAC,UAAU,GAAG,OAAO,CAAC;IACnC,CAAC;IACD;;;OAGG;IACH,SAAS;QACP,OAAO,IAAI,CAAC,UAAU,GAAG,UAAU,CAAC;IACtC,CAAC;IACD,UAAU;QACR,OAAO,kBAAI,CAAC,SAAS,CAAC,IAAI,CAAC,SAAS,EAAE,GAAG,GAAG,CAAC,CAAC;IAChD,CAAC;;AAvCH,gCAwCC;;;AAiBD;;GAEG;AACH,MAAa,KAAK;IAChB;;;;;OAKG;IACH,MAAM,CAAC,eAAe,CAAC,OAAe,EAAE,OAAsB;QAC5D,MAAM,UAAU,GAAG,OAAO,EAAE,UAAU,IAAI,KAAK,CAAC,WAAW,CAAC,OAAO,CAAC,CAAC;QACrE,IAAI,CAAC,UAAU,EAAE,CAAC;YAChB,MAAM,IAAI,KAAK,CACb,yFAAyF,CAC1F,CAAC;QACJ,CAAC;QACD,OAAO,IAAI,KAAK,CAAC,OAAO,EAAE,OAAO,EAAE,SAAS,IAAI,OAAO,EAAE;YACvD,GAAG,OAAO;YACV,UAAU;SACX,CAAC,CAAC;IACL,CAAC;IACD;;;;;;OAMG;IACH,MAAM,CAAC,UAAU,CAAC,MAAe,EAAE,MAAc,EAAE,OAAsB;QACvE,IAAI,mBAAK,CAAC,YAAY,CAAC,MAAM,CAAC,IAAI,CAAC,OAAO,EAAE,SAAS,EAAE,CAAC;YACtD,MAAM,IAAI,KAAK,CAAC,iDAAiD,CAAC,CAAC;QACrE,CAAC;QACD,MAAM,SAAS,GAAG,OAAO,EAAE,SAAS,IAAI,MAAM,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;QACvE,MAAM,UAAU,GAAG,OAAO,EAAE,UAAU,IAAI,KAAK,CAAC,WAAW,CAAC,SAAS,CAAC,CAAC;QACvE,IAAI,CAAC,UAAU,EAAE,CAAC;YAChB,MAAM,IAAI,KAAK,CACb,yFAAyF,CAC1F,CAAC;QACJ,CAAC;QACD,OAAO,IAAI,KAAK,CACd,MAAM,CAAC,cAAc,CAAC,MAAM,CAAC,EAC7B,SAAS,EACT,EAAE,GAAG,OAAO,EAAE,UAAU,EAAE,EAC1B,MAAM,EACN,MAAM,CACP,CAAC;IACJ,CAAC;IACO,MAAM,CAAC,WAAW,CAAC,MAAc;QACvC,IAAI,CAAC;YACH,MAAM,OAAO,GAAG,MAAM,CAAC,KAAK,CAAC,YAAY,CAAC,CAAC;YAC3C,IAAI,OAAO,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;gBACjB,OAAO,UAAU,CAAC,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YAClD,CAAC;YACD,MAAM,OAAO,GAAG,MAAM,CAAC,KAAK,CAAC,YAAY,CAAC,CAAC;YAC3C,IAAI,OAAO,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;gBACjB,OAAO,UAAU,CAAC,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;YAClD,CAAC;QACH,CAAC;QAAC,MAAM,CAAC;YACP,MAAM;QACR,CAAC;QACD,OAAO,SAAS,CAAC;IACnB,CAAC;IACD,YACW,OAAe,EACf,SAAiB,EACjB,OAAqB,EACrB,MAAgB,EAChB,MAAe;QAJf,YAAO,GAAP,OAAO,CAAQ;QACf,cAAS,GAAT,SAAS,CAAQ;QACjB,YAAO,GAAP,OAAO,CAAc;QACrB,WAAM,GAAN,MAAM,CAAU;QAChB,WAAM,GAAN,MAAM,CAAS;IACvB,CAAC;;AAlEN,sBAmEC","sourcesContent":["import { Size, Token } from \"aws-cdk-lib\";\nimport { IBucket } from \"aws-cdk-lib/aws-s3\";\n\nexport enum DataTypeBits {\n  BF16_OR_FP16 = 16,\n  FP8_OR_INT8 = 8,\n}\n\n/**\n * Quant data type.\n */\nexport enum QuantDtype {\n  /**\n   * int8 weight storage.\n   */\n  S8 = \"s8\",\n}\n\n/**\n * Optimization level.\n */\nexport enum OptLevel {\n  /**\n   * enables the core performance optimizations in the compiler, while also minimizing compile time.\n   */\n  MINIMIZING_COMPILE_TIME = 1,\n  /**\n   * provides the best balance between model performance and compile time.\n   */\n  BEST_BALANCE = 2,\n  /**\n   * may provide additional model execution performance but may incur longer compile times and higher host memory usage during model compilation.\n   */\n  MODEL_EXECUTION_PERFORMANCE = 3,\n}\n\n/**\n * Represents the amount of parameters.\n */\nexport class Parameters {\n  /**\n   * Create a Parameters representing an amount million.\n   * @param parameters number of parameters millionX\n   * @returns parameters\n   */\n  static million(parameters: number) {\n    return new Parameters(parameters * 1000000);\n  }\n  /**\n   * Create a Parameters representing an amount billion.\n   * @param parameters number of parameters billionX\n   * @returns parameters\n   */\n  static billion(parameters: number) {\n    return new Parameters(parameters * 1000000000);\n  }\n  private constructor(\n    /**\n     * number of paremters.\n     */\n    private readonly parameters: number,\n  ) {}\n  /**\n   * Return this number of parameters as million.\n   * @returns This number of parameters as million.\n   */\n  toMillion() {\n    return this.parameters / 1000000;\n  }\n  /**\n   * Return this number of parameters as billion.\n   * @returns This number of parameters as billion.\n   */\n  toBillion() {\n    return this.parameters / 1000000000;\n  }\n  weightSize() {\n    return Size.gibibytes(this.toBillion() * 2.5);\n  }\n}\n\nexport interface ModelConfig {\n  readonly layers: number;\n  readonly embeddingDimension: number;\n  readonly attentionHeads: number;\n}\n\n/**\n * Compile target model basic infromation\n */\nexport interface ModelOptions {\n  readonly parameters: Parameters;\n  readonly config?: ModelConfig;\n  readonly modelName?: string;\n}\n\n/**\n * Compile target model.\n */\nexport class Model {\n  /**\n   * model informations at HuggingFace\n   * @param modelId model id on the HuggingFace\n   * @param options model basic information\n   * @returns model instance\n   */\n  static fromHuggingFace(modelId: string, options?: ModelOptions) {\n    const parameters = options?.parameters ?? Model.maybeParams(modelId);\n    if (!parameters) {\n      throw new Error(\n        \"The number of parameters cannot be inferred from the model ID. Set optional parameters.\",\n      );\n    }\n    return new Model(modelId, options?.modelName ?? modelId, {\n      ...options,\n      parameters,\n    });\n  }\n  /**\n   * model informations at S3 Bucket\n   * @param bucket Model stored S3 Bucket\n   * @param prefix Model stored objects prefix\n   * @param options model basic information\n   * @returns model instance\n   */\n  static fromBucket(bucket: IBucket, prefix: string, options?: ModelOptions) {\n    if (Token.isUnresolved(prefix) && !options?.modelName) {\n      throw new Error(\"ModelName is required when prefix is unresolved\");\n    }\n    const modelName = options?.modelName ?? prefix.split(\"/\").slice(-1)[0];\n    const parameters = options?.parameters ?? Model.maybeParams(modelName);\n    if (!parameters) {\n      throw new Error(\n        \"The number of parameters cannot be inferred from the model ID. Set optional parameters.\",\n      );\n    }\n    return new Model(\n      bucket.s3UrlForObject(prefix),\n      modelName,\n      { ...options, parameters },\n      bucket,\n      prefix,\n    );\n  }\n  private static maybeParams(source: string) {\n    try {\n      const billion = source.match(/-(\\d+)[bB]/);\n      if (billion?.[1]) {\n        return Parameters.billion(parseInt(billion[1]));\n      }\n      const million = source.match(/-(\\d+)[mM]/);\n      if (million?.[1]) {\n        return Parameters.million(parseInt(million[1]));\n      }\n    } catch {\n      // NOP\n    }\n    return undefined;\n  }\n  private constructor(\n    readonly modelId: string,\n    readonly modelName: string,\n    readonly options: ModelOptions,\n    readonly bucket?: IBucket,\n    readonly prefix?: string,\n  ) {}\n}\n"]}
@@ -42,6 +42,6 @@ class NeuronOptimizedMachineImage extends constructs_1.Construct {
42
42
  }
43
43
  exports.NeuronOptimizedMachineImage = NeuronOptimizedMachineImage;
44
44
  _a = JSII_RTTI_SYMBOL_1;
45
- NeuronOptimizedMachineImage[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronOptimizedMachineImage", version: "0.2.1" };
45
+ NeuronOptimizedMachineImage[_a] = { fqn: "aws-cdk-neuronx-patterns.NeuronOptimizedMachineImage", version: "0.3.0" };
46
46
  NeuronOptimizedMachineImage.size = aws_cdk_lib_1.Size.gibibytes(30);
47
47
  //# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoibmV1cm9uLW9wdGltaXplZC1tYWNoaW5lLWltYWdlLmpzIiwic291cmNlUm9vdCI6IiIsInNvdXJjZXMiOlsiLi4vLi4vLi4vc3JjL2Jhc2UvbmV1cm9ueC9uZXVyb24tb3B0aW1pemVkLW1hY2hpbmUtaW1hZ2UudHMiXSwibmFtZXMiOltdLCJtYXBwaW5ncyI6Ijs7Ozs7QUFBQSw2Q0FBbUQ7QUFDbkQsaURBSzZCO0FBQzdCLHVEQUEwRTtBQUMxRSwyQ0FBMkM7QUFDM0MsbUVBQXdEO0FBQ3hELDJDQUF1QztBQUN2Qyw2QkFBNkI7QUFFN0IsTUFBYSwyQkFDWCxTQUFRLHNCQUFTO0lBS2pCLElBQUksT0FBTztRQUNULE9BQU8sSUFBSSxDQUFDLFFBQVEsQ0FBQyxZQUFZLENBQUMsVUFBVSxDQUFDLENBQUM7SUFDaEQsQ0FBQztJQUVELFlBQVksS0FBZ0IsRUFBRSxFQUFVO1FBQ3RDLEtBQUssQ0FBQyxLQUFLLEVBQUUsRUFBRSxDQUFDLENBQUM7UUFFakIsTUFBTSxRQUFRLEdBQUcsSUFBSSwyQkFBUSxDQUFDLElBQUksRUFBRSxvQkFBb0IsRUFBRTtZQUN4RCxjQUFjLEVBQUUsSUFBSSw4QkFBaUIsQ0FBQyxJQUFJLEVBQUUsb0JBQW9CLEVBQUU7Z0JBQ2hFLElBQUksRUFBRSxpQkFBSSxDQUFDLFNBQVMsQ0FBQyxJQUFJLENBQUMsSUFBSSxDQUFDLFNBQVMsRUFBRSxxQkFBcUIsQ0FBQyxDQUFDO2dCQUNqRSxPQUFPLEVBQUUsZUFBZTtnQkFDeEIsT0FBTyxFQUFFLG9CQUFPLENBQUMsYUFBYTtnQkFDOUIsSUFBSSxFQUFFLHNDQUFzQzthQUM3QyxDQUFDO1NBQ0gsQ0FBQyxDQUFDO1FBQ0gsSUFBSSxDQUFDLFFBQVEsR0FBRyxJQUFJLDRCQUFjLENBQUMsSUFBSSxFQUFFLFlBQVksRUFBRTtZQUNyRCxZQUFZLEVBQUUsUUFBUSxDQUFDLFlBQVk7WUFDbkMsWUFBWSxFQUFFLG9CQUFvQjtZQUNsQyxVQUFVLEVBQUU7Z0JBQ1YsS0FBSyxFQUFFLEdBQUcsQ0FBQyxlQUFlLENBQUMsdUJBQXVCLENBQ2hELElBQUksRUFDSixPQUFPLEVBQ1AscUVBQXFFLENBQ3RFLENBQUMsV0FBVzthQUNkO1NBQ0YsQ0FBQyxDQUFDO0lBQ0wsQ0FBQztJQUNELFFBQVEsQ0FBQyxNQUFpQjtRQUN4QixPQUFPO1lBQ0wsT0FBTyxFQUFFLElBQUksQ0FBQyxPQUFPO1lBQ3JCLE1BQU0sRUFBRSw2QkFBbUIsQ0FBQyxLQUFLO1lBQ2pDLFFBQVEsRUFBRSxrQkFBUSxDQUFDLFFBQVEsRUFBRTtTQUM5QixDQUFDO0lBQ0osQ0FBQzs7QUF2Q0gsa0VBd0NDOzs7QUFwQ2lCLGdDQUFJLEdBQUcsa0JBQUksQ0FBQyxTQUFTLENBQUMsRUFBRSxDQUFDLENBQUMiLCJzb3VyY2VzQ29udGVudCI6WyJpbXBvcnQgeyBDdXN0b21SZXNvdXJjZSwgU2l6ZSB9IGZyb20gXCJhd3MtY2RrLWxpYlwiO1xuaW1wb3J0IHtcbiAgSU1hY2hpbmVJbWFnZSxcbiAgTWFjaGluZUltYWdlQ29uZmlnLFxuICBPcGVyYXRpbmdTeXN0ZW1UeXBlLFxuICBVc2VyRGF0YSxcbn0gZnJvbSBcImF3cy1jZGstbGliL2F3cy1lYzJcIjtcbmltcG9ydCB7IENvZGUsIFJ1bnRpbWUsIFNpbmdsZXRvbkZ1bmN0aW9uIH0gZnJvbSBcImF3cy1jZGstbGliL2F3cy1sYW1iZGFcIjtcbmltcG9ydCAqIGFzIHNzbSBmcm9tIFwiYXdzLWNkay1saWIvYXdzLXNzbVwiO1xuaW1wb3J0IHsgUHJvdmlkZXIgfSBmcm9tIFwiYXdzLWNkay1saWIvY3VzdG9tLXJlc291cmNlc1wiO1xuaW1wb3J0IHsgQ29uc3RydWN0IH0gZnJvbSBcImNvbnN0cnVjdHNcIjtcbmltcG9ydCAqIGFzIHBhdGggZnJvbSBcInBhdGhcIjtcblxuZXhwb3J0IGNsYXNzIE5ldXJvbk9wdGltaXplZE1hY2hpbmVJbWFnZVxuICBleHRlbmRzIENvbnN0cnVjdFxuICBpbXBsZW1lbnRzIElNYWNoaW5lSW1hZ2VcbntcbiAgc3RhdGljIHJlYWRvbmx5IHNpemUgPSBTaXplLmdpYmlieXRlcygzMCk7XG4gIHByaXZhdGUgcmVhZG9ubHkgcmVzb3VyY2U6IEN1c3RvbVJlc291cmNlO1xuICBnZXQgaW1hZ2VJZCgpIHtcbiAgICByZXR1cm4gdGhpcy5yZXNvdXJjZS5nZXRBdHRTdHJpbmcoXCJpbWFnZV9pZFwiKTtcbiAgfVxuXG4gIGNvbnN0cnVjdG9yKHNjb3BlOiBDb25zdHJ1Y3QsIGlkOiBzdHJpbmcpIHtcbiAgICBzdXBlcihzY29wZSwgaWQpO1xuXG4gICAgY29uc3QgcHJvdmlkZXIgPSBuZXcgUHJvdmlkZXIodGhpcywgXCJOZXVyb254QW1pUHJvdmlkZXJcIiwge1xuICAgICAgb25FdmVudEhhbmRsZXI6IG5ldyBTaW5nbGV0b25GdW5jdGlvbih0aGlzLCBcIk5ldXJvbnhBbWlGdW5jdGlvblwiLCB7XG4gICAgICAgIGNvZGU6IENvZGUuZnJvbUFzc2V0KHBhdGguam9pbihfX2Rpcm5hbWUsIFwicHJpdmF0ZS9uZXVyb254LWFtaVwiKSksXG4gICAgICAgIGhhbmRsZXI6IFwiaW5kZXgub25FdmVudFwiLFxuICAgICAgICBydW50aW1lOiBSdW50aW1lLk5PREVKU19MQVRFU1QsXG4gICAgICAgIHV1aWQ6IFwiMDhjOTg1MGEtNmYxMy00ZWQ0LTllMmQtNzg4OGQ3YjVhMjU4XCIsXG4gICAgICB9KSxcbiAgICB9KTtcbiAgICB0aGlzLnJlc291cmNlID0gbmV3IEN1c3RvbVJlc291cmNlKHRoaXMsIFwiTmV1cm9ueEFtaVwiLCB7XG4gICAgICBzZXJ2aWNlVG9rZW46IHByb3ZpZGVyLnNlcnZpY2VUb2tlbixcbiAgICAgIHJlc291cmNlVHlwZTogXCJDdXN0b206Ok5ldXJvbnhBbWlcIixcbiAgICAgIHByb3BlcnRpZXM6IHtcbiAgICAgICAgaW1hZ2U6IHNzbS5TdHJpbmdQYXJhbWV0ZXIuZnJvbVN0cmluZ1BhcmFtZXRlck5hbWUoXG4gICAgICAgICAgdGhpcyxcbiAgICAgICAgICBcIkltYWdlXCIsXG4gICAgICAgICAgXCIvYXdzL3NlcnZpY2UvZWNzL29wdGltaXplZC1hbWkvYW1hem9uLWxpbnV4LTIwMjMvbmV1cm9uL3JlY29tbWVuZGVkXCIsXG4gICAgICAgICkuc3RyaW5nVmFsdWUsXG4gICAgICB9LFxuICAgIH0pO1xuICB9XG4gIGdldEltYWdlKF9zY29wZTogQ29uc3RydWN0KTogTWFjaGluZUltYWdlQ29uZmlnIHtcbiAgICByZXR1cm4ge1xuICAgICAgaW1hZ2VJZDogdGhpcy5pbWFnZUlkLFxuICAgICAgb3NUeXBlOiBPcGVyYXRpbmdTeXN0ZW1UeXBlLkxJTlVYLFxuICAgICAgdXNlckRhdGE6IFVzZXJEYXRhLmZvckxpbnV4KCksXG4gICAgfTtcbiAgfVxufVxuIl19
@@ -14,7 +14,7 @@ class Inferentia2Chips {
14
14
  }
15
15
  exports.Inferentia2Chips = Inferentia2Chips;
16
16
  _a = JSII_RTTI_SYMBOL_1;
17
- Inferentia2Chips[_a] = { fqn: "aws-cdk-neuronx-patterns.Inferentia2Chips", version: "0.2.1" };
17
+ Inferentia2Chips[_a] = { fqn: "aws-cdk-neuronx-patterns.Inferentia2Chips", version: "0.3.0" };
18
18
  class Trainium1Chips {
19
19
  constructor(chips) {
20
20
  this.chips = chips;
@@ -24,7 +24,7 @@ class Trainium1Chips {
24
24
  }
25
25
  exports.Trainium1Chips = Trainium1Chips;
26
26
  _b = JSII_RTTI_SYMBOL_1;
27
- Trainium1Chips[_b] = { fqn: "aws-cdk-neuronx-patterns.Trainium1Chips", version: "0.2.1" };
27
+ Trainium1Chips[_b] = { fqn: "aws-cdk-neuronx-patterns.Trainium1Chips", version: "0.3.0" };
28
28
  class Trainium2Chips {
29
29
  constructor(chips) {
30
30
  this.chips = chips;
@@ -37,7 +37,7 @@ class Trainium2Chips {
37
37
  }
38
38
  exports.Trainium2Chips = Trainium2Chips;
39
39
  _c = JSII_RTTI_SYMBOL_1;
40
- Trainium2Chips[_c] = { fqn: "aws-cdk-neuronx-patterns.Trainium2Chips", version: "0.2.1" };
40
+ Trainium2Chips[_c] = { fqn: "aws-cdk-neuronx-patterns.Trainium2Chips", version: "0.3.0" };
41
41
  class NeuronxInstanceTypeBase {
42
42
  constructor(props) {
43
43
  this.instanceType = props.instanceType;
@@ -96,7 +96,7 @@ class NeuronxInstanceType {
96
96
  }
97
97
  exports.NeuronxInstanceType = NeuronxInstanceType;
98
98
  _d = JSII_RTTI_SYMBOL_1;
99
- NeuronxInstanceType[_d] = { fqn: "aws-cdk-neuronx-patterns.NeuronxInstanceType", version: "0.2.1" };
99
+ NeuronxInstanceType[_d] = { fqn: "aws-cdk-neuronx-patterns.NeuronxInstanceType", version: "0.3.0" };
100
100
  /**
101
101
  * inf2.xlarge
102
102
  */
@@ -1 +1,3 @@
1
- export * from "./neuronx-compiler";
1
+ export * from "./neuronx-compiler-base";
2
+ export * from "./neuronx-native-compiler";
3
+ export * from "./neuronx-cross-compiler";
@@ -14,5 +14,7 @@ var __exportStar = (this && this.__exportStar) || function(m, exports) {
14
14
  for (var p in m) if (p !== "default" && !Object.prototype.hasOwnProperty.call(exports, p)) __createBinding(exports, m, p);
15
15
  };
16
16
  Object.defineProperty(exports, "__esModule", { value: true });
17
- __exportStar(require("./neuronx-compiler"), exports);
18
- //# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoiaW5kZXguanMiLCJzb3VyY2VSb290IjoiIiwic291cmNlcyI6WyIuLi8uLi8uLi9zcmMvYmFzZS9uZXVyb254LWNvbXBpbGVyL2luZGV4LnRzIl0sIm5hbWVzIjpbXSwibWFwcGluZ3MiOiI7Ozs7Ozs7Ozs7Ozs7Ozs7QUFBQSxxREFBbUMiLCJzb3VyY2VzQ29udGVudCI6WyJleHBvcnQgKiBmcm9tIFwiLi9uZXVyb254LWNvbXBpbGVyXCI7XG4iXX0=
17
+ __exportStar(require("./neuronx-compiler-base"), exports);
18
+ __exportStar(require("./neuronx-native-compiler"), exports);
19
+ __exportStar(require("./neuronx-cross-compiler"), exports);
20
+ //# sourceMappingURL=data:application/json;base64,eyJ2ZXJzaW9uIjozLCJmaWxlIjoiaW5kZXguanMiLCJzb3VyY2VSb290IjoiIiwic291cmNlcyI6WyIuLi8uLi8uLi9zcmMvYmFzZS9uZXVyb254LWNvbXBpbGVyL2luZGV4LnRzIl0sIm5hbWVzIjpbXSwibWFwcGluZ3MiOiI7Ozs7Ozs7Ozs7Ozs7Ozs7QUFBQSwwREFBd0M7QUFDeEMsNERBQTBDO0FBQzFDLDJEQUF5QyIsInNvdXJjZXNDb250ZW50IjpbImV4cG9ydCAqIGZyb20gXCIuL25ldXJvbngtY29tcGlsZXItYmFzZVwiO1xuZXhwb3J0ICogZnJvbSBcIi4vbmV1cm9ueC1uYXRpdmUtY29tcGlsZXJcIjtcbmV4cG9ydCAqIGZyb20gXCIuL25ldXJvbngtY3Jvc3MtY29tcGlsZXJcIjtcbiJdfQ==
@@ -1,7 +1,8 @@
1
1
  import { Size } from "aws-cdk-lib";
2
2
  import * as batch from "aws-cdk-lib/aws-batch";
3
- import * as ec2 from "aws-cdk-lib/aws-ec2";
3
+ import { IVpc, SubnetSelection } from "aws-cdk-lib/aws-ec2";
4
4
  import { ContainerImage } from "aws-cdk-lib/aws-ecs";
5
+ import { IRole } from "aws-cdk-lib/aws-iam";
5
6
  import { IBucket } from "aws-cdk-lib/aws-s3";
6
7
  import { Construct } from "constructs";
7
8
  import { INeuronxInstanceType, Model } from "../neuronx";
@@ -19,13 +20,48 @@ export interface INeuronxContainerImage {
19
20
  readonly neuronSdkVersion: string;
20
21
  }
21
22
  /**
22
- * Props of NeuronxCompiler.
23
+ * The model compiled by Neuronx compiler.
23
24
  */
24
- export interface NeuronxCompilerProps {
25
+ export interface NeuronxCompiledModel {
26
+ /**
27
+ * The recommended Neuron instance type for running inference with this compiled model.
28
+ */
29
+ readonly recommendedInstanceType: INeuronxInstanceType;
30
+ /**
31
+ * The bucket to upload compiled artifacts.
32
+ */
33
+ readonly bucket: IBucket;
34
+ /**
35
+ * S3 URL that compiled artifact uploaded.
36
+ */
37
+ readonly s3Uri: string;
38
+ /**
39
+ * S3 prefix that compiled artifact uploaded.
40
+ */
41
+ readonly s3Prefix: string;
42
+ /**
43
+ * The model name.
44
+ */
45
+ readonly modelName: string;
46
+ /**
47
+ * The weight size of the model.
48
+ */
49
+ readonly weightSize: Size;
50
+ }
51
+ /**
52
+ * Interface for Neuronx compilers.
53
+ */
54
+ export interface INeuronxCompiler {
55
+ compile(): NeuronxCompiledModel;
56
+ }
57
+ /**
58
+ * Common props for NeuronxCompilerBase.
59
+ */
60
+ export interface NeuronxCompilerBaseProps {
25
61
  /**
26
62
  * VPC in which this will launch compile worker instance.
27
63
  */
28
- readonly vpc: ec2.IVpc;
64
+ readonly vpc: IVpc;
29
65
  /**
30
66
  * The bucket to upload compiled artifacts.
31
67
  */
@@ -53,10 +89,13 @@ export interface NeuronxCompilerProps {
53
89
  * An image of the container where the compile job is executed.
54
90
  */
55
91
  readonly image: INeuronxContainerImage;
92
+ /**
93
+ * The command to run in the container.
94
+ */
56
95
  readonly command?: string[];
57
96
  /**
58
97
  * The root volume of worker instance.
59
- * @default - N bilion parameters * 5GiB EBS
98
+ * @default - N billion parameters * 5GiB EBS
60
99
  */
61
100
  readonly volumeSize?: Size;
62
101
  /**
@@ -70,7 +109,7 @@ export interface NeuronxCompilerProps {
70
109
  *
71
110
  * @default - new subnets will be created
72
111
  */
73
- readonly vpcSubnets?: ec2.SubnetSelection;
112
+ readonly vpcSubnets?: SubnetSelection;
74
113
  /**
75
114
  * The environment variables to pass to the container.
76
115
  * This is only applicable when using container runtime.
@@ -81,40 +120,43 @@ export interface NeuronxCompilerProps {
81
120
  [key: string]: string;
82
121
  };
83
122
  }
84
- export interface NeuronxCompiledModel {
85
- readonly compileTimeInstanceType: INeuronxInstanceType;
86
- /**
87
- * The bucket to upload compiled artifacts.
88
- */
89
- readonly bucket: IBucket;
90
- /**
91
- * S3 URL that compiled artifact uploaded.
92
- */
93
- readonly s3Uri: string;
123
+ /**
124
+ * Result of creating a compute environment.
125
+ */
126
+ export interface ComputeEnvironmentResult {
94
127
  /**
95
- * S3 prefix that compiled artifact uploaded.
128
+ * The compute environment.
96
129
  */
97
- readonly s3Prefix: string;
130
+ readonly computeEnvironment: batch.IComputeEnvironment;
98
131
  /**
99
- * The model name.
132
+ * The instance role associated with the compute environment.
100
133
  */
101
- readonly modelName: string;
102
- readonly weightSize: Size;
134
+ readonly instanceRole: IRole;
103
135
  }
104
136
  /**
105
- * Neuronx compiler construct.
106
- * Compile the model to work with Inferentia2 and Trainium1 and upload it to an S3 bucket.
137
+ * Abstract base class for Neuronx compilers.
138
+ * Provides the common orchestration logic (Lambda, CustomResource, WaitCondition)
139
+ * while subclasses define how to create the Batch compute environment and job definition.
107
140
  */
108
- export declare class NeuronxCompiler extends Construct {
141
+ export declare abstract class NeuronxCompilerBase extends Construct implements INeuronxCompiler {
109
142
  private compiledModel?;
110
143
  private readonly entrypoint;
111
- private readonly jobDefinition;
112
- private readonly jobQueue;
113
- private readonly artifactS3Prefix;
114
- private readonly weightSize;
115
- private readonly neuronxInstanceType;
116
- private readonly model;
117
- private readonly bucket;
118
- constructor(scope: Construct, id: string, props: NeuronxCompilerProps);
144
+ protected readonly artifactS3Prefix: string;
145
+ protected readonly weightSize: Size;
146
+ protected readonly neuronxInstanceType: INeuronxInstanceType;
147
+ protected readonly model: Model;
148
+ protected readonly bucket: IBucket;
149
+ constructor(scope: Construct, id: string, props: NeuronxCompilerBaseProps);
150
+ /**
151
+ * Create the Batch compute environment.
152
+ * Subclasses must implement this to provide the appropriate compute environment.
153
+ */
154
+ protected abstract createComputeEnvironment(props: NeuronxCompilerBaseProps): ComputeEnvironmentResult;
155
+ /**
156
+ * Create the Batch job definition.
157
+ * Subclasses must implement this to provide the appropriate job definition.
158
+ */
159
+ protected abstract createJobDefinition(props: NeuronxCompilerBaseProps): batch.IJobDefinition;
160
+ private createJobQueue;
119
161
  compile(): NeuronxCompiledModel;
120
162
  }