aws-cdk-neuronx-patterns 0.1.1 → 0.2.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.jsii +384 -82
- package/AGENT.md +11 -0
- package/API.md +237 -1
- package/lib/base/aws-batch/neuronx-batch-compute-environment.js +1 -1
- package/lib/base/aws-batch/neuronx-batch-ecs-job-definition.js +1 -1
- package/lib/base/aws-batch/neuronx-batch.js +1 -1
- package/lib/base/aws-ecs-patterns/application-load-balanced-neuronx-service.js +2 -2
- package/lib/base/neuronx/calculator.test.js +61 -1
- package/lib/base/neuronx/deep-learning-containers.d.ts +21 -3
- package/lib/base/neuronx/deep-learning-containers.js +25 -7
- package/lib/base/neuronx/deep-learning-containers.test.js +80 -3
- package/lib/base/neuronx/model.js +2 -2
- package/lib/base/neuronx/neuron-optimized-machine-image.js +1 -1
- package/lib/base/neuronx/neuronx-instance-type.d.ts +18 -0
- package/lib/base/neuronx/neuronx-instance-type.js +60 -7
- package/lib/base/neuronx/neuronx-instance-type.test.js +80 -1
- package/lib/base/neuronx-compiler/neuronx-compiler.js +1 -1
- package/lib/base/server-engine/vllm-engine/vllm-engine-argments.js +1 -1
- package/lib/vllm-nxd-inference/vllm-nxd-inference-compiler.js +5 -3
- package/lib/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.js +4 -4
- package/package.json +6 -6
package/.jsii
CHANGED
|
@@ -8,7 +8,7 @@
|
|
|
8
8
|
},
|
|
9
9
|
"dependencies": {
|
|
10
10
|
"@aws-cdk/aws-sagemaker-alpha": "2.240.0-alpha.0",
|
|
11
|
-
"@cdklabs/deploy-time-build": "^0.0
|
|
11
|
+
"@cdklabs/deploy-time-build": "^0.1.0",
|
|
12
12
|
"aws-cdk-lib": "^2.240.0",
|
|
13
13
|
"constructs": "^10.5.1"
|
|
14
14
|
},
|
|
@@ -8555,7 +8555,7 @@
|
|
|
8555
8555
|
"stability": "stable"
|
|
8556
8556
|
},
|
|
8557
8557
|
"homepage": "https://github.com/WinterYukky/aws-cdk-neuronx-patterns.git",
|
|
8558
|
-
"jsiiVersion": "5.9.
|
|
8558
|
+
"jsiiVersion": "5.9.31 (build 550e607)",
|
|
8559
8559
|
"keywords": [
|
|
8560
8560
|
"cdk",
|
|
8561
8561
|
"neuronx"
|
|
@@ -9340,7 +9340,7 @@
|
|
|
9340
9340
|
"kind": "interface",
|
|
9341
9341
|
"locationInModule": {
|
|
9342
9342
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
9343
|
-
"line":
|
|
9343
|
+
"line": 42
|
|
9344
9344
|
},
|
|
9345
9345
|
"name": "INeuronxInstanceType",
|
|
9346
9346
|
"properties": [
|
|
@@ -9352,7 +9352,7 @@
|
|
|
9352
9352
|
"immutable": true,
|
|
9353
9353
|
"locationInModule": {
|
|
9354
9354
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
9355
|
-
"line":
|
|
9355
|
+
"line": 47
|
|
9356
9356
|
},
|
|
9357
9357
|
"name": "acceleratorChips",
|
|
9358
9358
|
"type": {
|
|
@@ -9367,7 +9367,7 @@
|
|
|
9367
9367
|
"immutable": true,
|
|
9368
9368
|
"locationInModule": {
|
|
9369
9369
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
9370
|
-
"line":
|
|
9370
|
+
"line": 44
|
|
9371
9371
|
},
|
|
9372
9372
|
"name": "instanceType",
|
|
9373
9373
|
"type": {
|
|
@@ -9382,7 +9382,7 @@
|
|
|
9382
9382
|
"immutable": true,
|
|
9383
9383
|
"locationInModule": {
|
|
9384
9384
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
9385
|
-
"line":
|
|
9385
|
+
"line": 46
|
|
9386
9386
|
},
|
|
9387
9387
|
"name": "memory",
|
|
9388
9388
|
"type": {
|
|
@@ -9397,7 +9397,7 @@
|
|
|
9397
9397
|
"immutable": true,
|
|
9398
9398
|
"locationInModule": {
|
|
9399
9399
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
9400
|
-
"line":
|
|
9400
|
+
"line": 43
|
|
9401
9401
|
},
|
|
9402
9402
|
"name": "supportedTensorParallelism",
|
|
9403
9403
|
"type": {
|
|
@@ -9417,7 +9417,7 @@
|
|
|
9417
9417
|
"immutable": true,
|
|
9418
9418
|
"locationInModule": {
|
|
9419
9419
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
9420
|
-
"line":
|
|
9420
|
+
"line": 45
|
|
9421
9421
|
},
|
|
9422
9422
|
"name": "vCpu",
|
|
9423
9423
|
"type": {
|
|
@@ -9518,7 +9518,7 @@
|
|
|
9518
9518
|
"kind": "interface",
|
|
9519
9519
|
"locationInModule": {
|
|
9520
9520
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
9521
|
-
"line":
|
|
9521
|
+
"line": 233
|
|
9522
9522
|
},
|
|
9523
9523
|
"name": "IVllmInferenceNeuronxImage",
|
|
9524
9524
|
"properties": [
|
|
@@ -9530,7 +9530,7 @@
|
|
|
9530
9530
|
"immutable": true,
|
|
9531
9531
|
"locationInModule": {
|
|
9532
9532
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
9533
|
-
"line":
|
|
9533
|
+
"line": 234
|
|
9534
9534
|
},
|
|
9535
9535
|
"name": "vllmVersion",
|
|
9536
9536
|
"type": {
|
|
@@ -11391,7 +11391,7 @@
|
|
|
11391
11391
|
"kind": "class",
|
|
11392
11392
|
"locationInModule": {
|
|
11393
11393
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
11394
|
-
"line":
|
|
11394
|
+
"line": 137
|
|
11395
11395
|
},
|
|
11396
11396
|
"name": "NeuronxInstanceType",
|
|
11397
11397
|
"properties": [
|
|
@@ -11404,7 +11404,7 @@
|
|
|
11404
11404
|
"immutable": true,
|
|
11405
11405
|
"locationInModule": {
|
|
11406
11406
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
11407
|
-
"line":
|
|
11407
|
+
"line": 167
|
|
11408
11408
|
},
|
|
11409
11409
|
"name": "INF2_24XLARGE",
|
|
11410
11410
|
"static": true,
|
|
@@ -11421,7 +11421,7 @@
|
|
|
11421
11421
|
"immutable": true,
|
|
11422
11422
|
"locationInModule": {
|
|
11423
11423
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
11424
|
-
"line":
|
|
11424
|
+
"line": 180
|
|
11425
11425
|
},
|
|
11426
11426
|
"name": "INF2_48XLARGE",
|
|
11427
11427
|
"static": true,
|
|
@@ -11438,7 +11438,7 @@
|
|
|
11438
11438
|
"immutable": true,
|
|
11439
11439
|
"locationInModule": {
|
|
11440
11440
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
11441
|
-
"line":
|
|
11441
|
+
"line": 154
|
|
11442
11442
|
},
|
|
11443
11443
|
"name": "INF2_8XLARGE",
|
|
11444
11444
|
"static": true,
|
|
@@ -11455,7 +11455,7 @@
|
|
|
11455
11455
|
"immutable": true,
|
|
11456
11456
|
"locationInModule": {
|
|
11457
11457
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
11458
|
-
"line":
|
|
11458
|
+
"line": 141
|
|
11459
11459
|
},
|
|
11460
11460
|
"name": "INF2_XLARGE",
|
|
11461
11461
|
"static": true,
|
|
@@ -11472,7 +11472,7 @@
|
|
|
11472
11472
|
"immutable": true,
|
|
11473
11473
|
"locationInModule": {
|
|
11474
11474
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
11475
|
-
"line":
|
|
11475
|
+
"line": 193
|
|
11476
11476
|
},
|
|
11477
11477
|
"name": "TRN1_2XLARGE",
|
|
11478
11478
|
"static": true,
|
|
@@ -11489,13 +11489,64 @@
|
|
|
11489
11489
|
"immutable": true,
|
|
11490
11490
|
"locationInModule": {
|
|
11491
11491
|
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
11492
|
-
"line":
|
|
11492
|
+
"line": 206
|
|
11493
11493
|
},
|
|
11494
11494
|
"name": "TRN1_32XLARGE",
|
|
11495
11495
|
"static": true,
|
|
11496
11496
|
"type": {
|
|
11497
11497
|
"fqn": "aws-cdk-neuronx-patterns.INeuronxInstanceType"
|
|
11498
11498
|
}
|
|
11499
|
+
},
|
|
11500
|
+
{
|
|
11501
|
+
"const": true,
|
|
11502
|
+
"docs": {
|
|
11503
|
+
"stability": "stable",
|
|
11504
|
+
"summary": "trn2.3xlarge."
|
|
11505
|
+
},
|
|
11506
|
+
"immutable": true,
|
|
11507
|
+
"locationInModule": {
|
|
11508
|
+
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
11509
|
+
"line": 219
|
|
11510
|
+
},
|
|
11511
|
+
"name": "TRN2_3XLARGE",
|
|
11512
|
+
"static": true,
|
|
11513
|
+
"type": {
|
|
11514
|
+
"fqn": "aws-cdk-neuronx-patterns.INeuronxInstanceType"
|
|
11515
|
+
}
|
|
11516
|
+
},
|
|
11517
|
+
{
|
|
11518
|
+
"const": true,
|
|
11519
|
+
"docs": {
|
|
11520
|
+
"stability": "stable",
|
|
11521
|
+
"summary": "trn2.48xlarge."
|
|
11522
|
+
},
|
|
11523
|
+
"immutable": true,
|
|
11524
|
+
"locationInModule": {
|
|
11525
|
+
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
11526
|
+
"line": 232
|
|
11527
|
+
},
|
|
11528
|
+
"name": "TRN2_48XLARGE",
|
|
11529
|
+
"static": true,
|
|
11530
|
+
"type": {
|
|
11531
|
+
"fqn": "aws-cdk-neuronx-patterns.INeuronxInstanceType"
|
|
11532
|
+
}
|
|
11533
|
+
},
|
|
11534
|
+
{
|
|
11535
|
+
"const": true,
|
|
11536
|
+
"docs": {
|
|
11537
|
+
"stability": "stable",
|
|
11538
|
+
"summary": "trn2u.48xlarge."
|
|
11539
|
+
},
|
|
11540
|
+
"immutable": true,
|
|
11541
|
+
"locationInModule": {
|
|
11542
|
+
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
11543
|
+
"line": 245
|
|
11544
|
+
},
|
|
11545
|
+
"name": "TRN2U_48XLARGE",
|
|
11546
|
+
"static": true,
|
|
11547
|
+
"type": {
|
|
11548
|
+
"fqn": "aws-cdk-neuronx-patterns.INeuronxInstanceType"
|
|
11549
|
+
}
|
|
11499
11550
|
}
|
|
11500
11551
|
],
|
|
11501
11552
|
"symbolId": "src/base/neuronx/neuronx-instance-type:NeuronxInstanceType"
|
|
@@ -11983,7 +12034,7 @@
|
|
|
11983
12034
|
"kind": "class",
|
|
11984
12035
|
"locationInModule": {
|
|
11985
12036
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
11986
|
-
"line":
|
|
12037
|
+
"line": 159
|
|
11987
12038
|
},
|
|
11988
12039
|
"methods": [
|
|
11989
12040
|
{
|
|
@@ -11992,7 +12043,7 @@
|
|
|
11992
12043
|
},
|
|
11993
12044
|
"locationInModule": {
|
|
11994
12045
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
11995
|
-
"line":
|
|
12046
|
+
"line": 144
|
|
11996
12047
|
},
|
|
11997
12048
|
"name": "fromNeuronSdkVersion",
|
|
11998
12049
|
"parameters": [
|
|
@@ -12039,7 +12090,7 @@
|
|
|
12039
12090
|
"immutable": true,
|
|
12040
12091
|
"locationInModule": {
|
|
12041
12092
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12042
|
-
"line":
|
|
12093
|
+
"line": 160
|
|
12043
12094
|
},
|
|
12044
12095
|
"name": "imageName",
|
|
12045
12096
|
"static": true,
|
|
@@ -12056,7 +12107,7 @@
|
|
|
12056
12107
|
"immutable": true,
|
|
12057
12108
|
"locationInModule": {
|
|
12058
12109
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12059
|
-
"line":
|
|
12110
|
+
"line": 226
|
|
12060
12111
|
},
|
|
12061
12112
|
"name": "LATEST",
|
|
12062
12113
|
"static": true,
|
|
@@ -12073,7 +12124,7 @@
|
|
|
12073
12124
|
"immutable": true,
|
|
12074
12125
|
"locationInModule": {
|
|
12075
12126
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12076
|
-
"line":
|
|
12127
|
+
"line": 135
|
|
12077
12128
|
},
|
|
12078
12129
|
"name": "SDK_2_18_0",
|
|
12079
12130
|
"static": true,
|
|
@@ -12090,7 +12141,7 @@
|
|
|
12090
12141
|
"immutable": true,
|
|
12091
12142
|
"locationInModule": {
|
|
12092
12143
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12093
|
-
"line":
|
|
12144
|
+
"line": 128
|
|
12094
12145
|
},
|
|
12095
12146
|
"name": "SDK_2_18_1",
|
|
12096
12147
|
"static": true,
|
|
@@ -12107,7 +12158,7 @@
|
|
|
12107
12158
|
"immutable": true,
|
|
12108
12159
|
"locationInModule": {
|
|
12109
12160
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12110
|
-
"line":
|
|
12161
|
+
"line": 121
|
|
12111
12162
|
},
|
|
12112
12163
|
"name": "SDK_2_18_2",
|
|
12113
12164
|
"static": true,
|
|
@@ -12124,7 +12175,7 @@
|
|
|
12124
12175
|
"immutable": true,
|
|
12125
12176
|
"locationInModule": {
|
|
12126
12177
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12127
|
-
"line":
|
|
12178
|
+
"line": 114
|
|
12128
12179
|
},
|
|
12129
12180
|
"name": "SDK_2_19_0",
|
|
12130
12181
|
"static": true,
|
|
@@ -12141,7 +12192,7 @@
|
|
|
12141
12192
|
"immutable": true,
|
|
12142
12193
|
"locationInModule": {
|
|
12143
12194
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12144
|
-
"line":
|
|
12195
|
+
"line": 107
|
|
12145
12196
|
},
|
|
12146
12197
|
"name": "SDK_2_19_1",
|
|
12147
12198
|
"static": true,
|
|
@@ -12158,7 +12209,7 @@
|
|
|
12158
12209
|
"immutable": true,
|
|
12159
12210
|
"locationInModule": {
|
|
12160
12211
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12161
|
-
"line":
|
|
12212
|
+
"line": 100
|
|
12162
12213
|
},
|
|
12163
12214
|
"name": "SDK_2_20_0",
|
|
12164
12215
|
"static": true,
|
|
@@ -12175,7 +12226,7 @@
|
|
|
12175
12226
|
"immutable": true,
|
|
12176
12227
|
"locationInModule": {
|
|
12177
12228
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12178
|
-
"line":
|
|
12229
|
+
"line": 93
|
|
12179
12230
|
},
|
|
12180
12231
|
"name": "SDK_2_20_1",
|
|
12181
12232
|
"static": true,
|
|
@@ -12192,7 +12243,7 @@
|
|
|
12192
12243
|
"immutable": true,
|
|
12193
12244
|
"locationInModule": {
|
|
12194
12245
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12195
|
-
"line":
|
|
12246
|
+
"line": 86
|
|
12196
12247
|
},
|
|
12197
12248
|
"name": "SDK_2_20_2",
|
|
12198
12249
|
"static": true,
|
|
@@ -12209,7 +12260,7 @@
|
|
|
12209
12260
|
"immutable": true,
|
|
12210
12261
|
"locationInModule": {
|
|
12211
12262
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12212
|
-
"line":
|
|
12263
|
+
"line": 218
|
|
12213
12264
|
},
|
|
12214
12265
|
"name": "SDK_2_20_2_PYTORCH_1_13_1",
|
|
12215
12266
|
"static": true,
|
|
@@ -12226,7 +12277,7 @@
|
|
|
12226
12277
|
"immutable": true,
|
|
12227
12278
|
"locationInModule": {
|
|
12228
12279
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12229
|
-
"line":
|
|
12280
|
+
"line": 210
|
|
12230
12281
|
},
|
|
12231
12282
|
"name": "SDK_2_20_2_PYTORCH_2_1_2",
|
|
12232
12283
|
"static": true,
|
|
@@ -12243,7 +12294,7 @@
|
|
|
12243
12294
|
"immutable": true,
|
|
12244
12295
|
"locationInModule": {
|
|
12245
12296
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12246
|
-
"line":
|
|
12297
|
+
"line": 79
|
|
12247
12298
|
},
|
|
12248
12299
|
"name": "SDK_2_21_0",
|
|
12249
12300
|
"static": true,
|
|
@@ -12260,7 +12311,7 @@
|
|
|
12260
12311
|
"immutable": true,
|
|
12261
12312
|
"locationInModule": {
|
|
12262
12313
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12263
|
-
"line":
|
|
12314
|
+
"line": 72
|
|
12264
12315
|
},
|
|
12265
12316
|
"name": "SDK_2_21_1",
|
|
12266
12317
|
"static": true,
|
|
@@ -12277,7 +12328,7 @@
|
|
|
12277
12328
|
"immutable": true,
|
|
12278
12329
|
"locationInModule": {
|
|
12279
12330
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12280
|
-
"line":
|
|
12331
|
+
"line": 202
|
|
12281
12332
|
},
|
|
12282
12333
|
"name": "SDK_2_22_0",
|
|
12283
12334
|
"static": true,
|
|
@@ -12294,7 +12345,7 @@
|
|
|
12294
12345
|
"immutable": true,
|
|
12295
12346
|
"locationInModule": {
|
|
12296
12347
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12297
|
-
"line":
|
|
12348
|
+
"line": 194
|
|
12298
12349
|
},
|
|
12299
12350
|
"name": "SDK_2_23_0",
|
|
12300
12351
|
"static": true,
|
|
@@ -12311,7 +12362,7 @@
|
|
|
12311
12362
|
"immutable": true,
|
|
12312
12363
|
"locationInModule": {
|
|
12313
12364
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12314
|
-
"line":
|
|
12365
|
+
"line": 51
|
|
12315
12366
|
},
|
|
12316
12367
|
"name": "SDK_2_24_0",
|
|
12317
12368
|
"static": true,
|
|
@@ -12328,7 +12379,7 @@
|
|
|
12328
12379
|
"immutable": true,
|
|
12329
12380
|
"locationInModule": {
|
|
12330
12381
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12331
|
-
"line":
|
|
12382
|
+
"line": 186
|
|
12332
12383
|
},
|
|
12333
12384
|
"name": "SDK_2_25_0",
|
|
12334
12385
|
"static": true,
|
|
@@ -12345,7 +12396,7 @@
|
|
|
12345
12396
|
"immutable": true,
|
|
12346
12397
|
"locationInModule": {
|
|
12347
12398
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12348
|
-
"line":
|
|
12399
|
+
"line": 178
|
|
12349
12400
|
},
|
|
12350
12401
|
"name": "SDK_2_26_1",
|
|
12351
12402
|
"static": true,
|
|
@@ -12362,7 +12413,7 @@
|
|
|
12362
12413
|
"immutable": true,
|
|
12363
12414
|
"locationInModule": {
|
|
12364
12415
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12365
|
-
"line":
|
|
12416
|
+
"line": 170
|
|
12366
12417
|
},
|
|
12367
12418
|
"name": "SDK_2_27_1",
|
|
12368
12419
|
"static": true,
|
|
@@ -12379,7 +12430,7 @@
|
|
|
12379
12430
|
"immutable": true,
|
|
12380
12431
|
"locationInModule": {
|
|
12381
12432
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12382
|
-
"line":
|
|
12433
|
+
"line": 162
|
|
12383
12434
|
},
|
|
12384
12435
|
"name": "SDK_2_28_0",
|
|
12385
12436
|
"static": true,
|
|
@@ -12421,7 +12472,7 @@
|
|
|
12421
12472
|
"kind": "class",
|
|
12422
12473
|
"locationInModule": {
|
|
12423
12474
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12424
|
-
"line":
|
|
12475
|
+
"line": 229
|
|
12425
12476
|
},
|
|
12426
12477
|
"methods": [
|
|
12427
12478
|
{
|
|
@@ -12430,7 +12481,7 @@
|
|
|
12430
12481
|
},
|
|
12431
12482
|
"locationInModule": {
|
|
12432
12483
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12433
|
-
"line":
|
|
12484
|
+
"line": 144
|
|
12434
12485
|
},
|
|
12435
12486
|
"name": "fromNeuronSdkVersion",
|
|
12436
12487
|
"parameters": [
|
|
@@ -12477,7 +12528,7 @@
|
|
|
12477
12528
|
"immutable": true,
|
|
12478
12529
|
"locationInModule": {
|
|
12479
12530
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12480
|
-
"line":
|
|
12531
|
+
"line": 230
|
|
12481
12532
|
},
|
|
12482
12533
|
"name": "imageName",
|
|
12483
12534
|
"static": true,
|
|
@@ -12494,7 +12545,7 @@
|
|
|
12494
12545
|
"immutable": true,
|
|
12495
12546
|
"locationInModule": {
|
|
12496
12547
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12497
|
-
"line":
|
|
12548
|
+
"line": 142
|
|
12498
12549
|
},
|
|
12499
12550
|
"name": "LATEST",
|
|
12500
12551
|
"static": true,
|
|
@@ -12511,7 +12562,7 @@
|
|
|
12511
12562
|
"immutable": true,
|
|
12512
12563
|
"locationInModule": {
|
|
12513
12564
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12514
|
-
"line":
|
|
12565
|
+
"line": 135
|
|
12515
12566
|
},
|
|
12516
12567
|
"name": "SDK_2_18_0",
|
|
12517
12568
|
"static": true,
|
|
@@ -12528,7 +12579,7 @@
|
|
|
12528
12579
|
"immutable": true,
|
|
12529
12580
|
"locationInModule": {
|
|
12530
12581
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12531
|
-
"line":
|
|
12582
|
+
"line": 128
|
|
12532
12583
|
},
|
|
12533
12584
|
"name": "SDK_2_18_1",
|
|
12534
12585
|
"static": true,
|
|
@@ -12545,7 +12596,7 @@
|
|
|
12545
12596
|
"immutable": true,
|
|
12546
12597
|
"locationInModule": {
|
|
12547
12598
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12548
|
-
"line":
|
|
12599
|
+
"line": 121
|
|
12549
12600
|
},
|
|
12550
12601
|
"name": "SDK_2_18_2",
|
|
12551
12602
|
"static": true,
|
|
@@ -12562,7 +12613,7 @@
|
|
|
12562
12613
|
"immutable": true,
|
|
12563
12614
|
"locationInModule": {
|
|
12564
12615
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12565
|
-
"line":
|
|
12616
|
+
"line": 114
|
|
12566
12617
|
},
|
|
12567
12618
|
"name": "SDK_2_19_0",
|
|
12568
12619
|
"static": true,
|
|
@@ -12579,7 +12630,7 @@
|
|
|
12579
12630
|
"immutable": true,
|
|
12580
12631
|
"locationInModule": {
|
|
12581
12632
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12582
|
-
"line":
|
|
12633
|
+
"line": 107
|
|
12583
12634
|
},
|
|
12584
12635
|
"name": "SDK_2_19_1",
|
|
12585
12636
|
"static": true,
|
|
@@ -12596,7 +12647,7 @@
|
|
|
12596
12647
|
"immutable": true,
|
|
12597
12648
|
"locationInModule": {
|
|
12598
12649
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12599
|
-
"line":
|
|
12650
|
+
"line": 100
|
|
12600
12651
|
},
|
|
12601
12652
|
"name": "SDK_2_20_0",
|
|
12602
12653
|
"static": true,
|
|
@@ -12613,7 +12664,7 @@
|
|
|
12613
12664
|
"immutable": true,
|
|
12614
12665
|
"locationInModule": {
|
|
12615
12666
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12616
|
-
"line":
|
|
12667
|
+
"line": 93
|
|
12617
12668
|
},
|
|
12618
12669
|
"name": "SDK_2_20_1",
|
|
12619
12670
|
"static": true,
|
|
@@ -12630,7 +12681,7 @@
|
|
|
12630
12681
|
"immutable": true,
|
|
12631
12682
|
"locationInModule": {
|
|
12632
12683
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12633
|
-
"line":
|
|
12684
|
+
"line": 86
|
|
12634
12685
|
},
|
|
12635
12686
|
"name": "SDK_2_20_2",
|
|
12636
12687
|
"static": true,
|
|
@@ -12647,7 +12698,7 @@
|
|
|
12647
12698
|
"immutable": true,
|
|
12648
12699
|
"locationInModule": {
|
|
12649
12700
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12650
|
-
"line":
|
|
12701
|
+
"line": 79
|
|
12651
12702
|
},
|
|
12652
12703
|
"name": "SDK_2_21_0",
|
|
12653
12704
|
"static": true,
|
|
@@ -12664,7 +12715,7 @@
|
|
|
12664
12715
|
"immutable": true,
|
|
12665
12716
|
"locationInModule": {
|
|
12666
12717
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12667
|
-
"line":
|
|
12718
|
+
"line": 72
|
|
12668
12719
|
},
|
|
12669
12720
|
"name": "SDK_2_21_1",
|
|
12670
12721
|
"static": true,
|
|
@@ -12681,7 +12732,7 @@
|
|
|
12681
12732
|
"immutable": true,
|
|
12682
12733
|
"locationInModule": {
|
|
12683
12734
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12684
|
-
"line":
|
|
12735
|
+
"line": 65
|
|
12685
12736
|
},
|
|
12686
12737
|
"name": "SDK_2_22_0",
|
|
12687
12738
|
"static": true,
|
|
@@ -12698,7 +12749,7 @@
|
|
|
12698
12749
|
"immutable": true,
|
|
12699
12750
|
"locationInModule": {
|
|
12700
12751
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12701
|
-
"line":
|
|
12752
|
+
"line": 58
|
|
12702
12753
|
},
|
|
12703
12754
|
"name": "SDK_2_23_0",
|
|
12704
12755
|
"static": true,
|
|
@@ -12715,7 +12766,7 @@
|
|
|
12715
12766
|
"immutable": true,
|
|
12716
12767
|
"locationInModule": {
|
|
12717
12768
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12718
|
-
"line":
|
|
12769
|
+
"line": 51
|
|
12719
12770
|
},
|
|
12720
12771
|
"name": "SDK_2_24_0",
|
|
12721
12772
|
"static": true,
|
|
@@ -12723,6 +12774,74 @@
|
|
|
12723
12774
|
"fqn": "aws-cdk-neuronx-patterns.INeuronxImage"
|
|
12724
12775
|
}
|
|
12725
12776
|
},
|
|
12777
|
+
{
|
|
12778
|
+
"const": true,
|
|
12779
|
+
"docs": {
|
|
12780
|
+
"stability": "stable",
|
|
12781
|
+
"summary": "Neuron SDK 2.25.0."
|
|
12782
|
+
},
|
|
12783
|
+
"immutable": true,
|
|
12784
|
+
"locationInModule": {
|
|
12785
|
+
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12786
|
+
"line": 44
|
|
12787
|
+
},
|
|
12788
|
+
"name": "SDK_2_25_0",
|
|
12789
|
+
"static": true,
|
|
12790
|
+
"type": {
|
|
12791
|
+
"fqn": "aws-cdk-neuronx-patterns.INeuronxImage"
|
|
12792
|
+
}
|
|
12793
|
+
},
|
|
12794
|
+
{
|
|
12795
|
+
"const": true,
|
|
12796
|
+
"docs": {
|
|
12797
|
+
"stability": "stable",
|
|
12798
|
+
"summary": "Neuron SDK 2.26.1."
|
|
12799
|
+
},
|
|
12800
|
+
"immutable": true,
|
|
12801
|
+
"locationInModule": {
|
|
12802
|
+
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12803
|
+
"line": 37
|
|
12804
|
+
},
|
|
12805
|
+
"name": "SDK_2_26_1",
|
|
12806
|
+
"static": true,
|
|
12807
|
+
"type": {
|
|
12808
|
+
"fqn": "aws-cdk-neuronx-patterns.INeuronxImage"
|
|
12809
|
+
}
|
|
12810
|
+
},
|
|
12811
|
+
{
|
|
12812
|
+
"const": true,
|
|
12813
|
+
"docs": {
|
|
12814
|
+
"stability": "stable",
|
|
12815
|
+
"summary": "Neuron SDK 2.27.1."
|
|
12816
|
+
},
|
|
12817
|
+
"immutable": true,
|
|
12818
|
+
"locationInModule": {
|
|
12819
|
+
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12820
|
+
"line": 30
|
|
12821
|
+
},
|
|
12822
|
+
"name": "SDK_2_27_1",
|
|
12823
|
+
"static": true,
|
|
12824
|
+
"type": {
|
|
12825
|
+
"fqn": "aws-cdk-neuronx-patterns.INeuronxImage"
|
|
12826
|
+
}
|
|
12827
|
+
},
|
|
12828
|
+
{
|
|
12829
|
+
"const": true,
|
|
12830
|
+
"docs": {
|
|
12831
|
+
"stability": "stable",
|
|
12832
|
+
"summary": "Neuron SDK 2.28.0."
|
|
12833
|
+
},
|
|
12834
|
+
"immutable": true,
|
|
12835
|
+
"locationInModule": {
|
|
12836
|
+
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
12837
|
+
"line": 23
|
|
12838
|
+
},
|
|
12839
|
+
"name": "SDK_2_28_0",
|
|
12840
|
+
"static": true,
|
|
12841
|
+
"type": {
|
|
12842
|
+
"fqn": "aws-cdk-neuronx-patterns.INeuronxImage"
|
|
12843
|
+
}
|
|
12844
|
+
},
|
|
12726
12845
|
{
|
|
12727
12846
|
"const": true,
|
|
12728
12847
|
"docs": {
|
|
@@ -13217,6 +13336,87 @@
|
|
|
13217
13336
|
],
|
|
13218
13337
|
"symbolId": "src/base/neuronx/neuronx-instance-type:Trainium1Chips"
|
|
13219
13338
|
},
|
|
13339
|
+
"aws-cdk-neuronx-patterns.Trainium2Chips": {
|
|
13340
|
+
"assembly": "aws-cdk-neuronx-patterns",
|
|
13341
|
+
"docs": {
|
|
13342
|
+
"stability": "stable"
|
|
13343
|
+
},
|
|
13344
|
+
"fqn": "aws-cdk-neuronx-patterns.Trainium2Chips",
|
|
13345
|
+
"initializer": {
|
|
13346
|
+
"docs": {
|
|
13347
|
+
"stability": "stable"
|
|
13348
|
+
},
|
|
13349
|
+
"locationInModule": {
|
|
13350
|
+
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
13351
|
+
"line": 34
|
|
13352
|
+
},
|
|
13353
|
+
"parameters": [
|
|
13354
|
+
{
|
|
13355
|
+
"name": "chips",
|
|
13356
|
+
"type": {
|
|
13357
|
+
"primitive": "number"
|
|
13358
|
+
}
|
|
13359
|
+
}
|
|
13360
|
+
]
|
|
13361
|
+
},
|
|
13362
|
+
"interfaces": [
|
|
13363
|
+
"aws-cdk-neuronx-patterns.IAcceleratorChips"
|
|
13364
|
+
],
|
|
13365
|
+
"kind": "class",
|
|
13366
|
+
"locationInModule": {
|
|
13367
|
+
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
13368
|
+
"line": 31
|
|
13369
|
+
},
|
|
13370
|
+
"name": "Trainium2Chips",
|
|
13371
|
+
"properties": [
|
|
13372
|
+
{
|
|
13373
|
+
"docs": {
|
|
13374
|
+
"stability": "stable"
|
|
13375
|
+
},
|
|
13376
|
+
"immutable": true,
|
|
13377
|
+
"locationInModule": {
|
|
13378
|
+
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
13379
|
+
"line": 33
|
|
13380
|
+
},
|
|
13381
|
+
"name": "acceleratorMemory",
|
|
13382
|
+
"overrides": "aws-cdk-neuronx-patterns.IAcceleratorChips",
|
|
13383
|
+
"type": {
|
|
13384
|
+
"fqn": "aws-cdk-lib.Size"
|
|
13385
|
+
}
|
|
13386
|
+
},
|
|
13387
|
+
{
|
|
13388
|
+
"docs": {
|
|
13389
|
+
"stability": "stable"
|
|
13390
|
+
},
|
|
13391
|
+
"immutable": true,
|
|
13392
|
+
"locationInModule": {
|
|
13393
|
+
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
13394
|
+
"line": 34
|
|
13395
|
+
},
|
|
13396
|
+
"name": "chips",
|
|
13397
|
+
"overrides": "aws-cdk-neuronx-patterns.IAcceleratorChips",
|
|
13398
|
+
"type": {
|
|
13399
|
+
"primitive": "number"
|
|
13400
|
+
}
|
|
13401
|
+
},
|
|
13402
|
+
{
|
|
13403
|
+
"docs": {
|
|
13404
|
+
"stability": "stable"
|
|
13405
|
+
},
|
|
13406
|
+
"immutable": true,
|
|
13407
|
+
"locationInModule": {
|
|
13408
|
+
"filename": "src/base/neuronx/neuronx-instance-type.ts",
|
|
13409
|
+
"line": 32
|
|
13410
|
+
},
|
|
13411
|
+
"name": "neuronxCores",
|
|
13412
|
+
"overrides": "aws-cdk-neuronx-patterns.IAcceleratorChips",
|
|
13413
|
+
"type": {
|
|
13414
|
+
"primitive": "number"
|
|
13415
|
+
}
|
|
13416
|
+
}
|
|
13417
|
+
],
|
|
13418
|
+
"symbolId": "src/base/neuronx/neuronx-instance-type:Trainium2Chips"
|
|
13419
|
+
},
|
|
13220
13420
|
"aws-cdk-neuronx-patterns.UvicornLogLevel": {
|
|
13221
13421
|
"assembly": "aws-cdk-neuronx-patterns",
|
|
13222
13422
|
"docs": {
|
|
@@ -13673,7 +13873,7 @@
|
|
|
13673
13873
|
"kind": "class",
|
|
13674
13874
|
"locationInModule": {
|
|
13675
13875
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
13676
|
-
"line":
|
|
13876
|
+
"line": 236
|
|
13677
13877
|
},
|
|
13678
13878
|
"methods": [
|
|
13679
13879
|
{
|
|
@@ -13682,7 +13882,7 @@
|
|
|
13682
13882
|
},
|
|
13683
13883
|
"locationInModule": {
|
|
13684
13884
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
13685
|
-
"line":
|
|
13885
|
+
"line": 291
|
|
13686
13886
|
},
|
|
13687
13887
|
"name": "fromNeuronSdkVersion",
|
|
13688
13888
|
"parameters": [
|
|
@@ -13730,7 +13930,7 @@
|
|
|
13730
13930
|
"immutable": true,
|
|
13731
13931
|
"locationInModule": {
|
|
13732
13932
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
13733
|
-
"line":
|
|
13933
|
+
"line": 289
|
|
13734
13934
|
},
|
|
13735
13935
|
"name": "LATEST",
|
|
13736
13936
|
"static": true,
|
|
@@ -13738,6 +13938,40 @@
|
|
|
13738
13938
|
"fqn": "aws-cdk-neuronx-patterns.IVllmInferenceNeuronxImage"
|
|
13739
13939
|
}
|
|
13740
13940
|
},
|
|
13941
|
+
{
|
|
13942
|
+
"const": true,
|
|
13943
|
+
"docs": {
|
|
13944
|
+
"stability": "stable",
|
|
13945
|
+
"summary": "Neuron SDK 2.24.1 with vLLM 0.7.2."
|
|
13946
|
+
},
|
|
13947
|
+
"immutable": true,
|
|
13948
|
+
"locationInModule": {
|
|
13949
|
+
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
13950
|
+
"line": 282
|
|
13951
|
+
},
|
|
13952
|
+
"name": "SDK_2_24_1",
|
|
13953
|
+
"static": true,
|
|
13954
|
+
"type": {
|
|
13955
|
+
"fqn": "aws-cdk-neuronx-patterns.IVllmInferenceNeuronxImage"
|
|
13956
|
+
}
|
|
13957
|
+
},
|
|
13958
|
+
{
|
|
13959
|
+
"const": true,
|
|
13960
|
+
"docs": {
|
|
13961
|
+
"stability": "stable",
|
|
13962
|
+
"summary": "Neuron SDK 2.25.0 with vLLM 0.9.1."
|
|
13963
|
+
},
|
|
13964
|
+
"immutable": true,
|
|
13965
|
+
"locationInModule": {
|
|
13966
|
+
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
13967
|
+
"line": 275
|
|
13968
|
+
},
|
|
13969
|
+
"name": "SDK_2_25_0",
|
|
13970
|
+
"static": true,
|
|
13971
|
+
"type": {
|
|
13972
|
+
"fqn": "aws-cdk-neuronx-patterns.IVllmInferenceNeuronxImage"
|
|
13973
|
+
}
|
|
13974
|
+
},
|
|
13741
13975
|
{
|
|
13742
13976
|
"const": true,
|
|
13743
13977
|
"docs": {
|
|
@@ -13747,13 +13981,81 @@
|
|
|
13747
13981
|
"immutable": true,
|
|
13748
13982
|
"locationInModule": {
|
|
13749
13983
|
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
13750
|
-
"line":
|
|
13984
|
+
"line": 268
|
|
13751
13985
|
},
|
|
13752
13986
|
"name": "SDK_2_26_0",
|
|
13753
13987
|
"static": true,
|
|
13754
13988
|
"type": {
|
|
13755
13989
|
"fqn": "aws-cdk-neuronx-patterns.IVllmInferenceNeuronxImage"
|
|
13756
13990
|
}
|
|
13991
|
+
},
|
|
13992
|
+
{
|
|
13993
|
+
"const": true,
|
|
13994
|
+
"docs": {
|
|
13995
|
+
"stability": "stable",
|
|
13996
|
+
"summary": "Neuron SDK 2.26.1 with vLLM 0.9.1."
|
|
13997
|
+
},
|
|
13998
|
+
"immutable": true,
|
|
13999
|
+
"locationInModule": {
|
|
14000
|
+
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
14001
|
+
"line": 261
|
|
14002
|
+
},
|
|
14003
|
+
"name": "SDK_2_26_1",
|
|
14004
|
+
"static": true,
|
|
14005
|
+
"type": {
|
|
14006
|
+
"fqn": "aws-cdk-neuronx-patterns.IVllmInferenceNeuronxImage"
|
|
14007
|
+
}
|
|
14008
|
+
},
|
|
14009
|
+
{
|
|
14010
|
+
"const": true,
|
|
14011
|
+
"docs": {
|
|
14012
|
+
"stability": "stable",
|
|
14013
|
+
"summary": "Neuron SDK 2.27.1 with vLLM 0.11.0."
|
|
14014
|
+
},
|
|
14015
|
+
"immutable": true,
|
|
14016
|
+
"locationInModule": {
|
|
14017
|
+
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
14018
|
+
"line": 253
|
|
14019
|
+
},
|
|
14020
|
+
"name": "SDK_2_27_1_VLLM_0_11_0",
|
|
14021
|
+
"static": true,
|
|
14022
|
+
"type": {
|
|
14023
|
+
"fqn": "aws-cdk-neuronx-patterns.IVllmInferenceNeuronxImage"
|
|
14024
|
+
}
|
|
14025
|
+
},
|
|
14026
|
+
{
|
|
14027
|
+
"const": true,
|
|
14028
|
+
"docs": {
|
|
14029
|
+
"stability": "stable",
|
|
14030
|
+
"summary": "Neuron SDK 2.27.1 with vLLM 0.13.0."
|
|
14031
|
+
},
|
|
14032
|
+
"immutable": true,
|
|
14033
|
+
"locationInModule": {
|
|
14034
|
+
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
14035
|
+
"line": 245
|
|
14036
|
+
},
|
|
14037
|
+
"name": "SDK_2_27_1_VLLM_0_13_0",
|
|
14038
|
+
"static": true,
|
|
14039
|
+
"type": {
|
|
14040
|
+
"fqn": "aws-cdk-neuronx-patterns.IVllmInferenceNeuronxImage"
|
|
14041
|
+
}
|
|
14042
|
+
},
|
|
14043
|
+
{
|
|
14044
|
+
"const": true,
|
|
14045
|
+
"docs": {
|
|
14046
|
+
"stability": "stable",
|
|
14047
|
+
"summary": "Neuron SDK 2.28.0 with vLLM 0.13.0."
|
|
14048
|
+
},
|
|
14049
|
+
"immutable": true,
|
|
14050
|
+
"locationInModule": {
|
|
14051
|
+
"filename": "src/base/neuronx/deep-learning-containers.ts",
|
|
14052
|
+
"line": 238
|
|
14053
|
+
},
|
|
14054
|
+
"name": "SDK_2_28_0",
|
|
14055
|
+
"static": true,
|
|
14056
|
+
"type": {
|
|
14057
|
+
"fqn": "aws-cdk-neuronx-patterns.IVllmInferenceNeuronxImage"
|
|
14058
|
+
}
|
|
13757
14059
|
}
|
|
13758
14060
|
],
|
|
13759
14061
|
"symbolId": "src/base/neuronx/deep-learning-containers:VllmInferenceNeuronxImage"
|
|
@@ -15672,7 +15974,7 @@
|
|
|
15672
15974
|
},
|
|
15673
15975
|
"locationInModule": {
|
|
15674
15976
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15675
|
-
"line":
|
|
15977
|
+
"line": 43
|
|
15676
15978
|
},
|
|
15677
15979
|
"parameters": [
|
|
15678
15980
|
{
|
|
@@ -15699,7 +16001,7 @@
|
|
|
15699
16001
|
"kind": "class",
|
|
15700
16002
|
"locationInModule": {
|
|
15701
16003
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15702
|
-
"line":
|
|
16004
|
+
"line": 38
|
|
15703
16005
|
},
|
|
15704
16006
|
"name": "VllmNxdInferenceCompileImage",
|
|
15705
16007
|
"properties": [
|
|
@@ -15711,7 +16013,7 @@
|
|
|
15711
16013
|
"immutable": true,
|
|
15712
16014
|
"locationInModule": {
|
|
15713
16015
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15714
|
-
"line":
|
|
16016
|
+
"line": 42
|
|
15715
16017
|
},
|
|
15716
16018
|
"name": "image",
|
|
15717
16019
|
"overrides": "aws-cdk-neuronx-patterns.VllmNxdInferenceEcsImageBase",
|
|
@@ -15733,7 +16035,7 @@
|
|
|
15733
16035
|
"kind": "interface",
|
|
15734
16036
|
"locationInModule": {
|
|
15735
16037
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15736
|
-
"line":
|
|
16038
|
+
"line": 64
|
|
15737
16039
|
},
|
|
15738
16040
|
"name": "VllmNxdInferenceCompileProps",
|
|
15739
16041
|
"properties": [
|
|
@@ -15746,7 +16048,7 @@
|
|
|
15746
16048
|
"immutable": true,
|
|
15747
16049
|
"locationInModule": {
|
|
15748
16050
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15749
|
-
"line":
|
|
16051
|
+
"line": 72
|
|
15750
16052
|
},
|
|
15751
16053
|
"name": "bucket",
|
|
15752
16054
|
"type": {
|
|
@@ -15762,7 +16064,7 @@
|
|
|
15762
16064
|
"immutable": true,
|
|
15763
16065
|
"locationInModule": {
|
|
15764
16066
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15765
|
-
"line":
|
|
16067
|
+
"line": 80
|
|
15766
16068
|
},
|
|
15767
16069
|
"name": "model",
|
|
15768
16070
|
"type": {
|
|
@@ -15778,7 +16080,7 @@
|
|
|
15778
16080
|
"immutable": true,
|
|
15779
16081
|
"locationInModule": {
|
|
15780
16082
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15781
|
-
"line":
|
|
16083
|
+
"line": 68
|
|
15782
16084
|
},
|
|
15783
16085
|
"name": "vpc",
|
|
15784
16086
|
"type": {
|
|
@@ -15796,7 +16098,7 @@
|
|
|
15796
16098
|
"immutable": true,
|
|
15797
16099
|
"locationInModule": {
|
|
15798
16100
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15799
|
-
"line":
|
|
16101
|
+
"line": 104
|
|
15800
16102
|
},
|
|
15801
16103
|
"name": "environment",
|
|
15802
16104
|
"optional": true,
|
|
@@ -15819,7 +16121,7 @@
|
|
|
15819
16121
|
"immutable": true,
|
|
15820
16122
|
"locationInModule": {
|
|
15821
16123
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15822
|
-
"line":
|
|
16124
|
+
"line": 116
|
|
15823
16125
|
},
|
|
15824
16126
|
"name": "image",
|
|
15825
16127
|
"optional": true,
|
|
@@ -15836,7 +16138,7 @@
|
|
|
15836
16138
|
"immutable": true,
|
|
15837
16139
|
"locationInModule": {
|
|
15838
16140
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15839
|
-
"line":
|
|
16141
|
+
"line": 76
|
|
15840
16142
|
},
|
|
15841
16143
|
"name": "neuronxInstanceType",
|
|
15842
16144
|
"optional": true,
|
|
@@ -15855,7 +16157,7 @@
|
|
|
15855
16157
|
"immutable": true,
|
|
15856
16158
|
"locationInModule": {
|
|
15857
16159
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15858
|
-
"line":
|
|
16160
|
+
"line": 91
|
|
15859
16161
|
},
|
|
15860
16162
|
"name": "spot",
|
|
15861
16163
|
"optional": true,
|
|
@@ -15873,7 +16175,7 @@
|
|
|
15873
16175
|
"immutable": true,
|
|
15874
16176
|
"locationInModule": {
|
|
15875
16177
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15876
|
-
"line":
|
|
16178
|
+
"line": 111
|
|
15877
16179
|
},
|
|
15878
16180
|
"name": "vllmArgs",
|
|
15879
16181
|
"optional": true,
|
|
@@ -15891,7 +16193,7 @@
|
|
|
15891
16193
|
"immutable": true,
|
|
15892
16194
|
"locationInModule": {
|
|
15893
16195
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15894
|
-
"line":
|
|
16196
|
+
"line": 85
|
|
15895
16197
|
},
|
|
15896
16198
|
"name": "volumeSize",
|
|
15897
16199
|
"optional": true,
|
|
@@ -15909,7 +16211,7 @@
|
|
|
15909
16211
|
"immutable": true,
|
|
15910
16212
|
"locationInModule": {
|
|
15911
16213
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15912
|
-
"line":
|
|
16214
|
+
"line": 97
|
|
15913
16215
|
},
|
|
15914
16216
|
"name": "vpcSubnets",
|
|
15915
16217
|
"optional": true,
|
|
@@ -15934,7 +16236,7 @@
|
|
|
15934
16236
|
"kind": "interface",
|
|
15935
16237
|
"locationInModule": {
|
|
15936
16238
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15937
|
-
"line":
|
|
16239
|
+
"line": 122
|
|
15938
16240
|
},
|
|
15939
16241
|
"name": "VllmNxdInferenceCompiledModel",
|
|
15940
16242
|
"properties": [
|
|
@@ -15947,7 +16249,7 @@
|
|
|
15947
16249
|
"immutable": true,
|
|
15948
16250
|
"locationInModule": {
|
|
15949
16251
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15950
|
-
"line":
|
|
16252
|
+
"line": 126
|
|
15951
16253
|
},
|
|
15952
16254
|
"name": "vllmArgs",
|
|
15953
16255
|
"type": {
|
|
@@ -15972,7 +16274,7 @@
|
|
|
15972
16274
|
},
|
|
15973
16275
|
"locationInModule": {
|
|
15974
16276
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
15975
|
-
"line":
|
|
16277
|
+
"line": 136
|
|
15976
16278
|
},
|
|
15977
16279
|
"parameters": [
|
|
15978
16280
|
{
|
|
@@ -15998,7 +16300,7 @@
|
|
|
15998
16300
|
"kind": "class",
|
|
15999
16301
|
"locationInModule": {
|
|
16000
16302
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
16001
|
-
"line":
|
|
16303
|
+
"line": 133
|
|
16002
16304
|
},
|
|
16003
16305
|
"methods": [
|
|
16004
16306
|
{
|
|
@@ -16009,7 +16311,7 @@
|
|
|
16009
16311
|
},
|
|
16010
16312
|
"locationInModule": {
|
|
16011
16313
|
"filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
|
|
16012
|
-
"line":
|
|
16314
|
+
"line": 251
|
|
16013
16315
|
},
|
|
16014
16316
|
"name": "compile",
|
|
16015
16317
|
"returns": {
|
|
@@ -16919,6 +17221,6 @@
|
|
|
16919
17221
|
"symbolId": "src/base/server-engine/vllm-engine/vllm-engine-argments:VllmTask"
|
|
16920
17222
|
}
|
|
16921
17223
|
},
|
|
16922
|
-
"version": "0.
|
|
16923
|
-
"fingerprint": "
|
|
17224
|
+
"version": "0.2.1",
|
|
17225
|
+
"fingerprint": "rmWh4Yidj/K2VX7stt6PQSQkVTyMLNqwdBOhr/rmLZQ="
|
|
16924
17226
|
}
|