aws-cdk-neuronx-patterns 0.0.20 → 0.0.22

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/.jsii CHANGED
@@ -4038,7 +4038,7 @@
4038
4038
  },
4039
4039
  "locationInModule": {
4040
4040
  "filename": "src/base/aws-ecs-patterns/application-load-balanced-neuronx-service.ts",
4041
- "line": 119
4041
+ "line": 120
4042
4042
  },
4043
4043
  "parameters": [
4044
4044
  {
@@ -4064,7 +4064,7 @@
4064
4064
  "kind": "class",
4065
4065
  "locationInModule": {
4066
4066
  "filename": "src/base/aws-ecs-patterns/application-load-balanced-neuronx-service.ts",
4067
- "line": 118
4067
+ "line": 119
4068
4068
  },
4069
4069
  "name": "ApplicationLoadBalancedNeuronxService",
4070
4070
  "symbolId": "src/base/aws-ecs-patterns/application-load-balanced-neuronx-service:ApplicationLoadBalancedNeuronxService"
@@ -4082,7 +4082,7 @@
4082
4082
  "kind": "interface",
4083
4083
  "locationInModule": {
4084
4084
  "filename": "src/base/aws-ecs-patterns/application-load-balanced-neuronx-service.ts",
4085
- "line": 116
4085
+ "line": 117
4086
4086
  },
4087
4087
  "name": "ApplicationLoadBalancedNeuronxServiceProps",
4088
4088
  "symbolId": "src/base/aws-ecs-patterns/application-load-balanced-neuronx-service:ApplicationLoadBalancedNeuronxServiceProps"
@@ -4103,7 +4103,7 @@
4103
4103
  },
4104
4104
  "locationInModule": {
4105
4105
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
4106
- "line": 184
4106
+ "line": 200
4107
4107
  },
4108
4108
  "parameters": [
4109
4109
  {
@@ -4129,7 +4129,7 @@
4129
4129
  "kind": "class",
4130
4130
  "locationInModule": {
4131
4131
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
4132
- "line": 178
4132
+ "line": 194
4133
4133
  },
4134
4134
  "name": "ApplicationLoadBalancedVllmNxDInferenceService",
4135
4135
  "properties": [
@@ -4140,7 +4140,7 @@
4140
4140
  "immutable": true,
4141
4141
  "locationInModule": {
4142
4142
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
4143
- "line": 180
4143
+ "line": 196
4144
4144
  },
4145
4145
  "name": "listener",
4146
4146
  "type": {
@@ -4154,7 +4154,7 @@
4154
4154
  "immutable": true,
4155
4155
  "locationInModule": {
4156
4156
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
4157
- "line": 179
4157
+ "line": 195
4158
4158
  },
4159
4159
  "name": "loadBalancer",
4160
4160
  "type": {
@@ -4168,7 +4168,7 @@
4168
4168
  "immutable": true,
4169
4169
  "locationInModule": {
4170
4170
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
4171
- "line": 182
4171
+ "line": 198
4172
4172
  },
4173
4173
  "name": "service",
4174
4174
  "type": {
@@ -4182,7 +4182,7 @@
4182
4182
  "immutable": true,
4183
4183
  "locationInModule": {
4184
4184
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
4185
- "line": 181
4185
+ "line": 197
4186
4186
  },
4187
4187
  "name": "targetGroup",
4188
4188
  "type": {
@@ -4196,7 +4196,7 @@
4196
4196
  "immutable": true,
4197
4197
  "locationInModule": {
4198
4198
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
4199
- "line": 183
4199
+ "line": 199
4200
4200
  },
4201
4201
  "name": "taskDefinition",
4202
4202
  "type": {
@@ -4220,7 +4220,7 @@
4220
4220
  "kind": "interface",
4221
4221
  "locationInModule": {
4222
4222
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
4223
- "line": 153
4223
+ "line": 169
4224
4224
  },
4225
4225
  "name": "ApplicationLoadBalancedVllmNxDInferenceServiceProps",
4226
4226
  "symbolId": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns:ApplicationLoadBalancedVllmNxDInferenceServiceProps"
@@ -6501,7 +6501,7 @@
6501
6501
  },
6502
6502
  "locationInModule": {
6503
6503
  "filename": "src/base/neuronx-compiler/neuronx-compiler.ts",
6504
- "line": 283
6504
+ "line": 286
6505
6505
  },
6506
6506
  "name": "compile",
6507
6507
  "returns": {
@@ -6926,7 +6926,7 @@
6926
6926
  },
6927
6927
  "locationInModule": {
6928
6928
  "filename": "src/base/aws-ecs-patterns/application-load-balanced-neuronx-service.ts",
6929
- "line": 92
6929
+ "line": 93
6930
6930
  },
6931
6931
  "name": "addContainerWithDefault",
6932
6932
  "parameters": [
@@ -10492,7 +10492,7 @@
10492
10492
  },
10493
10493
  "locationInModule": {
10494
10494
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10495
- "line": 40
10495
+ "line": 43
10496
10496
  },
10497
10497
  "parameters": [
10498
10498
  {
@@ -10500,13 +10500,20 @@
10500
10500
  "type": {
10501
10501
  "fqn": "aws-cdk-neuronx-patterns.INeuronxImage"
10502
10502
  }
10503
+ },
10504
+ {
10505
+ "name": "options",
10506
+ "optional": true,
10507
+ "type": {
10508
+ "fqn": "aws-cdk-neuronx-patterns.VllmNxdInferenceImageOptions"
10509
+ }
10503
10510
  }
10504
10511
  ]
10505
10512
  },
10506
10513
  "kind": "class",
10507
10514
  "locationInModule": {
10508
10515
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10509
- "line": 35
10516
+ "line": 38
10510
10517
  },
10511
10518
  "name": "VllmNxdInferenceCompileImage",
10512
10519
  "properties": [
@@ -10518,7 +10525,7 @@
10518
10525
  "immutable": true,
10519
10526
  "locationInModule": {
10520
10527
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10521
- "line": 39
10528
+ "line": 42
10522
10529
  },
10523
10530
  "name": "image",
10524
10531
  "overrides": "aws-cdk-neuronx-patterns.VllmNxdInferenceImageBase",
@@ -10540,7 +10547,7 @@
10540
10547
  "kind": "interface",
10541
10548
  "locationInModule": {
10542
10549
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10543
- "line": 58
10550
+ "line": 65
10544
10551
  },
10545
10552
  "name": "VllmNxdInferenceCompileProps",
10546
10553
  "properties": [
@@ -10553,7 +10560,7 @@
10553
10560
  "immutable": true,
10554
10561
  "locationInModule": {
10555
10562
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10556
- "line": 66
10563
+ "line": 73
10557
10564
  },
10558
10565
  "name": "bucket",
10559
10566
  "type": {
@@ -10569,7 +10576,7 @@
10569
10576
  "immutable": true,
10570
10577
  "locationInModule": {
10571
10578
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10572
- "line": 74
10579
+ "line": 81
10573
10580
  },
10574
10581
  "name": "model",
10575
10582
  "type": {
@@ -10585,7 +10592,7 @@
10585
10592
  "immutable": true,
10586
10593
  "locationInModule": {
10587
10594
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10588
- "line": 62
10595
+ "line": 69
10589
10596
  },
10590
10597
  "name": "vpc",
10591
10598
  "type": {
@@ -10603,7 +10610,7 @@
10603
10610
  "immutable": true,
10604
10611
  "locationInModule": {
10605
10612
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10606
- "line": 98
10613
+ "line": 105
10607
10614
  },
10608
10615
  "name": "environment",
10609
10616
  "optional": true,
@@ -10626,7 +10633,7 @@
10626
10633
  "immutable": true,
10627
10634
  "locationInModule": {
10628
10635
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10629
- "line": 110
10636
+ "line": 117
10630
10637
  },
10631
10638
  "name": "image",
10632
10639
  "optional": true,
@@ -10643,7 +10650,7 @@
10643
10650
  "immutable": true,
10644
10651
  "locationInModule": {
10645
10652
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10646
- "line": 70
10653
+ "line": 77
10647
10654
  },
10648
10655
  "name": "neuronxInstanceType",
10649
10656
  "optional": true,
@@ -10662,7 +10669,7 @@
10662
10669
  "immutable": true,
10663
10670
  "locationInModule": {
10664
10671
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10665
- "line": 85
10672
+ "line": 92
10666
10673
  },
10667
10674
  "name": "spot",
10668
10675
  "optional": true,
@@ -10680,7 +10687,7 @@
10680
10687
  "immutable": true,
10681
10688
  "locationInModule": {
10682
10689
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10683
- "line": 105
10690
+ "line": 112
10684
10691
  },
10685
10692
  "name": "vllmArgs",
10686
10693
  "optional": true,
@@ -10698,7 +10705,7 @@
10698
10705
  "immutable": true,
10699
10706
  "locationInModule": {
10700
10707
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10701
- "line": 79
10708
+ "line": 86
10702
10709
  },
10703
10710
  "name": "volumeSize",
10704
10711
  "optional": true,
@@ -10716,7 +10723,7 @@
10716
10723
  "immutable": true,
10717
10724
  "locationInModule": {
10718
10725
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10719
- "line": 91
10726
+ "line": 98
10720
10727
  },
10721
10728
  "name": "vpcSubnets",
10722
10729
  "optional": true,
@@ -10741,7 +10748,7 @@
10741
10748
  "kind": "interface",
10742
10749
  "locationInModule": {
10743
10750
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10744
- "line": 116
10751
+ "line": 123
10745
10752
  },
10746
10753
  "name": "VllmNxdInferenceCompiledModel",
10747
10754
  "properties": [
@@ -10754,7 +10761,7 @@
10754
10761
  "immutable": true,
10755
10762
  "locationInModule": {
10756
10763
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10757
- "line": 120
10764
+ "line": 127
10758
10765
  },
10759
10766
  "name": "vllmArgs",
10760
10767
  "type": {
@@ -10779,7 +10786,7 @@
10779
10786
  },
10780
10787
  "locationInModule": {
10781
10788
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10782
- "line": 130
10789
+ "line": 137
10783
10790
  },
10784
10791
  "parameters": [
10785
10792
  {
@@ -10805,7 +10812,7 @@
10805
10812
  "kind": "class",
10806
10813
  "locationInModule": {
10807
10814
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10808
- "line": 127
10815
+ "line": 134
10809
10816
  },
10810
10817
  "methods": [
10811
10818
  {
@@ -10816,7 +10823,7 @@
10816
10823
  },
10817
10824
  "locationInModule": {
10818
10825
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-compiler.ts",
10819
- "line": 244
10826
+ "line": 251
10820
10827
  },
10821
10828
  "name": "compile",
10822
10829
  "returns": {
@@ -10844,7 +10851,7 @@
10844
10851
  },
10845
10852
  "locationInModule": {
10846
10853
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
10847
- "line": 53
10854
+ "line": 65
10848
10855
  },
10849
10856
  "parameters": [
10850
10857
  {
@@ -10852,13 +10859,20 @@
10852
10859
  "type": {
10853
10860
  "fqn": "aws-cdk-neuronx-patterns.INeuronxImage"
10854
10861
  }
10862
+ },
10863
+ {
10864
+ "name": "options",
10865
+ "optional": true,
10866
+ "type": {
10867
+ "fqn": "aws-cdk-neuronx-patterns.VllmNxdInferenceImageOptions"
10868
+ }
10855
10869
  }
10856
10870
  ]
10857
10871
  },
10858
10872
  "kind": "class",
10859
10873
  "locationInModule": {
10860
10874
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
10861
- "line": 51
10875
+ "line": 63
10862
10876
  },
10863
10877
  "name": "VllmNxdInferenceImage",
10864
10878
  "properties": [
@@ -10870,7 +10884,7 @@
10870
10884
  "immutable": true,
10871
10885
  "locationInModule": {
10872
10886
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
10873
- "line": 52
10887
+ "line": 64
10874
10888
  },
10875
10889
  "name": "image",
10876
10890
  "overrides": "aws-cdk-neuronx-patterns.VllmNxdInferenceImageBase",
@@ -10895,7 +10909,7 @@
10895
10909
  },
10896
10910
  "locationInModule": {
10897
10911
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
10898
- "line": 35
10912
+ "line": 49
10899
10913
  },
10900
10914
  "parameters": [
10901
10915
  {
@@ -10903,6 +10917,13 @@
10903
10917
  "type": {
10904
10918
  "fqn": "aws-cdk-neuronx-patterns.INeuronxImage"
10905
10919
  }
10920
+ },
10921
+ {
10922
+ "name": "options",
10923
+ "optional": true,
10924
+ "type": {
10925
+ "fqn": "aws-cdk-neuronx-patterns.VllmNxdInferenceImageOptions"
10926
+ }
10906
10927
  }
10907
10928
  ]
10908
10929
  },
@@ -10912,7 +10933,7 @@
10912
10933
  "kind": "class",
10913
10934
  "locationInModule": {
10914
10935
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
10915
- "line": 24
10936
+ "line": 28
10916
10937
  },
10917
10938
  "name": "VllmNxdInferenceImageBase",
10918
10939
  "properties": [
@@ -10925,7 +10946,7 @@
10925
10946
  "immutable": true,
10926
10947
  "locationInModule": {
10927
10948
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
10928
- "line": 30
10949
+ "line": 34
10929
10950
  },
10930
10951
  "name": "image",
10931
10952
  "overrides": "aws-cdk-neuronx-patterns.INeuronxContainerImage",
@@ -10941,7 +10962,7 @@
10941
10962
  "immutable": true,
10942
10963
  "locationInModule": {
10943
10964
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
10944
- "line": 34
10965
+ "line": 48
10945
10966
  },
10946
10967
  "name": "sdkVersion",
10947
10968
  "overrides": "aws-cdk-neuronx-patterns.INeuronxContainerImage",
@@ -10953,21 +10974,86 @@
10953
10974
  "docs": {
10954
10975
  "see": "https://github.com/aws-neuron/upstreaming-to-vllm",
10955
10976
  "stability": "stable",
10956
- "summary": "The Git branch name for aws-neuron/upstreaming-to-vllm."
10977
+ "summary": "The Git branch name of aws-neuron/upstreaming-to-vllm."
10957
10978
  },
10958
10979
  "immutable": true,
10959
10980
  "locationInModule": {
10960
10981
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
10961
- "line": 42
10982
+ "line": 39
10962
10983
  },
10963
10984
  "name": "vllmGitBranch",
10964
10985
  "type": {
10965
10986
  "primitive": "string"
10966
10987
  }
10988
+ },
10989
+ {
10990
+ "docs": {
10991
+ "see": "https://github.com/aws-neuron/upstreaming-to-vllm",
10992
+ "stability": "stable",
10993
+ "summary": "The Git commit fosh of aws-neuron/upstreaming-to-vllm."
10994
+ },
10995
+ "immutable": true,
10996
+ "locationInModule": {
10997
+ "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
10998
+ "line": 44
10999
+ },
11000
+ "name": "vllmGitCommitHash",
11001
+ "type": {
11002
+ "primitive": "string"
11003
+ }
10967
11004
  }
10968
11005
  ],
10969
11006
  "symbolId": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns:VllmNxdInferenceImageBase"
10970
11007
  },
11008
+ "aws-cdk-neuronx-patterns.VllmNxdInferenceImageOptions": {
11009
+ "assembly": "aws-cdk-neuronx-patterns",
11010
+ "datatype": true,
11011
+ "docs": {
11012
+ "stability": "stable"
11013
+ },
11014
+ "fqn": "aws-cdk-neuronx-patterns.VllmNxdInferenceImageOptions",
11015
+ "kind": "interface",
11016
+ "locationInModule": {
11017
+ "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
11018
+ "line": 21
11019
+ },
11020
+ "name": "VllmNxdInferenceImageOptions",
11021
+ "properties": [
11022
+ {
11023
+ "abstract": true,
11024
+ "docs": {
11025
+ "stability": "stable"
11026
+ },
11027
+ "immutable": true,
11028
+ "locationInModule": {
11029
+ "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
11030
+ "line": 22
11031
+ },
11032
+ "name": "vllmGitBranch",
11033
+ "optional": true,
11034
+ "type": {
11035
+ "primitive": "string"
11036
+ }
11037
+ },
11038
+ {
11039
+ "abstract": true,
11040
+ "docs": {
11041
+ "stability": "stable"
11042
+ },
11043
+ "immutable": true,
11044
+ "locationInModule": {
11045
+ "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
11046
+ "line": 23
11047
+ },
11048
+ "name": "vllmGitCommitHash",
11049
+ "optional": true,
11050
+ "type": {
11051
+ "primitive": "string"
11052
+ }
11053
+ }
11054
+ ],
11055
+ "symbolId": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns:VllmNxdInferenceImageOptions"
11056
+ },
10971
11057
  "aws-cdk-neuronx-patterns.VllmNxdInferenceTaskDefinition": {
10972
11058
  "assembly": "aws-cdk-neuronx-patterns",
10973
11059
  "base": "aws-cdk-neuronx-patterns.NeuronxTaskDefinition",
@@ -10982,7 +11068,7 @@
10982
11068
  },
10983
11069
  "locationInModule": {
10984
11070
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
10985
- "line": 97
11071
+ "line": 113
10986
11072
  },
10987
11073
  "parameters": [
10988
11074
  {
@@ -11008,7 +11094,7 @@
11008
11094
  "kind": "class",
11009
11095
  "locationInModule": {
11010
11096
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
11011
- "line": 96
11097
+ "line": 112
11012
11098
  },
11013
11099
  "name": "VllmNxdInferenceTaskDefinition",
11014
11100
  "symbolId": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns:VllmNxdInferenceTaskDefinition"
@@ -11027,7 +11113,7 @@
11027
11113
  "kind": "interface",
11028
11114
  "locationInModule": {
11029
11115
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
11030
- "line": 71
11116
+ "line": 87
11031
11117
  },
11032
11118
  "name": "VllmNxdInferenceTaskDefinitionProps",
11033
11119
  "properties": [
@@ -11040,7 +11126,7 @@
11040
11126
  "immutable": true,
11041
11127
  "locationInModule": {
11042
11128
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
11043
- "line": 76
11129
+ "line": 92
11044
11130
  },
11045
11131
  "name": "compiledModel",
11046
11132
  "type": {
@@ -11058,7 +11144,7 @@
11058
11144
  "immutable": true,
11059
11145
  "locationInModule": {
11060
11146
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
11061
- "line": 88
11147
+ "line": 104
11062
11148
  },
11063
11149
  "name": "environment",
11064
11150
  "optional": true,
@@ -11081,7 +11167,7 @@
11081
11167
  "immutable": true,
11082
11168
  "locationInModule": {
11083
11169
  "filename": "src/vllm-nxd-inference/vllm-nxd-inference-ecs-patterns.ts",
11084
- "line": 81
11170
+ "line": 97
11085
11171
  },
11086
11172
  "name": "image",
11087
11173
  "optional": true,
@@ -11688,6 +11774,6 @@
11688
11774
  "symbolId": "src/base/server-engine/vllm-engine/vllm-engine-argments:VllmTask"
11689
11775
  }
11690
11776
  },
11691
- "version": "0.0.20",
11692
- "fingerprint": "rP1a2UZz0ejn2Fu3GTWzGI80QivXWfxxkp0ZcLOUbbU="
11777
+ "version": "0.0.22",
11778
+ "fingerprint": "IkS0IrcyTruVx/Q04gb1v4zfnLZrcRTr1ZQrhmALyuU="
11693
11779
  }