flyteplugins-vllm 2.0.0b43__py3-none-any.whl → 2.0.0b45__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- flyteplugins/vllm/_app_environment.py +5 -1
- flyteplugins/vllm/_constants.py +2 -0
- flyteplugins/vllm/_model_loader/shim.py +14 -2
- {flyteplugins_vllm-2.0.0b43.dist-info → flyteplugins_vllm-2.0.0b45.dist-info}/METADATA +2 -2
- flyteplugins_vllm-2.0.0b45.dist-info/RECORD +11 -0
- flyteplugins_vllm-2.0.0b43.dist-info/RECORD +0 -10
- {flyteplugins_vllm-2.0.0b43.dist-info → flyteplugins_vllm-2.0.0b45.dist-info}/WHEEL +0 -0
- {flyteplugins_vllm-2.0.0b43.dist-info → flyteplugins_vllm-2.0.0b45.dist-info}/entry_points.txt +0 -0
- {flyteplugins_vllm-2.0.0b43.dist-info → flyteplugins_vllm-2.0.0b45.dist-info}/top_level.txt +0 -0
|
@@ -11,13 +11,17 @@ from flyte.app import Parameter, RunOutput
|
|
|
11
11
|
from flyte.app._types import Port
|
|
12
12
|
from flyte.models import SerializationContext
|
|
13
13
|
|
|
14
|
+
from flyteplugins.vllm._constants import VLLM_MIN_VERSION_STR
|
|
15
|
+
|
|
14
16
|
DEFAULT_VLLM_IMAGE = (
|
|
15
|
-
flyte.Image.from_debian_base(name="vllm-app-image"
|
|
17
|
+
flyte.Image.from_debian_base(name="vllm-app-image")
|
|
16
18
|
# install flashinfer and vllm
|
|
17
19
|
.with_pip_packages("flashinfer-python", "flashinfer-cubin")
|
|
18
20
|
.with_pip_packages("flashinfer-jit-cache", index_url="https://flashinfer.ai/whl/cu129")
|
|
19
21
|
# install the vllm flyte plugin
|
|
20
22
|
.with_pip_packages("flyteplugins-vllm", pre=True)
|
|
23
|
+
# install vllm in a separate layer due to dependency conflict with flyte (protovalidate)
|
|
24
|
+
.with_pip_packages(f"vllm>={VLLM_MIN_VERSION_STR}")
|
|
21
25
|
)
|
|
22
26
|
|
|
23
27
|
|
|
@@ -2,14 +2,26 @@ import logging
|
|
|
2
2
|
from typing import Generator
|
|
3
3
|
|
|
4
4
|
import torch
|
|
5
|
-
import vllm
|
|
6
|
-
import vllm.entrypoints.cli.main
|
|
7
5
|
from flyte.app.extras._model_loader.config import (
|
|
8
6
|
LOCAL_MODEL_PATH,
|
|
9
7
|
REMOTE_MODEL_PATH,
|
|
10
8
|
STREAM_SAFETENSORS,
|
|
11
9
|
)
|
|
12
10
|
from flyte.app.extras._model_loader.loader import SafeTensorsStreamer, prefetch
|
|
11
|
+
|
|
12
|
+
from flyteplugins.vllm._constants import VLLM_MIN_VERSION, VLLM_MIN_VERSION_STR
|
|
13
|
+
|
|
14
|
+
try:
|
|
15
|
+
import vllm
|
|
16
|
+
except ImportError:
|
|
17
|
+
raise ImportError(f"vllm is not installed. Please install 'vllm>={VLLM_MIN_VERSION_STR}', to use the model loader.")
|
|
18
|
+
|
|
19
|
+
if tuple([int(part) for part in vllm.__version__.split(".") if part.isdigit()]) < VLLM_MIN_VERSION:
|
|
20
|
+
raise ImportError(
|
|
21
|
+
f"vllm version >={VLLM_MIN_VERSION_STR} required, but found {vllm.__version__}. Please upgrade vllm."
|
|
22
|
+
)
|
|
23
|
+
|
|
24
|
+
import vllm.entrypoints.cli.main
|
|
13
25
|
from vllm.config import ModelConfig, VllmConfig
|
|
14
26
|
from vllm.distributed import get_tensor_model_parallel_rank
|
|
15
27
|
from vllm.model_executor.model_loader import register_model_loader
|
|
@@ -1,11 +1,11 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: flyteplugins-vllm
|
|
3
|
-
Version: 2.0.
|
|
3
|
+
Version: 2.0.0b45
|
|
4
4
|
Summary: vLLM plugin for flyte
|
|
5
5
|
Author-email: Niels Bantilan <cosmicbboy@users.noreply.github.com>
|
|
6
6
|
Requires-Python: >=3.10
|
|
7
7
|
Description-Content-Type: text/markdown
|
|
8
|
-
Requires-Dist:
|
|
8
|
+
Requires-Dist: flyte>=2.0.0b43
|
|
9
9
|
|
|
10
10
|
# Union vLLM Plugin
|
|
11
11
|
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
flyteplugins/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
2
|
+
flyteplugins/vllm/__init__.py,sha256=FhdW2e_f6PsGo4wyV07jradAFbg7WmB0Luz3zHIDd7A,100
|
|
3
|
+
flyteplugins/vllm/_app_environment.py,sha256=4cfbX9ZCXMDjAk2PSWZRkSqZLTrMZJteK_nBN1MDoe0,8263
|
|
4
|
+
flyteplugins/vllm/_constants.py,sha256=I8suY7mz05kyvaW0Zskv_Zw0y7Gf0E4wjWm88cdjttU,90
|
|
5
|
+
flyteplugins/vllm/_model_loader/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
6
|
+
flyteplugins/vllm/_model_loader/shim.py,sha256=ANgEgTTLOhrCd0xIePsjah__gWcPQawLS_oq7RWa0X4,5825
|
|
7
|
+
flyteplugins_vllm-2.0.0b45.dist-info/METADATA,sha256=YIKWiM7Go4RuqldcESslLFMvNqQib1aWQsDD3rglTfM,1580
|
|
8
|
+
flyteplugins_vllm-2.0.0b45.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
9
|
+
flyteplugins_vllm-2.0.0b45.dist-info/entry_points.txt,sha256=lC-uwvkaytwtzbkJWdS69np63yLAakaDpI4mV1Yp9l8,74
|
|
10
|
+
flyteplugins_vllm-2.0.0b45.dist-info/top_level.txt,sha256=cgd779rPu9EsvdtuYgUxNHHgElaQvPn74KhB5XSeMBE,13
|
|
11
|
+
flyteplugins_vllm-2.0.0b45.dist-info/RECORD,,
|
|
@@ -1,10 +0,0 @@
|
|
|
1
|
-
flyteplugins/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
2
|
-
flyteplugins/vllm/__init__.py,sha256=FhdW2e_f6PsGo4wyV07jradAFbg7WmB0Luz3zHIDd7A,100
|
|
3
|
-
flyteplugins/vllm/_app_environment.py,sha256=-luoJak9FC4K8vs5JB34kXRnu3ms_ou2whQi64uCNrk,8075
|
|
4
|
-
flyteplugins/vllm/_model_loader/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
5
|
-
flyteplugins/vllm/_model_loader/shim.py,sha256=tQAyA7bwuR98fs4eLFiqOmIUGrVrbf5pfbPGmljWeDo,5352
|
|
6
|
-
flyteplugins_vllm-2.0.0b43.dist-info/METADATA,sha256=fPWhq_-KsLCH62UKYo_7zVCdq6t_bvELpU5f4CtIAdg,1577
|
|
7
|
-
flyteplugins_vllm-2.0.0b43.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
8
|
-
flyteplugins_vllm-2.0.0b43.dist-info/entry_points.txt,sha256=lC-uwvkaytwtzbkJWdS69np63yLAakaDpI4mV1Yp9l8,74
|
|
9
|
-
flyteplugins_vllm-2.0.0b43.dist-info/top_level.txt,sha256=cgd779rPu9EsvdtuYgUxNHHgElaQvPn74KhB5XSeMBE,13
|
|
10
|
-
flyteplugins_vllm-2.0.0b43.dist-info/RECORD,,
|
|
File without changes
|
{flyteplugins_vllm-2.0.0b43.dist-info → flyteplugins_vllm-2.0.0b45.dist-info}/entry_points.txt
RENAMED
|
File without changes
|
|
File without changes
|