flyteplugins-vllm 2.0.0b43__py3-none-any.whl → 2.0.0b45__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -11,13 +11,17 @@ from flyte.app import Parameter, RunOutput
11
11
  from flyte.app._types import Port
12
12
  from flyte.models import SerializationContext
13
13
 
14
+ from flyteplugins.vllm._constants import VLLM_MIN_VERSION_STR
15
+
14
16
  DEFAULT_VLLM_IMAGE = (
15
- flyte.Image.from_debian_base(name="vllm-app-image", python_version=(3, 12))
17
+ flyte.Image.from_debian_base(name="vllm-app-image")
16
18
  # install flashinfer and vllm
17
19
  .with_pip_packages("flashinfer-python", "flashinfer-cubin")
18
20
  .with_pip_packages("flashinfer-jit-cache", index_url="https://flashinfer.ai/whl/cu129")
19
21
  # install the vllm flyte plugin
20
22
  .with_pip_packages("flyteplugins-vllm", pre=True)
23
+ # install vllm in a separate layer due to dependency conflict with flyte (protovalidate)
24
+ .with_pip_packages(f"vllm>={VLLM_MIN_VERSION_STR}")
21
25
  )
22
26
 
23
27
 
@@ -0,0 +1,2 @@
1
+ VLLM_MIN_VERSION = (0, 11, 0)
2
+ VLLM_MIN_VERSION_STR = ".".join(map(str, VLLM_MIN_VERSION))
@@ -2,14 +2,26 @@ import logging
2
2
  from typing import Generator
3
3
 
4
4
  import torch
5
- import vllm
6
- import vllm.entrypoints.cli.main
7
5
  from flyte.app.extras._model_loader.config import (
8
6
  LOCAL_MODEL_PATH,
9
7
  REMOTE_MODEL_PATH,
10
8
  STREAM_SAFETENSORS,
11
9
  )
12
10
  from flyte.app.extras._model_loader.loader import SafeTensorsStreamer, prefetch
11
+
12
+ from flyteplugins.vllm._constants import VLLM_MIN_VERSION, VLLM_MIN_VERSION_STR
13
+
14
+ try:
15
+ import vllm
16
+ except ImportError:
17
+ raise ImportError(f"vllm is not installed. Please install 'vllm>={VLLM_MIN_VERSION_STR}', to use the model loader.")
18
+
19
+ if tuple([int(part) for part in vllm.__version__.split(".") if part.isdigit()]) < VLLM_MIN_VERSION:
20
+ raise ImportError(
21
+ f"vllm version >={VLLM_MIN_VERSION_STR} required, but found {vllm.__version__}. Please upgrade vllm."
22
+ )
23
+
24
+ import vllm.entrypoints.cli.main
13
25
  from vllm.config import ModelConfig, VllmConfig
14
26
  from vllm.distributed import get_tensor_model_parallel_rank
15
27
  from vllm.model_executor.model_loader import register_model_loader
@@ -1,11 +1,11 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: flyteplugins-vllm
3
- Version: 2.0.0b43
3
+ Version: 2.0.0b45
4
4
  Summary: vLLM plugin for flyte
5
5
  Author-email: Niels Bantilan <cosmicbboy@users.noreply.github.com>
6
6
  Requires-Python: >=3.10
7
7
  Description-Content-Type: text/markdown
8
- Requires-Dist: vllm>=0.11.0
8
+ Requires-Dist: flyte>=2.0.0b43
9
9
 
10
10
  # Union vLLM Plugin
11
11
 
@@ -0,0 +1,11 @@
1
+ flyteplugins/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
2
+ flyteplugins/vllm/__init__.py,sha256=FhdW2e_f6PsGo4wyV07jradAFbg7WmB0Luz3zHIDd7A,100
3
+ flyteplugins/vllm/_app_environment.py,sha256=4cfbX9ZCXMDjAk2PSWZRkSqZLTrMZJteK_nBN1MDoe0,8263
4
+ flyteplugins/vllm/_constants.py,sha256=I8suY7mz05kyvaW0Zskv_Zw0y7Gf0E4wjWm88cdjttU,90
5
+ flyteplugins/vllm/_model_loader/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
6
+ flyteplugins/vllm/_model_loader/shim.py,sha256=ANgEgTTLOhrCd0xIePsjah__gWcPQawLS_oq7RWa0X4,5825
7
+ flyteplugins_vllm-2.0.0b45.dist-info/METADATA,sha256=YIKWiM7Go4RuqldcESslLFMvNqQib1aWQsDD3rglTfM,1580
8
+ flyteplugins_vllm-2.0.0b45.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
9
+ flyteplugins_vllm-2.0.0b45.dist-info/entry_points.txt,sha256=lC-uwvkaytwtzbkJWdS69np63yLAakaDpI4mV1Yp9l8,74
10
+ flyteplugins_vllm-2.0.0b45.dist-info/top_level.txt,sha256=cgd779rPu9EsvdtuYgUxNHHgElaQvPn74KhB5XSeMBE,13
11
+ flyteplugins_vllm-2.0.0b45.dist-info/RECORD,,
@@ -1,10 +0,0 @@
1
- flyteplugins/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
2
- flyteplugins/vllm/__init__.py,sha256=FhdW2e_f6PsGo4wyV07jradAFbg7WmB0Luz3zHIDd7A,100
3
- flyteplugins/vllm/_app_environment.py,sha256=-luoJak9FC4K8vs5JB34kXRnu3ms_ou2whQi64uCNrk,8075
4
- flyteplugins/vllm/_model_loader/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
5
- flyteplugins/vllm/_model_loader/shim.py,sha256=tQAyA7bwuR98fs4eLFiqOmIUGrVrbf5pfbPGmljWeDo,5352
6
- flyteplugins_vllm-2.0.0b43.dist-info/METADATA,sha256=fPWhq_-KsLCH62UKYo_7zVCdq6t_bvELpU5f4CtIAdg,1577
7
- flyteplugins_vllm-2.0.0b43.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
8
- flyteplugins_vllm-2.0.0b43.dist-info/entry_points.txt,sha256=lC-uwvkaytwtzbkJWdS69np63yLAakaDpI4mV1Yp9l8,74
9
- flyteplugins_vllm-2.0.0b43.dist-info/top_level.txt,sha256=cgd779rPu9EsvdtuYgUxNHHgElaQvPn74KhB5XSeMBE,13
10
- flyteplugins_vllm-2.0.0b43.dist-info/RECORD,,