PyPI - xinference - Versions diffs - 1.7.1__py3-none-any.whl → 1.8.0__py3-none-any.whl - Mend

xinference 1.7.1py3-none-any.whl → 1.8.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of xinference might be problematic. Click here for more details.

Files changed (136) hide show

xinference/_version.py +3 -3
xinference/client/restful/async_restful_client.py +8 -13
xinference/client/restful/restful_client.py +6 -2
xinference/core/chat_interface.py +6 -4
xinference/core/media_interface.py +5 -0
xinference/core/model.py +1 -5
xinference/core/supervisor.py +117 -68
xinference/core/worker.py +49 -37
xinference/deploy/test/test_cmdline.py +2 -6
xinference/model/audio/__init__.py +26 -23
xinference/model/audio/chattts.py +3 -2
xinference/model/audio/core.py +49 -98
xinference/model/audio/cosyvoice.py +3 -2
xinference/model/audio/custom.py +28 -73
xinference/model/audio/f5tts.py +3 -2
xinference/model/audio/f5tts_mlx.py +3 -2
xinference/model/audio/fish_speech.py +3 -2
xinference/model/audio/funasr.py +17 -4
xinference/model/audio/kokoro.py +3 -2
xinference/model/audio/megatts.py +3 -2
xinference/model/audio/melotts.py +3 -2
xinference/model/audio/model_spec.json +572 -171
xinference/model/audio/utils.py +0 -6
xinference/model/audio/whisper.py +3 -2
xinference/model/audio/whisper_mlx.py +3 -2
xinference/model/cache_manager.py +141 -0
xinference/model/core.py +6 -49
xinference/model/custom.py +174 -0
xinference/model/embedding/__init__.py +67 -56
xinference/model/embedding/cache_manager.py +35 -0
xinference/model/embedding/core.py +104 -84
xinference/model/embedding/custom.py +55 -78
xinference/model/embedding/embed_family.py +80 -31
xinference/model/embedding/flag/core.py +21 -5
xinference/model/embedding/llama_cpp/__init__.py +0 -0
xinference/model/embedding/llama_cpp/core.py +234 -0
xinference/model/embedding/model_spec.json +968 -103
xinference/model/embedding/sentence_transformers/core.py +30 -20
xinference/model/embedding/vllm/core.py +11 -5
xinference/model/flexible/__init__.py +8 -2
xinference/model/flexible/core.py +26 -119
xinference/model/flexible/custom.py +69 -0
xinference/model/flexible/launchers/image_process_launcher.py +1 -0
xinference/model/flexible/launchers/modelscope_launcher.py +5 -1
xinference/model/flexible/launchers/transformers_launcher.py +15 -3
xinference/model/flexible/launchers/yolo_launcher.py +5 -1
xinference/model/image/__init__.py +20 -20
xinference/model/image/cache_manager.py +62 -0
xinference/model/image/core.py +70 -182
xinference/model/image/custom.py +28 -72
xinference/model/image/model_spec.json +402 -119
xinference/model/image/ocr/got_ocr2.py +3 -2
xinference/model/image/stable_diffusion/core.py +22 -7
xinference/model/image/stable_diffusion/mlx.py +6 -6
xinference/model/image/utils.py +2 -2
xinference/model/llm/__init__.py +71 -94
xinference/model/llm/cache_manager.py +292 -0
xinference/model/llm/core.py +37 -111
xinference/model/llm/custom.py +88 -0
xinference/model/llm/llama_cpp/core.py +5 -7
xinference/model/llm/llm_family.json +16260 -8151
xinference/model/llm/llm_family.py +138 -839
xinference/model/llm/lmdeploy/core.py +5 -7
xinference/model/llm/memory.py +3 -4
xinference/model/llm/mlx/core.py +6 -8
xinference/model/llm/reasoning_parser.py +3 -1
xinference/model/llm/sglang/core.py +32 -14
xinference/model/llm/transformers/chatglm.py +3 -7
xinference/model/llm/transformers/core.py +49 -27
xinference/model/llm/transformers/deepseek_v2.py +2 -2
xinference/model/llm/transformers/gemma3.py +2 -2
xinference/model/llm/transformers/multimodal/cogagent.py +2 -2
xinference/model/llm/transformers/multimodal/deepseek_vl2.py +2 -2
xinference/model/llm/transformers/multimodal/gemma3.py +2 -2
xinference/model/llm/transformers/multimodal/glm4_1v.py +167 -0
xinference/model/llm/transformers/multimodal/glm4v.py +2 -2
xinference/model/llm/transformers/multimodal/intern_vl.py +2 -2
xinference/model/llm/transformers/multimodal/minicpmv26.py +3 -3
xinference/model/llm/transformers/multimodal/ovis2.py +2 -2
xinference/model/llm/transformers/multimodal/qwen-omni.py +2 -2
xinference/model/llm/transformers/multimodal/qwen2_audio.py +2 -2
xinference/model/llm/transformers/multimodal/qwen2_vl.py +2 -2
xinference/model/llm/transformers/opt.py +3 -7
xinference/model/llm/utils.py +34 -49
xinference/model/llm/vllm/core.py +77 -27
xinference/model/llm/vllm/xavier/engine.py +5 -3
xinference/model/llm/vllm/xavier/scheduler.py +10 -6
xinference/model/llm/vllm/xavier/transfer.py +1 -1
xinference/model/rerank/__init__.py +26 -25
xinference/model/rerank/core.py +47 -87
xinference/model/rerank/custom.py +25 -71
xinference/model/rerank/model_spec.json +158 -33
xinference/model/rerank/utils.py +2 -2
xinference/model/utils.py +115 -54
xinference/model/video/__init__.py +13 -17
xinference/model/video/core.py +44 -102
xinference/model/video/diffusers.py +4 -3
xinference/model/video/model_spec.json +90 -21
xinference/types.py +5 -3
xinference/web/ui/build/asset-manifest.json +3 -3
xinference/web/ui/build/index.html +1 -1
xinference/web/ui/build/static/js/main.7d24df53.js +3 -0
xinference/web/ui/build/static/js/main.7d24df53.js.map +1 -0
xinference/web/ui/node_modules/.cache/babel-loader/2704ff66a5f73ca78b341eb3edec60154369df9d87fbc8c6dd60121abc5e1b0a.json +1 -0
xinference/web/ui/node_modules/.cache/babel-loader/607dfef23d33e6b594518c0c6434567639f24f356b877c80c60575184ec50ed0.json +1 -0
xinference/web/ui/node_modules/.cache/babel-loader/9be3d56173aacc3efd0b497bcb13c4f6365de30069176ee9403b40e717542326.json +1 -0
xinference/web/ui/node_modules/.cache/babel-loader/9f9dd6c32c78a222d07da5987ae902effe16bcf20aac00774acdccc4de3c9ff2.json +1 -0
xinference/web/ui/node_modules/.cache/babel-loader/b2ab5ee972c60d15eb9abf5845705f8ab7e1d125d324d9a9b1bcae5d6fd7ffb2.json +1 -0
xinference/web/ui/src/locales/en.json +0 -1
xinference/web/ui/src/locales/ja.json +0 -1
xinference/web/ui/src/locales/ko.json +0 -1
xinference/web/ui/src/locales/zh.json +0 -1
{xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/METADATA +9 -11
{xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/RECORD +119 -119
xinference/model/audio/model_spec_modelscope.json +0 -231
xinference/model/embedding/model_spec_modelscope.json +0 -293
xinference/model/embedding/utils.py +0 -18
xinference/model/image/model_spec_modelscope.json +0 -375
xinference/model/llm/llama_cpp/memory.py +0 -457
xinference/model/llm/llm_family_csghub.json +0 -56
xinference/model/llm/llm_family_modelscope.json +0 -8700
xinference/model/llm/llm_family_openmind_hub.json +0 -1019
xinference/model/rerank/model_spec_modelscope.json +0 -85
xinference/model/video/model_spec_modelscope.json +0 -184
xinference/web/ui/build/static/js/main.9b12b7f9.js +0 -3
xinference/web/ui/build/static/js/main.9b12b7f9.js.map +0 -1
xinference/web/ui/node_modules/.cache/babel-loader/1460361af6975e63576708039f1cb732faf9c672d97c494d4055fc6331460be0.json +0 -1
xinference/web/ui/node_modules/.cache/babel-loader/4efd8dda58fda83ed9546bf2f587df67f8d98e639117bee2d9326a9a1d9bebb2.json +0 -1
xinference/web/ui/node_modules/.cache/babel-loader/55b9fb40b57fa926e8f05f31c2f96467e76e5ad62f033dca97c03f9e8c4eb4fe.json +0 -1
xinference/web/ui/node_modules/.cache/babel-loader/5b2dafe5aa9e1105e0244a2b6751807342fa86aa0144b4e84d947a1686102715.json +0 -1
xinference/web/ui/node_modules/.cache/babel-loader/611fa2c6c53b66039991d06dfb0473b5ab37fc63b4564e0f6e1718523768a045.json +0 -1
/xinference/web/ui/build/static/js/{main.9b12b7f9.js.LICENSE.txt → main.7d24df53.js.LICENSE.txt} +0 -0
{xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/WHEEL +0 -0
{xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/entry_points.txt +0 -0
{xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/licenses/LICENSE +0 -0
{xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/top_level.txt +0 -0

xinference/model/image/core.py CHANGED Viewed

@@ -14,30 +14,21 @@
 import collections.abc
 import logging
-import os
 import platform
 from collections import defaultdict
-from typing import Dict, List, Literal, Optional, Tuple, Union
+from typing import Dict, List, Literal, Optional, Union
-from ...constants import XINFERENCE_CACHE_DIR
 from ...types import PeftModelConfig
-from ..core import CacheableModelSpec, ModelDescription, VirtualEnvSettings
-from ..utils import (
-    IS_NEW_HUGGINGFACE_HUB,
-    retry_download,
-    symlink_local_file,
-    valid_model_revision,
-)
+from ..core import CacheableModelSpec, VirtualEnvSettings
+from ..utils import ModelInstanceInfoMixin
 from .ocr.got_ocr2 import GotOCR2Model
 from .stable_diffusion.core import DiffusionModel
 from .stable_diffusion.mlx import MLXDiffusionModel
 logger = logging.getLogger(__name__)
-MODEL_NAME_TO_REVISION: Dict[str, List[str]] = defaultdict(list)
 IMAGE_MODEL_DESCRIPTIONS: Dict[str, List[Dict]] = defaultdict(list)
-BUILTIN_IMAGE_MODELS: Dict[str, "ImageModelFamilyV1"] = {}
-MODELSCOPE_IMAGE_MODELS: Dict[str, "ImageModelFamilyV1"] = {}
+BUILTIN_IMAGE_MODELS: Dict[str, List["ImageModelFamilyV2"]] = {}
 def get_image_model_descriptions():
@@ -46,14 +37,15 @@ def get_image_model_descriptions():
     return copy.deepcopy(IMAGE_MODEL_DESCRIPTIONS)
-class ImageModelFamilyV1(CacheableModelSpec):
+class ImageModelFamilyV2(CacheableModelSpec, ModelInstanceInfoMixin):
+    version: Literal[2] = 2
     model_family: str
     model_name: str
     model_id: str
     model_revision: str
     model_hub: str = "huggingface"
     model_ability: Optional[List[str]]
-    controlnet: Optional[List["ImageModelFamilyV1"]]
+    controlnet: Optional[List["ImageModelFamilyV2"]]
     default_model_config: Optional[dict] = {}
     default_generate_config: Optional[dict] = {}
     gguf_model_id: Optional[str]
@@ -61,65 +53,48 @@ class ImageModelFamilyV1(CacheableModelSpec):
     gguf_model_file_name_template: Optional[str]
     virtualenv: Optional[VirtualEnvSettings]
+    class Config:
+        extra = "allow"
-class ImageModelDescription(ModelDescription):
-    def __init__(
-        self,
-        address: Optional[str],
-        devices: Optional[List[str]],
-        model_spec: ImageModelFamilyV1,
-        model_path: Optional[str] = None,
-    ):
-        super().__init__(address, devices, model_path=model_path)
-        self._model_spec = model_spec
-    @property
-    def spec(self):
-        return self._model_spec
-    def to_dict(self):
-        if self._model_spec.controlnet is not None:
-            controlnet = [cn.dict() for cn in self._model_spec.controlnet]
+    def to_description(self):
+        if self.controlnet is not None:
+            controlnet = [cn.dict() for cn in self.controlnet]
         else:
-            controlnet = self._model_spec.controlnet
+            controlnet = self.controlnet
         return {
             "model_type": "image",
-            "address": self.address,
-            "accelerators": self.devices,
-            "model_name": self._model_spec.model_name,
-            "model_family": self._model_spec.model_family,
-            "model_revision": self._model_spec.model_revision,
-            "model_ability": self._model_spec.model_ability,
+            "address": getattr(self, "address", None),
+            "accelerators": getattr(self, "accelerators", None),
+            "model_name": self.model_name,
+            "model_family": self.model_family,
+            "model_revision": self.model_revision,
+            "model_ability": self.model_ability,
             "controlnet": controlnet,
         }
     def to_version_info(self):
+        from .cache_manager import ImageCacheManager
         from .utils import get_model_version
-        if self._model_path is None:
-            is_cached = get_cache_status(self._model_spec)
-            file_location = get_cache_dir(self._model_spec)
-        else:
-            is_cached = True
-            file_location = self._model_path
+        cache_manager = ImageCacheManager(self)
-        if self._model_spec.controlnet is None:
+        if not self.controlnet:
             return [
                 {
-                    "model_version": get_model_version(self._model_spec, None),
-                    "model_file_location": file_location,
-                    "cache_status": is_cached,
+                    "model_version": get_model_version(self, None),
+                    "model_file_location": cache_manager.get_cache_dir(),
+                    "cache_status": cache_manager.get_cache_status(),
                     "controlnet": "zoe-depth",
                 }
             ]
         else:
             res = []
-            for cn in self._model_spec.controlnet:
+            for cn in self.controlnet:
                 res.append(
                     {
-                        "model_version": get_model_version(self._model_spec, cn),
-                        "model_file_location": file_location,
-                        "cache_status": is_cached,
+                        "model_version": get_model_version(self, cn),
+                        "model_file_location": cache_manager.get_cache_dir(),
+                        "cache_status": cache_manager.get_cache_status(),
                         "controlnet": cn.model_name,
                     }
                 )
@@ -127,12 +102,10 @@ class ImageModelDescription(ModelDescription):
 def generate_image_description(
-    image_model: ImageModelFamilyV1,
+    image_model: ImageModelFamilyV2,
 ) -> Dict[str, List[Dict]]:
     res = defaultdict(list)
-    res[image_model.model_name].extend(
-        ImageModelDescription(None, None, image_model).to_version_info()
-    )
+    res[image_model.model_name].extend(image_model.to_version_info())
     return res
@@ -141,27 +114,35 @@ def match_diffusion(
     download_hub: Optional[
         Literal["huggingface", "modelscope", "openmind_hub", "csghub"]
     ] = None,
-) -> ImageModelFamilyV1:
+) -> ImageModelFamilyV2:
     from ..utils import download_from_modelscope
-    from . import BUILTIN_IMAGE_MODELS, MODELSCOPE_IMAGE_MODELS
+    from . import BUILTIN_IMAGE_MODELS
     from .custom import get_user_defined_images
     for model_spec in get_user_defined_images():
         if model_spec.model_name == model_name:
             return model_spec
-    if download_hub == "modelscope" and model_name in MODELSCOPE_IMAGE_MODELS:
-        logger.debug(f"Image model {model_name} found in ModelScope.")
-        return MODELSCOPE_IMAGE_MODELS[model_name]
-    elif download_hub == "huggingface" and model_name in BUILTIN_IMAGE_MODELS:
-        logger.debug(f"Image model {model_name} found in Huggingface.")
-        return BUILTIN_IMAGE_MODELS[model_name]
-    elif download_from_modelscope() and model_name in MODELSCOPE_IMAGE_MODELS:
-        logger.debug(f"Image model {model_name} found in ModelScope.")
-        return MODELSCOPE_IMAGE_MODELS[model_name]
-    elif model_name in BUILTIN_IMAGE_MODELS:
-        logger.debug(f"Image model {model_name} found in Huggingface.")
-        return BUILTIN_IMAGE_MODELS[model_name]
+    if model_name in BUILTIN_IMAGE_MODELS:
+        if download_hub == "modelscope" or download_from_modelscope():
+            return (
+                [
+                    x
+                    for x in BUILTIN_IMAGE_MODELS[model_name]
+                    if x.model_hub == "modelscope"
+                ]
+                + [
+                    x
+                    for x in BUILTIN_IMAGE_MODELS[model_name]
+                    if x.model_hub == "huggingface"
+                ]
+            )[0]
+        else:
+            return [
+                x
+                for x in BUILTIN_IMAGE_MODELS[model_name]
+                if x.model_hub == "huggingface"
+            ][0]
     else:
         raise ValueError(
             f"Image model {model_name} not found, available"
@@ -169,117 +150,27 @@ def match_diffusion(
         )
-def cache(model_spec: ImageModelFamilyV1):
-    from ..utils import cache
-    return cache(model_spec, ImageModelDescription)
-def get_cache_dir(model_spec: ImageModelFamilyV1):
-    return os.path.realpath(os.path.join(XINFERENCE_CACHE_DIR, model_spec.model_name))
-def get_cache_status(
-    model_spec: ImageModelFamilyV1,
-) -> bool:
-    cache_dir = get_cache_dir(model_spec)
-    meta_path = os.path.join(cache_dir, "__valid_download")
-    model_name = model_spec.model_name
-    if model_name in BUILTIN_IMAGE_MODELS and model_name in MODELSCOPE_IMAGE_MODELS:
-        hf_spec = BUILTIN_IMAGE_MODELS[model_name]
-        ms_spec = MODELSCOPE_IMAGE_MODELS[model_name]
-        return any(
-            [
-                valid_model_revision(meta_path, hf_spec.model_revision),
-                valid_model_revision(meta_path, ms_spec.model_revision),
-            ]
-        )
-    else:  # Usually for UT
-        return valid_model_revision(meta_path, model_spec.model_revision)
-def cache_gguf(spec: ImageModelFamilyV1, quantization: Optional[str] = None):
-    if not quantization:
-        return
-    cache_dir = os.path.realpath(os.path.join(XINFERENCE_CACHE_DIR, spec.model_name))
-    if not os.path.exists(cache_dir):
-        os.makedirs(cache_dir, exist_ok=True)
-    if not spec.gguf_model_file_name_template:
-        raise NotImplementedError(
-            f"{spec.model_name} does not support GGUF quantization"
-        )
-    if quantization not in (spec.gguf_quantizations or []):
-        raise ValueError(
-            f"Cannot support quantization {quantization}, "
-            f"available quantizations: {spec.gguf_quantizations}"
-        )
-    filename = spec.gguf_model_file_name_template.format(quantization=quantization)  # type: ignore
-    full_path = os.path.join(cache_dir, filename)
-    if spec.model_hub == "huggingface":
-        import huggingface_hub
-        use_symlinks = {}
-        if not IS_NEW_HUGGINGFACE_HUB:
-            use_symlinks = {"local_dir_use_symlinks": True, "local_dir": cache_dir}
-        download_file_path = retry_download(
-            huggingface_hub.hf_hub_download,
-            spec.model_name,
-            None,
-            spec.gguf_model_id,
-            filename=filename,
-            **use_symlinks,
-        )
-        if IS_NEW_HUGGINGFACE_HUB:
-            symlink_local_file(download_file_path, cache_dir, filename)
-    elif spec.model_hub == "modelscope":
-        from modelscope.hub.file_download import model_file_download
-        download_file_path = retry_download(
-            model_file_download,
-            spec.model_name,
-            None,
-            spec.gguf_model_id,
-            filename,
-            revision=spec.model_revision,
-        )
-        symlink_local_file(download_file_path, cache_dir, filename)
-    else:
-        raise NotImplementedError
-    return full_path
 def create_ocr_model_instance(
-    subpool_addr: str,
-    devices: List[str],
     model_uid: str,
-    model_spec: ImageModelFamilyV1,
+    model_spec: ImageModelFamilyV2,
     model_path: Optional[str] = None,
     **kwargs,
-) -> Tuple[GotOCR2Model, ImageModelDescription]:
+) -> GotOCR2Model:
+    from .cache_manager import ImageCacheManager
     if not model_path:
-        model_path = cache(model_spec)
+        cache_manager = ImageCacheManager(model_spec)
+        model_path = cache_manager.cache()
     model = GotOCR2Model(
         model_uid,
         model_path,
         model_spec=model_spec,
         **kwargs,
     )
-    model_description = ImageModelDescription(
-        subpool_addr, devices, model_spec, model_path=model_path
-    )
-    return model, model_description
+    return model
 def create_image_model_instance(
-    subpool_addr: str,
-    devices: List[str],
     model_uid: str,
     model_name: str,
     peft_model_config: Optional[PeftModelConfig] = None,
@@ -290,14 +181,12 @@ def create_image_model_instance(
     gguf_quantization: Optional[str] = None,
     gguf_model_path: Optional[str] = None,
     **kwargs,
-) -> Tuple[
-    Union[DiffusionModel, MLXDiffusionModel, GotOCR2Model], ImageModelDescription
-]:
+) -> Union[DiffusionModel, MLXDiffusionModel, GotOCR2Model]:
+    from .cache_manager import ImageCacheManager
     model_spec = match_diffusion(model_name, download_hub)
     if model_spec.model_ability and "ocr" in model_spec.model_ability:
         return create_ocr_model_instance(
-            subpool_addr=subpool_addr,
-            devices=devices,
             model_uid=model_uid,
             model_name=model_name,
             model_spec=model_spec,
@@ -327,7 +216,8 @@ def create_image_model_instance(
         for name in controlnet:
             for cn_model_spec in model_spec.controlnet:
                 if cn_model_spec.model_name == name:
-                    controlnet_model_path = cache(cn_model_spec)
+                    cn_cache_manager = ImageCacheManager(cn_model_spec)
+                    controlnet_model_path = cn_cache_manager.cache()
                     controlnet_model_paths.append(controlnet_model_path)
                     break
             else:
@@ -340,10 +230,11 @@ def create_image_model_instance(
             kwargs["controlnet"] = [
                 (n, path) for n, path in zip(controlnet, controlnet_model_paths)
             ]
+    cache_manager = ImageCacheManager(model_spec)
     if not model_path:
-        model_path = cache(model_spec)
+        model_path = cache_manager.cache()
     if not gguf_model_path and gguf_quantization:
-        gguf_model_path = cache_gguf(model_spec, gguf_quantization)
+        gguf_model_path = cache_manager.cache_gguf(gguf_quantization)
     if peft_model_config is not None:
         lora_model = peft_model_config.peft_model
         lora_load_kwargs = peft_model_config.image_lora_load_kwargs
@@ -356,7 +247,7 @@ def create_image_model_instance(
     if (
         platform.system() == "Darwin"
         and "arm" in platform.machine().lower()
-        and model_name in MLXDiffusionModel.supported_models
+        and MLXDiffusionModel.support_model(model_name)
     ):
         # Mac with M series silicon chips
         model_cls = MLXDiffusionModel
@@ -373,7 +264,4 @@ def create_image_model_instance(
         gguf_model_path=gguf_model_path,
         **kwargs,
     )
-    model_description = ImageModelDescription(
-        subpool_addr, devices, model_spec, model_path=model_path
-    )
-    return model, model_description
+    return model

xinference/model/image/custom.py CHANGED Viewed

@@ -11,98 +11,54 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import logging
-import os
-from threading import Lock
 from typing import List, Optional
-from ...constants import XINFERENCE_CACHE_DIR, XINFERENCE_MODEL_DIR
-from .core import ImageModelFamilyV1
+from ..._compat import Literal
+from ..custom import ModelRegistry
+from .core import ImageModelFamilyV2
 logger = logging.getLogger(__name__)
-UD_IMAGE_LOCK = Lock()
-class CustomImageModelFamilyV1(ImageModelFamilyV1):
+class CustomImageModelFamilyV2(ImageModelFamilyV2):
+    version: Literal[2] = 2
     model_id: Optional[str]  # type: ignore
     model_revision: Optional[str]  # type: ignore
     model_uri: Optional[str]
-    controlnet: Optional[List["CustomImageModelFamilyV1"]]
+    controlnet: Optional[List["CustomImageModelFamilyV2"]]
+UD_IMAGES: List[CustomImageModelFamilyV2] = []
-UD_IMAGES: List[CustomImageModelFamilyV1] = []
+class ImageModelRegistry(ModelRegistry):
+    model_type = "image"
-def get_user_defined_images() -> List[ImageModelFamilyV1]:
-    with UD_IMAGE_LOCK:
-        return UD_IMAGES.copy()
+    def __init__(self):
+        from .core import BUILTIN_IMAGE_MODELS
+        super().__init__()
+        self.models = UD_IMAGES
+        self.builtin_models = list(BUILTIN_IMAGE_MODELS.keys())
-def register_image(model_spec: CustomImageModelFamilyV1, persist: bool):
-    from ..utils import is_valid_model_name, is_valid_model_uri
-    from . import BUILTIN_IMAGE_MODELS, MODELSCOPE_IMAGE_MODELS
-    if not is_valid_model_name(model_spec.model_name):
-        raise ValueError(f"Invalid model name {model_spec.model_name}.")
+def get_user_defined_images() -> List[ImageModelFamilyV2]:
+    from ..custom import RegistryManager
-    model_uri = model_spec.model_uri
-    if model_uri and not is_valid_model_uri(model_uri):
-        raise ValueError(f"Invalid model URI {model_uri}")
+    registry = RegistryManager.get_registry("image")
+    return registry.get_custom_models()
-    with UD_IMAGE_LOCK:
-        for model_name in (
-            list(BUILTIN_IMAGE_MODELS.keys())
-            + list(MODELSCOPE_IMAGE_MODELS.keys())
-            + [spec.model_name for spec in UD_IMAGES]
-        ):
-            if model_spec.model_name == model_name:
-                raise ValueError(
-                    f"Model name conflicts with existing model {model_spec.model_name}"
-                )
-        UD_IMAGES.append(model_spec)
-    if persist:
-        persist_path = os.path.join(
-            XINFERENCE_MODEL_DIR, "image", f"{model_spec.model_name}.json"
-        )
-        os.makedirs(os.path.dirname(persist_path), exist_ok=True)
-        with open(persist_path, "w") as f:
-            f.write(model_spec.json())
+def register_image(model_spec: CustomImageModelFamilyV2, persist: bool):
+    from ..custom import RegistryManager
+    registry = RegistryManager.get_registry("image")
+    registry.register(model_spec, persist)
 def unregister_image(model_name: str, raise_error: bool = True):
-    with UD_IMAGE_LOCK:
-        model_spec = None
-        for i, f in enumerate(UD_IMAGES):
-            if f.model_name == model_name:
-                model_spec = f
-                break
-        if model_spec:
-            UD_IMAGES.remove(model_spec)
-            persist_path = os.path.join(
-                XINFERENCE_MODEL_DIR, "image", f"{model_spec.model_id}.json"
-            )
-            if os.path.exists(persist_path):
-                os.remove(persist_path)
-            cache_dir = os.path.join(XINFERENCE_CACHE_DIR, model_spec.model_name)
-            if os.path.exists(cache_dir):
-                logger.warning(
-                    f"Remove the cache of user-defined model {model_spec.model_name}. "
-                    f"Cache directory: {cache_dir}"
-                )
-                if os.path.islink(cache_dir):
-                    os.remove(cache_dir)
-                else:
-                    logger.warning(
-                        f"Cache directory is not a soft link, please remove it manually."
-                    )
-        else:
-            if raise_error:
-                raise ValueError(f"Model {model_name} not found.")
-            else:
-                logger.warning(f"Custom image model {model_name} not found.")
+    from ..custom import RegistryManager
+    registry = RegistryManager.get_registry("image")
+    registry.unregister(model_name, raise_error)

xinference 1.7.1__py3-none-any.whl → 1.8.0__py3-none-any.whl

Potentially problematic release.

xinference 1.7.1py3-none-any.whl → 1.8.0py3-none-any.whl