PyPI - optimum-rbln - Versions diffs - 0.1.13__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

optimum-rbln 0.1.13py3-none-any.whl → 0.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (103) hide show

optimum/rbln/modeling_base.py CHANGED Viewed

@@ -22,7 +22,6 @@
 # from Rebellions Inc.
 import importlib
-import inspect
 import logging
 import os
 import shutil
@@ -33,143 +32,31 @@ from typing import TYPE_CHECKING, Any, Dict, List, Optional, Union
 import rebel
 import torch
-import transformers
-from huggingface_hub import HfApi, HfFolder, hf_hub_download
-from optimum.exporters import TasksManager
-from optimum.modeling_base import OptimizedModel
 from transformers import (
     AutoConfig,
     AutoModel,
-    AutoModelForAudioClassification,
-    AutoModelForImageClassification,
-    AutoModelForMaskedLM,
-    AutoModelForQuestionAnswering,
-    AutoModelForSequenceClassification,
     GenerationConfig,
     PretrainedConfig,
 )
-from .modeling_config import DEFAULT_COMPILED_MODEL_NAME, RBLNCompileConfig, RBLNConfig, use_rbln_config
+from .modeling_config import RBLNCompileConfig, RBLNConfig, use_rbln_config
+from .utils.hub import PushToHubMixin, pull_compiled_model_from_hub, validate_files
 from .utils.runtime_utils import UnavailableRuntime
 from .utils.save_utils import maybe_load_preprocessors
+from .utils.submodule import SubModulesMixin
 if TYPE_CHECKING:
-    from transformers import (
-        AutoFeatureExtractor,
-        AutoProcessor,
-        AutoTokenizer,
-        PreTrainedModel,
-    )
+    from transformers import PreTrainedModel
 logger = logging.getLogger(__name__)
-class SubModulesMixin:
-    """
-    _rbln_submodules = [
-        {"name": "vision_tower"},
-        {"name": "language_model"},
-    ]
-    """
-    _rbln_submodules: List[Dict[str, Any]] = []
-    def __init__(
-        self,
-        *,
-        rbln_submodules: List["RBLNBaseModel"] = [],
-        **kwargs,
-    ) -> None:
-        for submodule_meta, submodule in zip(self._rbln_submodules, rbln_submodules):
-            setattr(self, submodule_meta["name"], submodule)
-    @classmethod
-    def _export_submodules_from_model(
-        cls,
-        model: "PreTrainedModel",
-        model_save_dir: str,
-        rbln_kwargs: Dict[str, Any],
-        **kwargs,
-    ) -> List["RBLNBaseModel"]:
-        rbln_submodules = []
-        for submodule in cls._rbln_submodules:
-            submodule_name = submodule["name"]
-            torch_submodule: "PreTrainedModel" = getattr(model, submodule["name"])
-            cls_name = torch_submodule.__class__.__name__
-            submodule_cls: "RBLNModel" = getattr(importlib.import_module("optimum.rbln"), f"RBLN{cls_name}")
-            if submodule_name in rbln_kwargs:
-                kwargs["rbln_config"] = rbln_kwargs[submodule_name]
-            rbln_submodule = submodule_cls.from_model(
-                model=torch_submodule,
-                subfolder=submodule_name,
-                model_save_dir=model_save_dir,
-                **kwargs,
-            )
-            rbln_submodules.append(rbln_submodule)
-        return rbln_submodules
-    @classmethod
-    def _load_submodules_from_compiled_models(
-        cls,
-        model_save_dir: str,
-        rbln_kwargs: Dict[str, Any],
-        **kwargs,
-    ):
-        rbln_submodules = []
-        for submodule in cls._rbln_submodules:
-            submodule_name = submodule["name"]
-            if submodule_name in rbln_kwargs:
-                kwargs["rbln_config"] = rbln_kwargs[submodule_name]
-            # Get cls name for call the constructor of the rbln class
-            submodule_rbln_config = RBLNConfig.load(Path(model_save_dir) / submodule_name)
-            submodule_cls_name = submodule_rbln_config.meta["cls"]
-            submodule_cls: "RBLNBaseModel" = getattr(importlib.import_module("optimum.rbln"), submodule_cls_name)
-            config = OptimizedModel._load_config(Path(model_save_dir) / submodule_name)
-            rbln_submodule = submodule_cls._from_pretrained(
-                model_id=model_save_dir,
-                config=config,
-                subfolder=submodule_name,
-                **kwargs,
-            )
-            rbln_submodules.append(rbln_submodule)
-        return rbln_submodules
-    @classmethod
-    def _load_submodules(
-        cls,
-        model_save_dir,
-        rbln_kwargs,
-        model=None,
-        **kwargs,
-    ):
-        # Two ways :
-        # 1. Compile from pytorch object
-        # 2. Load from compiled file
-        if model is not None:
-            return cls._export_submodules_from_model(
-                model=model,
-                model_save_dir=model_save_dir,
-                rbln_kwargs=rbln_kwargs,
-                **kwargs,
-            )
-        else:
-            return cls._load_submodules_from_compiled_models(
-                model_save_dir=model_save_dir,
-                rbln_kwargs=rbln_kwargs,
-                **kwargs,
-            )
+class PreTrainedModel(ABC):  # noqa: F811
+    pass
-class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
+class RBLNBaseModel(SubModulesMixin, PushToHubMixin, PreTrainedModel):
     """
     An abstract base class for compiling, loading, and saving neural network models from the huggingface
     transformers and diffusers libraries to run on RBLN NPU devices.
@@ -205,30 +92,29 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
     """
     model_type = "rbln_model"
-    auto_model_class = AutoModel  # feature extraction
+    auto_model_class = AutoModel
+    config_class = AutoConfig
     config_name = "config.json"
+    hf_library_name = "transformers"
+    _hf_class = None
     def __init__(
         self,
         models: List[rebel.Runtime],
         config: "PretrainedConfig",
         rbln_config: RBLNConfig,
-        preprocessors: Optional[List],
         model_save_dir: Optional[Union[str, Path, TemporaryDirectory]] = None,
         subfolder: str = "",
         rbln_compiled_models: Optional[rebel.RBLNCompiledModel] = None,
         rbln_submodules: List["RBLNBaseModel"] = [],
         **kwargs,
     ):
-        super().__init__(models, config)
-        if not isinstance(self.config, PretrainedConfig):  # if diffusers config
-            self.config = PretrainedConfig(**self.config)
+        self.model = models
+        self.config = config
         self.rbln_config = rbln_config
-        self.preprocessors = [] if preprocessors is None else preprocessors
         self.compiled_models = rbln_compiled_models
-        # Registers the RBLNBaseModelForXXX classes into the transformers AutoModel classes to avoid warnings when creating
+        # Registers the RBLN classes into the transformers AutoModel classes to avoid warnings when creating
         # a pipeline https://github.com/huggingface/transformers/blob/3d3204c025b6b5de013e07dd364208e28b4d9589/src/transformers/pipelines/base.py#L940
         AutoConfig.register(self.model_type, AutoConfig)
         if hasattr(self.auto_model_class, "register"):
@@ -247,6 +133,7 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
         self.device = torch.device("cpu")
         self.training = False
+        self.dtype = torch.float32
         # FIXME :: model_save_dir is not used after initialized. (This can be used when save/load)
         # This attribute is needed to keep one reference on the temporary directory, since garbage collecting it
@@ -264,34 +151,6 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
         self.rbln_submodules = rbln_submodules
         self.__post_init__(**kwargs)
-    def _save_pretrained(self, save_directory: Union[str, Path]):
-        """
-        Saves a model and its configuration file to a directory, so that it can be re-loaded using the
-        [`~optimum.rbln.modeling_base.RBLNBaseModel.from_pretrained`] class method.
-        Args:
-            save_directory (`Union[str, Path]`):
-                Directory where to save the model file.
-        """
-        real_save_dir = self.model_save_dir / self.subfolder
-        save_directory_path = Path(save_directory)
-        if os.path.exists(real_save_dir) and os.path.isdir(real_save_dir):
-            if save_directory_path.absolute() == real_save_dir.absolute():
-                raise FileExistsError(
-                    f"Cannot save model to '{save_directory}'. "
-                    f"This directory already exists and contains the model files."
-                )
-            shutil.copytree(real_save_dir, save_directory, dirs_exist_ok=True)
-            self.config.save_pretrained(save_directory)
-            if self.generation_config is not None:
-                self.generation_config.save_pretrained(save_directory)
-        else:
-            raise FileNotFoundError(
-                f"Unable to save the model. The model directory '{real_save_dir}' does not exist or is not accessible. "
-                f"Cannot save to the specified destination '{save_directory}'. "
-                f"Please ensure the model directory exists and you have the necessary permissions to access it."
-            )
     @classmethod
     def _load_compiled_model_dir(
         cls,
@@ -302,50 +161,18 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
         cache_dir: Optional[str] = None,
         subfolder: str = "",
         local_files_only: bool = False,
-    ):
-        # Find compiled model
-        # And prepare or download cache folder from HF Hub if needed.
+    ) -> str:
+        """Load the directory containing the compiled model files."""
         model_path = Path(model_id)
         if model_path.is_dir():
             model_path = model_path / subfolder
             rbln_files = list(model_path.glob("*.rbln"))
             rbln_config_filenames = list(model_path.glob("rbln_config.json"))
+            validate_files(rbln_files, rbln_config_filenames, f"directory {model_path}")
         else:
-            if isinstance(use_auth_token, bool):
-                token = HfFolder().get_token()
-            else:
-                token = use_auth_token
-            repo_files = list(
-                map(
-                    Path,
-                    HfApi().list_repo_files(model_id, revision=revision, token=token),
-                )
-            )
-            pattern = "*.rbln" if subfolder == "" else f"{subfolder}/*.rbln"
-            rbln_files = [p for p in repo_files if p.match(pattern)]
-            pattern = "rbln_config.json" if subfolder == "" else f"{subfolder}/rbln_config.json"
-            rbln_config_filenames = [p for p in repo_files if p.match(pattern)]
-        if len(rbln_files) == 0:
-            raise FileNotFoundError(f"Could not find any rbln model file in {model_path}")
-        if len(rbln_config_filenames) == 0:
-            raise FileNotFoundError(f"Could not find `rbln_config.json` file in {model_path}")
-        if len(rbln_config_filenames) > 1:
-            raise FileExistsError(
-                f"Multiple rbln_config.json are not expected. but {len(rbln_config_filenames)} are found."
-            )
-        if model_path.is_dir():
-            model_path = str(model_path)
-        else:
-            rbln_config_filename = rbln_config_filenames[0]
-            rbln_config_cache_path = hf_hub_download(
-                repo_id=model_id,
-                filename=str(rbln_config_filename),
+            model_path = pull_compiled_model_from_hub(
+                model_id=model_id,
                 subfolder=subfolder,
                 use_auth_token=use_auth_token,
                 revision=revision,
@@ -353,9 +180,8 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
                 force_download=force_download,
                 local_files_only=local_files_only,
             )
-            model_path = Path(rbln_config_cache_path).parent
-        return model_path
+        return str(model_path)
     @classmethod
     def _load_compiled_models(cls, model_path: str):
@@ -368,13 +194,14 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
     def _from_pretrained(
         cls,
         model_id: Union[str, Path],
-        config: "PretrainedConfig",
+        config: "PretrainedConfig" = None,
         use_auth_token: Optional[Union[bool, str]] = None,
         revision: Optional[str] = None,
         force_download: bool = False,
         cache_dir: Optional[str] = None,
         subfolder: str = "",
         local_files_only: bool = False,
+        trust_remote_code: bool = False,
         model_save_dir: Optional[Union[str, Path, TemporaryDirectory]] = None,
         # passed from compile function
         rbln_config: Optional[RBLNConfig] = None,
@@ -401,6 +228,43 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
             rbln_config = RBLNConfig.load(model_path_subfolder)
             rbln_config.update_runtime_cfg(rbln_kwargs)
+            if rbln_config.meta["cls"] != cls.__name__:
+                raise NameError(
+                    f"Cannot load the model. The model was originally compiled using "
+                    f"{rbln_config.meta['cls']}, but you are trying to load it with {cls.__name__}."
+                    "Please use the same model class that was used during compilation."
+                )
+            if config is None:
+                if cls.hf_library_name == "transformers":
+                    config = AutoConfig.from_pretrained(
+                        model_path_subfolder,
+                        cache_dir=cache_dir,
+                        force_download=force_download,
+                        revision=revision,
+                        token=use_auth_token,
+                        trust_remote_code=trust_remote_code,
+                    )
+                elif cls.hf_library_name == "diffusers":
+                    # import here to prevent diffusers dependency
+                    # TODO(jongho): Remove diffusers dependency if use transformers only.
+                    from diffusers.configuration_utils import ConfigMixin
+                    class DummyConfigMixin(ConfigMixin):
+                        # Just to load config, We need to specify `config_name`
+                        config_name = "config.json"
+                    config = DummyConfigMixin.load_config(
+                        model_id,
+                        cache_dir=cache_dir,
+                        force_download=force_download,
+                        local_files_only=local_files_only,
+                        revision=revision,
+                        token=use_auth_token,
+                        subfolder=subfolder,
+                    )
+                    config = PretrainedConfig(**config)
             rbln_compiled_models = cls._load_compiled_models(model_path_subfolder)
             if len(cls._rbln_submodules) > 0:
@@ -440,8 +304,6 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
     ):
         if isinstance(model_save_dir, str):
             model_save_dir = Path(model_save_dir)
-        preprocessors = maybe_load_preprocessors(model_save_dir.name, subfolder=subfolder)
         # FIXME:: Should we convert it?
         compiled_model_names = [cfg.compiled_model_name for cfg in rbln_config.compile_cfgs]
         rbln_compiled_models = [rbln_compiled_models[cm_name] for cm_name in compiled_model_names]
@@ -449,7 +311,7 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
         # create runtimes only if `rbln_create_runtimes` is enabled
         try:
             models = (
-                cls._create_runtimes(rbln_compiled_models, rbln_config.device_map)
+                cls._create_runtimes(rbln_compiled_models, rbln_config.device_map, rbln_config.activate_profiler)
                 if rbln_config.create_runtimes
                 else UnavailableRuntime()
             )
@@ -464,7 +326,6 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
             models,
             config,
             rbln_config,
-            preprocessors,
             model_save_dir=model_save_dir,
             subfolder=subfolder,
             rbln_compiled_models=(None if rbln_config.optimize_host_memory else rbln_compiled_models),
@@ -472,17 +333,53 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
             **kwargs,
         )
-    def __repr__(self):
-        return repr(self.model) + repr(self.rbln_submodules)
+    @classmethod
+    @use_rbln_config
+    def _export(
+        cls,
+        model_id: Union[str, Path],
+        rbln_config: Optional[Dict[str, Any]] = None,
+        **kwargs,
+    ) -> "RBLNBaseModel":
+        subfolder = kwargs.get("subfolder", "")
+        model_save_dir = kwargs.pop("model_save_dir", None)
+        rbln_kwargs = rbln_config
+        model: "PreTrainedModel" = cls.get_pytorch_model(
+            model_id=model_id,
+            rbln_kwargs=rbln_kwargs,
+            **kwargs,
+        )
+        preprocessors = maybe_load_preprocessors(model_id, subfolder=subfolder)
+        return cls.from_model(
+            model,
+            rbln_config=rbln_config,
+            preprocessors=preprocessors,
+            model_save_dir=model_save_dir,
+            **kwargs,
+        )
     @classmethod
-    def compile(cls, model, rbln_compile_config: Optional[RBLNCompileConfig] = None):
+    def from_pretrained(
+        cls,
+        model_id: Union[str, Path],
+        export: bool = False,
+        **kwargs,
+    ) -> "RBLNBaseModel":
+        if isinstance(model_id, Path):
+            model_id = model_id.as_posix()
+        from_pretrained_method = cls._export if export else cls._from_pretrained
+        return from_pretrained_method(model_id=model_id, **kwargs)
+    @classmethod
+    def compile(cls, model, rbln_compile_config: Optional[RBLNCompileConfig] = None, **kwargs):
         compiled_model = rebel.compile_from_torch(
             model,
             input_info=rbln_compile_config.input_info,
             fusion=rbln_compile_config.fusion,
             npu=rbln_compile_config.npu,
             tensor_parallel_size=rbln_compile_config.tensor_parallel_size,
+            **kwargs,
         )
         return compiled_model
@@ -500,6 +397,24 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
         rbln_config = cls._get_rbln_config(**others, rbln_kwargs=rbln_kwargs)
         return rbln_config
+    @classmethod
+    @property
+    def hf_class(cls):
+        """
+        Lazily loads and caches the corresponding Hugging Face model class.
+        Removes 'RBLN' prefix from the class name to get the original class name
+        (e.g., RBLNLlamaForCausalLM -> LlamaForCausalLM) and imports it from
+        the transformers/diffusers module.
+        Returns:
+            type: The original Hugging Face model class
+        """
+        if cls._hf_class is None:
+            hf_cls_name = cls.__name__[4:]
+            library = importlib.import_module(cls.hf_library_name)
+            cls._hf_class = getattr(library, hf_cls_name, None)
+        return cls._hf_class
     def can_generate(self):
         return False
@@ -509,37 +424,88 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
     def __call__(self, *args, **kwargs):
         return self.forward(*args, **kwargs)
+    def __repr__(self):
+        return repr(self.model) + repr(self.rbln_submodules)
     def __post_init__(self, **kwargs):
-        self.dtype = torch.float32
+        pass
-    @classmethod
-    def _from_transformers(cls, *args, **kwargs) -> "RBLNBaseModel":
+    def save_pretrained(
+        self,
+        save_directory: Union[str, Path],
+        push_to_hub: bool = False,
+        **kwargs,
+    ):
         """
-        Exports a vanilla Transformers model into a rbln-compiled Module.
-        This will be deprecated after optimum 2.0
+        Saves a model and its configuration file to a directory, so that it can be re-loaded using the
+        [`~optimum.rbln.modeling_base.RBLNBaseModel.from_pretrained`] class method.
+        Args:
+            save_directory (`Union[str, Path]`):
+                Directory where to save the model file.
+            push_to_hub (`bool`, *optional*, defaults to `False`):
+                Whether or not to push your model to the Hugging Face model hub after saving it.
         """
-        return cls._export(*args, **kwargs)
+        if os.path.isfile(save_directory):
+            logger.error(f"Provided path ({save_directory}) should be a directory, not a file")
+            return
-    @classmethod
-    def wrap_model_if_needed(cls, model: torch.nn.Module, rbln_config: RBLNConfig) -> torch.nn.Module:
-        # Wrap the model if needed.
-        return model
+        os.makedirs(save_directory, exist_ok=True)
+        real_save_dir = self.model_save_dir / self.subfolder
+        save_directory_path = Path(save_directory)
+        if os.path.exists(real_save_dir) and os.path.isdir(real_save_dir):
+            if save_directory_path.absolute() == real_save_dir.absolute():
+                raise FileExistsError(
+                    f"Cannot save model to '{save_directory}'. "
+                    f"This directory already exists and contains the model files."
+                )
+            shutil.copytree(real_save_dir, save_directory, dirs_exist_ok=True)
+            self.config.save_pretrained(save_directory)
+            if self.generation_config is not None:
+                self.generation_config.save_pretrained(save_directory)
+        else:
+            raise FileNotFoundError(
+                f"Unable to save the model. The model directory '{real_save_dir}' does not exist or is not accessible. "
+                f"Cannot save to the specified destination '{save_directory}'. "
+                f"Please ensure the model directory exists and you have the necessary permissions to access it."
+            )
+        if push_to_hub:
+            return super().push_to_hub(save_directory, **kwargs)
+    @staticmethod
+    def _raise_missing_compiled_file_error(missing_files: List[str]):
+        """Raises a KeyError with a message indicating missing compiled model files."""
+        if len(missing_files) == 1:
+            message = f"The rbln model folder is missing the required '{missing_files[0]}.rbln' file. "
+        else:
+            files_str = ", ".join([f"'{f}.rbln'" for f in missing_files])
+            message = (
+                "The rbln model folder is missing required files. "
+                f"Ensure that {files_str} files are present in the folder. "
+            )
+        message += (
+            "These files are necessary for loading the rbln model. "
+            "If these files are missing, please recompile the model using the latest optimum-rbln "
+            "and ensure the compilation completes successfully."
+        )
+        raise KeyError(message)
     @classmethod
     @abstractmethod
     def _get_rbln_config(cls, **rbln_config_kwargs) -> RBLNConfig:
         pass
-    @abstractmethod
-    def forward(self, *args: List[torch.Tensor], **kwargs: Dict[str, torch.Tensor]):
-        pass
     @classmethod
     @abstractmethod
     def _create_runtimes(
         cls,
         compiled_models: List[rebel.RBLNCompiledModel],
         rbln_device_map: Dict[str, int],
+        activate_profiler: Optional[bool] = None,
     ) -> List[rebel.Runtime]:
         # compiled_models -> runtimes
         pass
@@ -562,546 +528,6 @@ class RBLNBaseModel(OptimizedModel, ABC, SubModulesMixin):
     ):
         pass
-    @classmethod
-    @use_rbln_config
-    def _export(
-        cls,
-        model_id: Union[str, Path],
-        config: "PretrainedConfig",  # FIXME : optimum passes config, but we ignore it.
-        rbln_config: Optional[Dict[str, Any]] = None,
-        **kwargs,
-    ) -> "RBLNModel":
-        subfolder = kwargs.get("subfolder", "")
-        model_save_dir = kwargs.pop("model_save_dir", None)
-        rbln_kwargs = rbln_config
-        model: "PreTrainedModel" = cls.get_pytorch_model(
-            model_id=model_id,
-            rbln_kwargs=rbln_kwargs,
-            **kwargs,
-        )
-        preprocessors = maybe_load_preprocessors(model_id, subfolder=subfolder)
-        return cls.from_model(
-            model,
-            rbln_config=rbln_config,
-            preprocessors=preprocessors,
-            model_save_dir=model_save_dir,
-            **kwargs,
-        )
-class RBLNModel(RBLNBaseModel):
-    """
-    A class that inherits from RBLNBaseModel for models consisting of a single `torch.nn.Module`.
-    This class supports all the functionality of RBLNBaseModel, including loading and saving models using
-    the `from_pretrained` and `save_pretrained` methods, compiling PyTorch models for execution on RBLN NPU
-    devices.
-    Example:
-        ```python
-        model = RBLNModel.from_pretrained("model_id", export=True, rbln_npu="npu_name")
-        outputs = model(**inputs)
-        ```
-    """
-    @classmethod
-    def update_kwargs(cls, kwargs):
-        """
-        Update user-given kwargs to get proper pytorch model.
-        For example, `torchscript`=True should be set because torch.jit
-        does not support `transformers` output instances as module output;
-        """
-        kwargs.update(
-            {
-                "torchscript": True,
-                "return_dict": False,
-            }
-        )
-        return kwargs
-    @classmethod
-    def get_pytorch_model(
-        cls,
-        model_id: str,
-        use_auth_token: Optional[Union[bool, str]] = None,
-        revision: Optional[str] = None,
-        force_download: bool = False,
-        cache_dir: Optional[str] = None,
-        subfolder: str = "",
-        local_files_only: bool = False,
-        trust_remote_code: bool = False,
-        # Some rbln-kwargs should be applied before loading torch module (i.e. quantized llm)
-        rbln_kwargs: Optional[Dict[str, Any]] = None,
-        **kwargs,
-    ) -> "PreTrainedModel":
-        task = kwargs.pop("task", None)
-        if task is None:
-            task = TasksManager.infer_task_from_model(cls.auto_model_class)
-        kwargs = cls.update_kwargs(kwargs)
-        model = TasksManager.get_model_from_task(
-            task=task,
-            model_name_or_path=model_id,
-            subfolder=subfolder,
-            revision=revision,
-            framework="pt",
-            cache_dir=cache_dir,
-            use_auth_token=use_auth_token,
-            local_files_only=local_files_only,
-            force_download=force_download,
-            trust_remote_code=trust_remote_code,
-            **kwargs,
-        )
-        return model
-    @classmethod
-    def save_torch_artifacts(
-        cls,
-        model: "PreTrainedModel",
-        save_dir_path: Path,
-        subfolder: str,
-        rbln_config: RBLNConfig,
-    ):
-        """
-        If you are unavoidably running on a CPU rather than an RBLN device,
-        store the torch tensor, weight, etc. in this function.
-        """
-    @classmethod
-    def get_compiled_model(cls, model: "PreTrainedModel", rbln_config: RBLNConfig):
-        model = cls.wrap_model_if_needed(model, rbln_config)
-        rbln_compile_config = rbln_config.compile_cfgs[0]
-        compiled_model = cls.compile(model, rbln_compile_config=rbln_compile_config)
-        return compiled_model
-    @classmethod
-    @use_rbln_config
-    def from_model(
-        cls,
-        model: "PreTrainedModel",
-        rbln_config: Dict[str, Any] = {},
-        model_save_dir: Optional[Union[str, Path, TemporaryDirectory]] = None,
-        subfolder: str = "",
-        **kwargs,
-    ):
-        preprocessors = kwargs.pop("preprocessors", [])
-        rbln_kwargs = rbln_config
-        # Directory to save compile artifacts(.rbln) and original configs
-        if model_save_dir is None:
-            save_dir = TemporaryDirectory()
-            save_dir_path = Path(save_dir.name)
-        else:
-            save_dir = model_save_dir
-            if isinstance(save_dir, TemporaryDirectory):
-                save_dir_path = Path(model_save_dir.name)
-            else:
-                save_dir_path = Path(model_save_dir)
-                save_dir_path.mkdir(exist_ok=True)
-        # (Optional) Save preprocessors (tokenizer, image preprocessors, etc)
-        for preprocessor in preprocessors:
-            preprocessor.save_pretrained(save_dir_path)
-        # Save configs
-        # FIXME :: optimum passes AutoConfig. But here we ignore it.
-        config = model.config
-        if hasattr(model, "can_generate") and model.can_generate():
-            generation_config = model.generation_config
-            generation_config.save_pretrained(save_dir_path / subfolder)
-        if not isinstance(config, PretrainedConfig):  # diffusers config
-            config = PretrainedConfig(**config)
-        config.save_pretrained(save_dir_path / subfolder)
-        # Get compilation arguments (e.g. input_info)
-        rbln_config: RBLNConfig = cls.get_rbln_config(
-            preprocessors=preprocessors, model_config=config, rbln_kwargs=rbln_kwargs
-        )
-        # rbln_config.update_runtime_cfg(rbln_kwargs) # This is done in get_rbln_config
-        compiled_model: Union[rebel.RBLNCompiledModel, Dict[str, rebel.RBLNCompiledModel]] = cls.get_compiled_model(
-            model, rbln_config=rbln_config
-        )
-        # Save compiled models (.rbln)
-        (save_dir_path / subfolder).mkdir(exist_ok=True)
-        if not isinstance(compiled_model, dict):
-            compiled_models = {DEFAULT_COMPILED_MODEL_NAME: compiled_model}
-        else:
-            compiled_models = compiled_model
-        for compiled_model_name, cm in compiled_models.items():
-            cm.save(save_dir_path / subfolder / f"{compiled_model_name}.rbln")
-        rbln_config.save(save_dir_path / subfolder)
-        # Save torch artifacts (e.g. embedding matrix if needed.)
-        cls.save_torch_artifacts(model, save_dir_path=save_dir_path, subfolder=subfolder, rbln_config=rbln_config)
-        # Load submodules
-        if len(cls._rbln_submodules) > 0:
-            rbln_submodules = cls._load_submodules(
-                model=model,
-                model_save_dir=save_dir,
-                rbln_kwargs=rbln_kwargs,
-                **kwargs,
-            )
-        else:
-            rbln_submodules = []
-        # Instantiate
-        return cls._from_pretrained(
-            model_id=save_dir_path,
-            config=config,
-            model_save_dir=save_dir,
-            subfolder=subfolder,
-            rbln_config=rbln_config,
-            rbln_compiled_models=compiled_models,
-            rbln_submodules=rbln_submodules,
-            **kwargs,
-        )
-    @classmethod
-    def _create_runtimes(
-        cls,
-        compiled_models: List[rebel.RBLNCompiledModel],
-        rbln_device_map: Dict[str, int],
-    ) -> List[rebel.Runtime]:
-        device = rbln_device_map[DEFAULT_COMPILED_MODEL_NAME]
-        return [compiled_model.create_runtime(tensor_type="pt", device=device) for compiled_model in compiled_models]
+    @abstractmethod
     def forward(self, *args: List[torch.Tensor], **kwargs: Dict[str, torch.Tensor]):
-        output = self.model[0](*args, **kwargs)
-        return output
-class RBLNModelForQuestionAnswering(RBLNModel):
-    auto_model_class = AutoModelForQuestionAnswering
-    rbln_model_input_names = ["input_ids", "attention_mask", "token_type_ids"]
-    @classmethod
-    def _get_rbln_config(
-        cls,
-        preprocessors: Optional[Union["AutoFeatureExtractor", "AutoProcessor", "AutoTokenizer"]],
-        model_config: Optional["PretrainedConfig"] = None,
-        rbln_kwargs: Dict[str, Any] = {},
-    ) -> RBLNConfig:
-        rbln_max_seq_len = rbln_kwargs.get("max_seq_len", None)
-        rbln_batch_size = rbln_kwargs.get("batch_size", None)
-        rbln_model_input_names = rbln_kwargs.get("model_input_names", None)
-        if rbln_max_seq_len is None:
-            for tokenizer in preprocessors:
-                if hasattr(tokenizer, "model_max_length"):
-                    rbln_max_seq_len = tokenizer.model_max_length
-                    break
-            if rbln_max_seq_len is None:
-                raise ValueError("`rbln_max_seq_len` should be specified!")
-        if rbln_batch_size is None:
-            rbln_batch_size = 1
-        if rbln_model_input_names is None:
-            for tokenizer in preprocessors:
-                if hasattr(tokenizer, "model_input_names"):
-                    rbln_model_input_names = tokenizer.model_input_names
-                    break
-            if rbln_model_input_names is None and hasattr(cls, "rbln_model_input_names"):
-                rbln_model_input_names = cls.rbln_model_input_names
-            elif rbln_model_input_names is None and hasattr(cls, "rbln_model_input_names") is False:
-                original_model_class = getattr(transformers, model_config.architectures[0])
-                input_names_order = inspect.signature(original_model_class.forward).parameters.keys()
-                raise ValueError(
-                    "Specify the model input names obtained by the tokenizer via `rbln_model_input_names`, "
-                    f"and be sure to make the order of the inputs same as QuestionAnswering forward() arguments like ({list(input_names_order)})"
-                )
-        input_info = [
-            (model_input_name, [rbln_batch_size, rbln_max_seq_len], "int64")
-            for model_input_name in rbln_model_input_names
-        ]
-        rbln_compile_config = RBLNCompileConfig(input_info=input_info)
-        rbln_config = RBLNConfig(
-            rbln_cls=cls.__name__,
-            compile_cfgs=[rbln_compile_config],
-            rbln_kwargs=rbln_kwargs,
-        )
-        rbln_config.model_cfg.update({"max_seq_len": rbln_max_seq_len})
-        return rbln_config
-class RBLNModelForImageClassification(RBLNModel):
-    """
-    This is a generic model class that will be instantiated as one of the model classes of the library (with a image classification head) when created with the from_pretrained() class method
-    """
-    auto_model_class = AutoModelForImageClassification
-    @classmethod
-    def _get_rbln_config(
-        cls,
-        preprocessors: Optional[Union["AutoFeatureExtractor", "AutoProcessor", "AutoTokenizer"]],
-        model_config: Optional["PretrainedConfig"] = None,
-        rbln_kwargs: Dict[str, Any] = {},
-    ) -> RBLNConfig:
-        rbln_image_size = rbln_kwargs.get("image_size", None)
-        rbln_batch_size = rbln_kwargs.get("batch_size", None)
-        if rbln_image_size is None:
-            for processor in preprocessors:
-                if hasattr(processor, "size"):
-                    if all(required_key in processor.size.keys() for required_key in ["height", "width"]):
-                        rbln_image_size = (processor.size["height"], processor.size["width"])
-                    elif "shortest_edge" in processor.size.keys():
-                        rbln_image_size = (processor.size["shortest_edge"], processor.size["shortest_edge"])
-                    elif "longest_edge" in processor.size.keys():
-                        rbln_image_size = (processor.size["longest_edge"], processor.size["longest_edge"])
-                    break
-            if rbln_image_size is None:
-                rbln_image_size = model_config.image_size
-            if rbln_image_size is None:
-                raise ValueError("`rbln_image_size` should be specified!")
-        if rbln_batch_size is None:
-            rbln_batch_size = 1
-        if isinstance(rbln_image_size, int):
-            rbln_image_height, rbln_image_width = rbln_image_size, rbln_image_size
-        elif isinstance(rbln_image_size, (list, tuple)):
-            rbln_image_height, rbln_image_width = rbln_image_size[0], rbln_image_size[1]
-        elif isinstance(rbln_image_size, dict):
-            rbln_image_height, rbln_image_width = rbln_image_size["height"], rbln_image_size["width"]
-        else:
-            raise ValueError(
-                "`rbln_image_size` should be `int` (ex. 224), `tuple` (ex. 224, 224), `dict` (ex. {'height': 224, 'width': 224}) format"
-            )
-        input_info = [
-            (
-                "pixel_values",
-                [rbln_batch_size, 3, rbln_image_height, rbln_image_width],
-                "float32",
-            )
-        ]
-        rbln_compile_config = RBLNCompileConfig(input_info=input_info)
-        return RBLNConfig(rbln_cls=cls.__name__, compile_cfgs=[rbln_compile_config], rbln_kwargs=rbln_kwargs)
-class RBLNModelForAudioClassification(RBLNModel):
-    """
-    This is a generic model class that will be instantiated as one of the model classes of the library (with a audio classification head) when created with the from_pretrained() class method
-    This model inherits from [`RBLNModel`]. Check the superclass documentation for the generic methods the library implements for all its models.
-    A class to convert and run pre-trained transformers based AudioClassification models on RBLN devices.
-    It implements the methods to convert a pre-trained transformers AudioClassification model into a RBLN transformer model by:
-    - transferring the checkpoint weights of the original into an optimized RBLN graph,
-    - compiling the resulting graph using the RBLN compiler.
-    Currently, this model class only supports the 'AST' model from the transformers library. Future updates may include support for additional model types.
-    """
-    auto_model_class = AutoModelForAudioClassification
-    @classmethod
-    def _get_rbln_config(
-        cls,
-        preprocessors: "AutoFeatureExtractor",
-        model_config: "PretrainedConfig",
-        rbln_kwargs: Dict[str, Any] = {},
-    ) -> RBLNConfig:
-        rbln_batch_size = rbln_kwargs.get("batch_size", None)
-        rbln_max_length = rbln_kwargs.get("max_length", None)
-        rbln_num_mel_bins = rbln_kwargs.get("num_mel_bins", None)
-        if rbln_batch_size is None:
-            rbln_batch_size = 1
-        if rbln_num_mel_bins is None:
-            rbln_num_mel_bins = getattr(model_config, "num_mel_bins", None)
-            if rbln_num_mel_bins is None:
-                for feature_extractor in preprocessors:
-                    if hasattr(feature_extractor, "num_mel_bins"):
-                        rbln_num_mel_bins = feature_extractor.num_mel_bins
-                        break
-        if rbln_num_mel_bins is None:
-            raise ValueError("`rbln_num_mel_bins` should be specified!")
-        if rbln_max_length is None:
-            rbln_max_length = getattr(model_config, "max_length", None)
-            for feature_extractor in preprocessors:
-                if hasattr(feature_extractor, "max_length"):
-                    rbln_max_length = feature_extractor.max_length
-                    break
-        if rbln_max_length is None:
-            raise ValueError("`rbln_max_length` should be specified!")
-        input_info = [
-            (
-                "input_values",
-                [rbln_batch_size, rbln_max_length, rbln_num_mel_bins],
-                "float32",
-            ),
-        ]
-        rbln_compile_config = RBLNCompileConfig(input_info=input_info)
-        rbln_config = RBLNConfig(
-            rbln_cls=cls.__name__,
-            compile_cfgs=[rbln_compile_config],
-            rbln_kwargs=rbln_kwargs,
-        )
-        rbln_config.model_cfg.update(
-            {
-                "batch_size": rbln_batch_size,
-                "max_length": rbln_max_length,
-                "num_mel_bins": rbln_num_mel_bins,
-            }
-        )
-        return rbln_config
-class RBLNModelForSequenceClassification(RBLNModel):
-    """
-    This is a generic model class that will be instantiated as one of the model classes of the library (with a sequence classification head) when created with the from_pretrained() class method
-    This model inherits from [`RBLNModel`]. Check the superclass documentation for the generic methods the library implements for all its models.
-    A class to convert and run pre-trained transformers based SequenceClassification models on RBLN devices.
-    It implements the methods to convert a pre-trained transformers SequenceClassification model into a RBLN transformer model by:
-    - transferring the checkpoint weights of the original into an optimized RBLN graph,
-    - compiling the resulting graph using the RBLN compiler.
-    Currently, this model class supports the 'XLMRoberta' and 'Roberta' model from the transformers library. Future updates may include support for additional model types.
-    """
-    auto_model_class = AutoModelForSequenceClassification
-    @classmethod
-    def _get_rbln_config(
-        cls,
-        preprocessors: Optional[Union["AutoFeatureExtractor", "AutoProcessor", "AutoTokenizer"]],
-        model_config: Optional["PretrainedConfig"] = None,
-        rbln_kwargs: Dict[str, Any] = {},
-    ) -> RBLNConfig:
-        rbln_max_seq_len = rbln_kwargs.get("max_seq_len", None)
-        rbln_model_input_names = rbln_kwargs.get("model_input_names", None)
-        rbln_batch_size = rbln_kwargs.get("batch_size", None)
-        max_position_embeddings = getattr(model_config, "n_positions", None) or getattr(
-            model_config, "max_position_embeddings", None
-        )
-        if rbln_max_seq_len is None:
-            rbln_max_seq_len = max_position_embeddings
-            if rbln_max_seq_len is None:
-                for tokenizer in preprocessors:
-                    if hasattr(tokenizer, "model_max_length"):
-                        rbln_max_seq_len = tokenizer.model_max_length
-                        break
-                if rbln_max_seq_len is None:
-                    raise ValueError("`rbln_max_seq_len` should be specified!")
-        if max_position_embeddings is not None and rbln_max_seq_len > max_position_embeddings:
-            raise ValueError("`rbln_enc_max_seq_len` should be less or equal than max_position_embeddings!")
-        if rbln_model_input_names is None:
-            for tokenizer in preprocessors:
-                if hasattr(tokenizer, "model_input_names"):
-                    rbln_model_input_names = tokenizer.model_input_names
-                    break
-            if rbln_model_input_names is None and hasattr(cls, "rbln_model_input_names"):
-                rbln_model_input_names = cls.rbln_model_input_names
-            elif rbln_model_input_names is None and hasattr(cls, "rbln_model_input_names") is False:
-                original_model_class = getattr(transformers, model_config.architectures[0])
-                input_names_order = inspect.signature(original_model_class.forward).parameters.keys()
-                raise ValueError(
-                    "Specify the model input names obtained by the tokenizer via `rbln_model_input_names`, "
-                    f"and be sure to make the order of the inputs same as SequenceClassification forward() arguments like ({list(input_names_order)})"
-                )
-        if rbln_batch_size is None:
-            rbln_batch_size = 1
-        input_info = [
-            (model_input_name, [rbln_batch_size, rbln_max_seq_len], "int64")
-            for model_input_name in rbln_model_input_names
-        ]
-        rbln_compile_config = RBLNCompileConfig(input_info=input_info)
-        rbln_config = RBLNConfig(
-            rbln_cls=cls.__name__,
-            compile_cfgs=[rbln_compile_config],
-            rbln_kwargs=rbln_kwargs,
-        )
-        rbln_config.model_cfg.update({"max_seq_len": rbln_max_seq_len})
-        return rbln_config
-class RBLNModelForMaskedLM(RBLNModel):
-    auto_model_class = AutoModelForMaskedLM
-    @classmethod
-    def _get_rbln_config(
-        cls,
-        preprocessors: Optional[Union["AutoFeatureExtractor", "AutoProcessor", "AutoTokenizer"]],
-        model_config: Optional["PretrainedConfig"] = None,
-        rbln_kwargs: Dict[str, Any] = {},
-    ) -> RBLNConfig:
-        rbln_max_seq_len = rbln_kwargs.get("max_seq_len", None)
-        rbln_model_input_names = rbln_kwargs.get("model_input_names", None)
-        rbln_batch_size = rbln_kwargs.get("batch_size", None)
-        max_position_embeddings = getattr(model_config, "n_positions", None) or getattr(
-            model_config, "max_position_embeddings", None
-        )
-        if rbln_max_seq_len is None:
-            rbln_max_seq_len = max_position_embeddings
-            if rbln_max_seq_len is None:
-                for tokenizer in preprocessors:
-                    if hasattr(tokenizer, "model_max_length"):
-                        rbln_max_seq_len = tokenizer.model_max_length
-                        break
-                if rbln_max_seq_len is None:
-                    raise ValueError("`rbln_max_seq_len` should be specified!")
-        if max_position_embeddings is not None and rbln_max_seq_len > max_position_embeddings:
-            raise ValueError("`rbln_enc_max_seq_len` should be less or equal than max_position_embeddings!")
-        if rbln_model_input_names is None:
-            for tokenizer in preprocessors:
-                if hasattr(tokenizer, "model_input_names"):
-                    rbln_model_input_names = tokenizer.model_input_names
-                    break
-            if rbln_model_input_names is None and hasattr(cls, "rbln_model_input_names"):
-                rbln_model_input_names = cls.rbln_model_input_names
-            elif rbln_model_input_names is None and hasattr(cls, "rbln_model_input_names") is False:
-                original_model_class = getattr(transformers, model_config.architectures[0])
-                input_names_order = inspect.signature(original_model_class.forward).parameters.keys()
-                raise ValueError(
-                    "Specify the model input names obtained by the tokenizer via `rbln_model_input_names`, "
-                    f"and be sure to make the order of the inputs same as MaskedLM forward() arguments like ({list(input_names_order)})"
-                )
-        if rbln_batch_size is None:
-            rbln_batch_size = 1
-        input_info = [
-            (model_input_name, [rbln_batch_size, rbln_max_seq_len], "int64")
-            for model_input_name in rbln_model_input_names
-        ]
-        rbln_compile_config = RBLNCompileConfig(input_info=input_info)
-        rbln_config = RBLNConfig(
-            rbln_cls=cls.__name__,
-            compile_cfgs=[rbln_compile_config],
-            rbln_kwargs=rbln_kwargs,
-        )
-        rbln_config.model_cfg.update({"max_seq_len": rbln_max_seq_len})
-        return rbln_config
+        pass

optimum-rbln 0.1.13__py3-none-any.whl → 0.2.0__py3-none-any.whl

optimum-rbln 0.1.13py3-none-any.whl → 0.2.0py3-none-any.whl