PyPI - optimum-rbln - Versions diffs - 0.9.4a2__py3-none-any.whl → 0.10.0.post1__py3-none-any.whl - Mend

optimum-rbln 0.9.4a2py3-none-any.whl → 0.10.0.post1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (108) hide show

optimum/rbln/transformers/models/phi/phi_architecture.py CHANGED Viewed

@@ -20,7 +20,6 @@ from transformers import PhiForCausalLM
 from ..decoderonly.decoderonly_architecture import (
     DecoderOnlyAttention,
     DecoderOnlyLayer,
-    DecoderOnlyModel,
     DecoderOnlyWrapper,
     apply_rotary_pos_emb_partial,
 )
@@ -37,9 +36,6 @@ class PhiWrapper(DecoderOnlyWrapper):
     def get_rbln_layer_class(self):
         return PhiLayer
-    def get_rbln_model_class(self):
-        return PhiModel
     def get_model_layer(self, model: Union["PhiForCausalLM", "PhiModel"]):
         return model.model if self.is_causal_lm else model
@@ -48,13 +44,15 @@ class PhiWrapper(DecoderOnlyWrapper):
 class PhiAttention(DecoderOnlyAttention):
-    def __post_init__(self):
-        self.q_proj = self._original_mod.q_proj
-        self.k_proj = self._original_mod.k_proj
-        self.v_proj = self._original_mod.v_proj
-        self.o_proj = self._original_mod.dense
-        self.qk_layernorm = self._original_mod.qk_layernorm
-        self.rotary_ndims = self._original_mod.rotary_ndims
+    def __post_init__(self, self_attn):
+        self.q_proj = self_attn.q_proj
+        self.k_proj = self_attn.k_proj
+        self.v_proj = self_attn.v_proj
+        self.o_proj = self_attn.dense
+        self.qk_layernorm = self_attn.qk_layernorm
+        self.rotary_ndims = self_attn.rotary_ndims
+        self.q_layernorm = getattr(self_attn, "q_layernorm", None)
+        self.k_layernorm = getattr(self_attn, "k_layernorm", None)
     def projection(self, hidden_states, lora_int_id) -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
         if lora_int_id is not None:
@@ -65,8 +63,8 @@ class PhiAttention(DecoderOnlyAttention):
         value_states = self.v_proj(hidden_states)
         if self.qk_layernorm:
-            query_states = self._original_mod.q_layernorm(query_states)
-            key_states = self._original_mod.k_layernorm(key_states)
+            query_states = self.q_layernorm(query_states)
+            key_states = self.k_layernorm(key_states)
         return query_states, key_states, value_states
@@ -75,8 +73,7 @@ class PhiAttention(DecoderOnlyAttention):
 class PhiLayer(DecoderOnlyLayer):
-    def get_post_attention_layernorm(self):
-        raise NotImplementedError
+    _POST_ATTN_LAYERNORM = None
     def forward(
         self,
@@ -103,13 +100,8 @@ class PhiLayer(DecoderOnlyLayer):
             block_tables=block_tables,
         )
-        feed_forward_hidden_states = self._original_mod.mlp(hidden_states)
+        feed_forward_hidden_states = self.mlp(hidden_states)
         hidden_states = attn_output + feed_forward_hidden_states + residual
         return hidden_states
-class PhiModel(DecoderOnlyModel):
-    def get_last_layernorm(self):
-        return self._original_mod.final_layernorm

optimum/rbln/transformers/models/pixtral/modeling_pixtral.py CHANGED Viewed

@@ -297,13 +297,17 @@ class RBLNPixtralVisionModel(RBLNModel):
         Forward pass for the RBLN-optimized Pixtral vision model.
         Args:
-            pixel_values (torch.Tensor of shape (batch_size, num_channels, image_size, image_size)) — The tensors corresponding to the input images. Pixel values can be obtained using PixtralImageProcessor. See PixtralImageProcessor.call() for details (PixtralProcessor uses PixtralImageProcessor for processing images).
-            image_sizes (torch.Tensor of shape (batch_size, 2), optional) — The sizes of the images in the batch, being (height, width) for each image.
-            output_hidden_states (bool, optional) — Whether or not to return the hidden states of all layers. See hidden_states under returned tensors for more detail.
-            return_dict (bool, optional) — Whether or not to return a ModelOutput instead of a plain tuple.
+            pixel_values: Input images as a tensor of shape (batch_size, num_channels, image_size, image_size).
+                Pixel values can be obtained using PixtralImageProcessor. See PixtralImageProcessor.__call__()
+                for details (PixtralProcessor uses PixtralImageProcessor for processing images).
+            image_sizes: The sizes of the images in the batch as a tensor of shape (batch_size, 2),
+                being (height, width) for each image. Optional.
+            output_hidden_states: Whether or not to return the hidden states of all layers. Optional.
+                See hidden_states under returned tensors for more detail.
+            return_dict: Whether or not to return a ModelOutput instead of a plain tuple. Optional.
         Returns:
-            BaseModelOutput or tuple(torch.FloatTensor)
+            The model outputs. If return_dict=False is passed, returns a tuple of tensors. Otherwise, returns a BaseModelOutput object.
         """
         output_hidden_states = (
             output_hidden_states if output_hidden_states is not None else self.rbln_config.output_hidden_states

optimum/rbln/transformers/models/qwen2_5_vl/__init__.py CHANGED Viewed

@@ -15,5 +15,10 @@
 from .configuration_qwen2_5_vl import (
     RBLNQwen2_5_VisionTransformerPretrainedModelConfig,
     RBLNQwen2_5_VLForConditionalGenerationConfig,
+    RBLNQwen2_5_VLModelConfig,
+)
+from .modeling_qwen2_5_vl import (
+    RBLNQwen2_5_VisionTransformerPretrainedModel,
+    RBLNQwen2_5_VLForConditionalGeneration,
+    RBLNQwen2_5_VLModel,
 )
-from .modeling_qwen2_5_vl import RBLNQwen2_5_VisionTransformerPretrainedModel, RBLNQwen2_5_VLForConditionalGeneration

optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py CHANGED Viewed

@@ -15,7 +15,7 @@
 from typing import Any, List, Optional, Union
 from ....configuration_utils import RBLNModelConfig
-from ..decoderonly.configuration_decoderonly import RBLNDecoderOnlyModelForCausalLMConfig
+from ..decoderonly.configuration_decoderonly import RBLNDecoderOnlyModelConfig, RBLNDecoderOnlyModelForCausalLMConfig
 class RBLNQwen2_5_VLForConditionalGenerationConfig(RBLNDecoderOnlyModelForCausalLMConfig):
@@ -56,6 +56,18 @@ class RBLNQwen2_5_VLForConditionalGenerationConfig(RBLNDecoderOnlyModelForCausal
         self.visual = visual
+class RBLNQwen2_5_VLModelConfig(RBLNDecoderOnlyModelConfig):
+    """
+    Configuration class for RBLNQwen2_5_VLModel.
+    """
+    submodules = ["visual"]
+    def __init__(self, visual: Optional[RBLNModelConfig] = None, **kwargs: Any):
+        super().__init__(**kwargs)
+        self.visual = self.initialize_submodule_config(submodule_config=visual)
 class RBLNQwen2_5_VisionTransformerPretrainedModelConfig(RBLNModelConfig):
     """
     Configuration class for RBLNQwen2_5_VisionTransformerPretrainedModel.

optimum-rbln 0.9.4a2__py3-none-any.whl → 0.10.0.post1__py3-none-any.whl

optimum-rbln 0.9.4a2py3-none-any.whl → 0.10.0.post1py3-none-any.whl