PyPI - optimum-rbln - Versions diffs - 0.8.1rc1__py3-none-any.whl → 0.8.2a0__py3-none-any.whl - Mend

optimum-rbln 0.8.1rc1py3-none-any.whl → 0.8.2a0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

optimum/rbln/transformers/models/gemma/gemma_architecture.py CHANGED Viewed

@@ -12,54 +12,16 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
-from typing import TYPE_CHECKING
 from ...models.decoderonly.decoderonly_architecture import (
-    DecoderOnlyAttention,
-    DecoderOnlyFlashAttention,
-    DecoderOnlyForCausalLM,
-    DecoderOnlyLayer,
     DecoderOnlyModel,
     DecoderOnlyWrapper,
 )
-if TYPE_CHECKING:
-    from transformers import GemmaForCausalLM
 class GemmaWrapper(DecoderOnlyWrapper):
-    def convert_to_rbln_causal_lm(self, causal_lm: "GemmaForCausalLM", max_seq_len: int):
-        new_layers = []
-        for layer in causal_lm.model.layers:
-            if self.attn_impl == "eager":
-                new_self_attn = DecoderOnlyAttention(
-                    layer.self_attn,
-                    self.use_attention_mask,
-                    kvcache_block_size=self.kvcache_block_size,
-                    use_position_ids=self.use_position_ids,
-                )
-            elif self.attn_impl == "flash_attn":
-                new_self_attn = DecoderOnlyFlashAttention(
-                    layer.self_attn,
-                    kvcache_partition_len=self.kvcache_partition_len,
-                    use_attention_mask=self.use_attention_mask,
-                    kvcache_block_size=self.kvcache_block_size,
-                    use_position_ids=self.use_position_ids,
-                )
-            else:
-                raise NotImplementedError(f"Unknwon attn : {self.attn_impl}")
-            new_layer = DecoderOnlyLayer(layer, new_self_attn)
-            new_layers.append(new_layer)
-        new_model = GemmaModel(
-            causal_lm.model,
-            new_layers,
-            partition_len=self.kvcache_partition_len,
-            max_seq_len=max_seq_len,
-            sliding_window_layers=self.sliding_window_layers,
-        )
-        new_causal_lm = DecoderOnlyForCausalLM(causal_lm, new_model)
-        return new_causal_lm
+    def get_rbln_model_class(self):
+        return GemmaModel
 class GemmaModel(DecoderOnlyModel):

optimum/rbln/transformers/models/gemma3/gemma3_architecture.py CHANGED Viewed

@@ -13,15 +13,13 @@
 # limitations under the License.
 import copy
-from typing import TYPE_CHECKING, Optional, Tuple, Union
+from typing import Optional, Tuple, Union
 import torch
 from transformers.models.gemma3.modeling_gemma3 import Gemma3RMSNorm
 from ..decoderonly.decoderonly_architecture import (
     DecoderOnlyAttention,
-    DecoderOnlyFlashAttention,
-    DecoderOnlyForCausalLM,
     DecoderOnlyLayer,
     DecoderOnlyModel,
     DecoderOnlyWrapper,
@@ -30,10 +28,6 @@ from ..decoderonly.decoderonly_architecture import (
 )
-if TYPE_CHECKING:
-    from transformers import Gemma3ForCausalLM
 class Gemma3ForCausalLMWrapper(DecoderOnlyWrapper):
     def get_rotary_emb(self, max_seq_len):
         rotary_emb_global = RotaryEmbedding(config=self.config, max_seq_len_cached=max_seq_len)
@@ -45,49 +39,14 @@ class Gemma3ForCausalLMWrapper(DecoderOnlyWrapper):
         return (rotary_emb_global, rotary_emb_local)
-    def convert_to_rbln_causal_lm(self, causal_lm: "Gemma3ForCausalLM", max_seq_len: int):
-        new_layers = []
-        for layer_idx, layer in enumerate(causal_lm.model.layers):
-            if layer_idx in self.sliding_window_layers:
-                new_self_attn = Gemma3Attention(
-                    layer.self_attn,
-                    use_attention_mask=None,  # FIXME: no use in SWA
-                    use_position_ids=self.use_position_ids,
-                    kvcache_block_size=self.config.sliding_window,
-                    is_sliding=True,
-                )
-            else:
-                if self.attn_impl == "eager":
-                    new_self_attn = Gemma3Attention(
-                        layer.self_attn,
-                        use_attention_mask=self.use_attention_mask,
-                        use_position_ids=self.use_position_ids,
-                        kvcache_block_size=self.kvcache_block_size,
-                        is_sliding=False,
-                    )
-                elif self.attn_impl == "flash_attn":
-                    new_self_attn = Gemma3FlashAttention(
-                        layer.self_attn,
-                        kvcache_partition_len=self.kvcache_partition_len,
-                        use_attention_mask=self.use_attention_mask,
-                        kvcache_block_size=self.kvcache_block_size,
-                        use_position_ids=self.use_position_ids,
-                    )
-                else:
-                    raise NotImplementedError(f"Unknwon attn : {self.attn_impl}")
-            new_layer = Gemma3DecoderLayer(layer, new_self_attn)
-            new_layers.append(new_layer)
-        new_model = Gemma3TextModel(
-            causal_lm.model,
-            new_layers,
-            partition_len=self.kvcache_partition_len,
-            max_seq_len=max_seq_len,
-            sliding_window_layers=self.sliding_window_layers,
-        )
-        new_causal_lm = DecoderOnlyForCausalLM(causal_lm, new_model)
-        return new_causal_lm
+    def get_rbln_attn_class(self):
+        return Gemma3Attention
+    def get_rbln_layer_class(self):
+        return Gemma3DecoderLayer
+    def get_rbln_model_class(self):
+        return Gemma3TextModel
 class Gemma3TextModel(DecoderOnlyModel):
@@ -199,16 +158,3 @@ class Gemma3Attention(DecoderOnlyAttention):
     def get_attn_scale(self):
         return self._original_mod.config.query_pre_attn_scalar**-0.5
-class Gemma3FlashAttention(DecoderOnlyFlashAttention):
-    def __post_init__(self):
-        self.q_proj = self._original_mod.q_proj
-        self.k_proj = self._original_mod.k_proj
-        self.v_proj = self._original_mod.v_proj
-        self.o_proj = self._original_mod.o_proj
-        self.q_norm = self._original_mod.q_norm
-        self.k_norm = self._original_mod.k_norm
-    def get_attn_scale(self):
-        return self._original_mod.config.query_pre_attn_scalar**-0.5

optimum/rbln/transformers/models/gpt2/gpt2_architecture.py CHANGED Viewed

@@ -17,10 +17,10 @@ from typing import TYPE_CHECKING, Tuple
 import torch
 import torch.nn as nn
+from transformers import PreTrainedModel
 from ..decoderonly.decoderonly_architecture import (
     DecoderOnlyAttention,
-    DecoderOnlyForCausalLM,
     DecoderOnlyLayer,
     DecoderOnlyModel,
     DecoderOnlyWrapper,
@@ -32,27 +32,23 @@ if TYPE_CHECKING:
 class GPT2Wrapper(DecoderOnlyWrapper):
-    def convert_to_rbln_causal_lm(self, causal_lm: "GPT2LMHeadModel", max_seq_len: int):
-        if self.attn_impl != "eager":
-            raise NotImplementedError(f"flash attention ({self.attn_impl}) is not implemented for {self.__class__}")
-        new_layers = []
-        for layer in causal_lm.transformer.h:
-            new_self_attn = GPT2Attention(
-                layer.attn,
-                self.use_attention_mask,
-                kvcache_block_size=self.kvcache_block_size,
-                use_position_ids=self.use_position_ids,
-            )
-            new_layer = GPT2Layer(layer, new_self_attn)
-            new_layers.append(new_layer)
-        new_model = GPT2Model(
-            causal_lm.transformer,
-            new_layers,
-            max_seq_len=max_seq_len,
-            sliding_window_layers=self.sliding_window_layers,
-        )
-        new_causal_lm = DecoderOnlyForCausalLM(causal_lm, new_model)
-        return new_causal_lm
+    def get_rbln_attn_class(self):
+        return GPT2Attention
+    def get_rbln_layer_class(self):
+        return GPT2Layer
+    def get_rbln_model_class(self):
+        return GPT2Model
+    def get_attn_layer(self, layer: nn.Module):
+        return layer.attn
+    def get_model_layer(self, causal_lm: "GPT2LMHeadModel"):
+        return causal_lm.transformer
+    def get_decoder_layers(self, causal_lm: PreTrainedModel):
+        return causal_lm.transformer.h
 class GPT2Model(DecoderOnlyModel):

optimum/rbln/transformers/models/midm/midm_architecture.py CHANGED Viewed

@@ -20,7 +20,6 @@ import torch.nn as nn
 from ..decoderonly.decoderonly_architecture import (
     DecoderOnlyAttention,
-    DecoderOnlyForCausalLM,
     DecoderOnlyLayer,
     DecoderOnlyModel,
     DecoderOnlyWrapper,
@@ -55,27 +54,20 @@ class MidmLMHeadModelWrapper(DecoderOnlyWrapper):
         self.config.partial_rotary_factor = self.config.rotary_percentage
         return super().get_rotary_emb(max_seq_len=max_seq_len)
-    def convert_to_rbln_causal_lm(self, causal_lm: "MidmLMHeadModel", max_seq_len: int):
-        if self.attn_impl != "eager":
-            raise NotImplementedError(f"flash attention ({self.attn_impl}) is not implemented for {self.__class__}")
-        new_layers = []
-        for layer in causal_lm.transformer.h:
-            new_self_attn = MidmAttention(
-                layer.attn,
-                self.use_attention_mask,
-                kvcache_block_size=self.kvcache_block_size,
-                use_position_ids=self.use_position_ids,
-            )
-            new_layer = MidmLayer(layer, new_self_attn)
-            new_layers.append(new_layer)
-        new_model = MidmModel(
-            causal_lm.transformer,
-            new_layers,
-            max_seq_len=max_seq_len,
-            sliding_window_layers=self.sliding_window_layers,
-        )
-        new_causal_lm = DecoderOnlyForCausalLM(causal_lm, new_model)
-        return new_causal_lm
+    def get_rbln_attn_class(self):
+        return MidmAttention
+    def get_rbln_layer_class(self):
+        return MidmLayer
+    def get_rbln_model_class(self):
+        return MidmModel
+    def get_model_layer(self, causal_lm: "MidmLMHeadModel"):
+        return causal_lm.transformer
+    def get_decoder_layers(self, causal_lm: "MidmLMHeadModel"):
+        return causal_lm.transformer.h
 class MidmModel(DecoderOnlyModel):

optimum/rbln/transformers/models/opt/opt_architecture.py CHANGED Viewed

@@ -18,7 +18,6 @@ import torch.nn as nn
 from ...models.decoderonly.decoderonly_architecture import (
     DecoderOnlyAttention,
-    DecoderOnlyForCausalLM,
     DecoderOnlyLayer,
     DecoderOnlyModel,
     DecoderOnlyWrapper,
@@ -30,30 +29,22 @@ if TYPE_CHECKING:
 class OPTWrapper(DecoderOnlyWrapper):
-    def convert_to_rbln_causal_lm(self, causal_lm: "OPTForCausalLM", max_seq_len: int):
-        if self.attn_impl != "eager":
-            raise NotImplementedError(f"flash attention ({self.attn_impl}) is not implemented for {self.__class__}")
-        new_layers = []
-        for layer in causal_lm.model.decoder.layers:
-            new_self_attn = OPTAttention(
-                layer.self_attn,
-                self.use_attention_mask,
-                kvcache_block_size=self.kvcache_block_size,
-                use_position_ids=self.use_position_ids,
-            )
-            new_layer = OPTDecoderLayer(layer, new_self_attn)
-            new_layers.append(new_layer)
-        new_model = OPTModel(
-            causal_lm.model.decoder,
-            new_layers,
-            max_seq_len=max_seq_len,
-            use_learned_pos_emb=True,
-            sliding_window_layers=self.sliding_window_layers,
-        )
-        new_causal_lm = DecoderOnlyForCausalLM(causal_lm, new_model)
-        return new_causal_lm
+    _use_learned_pos_emb = True
+    def get_rbln_attn_class(self):
+        return OPTAttention
+    def get_rbln_layer_class(self):
+        return OPTDecoderLayer
+    def get_rbln_model_class(self):
+        return OPTModel
+    def get_model_layer(self, causal_lm: "OPTForCausalLM"):
+        return causal_lm.model.decoder
+    def get_decoder_layers(self, causal_lm: "OPTForCausalLM"):
+        return causal_lm.model.decoder.layers
 class OPTAttention(DecoderOnlyAttention):

optimum/rbln/transformers/models/phi/phi_architecture.py CHANGED Viewed

@@ -19,7 +19,6 @@ from transformers import PhiForCausalLM
 from ..decoderonly.decoderonly_architecture import (
     DecoderOnlyAttention,
-    DecoderOnlyForCausalLM,
     DecoderOnlyLayer,
     DecoderOnlyModel,
     DecoderOnlyWrapper,
@@ -32,25 +31,20 @@ if TYPE_CHECKING:
 class PhiWrapper(DecoderOnlyWrapper):
-    def convert_to_rbln_causal_lm(self, causal_lm: "PhiForCausalLM", max_seq_len: int):
-        new_layers = []
-        for layer in causal_lm.model.layers:
-            if self.attn_impl == "eager":
-                new_self_attn = PhiAttention(
-                    layer.self_attn,
-                    self.use_attention_mask,
-                    kvcache_block_size=self.kvcache_block_size,
-                    use_position_ids=self.use_position_ids,
-                )
-            elif self.attn_impl == "flash_attn":
-                raise NotImplementedError(f"flash attn for {self.__class__} is not implemented yet.")
-            else:
-                raise NotImplementedError(f"Unknwon attn : {self.attn_impl}")
-            new_layer = PhiLayer(layer, new_self_attn)
-            new_layers.append(new_layer)
-        new_model = PhiModel(causal_lm.model, new_layers, sliding_window_layers=self.sliding_window_layers)
-        new_causal_lm = DecoderOnlyForCausalLM(causal_lm, new_model)
-        return new_causal_lm
+    def get_rbln_attn_class(self):
+        return PhiAttention
+    def get_rbln_layer_class(self):
+        return PhiLayer
+    def get_rbln_model_class(self):
+        return PhiModel
+    def get_model_layer(self, causal_lm: "PhiForCausalLM"):
+        return causal_lm.model
+    def get_decoder_layers(self, causal_lm: "PhiForCausalLM"):
+        return causal_lm.model.layers
 class PhiAttention(DecoderOnlyAttention):

{optimum_rbln-0.8.1rc1.dist-info → optimum_rbln-0.8.2a0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: optimum-rbln
-Version: 0.8.1rc1
+Version: 0.8.2a0
 Summary: Optimum RBLN is the interface between the HuggingFace Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
 Project-URL: Homepage, https://rebellions.ai
 Project-URL: Documentation, https://docs.rbln.ai

{optimum_rbln-0.8.1rc1.dist-info → optimum_rbln-0.8.2a0.dist-info}/RECORD RENAMED Viewed

@@ -1,5 +1,5 @@
 optimum/rbln/__init__.py,sha256=MZCYmY4Y_Zfk0TGo3xK52osHDLZHz4cSdduXZt6RfSI,15316
-optimum/rbln/__version__.py,sha256=_HBfPPqmrksIsmr93RnGS_EXQHyrC_e0NtnXkbI_leI,521
+optimum/rbln/__version__.py,sha256=kKne35dFUj-l3bjR0tLZka8O-dDdB-rFDsjhN13A2r4,519
 optimum/rbln/configuration_utils.py,sha256=o5oer7fBdE-MHLGNXoP35FjmuQbMmjEIDv0QE_k3kpo,32336
 optimum/rbln/modeling.py,sha256=bsvK6GQtoH9vx72Ea59kvv61jguOk9XDTzVjsY1ugkk,14248
 optimum/rbln/modeling_base.py,sha256=QpNkU_Do__JKmnHjaPzv47OhQwgGfVohisip1jqXa7A,23871
@@ -8,16 +8,16 @@ optimum/rbln/diffusers/modeling_diffusers.py,sha256=RjZNcYMU5daUIj-PAxyAwVoo2a9h
 optimum/rbln/diffusers/configurations/__init__.py,sha256=vMRnPY4s-Uju43xP038D2EA18X_mhy2YfsZVpSU-VoA,1322
 optimum/rbln/diffusers/configurations/models/__init__.py,sha256=7q95gtgDzCeIBogGw8SLQoHT4Wch7vpLJVF2UQovuoo,567
 optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl.py,sha256=ySetuNq6koleFIZ542zZLTzEEyl_CTul9l12ufWlQ_Y,3218
-optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl_cosmos.py,sha256=0BPZ4Tcz72j0a1KPdfpvk5G511wWNvS4MDJKbHAPzhA,4145
+optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl_cosmos.py,sha256=SJfgbUz1LlRVuKQ_sHwPS262oOHF2TliKqM2z13wjEw,4172
 optimum/rbln/diffusers/configurations/models/configuration_controlnet.py,sha256=VDO_YFS_QhcHhuRIXQL53JZXEO27yoKHtecq5hd2la8,2637
 optimum/rbln/diffusers/configurations/models/configuration_prior_transformer.py,sha256=vE8RsXc27Z4-9k0KEM_vP7AWd5UUYvDgfX1g6nUrPp4,2224
-optimum/rbln/diffusers/configurations/models/configuration_transformer_cosmos.py,sha256=WOsC3sufsbwEEtsx0q8KqXUQE2VAFFCKRC7f2H4fmhg,3100
+optimum/rbln/diffusers/configurations/models/configuration_transformer_cosmos.py,sha256=tqzBWzkl5PX60v8REGHuUC1WdJuIQv_2BGUOne5UYL8,3127
 optimum/rbln/diffusers/configurations/models/configuration_transformer_sd3.py,sha256=TAwHUyVy_9HSEZdXIuFCtrBfNIuYIedklJaCut5wEys,2412
 optimum/rbln/diffusers/configurations/models/configuration_unet_2d_condition.py,sha256=mxcbrOqLMnPpP-jnjSeRWPj2zwPMsgeQSq6LzhG2btA,3630
 optimum/rbln/diffusers/configurations/models/configuration_vq_model.py,sha256=dslGcfCZL_hNeVyjV-4FnCT1POmXuiaLbr6NcQSKgHg,3259
 optimum/rbln/diffusers/configurations/pipelines/__init__.py,sha256=RfJXQiYvgGc3Rp7JYk5s0AQd0XB5JCAb37_riGWQAYg,1268
 optimum/rbln/diffusers/configurations/pipelines/configuration_controlnet.py,sha256=nTtr2vqyr3zNSJXI0kiTAhOnVNhA-cVyaSnKOwBBZIo,14215
-optimum/rbln/diffusers/configurations/pipelines/configuration_cosmos.py,sha256=8GK9pAGzhtmQN2DQjgQZJo9S7y6dDko-Ii-3CagFxo4,4588
+optimum/rbln/diffusers/configurations/pipelines/configuration_cosmos.py,sha256=tncXVraSYfrezqL9cT4kg5nuoifzYVfP0qHbgg0QUjA,4615
 optimum/rbln/diffusers/configurations/pipelines/configuration_kandinsky2_2.py,sha256=1ve6o4OEpjPzTXWHXy_T5MAI0V-F08PMv2W6nBFfeKU,16386
 optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion.py,sha256=kR8dV_RsmoDxhK5bAfv3PbtS5LpN5g-O-snAX1sP6Fo,6591
 optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_3.py,sha256=f2VOwvCd-9kDnUpwhb0LaMWgfwdmBzUKMpmCdhUv2sc,7923
@@ -44,7 +44,7 @@ optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py,sha256=
 optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py,sha256=HX56itORMqXLjZcwv25C-_z3JyZn3v6BpfIjsrDO3mE,46640
 optimum/rbln/diffusers/pipelines/cosmos/__init__.py,sha256=h2j6S8IJPVHeNU8qmW9vyXMgHBw0d7kQcuMAA5YoHPU,795
 optimum/rbln/diffusers/pipelines/cosmos/configuration_cosmos_guardrail.py,sha256=kDVnUBBGdumpDj2DaOpo5MSsFvlFIGY6BU1LZaFVqao,3327
-optimum/rbln/diffusers/pipelines/cosmos/cosmos_guardrail.py,sha256=lzT6j0RifZfIktETC5gd8GAKPHwekeb3JH56aPChOtI,18088
+optimum/rbln/diffusers/pipelines/cosmos/cosmos_guardrail.py,sha256=EAt2UICPRTaUz4SNsQYOa9aoW0USj2qamqdhlf2ajrA,18261
 optimum/rbln/diffusers/pipelines/cosmos/pipeline_cosmos_text2world.py,sha256=TfhgAWVHUHvxsagBGLAVYKBoSMvuH7rg_xP5ZZ0rVU0,3910
 optimum/rbln/diffusers/pipelines/cosmos/pipeline_cosmos_video2world.py,sha256=-dl8AMwSuorIOxRNfyu1XhkJfmNVbSo3_Wkb2gAmUpo,3917
 optimum/rbln/diffusers/pipelines/kandinsky2_2/__init__.py,sha256=I4YQq2HfA3xONbWsdJ870IEJPyLWeCDDG-UCJsu9YO8,1035
@@ -90,18 +90,18 @@ optimum/rbln/transformers/models/bert/__init__.py,sha256=86FuGRBLw315_Roa9D5OUx6
 optimum/rbln/transformers/models/bert/configuration_bert.py,sha256=nEZnX6LXpLKWaoPEd4pWSysw9h-PLb2ld0ibC3dcJ7w,1611
 optimum/rbln/transformers/models/bert/modeling_bert.py,sha256=zR0US2laTT0yUkL6yyvrR5STQNJcYqtG98ez4SUYQAY,2040
 optimum/rbln/transformers/models/blip_2/__init__.py,sha256=L01gPXcUCa8Vg-bcng20vZvBIN_jlqCzwUSFuq0QOag,855
-optimum/rbln/transformers/models/blip_2/configuration_blip_2.py,sha256=Xl24Ao6xLblSR6u1TK--OHDsdKBVG6sDZz_hcEeoScY,3183
+optimum/rbln/transformers/models/blip_2/configuration_blip_2.py,sha256=ke75GqPU139dNOY1nm6QE661LepbD_0V9Bx1QbtHhKA,3210
 optimum/rbln/transformers/models/blip_2/modeling_blip_2.py,sha256=2sIVGrIn1B2nUZ8hw1sgW3VbJ2vxrlBRN37GgDiw0GU,16191
 optimum/rbln/transformers/models/clip/__init__.py,sha256=TLeXDqcFK6M6v9x7Xr64kBbqGu3hFHM7p754dQ8UVQc,938
 optimum/rbln/transformers/models/clip/configuration_clip.py,sha256=D7CIWpbMhXUrGv-CnhxRtSS3vAYb427-w7zSkfuJHEU,3455
 optimum/rbln/transformers/models/clip/modeling_clip.py,sha256=QbYrt7pUWNal-p93fxmuKrHa2CPlCaq8F16qOfMAst0,8090
 optimum/rbln/transformers/models/colpali/__init__.py,sha256=n3rueXT_oC0N8myoZiic0YkVK24CW5hZBPa-0L8so6Y,119
 optimum/rbln/transformers/models/colpali/colpali_architecture.py,sha256=bWG7TehWRZkTh2y6mGkpd85_onWAyiyKdaQC9TFsy3E,8065
-optimum/rbln/transformers/models/colpali/configuration_colpali.py,sha256=yPzLYON6qRJlBkzxFfIBzBWd2KjYWvdClO4iAqd_V7E,2609
+optimum/rbln/transformers/models/colpali/configuration_colpali.py,sha256=ieY-tuyDPObFUIJ5sfpcfuCsJ_HTAizN7ZGqirqeFRU,2636
 optimum/rbln/transformers/models/colpali/modeling_colpali.py,sha256=jzvJCBrrCXSpjfmJ3O-VvPNFGWGaNbpOV09JwLPAZWs,15757
 optimum/rbln/transformers/models/decoderonly/__init__.py,sha256=vQYZDDdoddwA7yKc5zzrq2Zs9sax-0p8rNF_aYfF4bk,1006
 optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py,sha256=cakn8RGo8gS3nmXdEqOfC2xUBOMGInROgLEbCOoLFR0,13398
-optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py,sha256=YAn8J_lIq4IS-HM_gbi5Qov8_osxhWtBr5z_28QRbGM,49667
+optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py,sha256=8ovJ5_q_asqVTuVnAuK1m6genW0OSJ30Cd7HS9JXJgc,46363
 optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py,sha256=NmWdodIcXXChI61-Ej7StTe52iQvalMYRUDuNtcQVEI,53342
 optimum/rbln/transformers/models/distilbert/__init__.py,sha256=zXL78SOEORTnUN_wrdoaDaYpntG8lcFHvPobM6jC0CI,841
 optimum/rbln/transformers/models/distilbert/configuration_distilbert.py,sha256=O3BW9JjyYk9PLyiofvOKEgTdMZ_jpIuPfot281pSsyg,984
@@ -111,19 +111,19 @@ optimum/rbln/transformers/models/dpt/configuration_dpt.py,sha256=3Bb_K0sKI6TKeoH
 optimum/rbln/transformers/models/dpt/modeling_dpt.py,sha256=uIwdHAhGgSyj_ljwJsRv6i5nUr9lTzB2Ss0iz0HplfY,978
 optimum/rbln/transformers/models/exaone/__init__.py,sha256=eUL0mq3yGVzCQfjLlOtVF2MecIN3DQWm07EmXubGSTs,921
 optimum/rbln/transformers/models/exaone/configuration_exaone.py,sha256=S4s4kJemPbmn-otYv-XNHE40DJaEYY6cmzaWV6MTGsY,1388
-optimum/rbln/transformers/models/exaone/exaone_architecture.py,sha256=-gCUDIJ1SJqNgIALJejJ75XPtAkd83oyomBke9xGRsc,3610
+optimum/rbln/transformers/models/exaone/exaone_architecture.py,sha256=lY4FwH2EZn_OY6sBIHlwxbfaEOEJ1eueUQJGB6Js62M,2306
 optimum/rbln/transformers/models/exaone/modeling_exaone.py,sha256=sr_ICK-rw_fYmLY5r0IOc-vDtSZEcSwFIQp3Gn92zqE,3929
 optimum/rbln/transformers/models/gemma/__init__.py,sha256=VqPIlokw3kjn_ZoLXINCLXw3vaysQFo5oPGGy6bnt4Q,708
 optimum/rbln/transformers/models/gemma/configuration_gemma.py,sha256=3hAxl7LL9vFpCHrs-g3BwVDdVjnnJ-fzSO88wdfyGDQ,1361
-optimum/rbln/transformers/models/gemma/gemma_architecture.py,sha256=I9EyRIEtMw9u7HhSa8PqUco4uNe3gl6_lx0r1uDT8hA,2546
+optimum/rbln/transformers/models/gemma/gemma_architecture.py,sha256=2Ivay8NTSHmQAqXFh9JvG6Ja5rMThcRAjYPzyipcRI8,956
 optimum/rbln/transformers/models/gemma/modeling_gemma.py,sha256=Ojvum34EhDHWfMB4D6S1BrwoTNwuBSZuBzwdnAgvq38,3095
 optimum/rbln/transformers/models/gemma3/__init__.py,sha256=6rugk3615SEt4lh7gduo_J9VyGiSReuEIvL0Uno0eaI,790
 optimum/rbln/transformers/models/gemma3/configuration_gemma3.py,sha256=eupMGTHJGJNNrAZ3GE6M6GQBAQzBb7KFJvalyDmbM-A,3063
-optimum/rbln/transformers/models/gemma3/gemma3_architecture.py,sha256=sgFQQbvEr15tb2Sxk_tgcgQFcjhKGbNSW6fm2u7-Vck,8609
+optimum/rbln/transformers/models/gemma3/gemma3_architecture.py,sha256=fpLDAXCe5paWVsfc0tL59JkRQMRF-WNgIzOIb_QpSLU,6191
 optimum/rbln/transformers/models/gemma3/modeling_gemma3.py,sha256=-cpU0ot46VFUZ6PtfwN9VJ-E44n6mP1E3dKwB99MtBM,38389
 optimum/rbln/transformers/models/gpt2/__init__.py,sha256=socBMIBZSiLbrVN12rQ4nL9gFeT0axMgz6SWaCaD4Ac,704
 optimum/rbln/transformers/models/gpt2/configuration_gpt2.py,sha256=9sS6-EGapmow3rG9ViejK9qwrqy_X86VBxQ7u9x0Yqk,923
-optimum/rbln/transformers/models/gpt2/gpt2_architecture.py,sha256=pnGgixjgjW7HULbs5211cC2guw_4e4-MlS69vdCRMMg,3206
+optimum/rbln/transformers/models/gpt2/gpt2_architecture.py,sha256=O7hBiaFJrpLSswGwW83cX9S9Q2wKRBDrpAqOgOS7zQg,2733
 optimum/rbln/transformers/models/gpt2/modeling_gpt2.py,sha256=qBDanUk_O-HtOIVCA4IE3FYyCsnL9xIDK00vft-0caw,1490
 optimum/rbln/transformers/models/idefics3/__init__.py,sha256=ulxE7HEfXsNJhd25J9Fvi6vggo9aZH9sLKJjWB6LlzQ,814
 optimum/rbln/transformers/models/idefics3/configuration_idefics3.py,sha256=wKroy3m65zS41G80QXssbndHoHU8wtHTteGU2Q6qbws,2390
@@ -137,7 +137,7 @@ optimum/rbln/transformers/models/llava_next/configuration_llava_next.py,sha256=b
 optimum/rbln/transformers/models/llava_next/modeling_llava_next.py,sha256=paYtCk58--FSZp8xjVrfZAxkJxO02X-jxaVPqL-l7ZU,27421
 optimum/rbln/transformers/models/midm/__init__.py,sha256=IC3FETwgYinbp3wDj7tp4zIHJhbqM-c6GfTRdYcMNj8,913
 optimum/rbln/transformers/models/midm/configuration_midm.py,sha256=DxhcSJlApxfi00XxYmSkKZ6bY9vfLXT0zh-oMKkZot0,1365
-optimum/rbln/transformers/models/midm/midm_architecture.py,sha256=XXY_uDGkXeVQnKpmSWrgljgxtSdTgLLFLfMqtZdRJdM,5642
+optimum/rbln/transformers/models/midm/midm_architecture.py,sha256=RlkmNhaWE5h_awt9aTtR8VZfshNTah0IoUfD2Z9vfxI,5055
 optimum/rbln/transformers/models/midm/modeling_midm.py,sha256=zbziYZ3f_dX_MOLwORTfJn22psZ1g3FFeQffM_TIh7A,3876
 optimum/rbln/transformers/models/mistral/__init__.py,sha256=9FE64bCYfSIyrBkRcwlqF8QyacSJFWvwEufHFi1ZIrM,716
 optimum/rbln/transformers/models/mistral/configuration_mistral.py,sha256=pMYJSwqmtx0uD2uExHx4S-JXal9rqQ5A2ulT2IoglTg,1383
@@ -146,11 +146,11 @@ optimum/rbln/transformers/models/mistral/modeling_mistral.py,sha256=SGzmn9EJeM27
 optimum/rbln/transformers/models/opt/__init__.py,sha256=w0v8GzbzlR5_4yL851njGDSJgX89TrYxrHnpNfMHZEI,700
 optimum/rbln/transformers/models/opt/configuration_opt.py,sha256=HgNCxnuoyZZwPoDMU41nvXG5DU9UHHSG8gvUSsm-r34,920
 optimum/rbln/transformers/models/opt/modeling_opt.py,sha256=aDijHHFOWBAjCJ_YrI7dcmuVuY69S1QD0115MQO9YFU,3667
-optimum/rbln/transformers/models/opt/opt_architecture.py,sha256=xRN0nNoZB4ZxKOmliFkI0xFQ1jy0hs42dv-hMyGOZ_Q,2802
+optimum/rbln/transformers/models/opt/opt_architecture.py,sha256=El2l0n7YUWTakzZvqWyu58KNEbCc6zoHQhkqSLSsVm0,2202
 optimum/rbln/transformers/models/phi/__init__.py,sha256=uqQb-sO1HXuaju2hfo7qJHk_IWhnptY-qFjNjK_uOc0,700
 optimum/rbln/transformers/models/phi/configuration_phi.py,sha256=58jv3bIo_BcPcS9wU6NVgh67mGpHafdoQzStLKmfuU4,1349
 optimum/rbln/transformers/models/phi/modeling_phi.py,sha256=sd8XYKJkpZM7pWqN0DE7B-dJuTpF9b2_ebZgJK1AuJ8,3061
-optimum/rbln/transformers/models/phi/phi_architecture.py,sha256=nv3jx0zWeExYDSr9xHzgG8pssxC5qe6QGy6HmZKXYas,4241
+optimum/rbln/transformers/models/phi/phi_architecture.py,sha256=yShRckC62i2nky3MvM_qGrhTXOo3FswwtNxd5fogduM,3574
 optimum/rbln/transformers/models/qwen2/__init__.py,sha256=Tu4_AXy3ktTvxGwxED3kewiv62S75HgDWD6-TeC1DfA,708
 optimum/rbln/transformers/models/qwen2/configuration_qwen2.py,sha256=Jc7qTFQgB9tbhJ-aPDN_lfyz9u0omNL84HWYBQ5fvcs,1359
 optimum/rbln/transformers/models/qwen2/modeling_qwen2.py,sha256=OKd7SXQLLtzPVolr26P1TvCV7Gf0XG7k6BjzjuvrL4s,3885
@@ -205,7 +205,7 @@ optimum/rbln/utils/model_utils.py,sha256=4k5879Kh75m3x_vS4-qOGfqsOiAvc2kdNFFfvsF
 optimum/rbln/utils/runtime_utils.py,sha256=D9PS8hfH1NBf8yH8cAu-XfdC9fxKzPbt4LFBVpADbbs,7180
 optimum/rbln/utils/save_utils.py,sha256=hG5uOtYmecSXZuGTvCXsTM-SiyZpr5q3InUGCCq_jzQ,3619
 optimum/rbln/utils/submodule.py,sha256=w5mgPgncI740gVKMu3S-69DGNdUSI0bTZxegQGcZ98Y,5011
-optimum_rbln-0.8.1rc1.dist-info/METADATA,sha256=52EcXRgXYVTSOWiLL_fQhxzsbZFrESQLFpluOvePehw,5300
-optimum_rbln-0.8.1rc1.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-optimum_rbln-0.8.1rc1.dist-info/licenses/LICENSE,sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE,11356
-optimum_rbln-0.8.1rc1.dist-info/RECORD,,
+optimum_rbln-0.8.2a0.dist-info/METADATA,sha256=dHMIEdFF_IuTWww99Iypz6HQKVDDk___EVJ8cK77eG0,5299
+optimum_rbln-0.8.2a0.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+optimum_rbln-0.8.2a0.dist-info/licenses/LICENSE,sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE,11356
+optimum_rbln-0.8.2a0.dist-info/RECORD,,

{optimum_rbln-0.8.1rc1.dist-info → optimum_rbln-0.8.2a0.dist-info}/WHEEL RENAMED Viewed

File without changes

{optimum_rbln-0.8.1rc1.dist-info → optimum_rbln-0.8.2a0.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

optimum-rbln 0.8.1rc1__py3-none-any.whl → 0.8.2a0__py3-none-any.whl

optimum-rbln 0.8.1rc1py3-none-any.whl → 0.8.2a0py3-none-any.whl