optimum-rbln 0.8.0__py3-none-any.whl → 0.8.0.post2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -17,5 +17,5 @@ __version__: str
17
17
  __version_tuple__: VERSION_TUPLE
18
18
  version_tuple: VERSION_TUPLE
19
19
 
20
- __version__ = version = '0.8.0'
21
- __version_tuple__ = version_tuple = (0, 8, 0)
20
+ __version__ = version = '0.8.0.post2'
21
+ __version_tuple__ = version_tuple = (0, 8, 0, 'post2')
@@ -474,7 +474,15 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
474
474
 
475
475
  if isinstance(submodule_config, dict):
476
476
  from_predecessor = self._runtime_options.copy()
477
+ from_predecessor.update(
478
+ {
479
+ "npu": self.npu,
480
+ "tensor_parallel_size": self.tensor_parallel_size,
481
+ "optimum_rbln_version": self.optimum_rbln_version,
482
+ }
483
+ )
477
484
  from_predecessor.update(kwargs)
485
+
478
486
  init_kwargs = from_predecessor
479
487
  init_kwargs.update(submodule_config)
480
488
  submodule_config = submodule_config_cls(**init_kwargs)
@@ -306,7 +306,7 @@ class RBLNRuntimeModel(RBLNPytorchRuntime):
306
306
 
307
307
  # Pad input and cache_position if the last chunk is smaller than `prefill_chunk_size`
308
308
  if query_length % self.prefill_chunk_size != 0:
309
- padding_size = self.prefill_chunk_size - query_length % self.prefill_chunk_size
309
+ padding_size = (self.prefill_chunk_size - query_length) % self.prefill_chunk_size
310
310
  # inputs_embeds
311
311
  if inputs.dim() == 3:
312
312
  inputs = torch.nn.functional.pad(inputs, (0, 0, 0, padding_size))
@@ -479,8 +479,9 @@ class RBLNGemma3RuntimeModel(RBLNRuntimeModel):
479
479
  )
480
480
 
481
481
  # Pad input and cache_position if the last chunk is smaller than `prefill_chunk_size`
482
+ padding_size = 0
482
483
  if query_length % self.prefill_chunk_size != 0:
483
- padding_size = self.prefill_chunk_size - query_length % self.prefill_chunk_size
484
+ padding_size = (self.prefill_chunk_size - query_length) % self.prefill_chunk_size
484
485
  # inputs_embeds
485
486
  if inputs.dim() == 3:
486
487
  inputs = torch.nn.functional.pad(inputs, (0, 0, 0, padding_size))
@@ -595,7 +595,7 @@ class RBLNQwen2_5_VLForConditionalGeneration(RBLNDecoderOnlyModelForCausalLM):
595
595
  )
596
596
  logits.append(output.logits)
597
597
  logits = torch.cat(logits, dim=0)
598
- # Decoder
598
+ # Decoder
599
599
  else:
600
600
  inputs_embeds, position_embed = self._preprocess_decoder(input_ids, cache_position)
601
601
  output = self.decoder(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: optimum-rbln
3
- Version: 0.8.0
3
+ Version: 0.8.0.post2
4
4
  Summary: Optimum RBLN is the interface between the HuggingFace Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
5
5
  Project-URL: Homepage, https://rebellions.ai
6
6
  Project-URL: Documentation, https://docs.rbln.ai
@@ -1,6 +1,6 @@
1
1
  optimum/rbln/__init__.py,sha256=oAnsJSMrPYwBGEttUt3CMXTIESVNe15ftTWRTShwhZI,14386
2
- optimum/rbln/__version__.py,sha256=fSm5pLlwHxfTD7vBTVEqChJUua9ilUsdQYNN_V3u3iE,511
3
- optimum/rbln/configuration_utils.py,sha256=gvAjRFEGw5rnSoH0IoyuLrE4fkxtk3DN1pikqrN_Rpk,31277
2
+ optimum/rbln/__version__.py,sha256=75bd_pNpUZxUHlc7qbG6-4x33AwcFJhMbPTXrvFx4-E,526
3
+ optimum/rbln/configuration_utils.py,sha256=HWOksqd8DHcytVoL9k00aWb6XQJ036DqVoWd2y-8ep8,31544
4
4
  optimum/rbln/modeling.py,sha256=BpydF-bLBF60NnRMbtZwn5odOUjU4Awu9azqGeSufTI,11462
5
5
  optimum/rbln/modeling_base.py,sha256=HQgscr5jpUEtuXU1ACJHSLIntX-kq6Ef0SQ_W2-rp5A,25341
6
6
  optimum/rbln/diffusers/__init__.py,sha256=XL6oKPHbPCV6IVCw3fu0-M9mD2KO_x6unx5kJdAtpVY,6180
@@ -87,7 +87,7 @@ optimum/rbln/transformers/models/clip/modeling_clip.py,sha256=UslcDN6otyQ_psou7F
87
87
  optimum/rbln/transformers/models/decoderonly/__init__.py,sha256=vQYZDDdoddwA7yKc5zzrq2Zs9sax-0p8rNF_aYfF4bk,1006
88
88
  optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py,sha256=WQlHUjcMuD_3BPLo1Ytzz-xAI-8J9BYfr7dEzmpLVks,6389
89
89
  optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py,sha256=m_wTGXSK8cBG3NjLDNLTxSWyErl7MB4PPU9fQ6zijEI,45991
90
- optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py,sha256=bYhw5co6aeueDNR2VHc9vwzhn9JL_fHTJS7E2bE6500,49471
90
+ optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py,sha256=NcmIbLTpj9X7lFFrVbnEm1UIh0cxgZhQdL9Iut6Z2qQ,49473
91
91
  optimum/rbln/transformers/models/dpt/__init__.py,sha256=Nzep9mlzKyL1kV726IBqY8DnLp1DkH9JzFeknWSRhok,714
92
92
  optimum/rbln/transformers/models/dpt/configuration_dpt.py,sha256=4fW6bzVhaAxym4wGV3F785rvUOoWPyw_gdEMqB08Leg,755
93
93
  optimum/rbln/transformers/models/dpt/modeling_dpt.py,sha256=oKLX7MQZvfk1QB8wOtcdi7AmZH2fOIVbypa9A3RA9MI,733
@@ -102,7 +102,7 @@ optimum/rbln/transformers/models/gemma/modeling_gemma.py,sha256=-U3w3cEOv3ps1S8a
102
102
  optimum/rbln/transformers/models/gemma3/__init__.py,sha256=6rugk3615SEt4lh7gduo_J9VyGiSReuEIvL0Uno0eaI,790
103
103
  optimum/rbln/transformers/models/gemma3/configuration_gemma3.py,sha256=RsowCftLZyluzuBwXsMMbHWOABslznMR7WY3rP2sAYw,3020
104
104
  optimum/rbln/transformers/models/gemma3/gemma3_architecture.py,sha256=Uer27wG06hgV1WNf92x1ZeUpl4Q0zskfCqzlLhtgtNU,17348
105
- optimum/rbln/transformers/models/gemma3/modeling_gemma3.py,sha256=OUGsML-H6FOKldld7KRW9l0nRoT4DojWBDl8ZHpfXVA,44982
105
+ optimum/rbln/transformers/models/gemma3/modeling_gemma3.py,sha256=t69RhSi0GWgBTdzhPY8wMT2EGrP0wcnks0fhkwVV3mk,45009
106
106
  optimum/rbln/transformers/models/gpt2/__init__.py,sha256=socBMIBZSiLbrVN12rQ4nL9gFeT0axMgz6SWaCaD4Ac,704
107
107
  optimum/rbln/transformers/models/gpt2/configuration_gpt2.py,sha256=vKvJD8P9Li4W9wdVoQcqMEr1MwEXojPBnF2NE85VXAo,772
108
108
  optimum/rbln/transformers/models/gpt2/gpt2_architecture.py,sha256=kf5jk7Djv9XXX3Q83oTosiMpt9g44TF_gCT-vMiWDJk,3097
@@ -139,7 +139,7 @@ optimum/rbln/transformers/models/qwen2/modeling_qwen2.py,sha256=9-aFDvjMzPNUyGOz
139
139
  optimum/rbln/transformers/models/qwen2/qwen2_architecture.py,sha256=XlNAMYAcDLohnSAhIFGKOPuCB5XLgzYs5ABWdeQSaZs,720
140
140
  optimum/rbln/transformers/models/qwen2_5_vl/__init__.py,sha256=rAW3DKQUzGL6EMwa5r1iLu94yhpiZpk6zfoD7TtYXrc,865
141
141
  optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py,sha256=dPcGNaLwJf61PIvVbyt-lvBflp_dvK0hubhNoA3len0,3123
142
- optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py,sha256=pb4OC5rRG-Y-a8WMBGqrV0owgjeGH83Lqx2fXztnlJg,25117
142
+ optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py,sha256=fD8_EdETHfu0oOqic5WtoETQ0RHD3jMUEBYl1aUQz94,25121
143
143
  optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py,sha256=OR-tTu8uzeFryenohoqRwgIVqw5zM7dcsZHwKL_jD0A,7232
144
144
  optimum/rbln/transformers/models/seq2seq/__init__.py,sha256=6WKstWiS1kW0oFDn_jyrKMW5QEJAWkmsSRAaadNedDM,715
145
145
  optimum/rbln/transformers/models/seq2seq/configuration_seq2seq2.py,sha256=vSNP1eILfL32cbiLOAD58Ocz6lk3hYFnhIRLDVqlSoI,2624
@@ -178,7 +178,7 @@ optimum/rbln/utils/model_utils.py,sha256=V2kFpUe2aqVzLwbpztD8JOVFQqRHncvIWwJbgnU
178
178
  optimum/rbln/utils/runtime_utils.py,sha256=LoKNK3AQNV_BSScstIZWjICkJf265MnUgy360BOocVI,5454
179
179
  optimum/rbln/utils/save_utils.py,sha256=hG5uOtYmecSXZuGTvCXsTM-SiyZpr5q3InUGCCq_jzQ,3619
180
180
  optimum/rbln/utils/submodule.py,sha256=ZfI7e3YzbjbbBW4Yjfucj8NygEsukfIkaJi3PtwHrhc,5105
181
- optimum_rbln-0.8.0.dist-info/METADATA,sha256=o162FwSFWUcaXw4SoFtdnPtAp14nkmE4wjRbY4O3HEU,5297
182
- optimum_rbln-0.8.0.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
183
- optimum_rbln-0.8.0.dist-info/licenses/LICENSE,sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE,11356
184
- optimum_rbln-0.8.0.dist-info/RECORD,,
181
+ optimum_rbln-0.8.0.post2.dist-info/METADATA,sha256=5id5JPtSaYR7FQG48Acy-NsGdB4GQqksqvgqTPu_1qU,5303
182
+ optimum_rbln-0.8.0.post2.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
183
+ optimum_rbln-0.8.0.post2.dist-info/licenses/LICENSE,sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE,11356
184
+ optimum_rbln-0.8.0.post2.dist-info/RECORD,,