optimum-rbln 0.8.0__py3-none-any.whl → 0.8.0.post2__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- optimum/rbln/__version__.py +2 -2
- optimum/rbln/configuration_utils.py +8 -0
- optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +1 -1
- optimum/rbln/transformers/models/gemma3/modeling_gemma3.py +2 -1
- optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py +1 -1
- {optimum_rbln-0.8.0.dist-info → optimum_rbln-0.8.0.post2.dist-info}/METADATA +1 -1
- {optimum_rbln-0.8.0.dist-info → optimum_rbln-0.8.0.post2.dist-info}/RECORD +9 -9
- {optimum_rbln-0.8.0.dist-info → optimum_rbln-0.8.0.post2.dist-info}/WHEEL +0 -0
- {optimum_rbln-0.8.0.dist-info → optimum_rbln-0.8.0.post2.dist-info}/licenses/LICENSE +0 -0
optimum/rbln/__version__.py
CHANGED
@@ -17,5 +17,5 @@ __version__: str
|
|
17
17
|
__version_tuple__: VERSION_TUPLE
|
18
18
|
version_tuple: VERSION_TUPLE
|
19
19
|
|
20
|
-
__version__ = version = '0.8.0'
|
21
|
-
__version_tuple__ = version_tuple = (0, 8, 0)
|
20
|
+
__version__ = version = '0.8.0.post2'
|
21
|
+
__version_tuple__ = version_tuple = (0, 8, 0, 'post2')
|
@@ -474,7 +474,15 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
|
|
474
474
|
|
475
475
|
if isinstance(submodule_config, dict):
|
476
476
|
from_predecessor = self._runtime_options.copy()
|
477
|
+
from_predecessor.update(
|
478
|
+
{
|
479
|
+
"npu": self.npu,
|
480
|
+
"tensor_parallel_size": self.tensor_parallel_size,
|
481
|
+
"optimum_rbln_version": self.optimum_rbln_version,
|
482
|
+
}
|
483
|
+
)
|
477
484
|
from_predecessor.update(kwargs)
|
485
|
+
|
478
486
|
init_kwargs = from_predecessor
|
479
487
|
init_kwargs.update(submodule_config)
|
480
488
|
submodule_config = submodule_config_cls(**init_kwargs)
|
@@ -306,7 +306,7 @@ class RBLNRuntimeModel(RBLNPytorchRuntime):
|
|
306
306
|
|
307
307
|
# Pad input and cache_position if the last chunk is smaller than `prefill_chunk_size`
|
308
308
|
if query_length % self.prefill_chunk_size != 0:
|
309
|
-
padding_size = self.prefill_chunk_size - query_length % self.prefill_chunk_size
|
309
|
+
padding_size = (self.prefill_chunk_size - query_length) % self.prefill_chunk_size
|
310
310
|
# inputs_embeds
|
311
311
|
if inputs.dim() == 3:
|
312
312
|
inputs = torch.nn.functional.pad(inputs, (0, 0, 0, padding_size))
|
@@ -479,8 +479,9 @@ class RBLNGemma3RuntimeModel(RBLNRuntimeModel):
|
|
479
479
|
)
|
480
480
|
|
481
481
|
# Pad input and cache_position if the last chunk is smaller than `prefill_chunk_size`
|
482
|
+
padding_size = 0
|
482
483
|
if query_length % self.prefill_chunk_size != 0:
|
483
|
-
padding_size = self.prefill_chunk_size - query_length % self.prefill_chunk_size
|
484
|
+
padding_size = (self.prefill_chunk_size - query_length) % self.prefill_chunk_size
|
484
485
|
# inputs_embeds
|
485
486
|
if inputs.dim() == 3:
|
486
487
|
inputs = torch.nn.functional.pad(inputs, (0, 0, 0, padding_size))
|
@@ -595,7 +595,7 @@ class RBLNQwen2_5_VLForConditionalGeneration(RBLNDecoderOnlyModelForCausalLM):
|
|
595
595
|
)
|
596
596
|
logits.append(output.logits)
|
597
597
|
logits = torch.cat(logits, dim=0)
|
598
|
-
|
598
|
+
# Decoder
|
599
599
|
else:
|
600
600
|
inputs_embeds, position_embed = self._preprocess_decoder(input_ids, cache_position)
|
601
601
|
output = self.decoder(
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: optimum-rbln
|
3
|
-
Version: 0.8.0
|
3
|
+
Version: 0.8.0.post2
|
4
4
|
Summary: Optimum RBLN is the interface between the HuggingFace Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
|
5
5
|
Project-URL: Homepage, https://rebellions.ai
|
6
6
|
Project-URL: Documentation, https://docs.rbln.ai
|
@@ -1,6 +1,6 @@
|
|
1
1
|
optimum/rbln/__init__.py,sha256=oAnsJSMrPYwBGEttUt3CMXTIESVNe15ftTWRTShwhZI,14386
|
2
|
-
optimum/rbln/__version__.py,sha256=
|
3
|
-
optimum/rbln/configuration_utils.py,sha256=
|
2
|
+
optimum/rbln/__version__.py,sha256=75bd_pNpUZxUHlc7qbG6-4x33AwcFJhMbPTXrvFx4-E,526
|
3
|
+
optimum/rbln/configuration_utils.py,sha256=HWOksqd8DHcytVoL9k00aWb6XQJ036DqVoWd2y-8ep8,31544
|
4
4
|
optimum/rbln/modeling.py,sha256=BpydF-bLBF60NnRMbtZwn5odOUjU4Awu9azqGeSufTI,11462
|
5
5
|
optimum/rbln/modeling_base.py,sha256=HQgscr5jpUEtuXU1ACJHSLIntX-kq6Ef0SQ_W2-rp5A,25341
|
6
6
|
optimum/rbln/diffusers/__init__.py,sha256=XL6oKPHbPCV6IVCw3fu0-M9mD2KO_x6unx5kJdAtpVY,6180
|
@@ -87,7 +87,7 @@ optimum/rbln/transformers/models/clip/modeling_clip.py,sha256=UslcDN6otyQ_psou7F
|
|
87
87
|
optimum/rbln/transformers/models/decoderonly/__init__.py,sha256=vQYZDDdoddwA7yKc5zzrq2Zs9sax-0p8rNF_aYfF4bk,1006
|
88
88
|
optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py,sha256=WQlHUjcMuD_3BPLo1Ytzz-xAI-8J9BYfr7dEzmpLVks,6389
|
89
89
|
optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py,sha256=m_wTGXSK8cBG3NjLDNLTxSWyErl7MB4PPU9fQ6zijEI,45991
|
90
|
-
optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py,sha256=
|
90
|
+
optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py,sha256=NcmIbLTpj9X7lFFrVbnEm1UIh0cxgZhQdL9Iut6Z2qQ,49473
|
91
91
|
optimum/rbln/transformers/models/dpt/__init__.py,sha256=Nzep9mlzKyL1kV726IBqY8DnLp1DkH9JzFeknWSRhok,714
|
92
92
|
optimum/rbln/transformers/models/dpt/configuration_dpt.py,sha256=4fW6bzVhaAxym4wGV3F785rvUOoWPyw_gdEMqB08Leg,755
|
93
93
|
optimum/rbln/transformers/models/dpt/modeling_dpt.py,sha256=oKLX7MQZvfk1QB8wOtcdi7AmZH2fOIVbypa9A3RA9MI,733
|
@@ -102,7 +102,7 @@ optimum/rbln/transformers/models/gemma/modeling_gemma.py,sha256=-U3w3cEOv3ps1S8a
|
|
102
102
|
optimum/rbln/transformers/models/gemma3/__init__.py,sha256=6rugk3615SEt4lh7gduo_J9VyGiSReuEIvL0Uno0eaI,790
|
103
103
|
optimum/rbln/transformers/models/gemma3/configuration_gemma3.py,sha256=RsowCftLZyluzuBwXsMMbHWOABslznMR7WY3rP2sAYw,3020
|
104
104
|
optimum/rbln/transformers/models/gemma3/gemma3_architecture.py,sha256=Uer27wG06hgV1WNf92x1ZeUpl4Q0zskfCqzlLhtgtNU,17348
|
105
|
-
optimum/rbln/transformers/models/gemma3/modeling_gemma3.py,sha256=
|
105
|
+
optimum/rbln/transformers/models/gemma3/modeling_gemma3.py,sha256=t69RhSi0GWgBTdzhPY8wMT2EGrP0wcnks0fhkwVV3mk,45009
|
106
106
|
optimum/rbln/transformers/models/gpt2/__init__.py,sha256=socBMIBZSiLbrVN12rQ4nL9gFeT0axMgz6SWaCaD4Ac,704
|
107
107
|
optimum/rbln/transformers/models/gpt2/configuration_gpt2.py,sha256=vKvJD8P9Li4W9wdVoQcqMEr1MwEXojPBnF2NE85VXAo,772
|
108
108
|
optimum/rbln/transformers/models/gpt2/gpt2_architecture.py,sha256=kf5jk7Djv9XXX3Q83oTosiMpt9g44TF_gCT-vMiWDJk,3097
|
@@ -139,7 +139,7 @@ optimum/rbln/transformers/models/qwen2/modeling_qwen2.py,sha256=9-aFDvjMzPNUyGOz
|
|
139
139
|
optimum/rbln/transformers/models/qwen2/qwen2_architecture.py,sha256=XlNAMYAcDLohnSAhIFGKOPuCB5XLgzYs5ABWdeQSaZs,720
|
140
140
|
optimum/rbln/transformers/models/qwen2_5_vl/__init__.py,sha256=rAW3DKQUzGL6EMwa5r1iLu94yhpiZpk6zfoD7TtYXrc,865
|
141
141
|
optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py,sha256=dPcGNaLwJf61PIvVbyt-lvBflp_dvK0hubhNoA3len0,3123
|
142
|
-
optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py,sha256=
|
142
|
+
optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py,sha256=fD8_EdETHfu0oOqic5WtoETQ0RHD3jMUEBYl1aUQz94,25121
|
143
143
|
optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py,sha256=OR-tTu8uzeFryenohoqRwgIVqw5zM7dcsZHwKL_jD0A,7232
|
144
144
|
optimum/rbln/transformers/models/seq2seq/__init__.py,sha256=6WKstWiS1kW0oFDn_jyrKMW5QEJAWkmsSRAaadNedDM,715
|
145
145
|
optimum/rbln/transformers/models/seq2seq/configuration_seq2seq2.py,sha256=vSNP1eILfL32cbiLOAD58Ocz6lk3hYFnhIRLDVqlSoI,2624
|
@@ -178,7 +178,7 @@ optimum/rbln/utils/model_utils.py,sha256=V2kFpUe2aqVzLwbpztD8JOVFQqRHncvIWwJbgnU
|
|
178
178
|
optimum/rbln/utils/runtime_utils.py,sha256=LoKNK3AQNV_BSScstIZWjICkJf265MnUgy360BOocVI,5454
|
179
179
|
optimum/rbln/utils/save_utils.py,sha256=hG5uOtYmecSXZuGTvCXsTM-SiyZpr5q3InUGCCq_jzQ,3619
|
180
180
|
optimum/rbln/utils/submodule.py,sha256=ZfI7e3YzbjbbBW4Yjfucj8NygEsukfIkaJi3PtwHrhc,5105
|
181
|
-
optimum_rbln-0.8.0.dist-info/METADATA,sha256=
|
182
|
-
optimum_rbln-0.8.0.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
|
183
|
-
optimum_rbln-0.8.0.dist-info/licenses/LICENSE,sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE,11356
|
184
|
-
optimum_rbln-0.8.0.dist-info/RECORD,,
|
181
|
+
optimum_rbln-0.8.0.post2.dist-info/METADATA,sha256=5id5JPtSaYR7FQG48Acy-NsGdB4GQqksqvgqTPu_1qU,5303
|
182
|
+
optimum_rbln-0.8.0.post2.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
|
183
|
+
optimum_rbln-0.8.0.post2.dist-info/licenses/LICENSE,sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE,11356
|
184
|
+
optimum_rbln-0.8.0.post2.dist-info/RECORD,,
|
File without changes
|
File without changes
|