optimum-rbln 0.7.5rc3__py3-none-any.whl → 0.8.1a0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- optimum/rbln/__version__.py +2 -2
- optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +3 -1
- optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py +1 -1
- {optimum_rbln-0.7.5rc3.dist-info → optimum_rbln-0.8.1a0.dist-info}/METADATA +1 -1
- {optimum_rbln-0.7.5rc3.dist-info → optimum_rbln-0.8.1a0.dist-info}/RECORD +7 -7
- {optimum_rbln-0.7.5rc3.dist-info → optimum_rbln-0.8.1a0.dist-info}/WHEEL +0 -0
- {optimum_rbln-0.7.5rc3.dist-info → optimum_rbln-0.8.1a0.dist-info}/licenses/LICENSE +0 -0
optimum/rbln/__version__.py
CHANGED
@@ -17,5 +17,5 @@ __version__: str
|
|
17
17
|
__version_tuple__: VERSION_TUPLE
|
18
18
|
version_tuple: VERSION_TUPLE
|
19
19
|
|
20
|
-
__version__ = version = '0.
|
21
|
-
__version_tuple__ = version_tuple = (0,
|
20
|
+
__version__ = version = '0.8.1a0'
|
21
|
+
__version_tuple__ = version_tuple = (0, 8, 1, 'a0')
|
@@ -709,7 +709,9 @@ class RBLNDecoderOnlyModelForCausalLM(RBLNModel):
|
|
709
709
|
compiled_models[f"decoder_batch_{batch_size}"].get_alloc_per_node_by_key().items()
|
710
710
|
):
|
711
711
|
alloc_memory_by_key[key] += sum(memory_per_node)
|
712
|
-
|
712
|
+
|
713
|
+
alloc_memory_by_key.pop("PortRecur", None) # Old compiler's kv-cache Key
|
714
|
+
alloc_memory_by_key.pop("DramTensor", None) # kv-cache
|
713
715
|
kernel_size = alloc_memory_by_key.pop("Kernel") # model weight
|
714
716
|
|
715
717
|
# Get the maximum number of blocks that can be allocated
|
@@ -595,7 +595,7 @@ class RBLNQwen2_5_VLForConditionalGeneration(RBLNDecoderOnlyModelForCausalLM):
|
|
595
595
|
)
|
596
596
|
logits.append(output.logits)
|
597
597
|
logits = torch.cat(logits, dim=0)
|
598
|
-
|
598
|
+
# Decoder
|
599
599
|
else:
|
600
600
|
inputs_embeds, position_embed = self._preprocess_decoder(input_ids, cache_position)
|
601
601
|
output = self.decoder(
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: optimum-rbln
|
3
|
-
Version: 0.
|
3
|
+
Version: 0.8.1a0
|
4
4
|
Summary: Optimum RBLN is the interface between the HuggingFace Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
|
5
5
|
Project-URL: Homepage, https://rebellions.ai
|
6
6
|
Project-URL: Documentation, https://docs.rbln.ai
|
@@ -1,5 +1,5 @@
|
|
1
1
|
optimum/rbln/__init__.py,sha256=oAnsJSMrPYwBGEttUt3CMXTIESVNe15ftTWRTShwhZI,14386
|
2
|
-
optimum/rbln/__version__.py,sha256=
|
2
|
+
optimum/rbln/__version__.py,sha256=8KrQ-gTLuRdO8nDDly9pCF_MZDqgHg6xW9QXyIjIHug,519
|
3
3
|
optimum/rbln/configuration_utils.py,sha256=gvAjRFEGw5rnSoH0IoyuLrE4fkxtk3DN1pikqrN_Rpk,31277
|
4
4
|
optimum/rbln/modeling.py,sha256=BpydF-bLBF60NnRMbtZwn5odOUjU4Awu9azqGeSufTI,11462
|
5
5
|
optimum/rbln/modeling_base.py,sha256=HQgscr5jpUEtuXU1ACJHSLIntX-kq6Ef0SQ_W2-rp5A,25341
|
@@ -87,7 +87,7 @@ optimum/rbln/transformers/models/clip/modeling_clip.py,sha256=UslcDN6otyQ_psou7F
|
|
87
87
|
optimum/rbln/transformers/models/decoderonly/__init__.py,sha256=vQYZDDdoddwA7yKc5zzrq2Zs9sax-0p8rNF_aYfF4bk,1006
|
88
88
|
optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py,sha256=WQlHUjcMuD_3BPLo1Ytzz-xAI-8J9BYfr7dEzmpLVks,6389
|
89
89
|
optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py,sha256=m_wTGXSK8cBG3NjLDNLTxSWyErl7MB4PPU9fQ6zijEI,45991
|
90
|
-
optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py,sha256=
|
90
|
+
optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py,sha256=hta8L3LB4nOMstSOFrPrbr2fIqzU5FMLev7UPB7eSJk,49561
|
91
91
|
optimum/rbln/transformers/models/dpt/__init__.py,sha256=Nzep9mlzKyL1kV726IBqY8DnLp1DkH9JzFeknWSRhok,714
|
92
92
|
optimum/rbln/transformers/models/dpt/configuration_dpt.py,sha256=4fW6bzVhaAxym4wGV3F785rvUOoWPyw_gdEMqB08Leg,755
|
93
93
|
optimum/rbln/transformers/models/dpt/modeling_dpt.py,sha256=oKLX7MQZvfk1QB8wOtcdi7AmZH2fOIVbypa9A3RA9MI,733
|
@@ -139,7 +139,7 @@ optimum/rbln/transformers/models/qwen2/modeling_qwen2.py,sha256=9-aFDvjMzPNUyGOz
|
|
139
139
|
optimum/rbln/transformers/models/qwen2/qwen2_architecture.py,sha256=XlNAMYAcDLohnSAhIFGKOPuCB5XLgzYs5ABWdeQSaZs,720
|
140
140
|
optimum/rbln/transformers/models/qwen2_5_vl/__init__.py,sha256=rAW3DKQUzGL6EMwa5r1iLu94yhpiZpk6zfoD7TtYXrc,865
|
141
141
|
optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py,sha256=dPcGNaLwJf61PIvVbyt-lvBflp_dvK0hubhNoA3len0,3123
|
142
|
-
optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py,sha256=
|
142
|
+
optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py,sha256=pb4OC5rRG-Y-a8WMBGqrV0owgjeGH83Lqx2fXztnlJg,25117
|
143
143
|
optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py,sha256=OR-tTu8uzeFryenohoqRwgIVqw5zM7dcsZHwKL_jD0A,7232
|
144
144
|
optimum/rbln/transformers/models/seq2seq/__init__.py,sha256=6WKstWiS1kW0oFDn_jyrKMW5QEJAWkmsSRAaadNedDM,715
|
145
145
|
optimum/rbln/transformers/models/seq2seq/configuration_seq2seq2.py,sha256=vSNP1eILfL32cbiLOAD58Ocz6lk3hYFnhIRLDVqlSoI,2624
|
@@ -178,7 +178,7 @@ optimum/rbln/utils/model_utils.py,sha256=V2kFpUe2aqVzLwbpztD8JOVFQqRHncvIWwJbgnU
|
|
178
178
|
optimum/rbln/utils/runtime_utils.py,sha256=LoKNK3AQNV_BSScstIZWjICkJf265MnUgy360BOocVI,5454
|
179
179
|
optimum/rbln/utils/save_utils.py,sha256=hG5uOtYmecSXZuGTvCXsTM-SiyZpr5q3InUGCCq_jzQ,3619
|
180
180
|
optimum/rbln/utils/submodule.py,sha256=ZfI7e3YzbjbbBW4Yjfucj8NygEsukfIkaJi3PtwHrhc,5105
|
181
|
-
optimum_rbln-0.
|
182
|
-
optimum_rbln-0.
|
183
|
-
optimum_rbln-0.
|
184
|
-
optimum_rbln-0.
|
181
|
+
optimum_rbln-0.8.1a0.dist-info/METADATA,sha256=oggHE1bTirnlPGJnS1TWULpx6etS6lUuS3-dB6vJxXQ,5299
|
182
|
+
optimum_rbln-0.8.1a0.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
|
183
|
+
optimum_rbln-0.8.1a0.dist-info/licenses/LICENSE,sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE,11356
|
184
|
+
optimum_rbln-0.8.1a0.dist-info/RECORD,,
|
File without changes
|
File without changes
|