optimum-rbln 0.9.4a2__py3-none-any.whl → 0.10.0.post1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- optimum/rbln/__init__.py +44 -0
- optimum/rbln/__version__.py +2 -2
- optimum/rbln/configuration_utils.py +230 -67
- optimum/rbln/diffusers/models/controlnet.py +2 -2
- optimum/rbln/diffusers/models/transformers/prior_transformer.py +2 -2
- optimum/rbln/diffusers/models/transformers/transformer_cosmos.py +2 -2
- optimum/rbln/diffusers/models/transformers/transformer_sd3.py +2 -2
- optimum/rbln/diffusers/pipelines/auto_pipeline.py +2 -3
- optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py +3 -12
- optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py +2 -4
- optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py +1 -3
- optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py +1 -3
- optimum/rbln/diffusers/pipelines/cosmos/cosmos_guardrail.py +2 -2
- optimum/rbln/modeling_base.py +11 -10
- optimum/rbln/ops/__init__.py +1 -0
- optimum/rbln/ops/attn.py +10 -0
- optimum/rbln/ops/flash_attn.py +8 -0
- optimum/rbln/ops/moe.py +180 -0
- optimum/rbln/ops/sliding_window_attn.py +9 -0
- optimum/rbln/transformers/__init__.py +44 -0
- optimum/rbln/transformers/modeling_attention_utils.py +124 -222
- optimum/rbln/transformers/modeling_outputs.py +25 -0
- optimum/rbln/transformers/modeling_rope_utils.py +78 -42
- optimum/rbln/transformers/models/__init__.py +38 -0
- optimum/rbln/transformers/models/auto/auto_factory.py +3 -3
- optimum/rbln/transformers/models/bart/bart_architecture.py +24 -24
- optimum/rbln/transformers/models/blip_2/configuration_blip_2.py +7 -2
- optimum/rbln/transformers/models/blip_2/modeling_blip_2.py +1 -1
- optimum/rbln/transformers/models/colpali/colpali_architecture.py +14 -20
- optimum/rbln/transformers/models/colpali/configuration_colpali.py +12 -17
- optimum/rbln/transformers/models/colpali/modeling_colpali.py +66 -182
- optimum/rbln/transformers/models/colqwen2/configuration_colqwen2.py +40 -23
- optimum/rbln/transformers/models/colqwen2/modeling_colqwen2.py +107 -371
- optimum/rbln/transformers/models/decoderonly/__init__.py +2 -0
- optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py +144 -17
- optimum/rbln/transformers/models/decoderonly/configuration_lora.py +1 -1
- optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py +122 -48
- optimum/rbln/transformers/models/decoderonly/decoderonly_runtime_utils.py +5 -7
- optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +120 -128
- optimum/rbln/transformers/models/detr/__init__.py +23 -0
- optimum/rbln/transformers/models/detr/configuration_detr.py +38 -0
- optimum/rbln/transformers/models/detr/modeling_detr.py +53 -0
- optimum/rbln/transformers/models/exaone/exaone_architecture.py +0 -36
- optimum/rbln/transformers/models/gemma/gemma_architecture.py +1 -1
- optimum/rbln/transformers/models/gemma2/__init__.py +16 -0
- optimum/rbln/transformers/models/gemma2/configuration_gemma2.py +45 -0
- optimum/rbln/transformers/models/gemma2/gemma2_architecture.py +83 -0
- optimum/rbln/transformers/models/gemma2/modeling_gemma2.py +101 -0
- optimum/rbln/transformers/models/gemma3/configuration_gemma3.py +2 -7
- optimum/rbln/transformers/models/gemma3/gemma3_architecture.py +16 -18
- optimum/rbln/transformers/models/gemma3/modeling_gemma3.py +5 -177
- optimum/rbln/transformers/models/gpt2/gpt2_architecture.py +8 -34
- optimum/rbln/transformers/models/gpt_oss/__init__.py +16 -0
- optimum/rbln/transformers/models/gpt_oss/configuration_gpt_oss.py +42 -0
- optimum/rbln/transformers/models/gpt_oss/gpt_oss_architecture.py +122 -0
- optimum/rbln/transformers/models/gpt_oss/modeling_gpt_oss.py +168 -0
- optimum/rbln/transformers/models/grounding_dino/configuration_grounding_dino.py +8 -5
- optimum/rbln/transformers/models/grounding_dino/grounding_dino_architecture.py +6 -4
- optimum/rbln/transformers/models/llava/modeling_llava.py +0 -1
- optimum/rbln/transformers/models/midm/midm_architecture.py +29 -22
- optimum/rbln/transformers/models/mixtral/__init__.py +16 -0
- optimum/rbln/transformers/models/mixtral/configuration_mixtral.py +38 -0
- optimum/rbln/transformers/models/mixtral/mixtral_architecture.py +76 -0
- optimum/rbln/transformers/models/mixtral/modeling_mixtral.py +68 -0
- optimum/rbln/transformers/models/opt/opt_architecture.py +1 -44
- optimum/rbln/transformers/models/paligemma/__init__.py +16 -0
- optimum/rbln/transformers/models/paligemma/configuration_paligemma.py +129 -0
- optimum/rbln/transformers/models/paligemma/modeling_paligemma.py +564 -0
- optimum/rbln/transformers/models/pegasus/pegasus_architecture.py +24 -24
- optimum/rbln/transformers/models/phi/phi_architecture.py +13 -21
- optimum/rbln/transformers/models/pixtral/modeling_pixtral.py +9 -5
- optimum/rbln/transformers/models/qwen2_5_vl/__init__.py +6 -1
- optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py +13 -1
- optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py +271 -122
- optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py +43 -39
- optimum/rbln/transformers/models/qwen2_moe/__init__.py +16 -0
- optimum/rbln/transformers/models/qwen2_moe/configuration_qwen2_moe.py +38 -0
- optimum/rbln/transformers/models/qwen2_moe/modeling_qwen2_moe.py +68 -0
- optimum/rbln/transformers/models/qwen2_moe/qwen2_moe_architecture.py +94 -0
- optimum/rbln/transformers/models/qwen2_vl/__init__.py +6 -1
- optimum/rbln/transformers/models/qwen2_vl/configuration_qwen2_vl.py +13 -1
- optimum/rbln/transformers/models/qwen2_vl/modeling_qwen2_vl.py +263 -105
- optimum/rbln/transformers/models/qwen2_vl/qwen2_vl_architecture.py +26 -34
- optimum/rbln/transformers/models/qwen3/qwen3_architecture.py +7 -7
- optimum/rbln/transformers/models/qwen3_moe/__init__.py +16 -0
- optimum/rbln/transformers/models/qwen3_moe/configuration_qwen3_moe.py +38 -0
- optimum/rbln/transformers/models/qwen3_moe/modeling_qwen3_moe.py +68 -0
- optimum/rbln/transformers/models/qwen3_moe/qwen3_moe_architecture.py +100 -0
- optimum/rbln/transformers/models/resnet/configuration_resnet.py +10 -4
- optimum/rbln/transformers/models/seq2seq/seq2seq_architecture.py +14 -12
- optimum/rbln/transformers/models/siglip/modeling_siglip.py +4 -18
- optimum/rbln/transformers/models/swin/configuration_swin.py +1 -6
- optimum/rbln/transformers/models/t5/t5_architecture.py +15 -16
- optimum/rbln/transformers/models/time_series_transformer/time_series_transformers_architecture.py +0 -3
- optimum/rbln/transformers/models/whisper/generation_whisper.py +8 -8
- optimum/rbln/transformers/models/whisper/whisper_architecture.py +0 -3
- optimum/rbln/transformers/utils/rbln_quantization.py +20 -12
- optimum/rbln/utils/deprecation.py +78 -1
- optimum/rbln/utils/hub.py +93 -2
- optimum/rbln/utils/import_utils.py +16 -1
- optimum/rbln/utils/runtime_utils.py +12 -8
- optimum/rbln/utils/submodule.py +24 -0
- {optimum_rbln-0.9.4a2.dist-info → optimum_rbln-0.10.0.post1.dist-info}/METADATA +6 -6
- {optimum_rbln-0.9.4a2.dist-info → optimum_rbln-0.10.0.post1.dist-info}/RECORD +107 -81
- optimum/rbln/transformers/models/colqwen2/colqwen2_architecture.py +0 -233
- {optimum_rbln-0.9.4a2.dist-info → optimum_rbln-0.10.0.post1.dist-info}/WHEEL +0 -0
- {optimum_rbln-0.9.4a2.dist-info → optimum_rbln-0.10.0.post1.dist-info}/entry_points.txt +0 -0
- {optimum_rbln-0.9.4a2.dist-info → optimum_rbln-0.10.0.post1.dist-info}/licenses/LICENSE +0 -0
|
@@ -1,9 +1,9 @@
|
|
|
1
|
-
optimum/rbln/__init__.py,sha256=
|
|
2
|
-
optimum/rbln/__version__.py,sha256=
|
|
1
|
+
optimum/rbln/__init__.py,sha256=ZValjdJsI0eMqOD33WfLDZhaO7UnHkP5EQAbSW-Uy54,21128
|
|
2
|
+
optimum/rbln/__version__.py,sha256=HXLwAU0-LV6usn1tU_KE6YdRJ-qAdgeGvm-VXk2nbe0,721
|
|
3
3
|
optimum/rbln/cli.py,sha256=944P_f9btDyFryHfHzxUKQvwXWYD1hrceDuK6SWNQcQ,22832
|
|
4
|
-
optimum/rbln/configuration_utils.py,sha256=
|
|
4
|
+
optimum/rbln/configuration_utils.py,sha256=pNNRWWcsmwy6VQzhtBF79ptanqccLD7F_br2WgIWWVg,44619
|
|
5
5
|
optimum/rbln/modeling.py,sha256=M9kEqbAqVZIeFxOF9dyfS8i7loJz3LV67zf1wzeVcxM,15218
|
|
6
|
-
optimum/rbln/modeling_base.py,sha256=
|
|
6
|
+
optimum/rbln/modeling_base.py,sha256=PmWBe-DiVYMGl77yJbZ3SitZqfVaz_Ot4JPVoQIM0Fo,27791
|
|
7
7
|
optimum/rbln/diffusers/__init__.py,sha256=dISoQ-mylK-n9DM0doqo3oeQFA2SWu9BZcbrcr4vO0I,7800
|
|
8
8
|
optimum/rbln/diffusers/modeling_diffusers.py,sha256=M4lpr5fdbL9fAGVPc_1IY9evxDA47rV68WyvK9jhnO0,20423
|
|
9
9
|
optimum/rbln/diffusers/configurations/__init__.py,sha256=8xhIEEa9HTbIg-9khGvxqr6kHPaMnnHZc-BNsEADO1o,1458
|
|
@@ -27,7 +27,7 @@ optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_3
|
|
|
27
27
|
optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_xl.py,sha256=qX6-HvOt8SBstEeigWWcor-z2bmyoqAucjRirNfma5o,7161
|
|
28
28
|
optimum/rbln/diffusers/configurations/pipelines/configuration_stable_video_diffusion.py,sha256=k5OZtqsmEd6Ruaw2AMU_M674LziR3bsOZFVEIE0RUO0,5156
|
|
29
29
|
optimum/rbln/diffusers/models/__init__.py,sha256=lTwyUgCSKCm6xksQFDOsyWAfqwbWYMum3BVlh31eADk,1804
|
|
30
|
-
optimum/rbln/diffusers/models/controlnet.py,sha256=
|
|
30
|
+
optimum/rbln/diffusers/models/controlnet.py,sha256=DXnVa6ExNPJl1FmjLRuXL31Z5iVOtc5f_It1Z1d4Dv0,11563
|
|
31
31
|
optimum/rbln/diffusers/models/autoencoders/__init__.py,sha256=sFfYxz0Iwg-xL2jrVkwMk7umiWcsbrtejzjpUZFI1VA,816
|
|
32
32
|
optimum/rbln/diffusers/models/autoencoders/autoencoder_kl.py,sha256=TDwSgO3L6L38JdH-FaxWc77aDkilr8WLL1YjjWMHz-M,9496
|
|
33
33
|
optimum/rbln/diffusers/models/autoencoders/autoencoder_kl_cosmos.py,sha256=WD3hUlZMJSEpeLx_hmrFQmR2Ye6TtCo3Olz4pxB5rsg,9538
|
|
@@ -35,23 +35,23 @@ optimum/rbln/diffusers/models/autoencoders/autoencoder_kl_temporal_decoder.py,sh
|
|
|
35
35
|
optimum/rbln/diffusers/models/autoencoders/vae.py,sha256=t6HHU2Cz2puwkOfk7fSVAxt5Wre7b6nZu-_Fo93Sexw,6086
|
|
36
36
|
optimum/rbln/diffusers/models/autoencoders/vq_model.py,sha256=bIvrtCjFFS5iYXEcQaQBB52VWS0OHAzJTfUOnD_V5aQ,7706
|
|
37
37
|
optimum/rbln/diffusers/models/transformers/__init__.py,sha256=3oTqAOok-dUR2KealC41CKt36dpKq3IT4kabmHkrCpg,767
|
|
38
|
-
optimum/rbln/diffusers/models/transformers/prior_transformer.py,sha256=
|
|
39
|
-
optimum/rbln/diffusers/models/transformers/transformer_cosmos.py,sha256=
|
|
40
|
-
optimum/rbln/diffusers/models/transformers/transformer_sd3.py,sha256=
|
|
38
|
+
optimum/rbln/diffusers/models/transformers/prior_transformer.py,sha256=YPCsfomj2ydGyOcAib6qVnBv0DuLFVpBr1NtkhGcmVE,6339
|
|
39
|
+
optimum/rbln/diffusers/models/transformers/transformer_cosmos.py,sha256=3KOidJT8dIE_vXCdUE_VXDpvDN0DJ3wXWU2kV8f73A8,14060
|
|
40
|
+
optimum/rbln/diffusers/models/transformers/transformer_sd3.py,sha256=7gWhdKCZ-WQFFhirnSVhzmTlf77zepdQqu1EQekqh_U,7846
|
|
41
41
|
optimum/rbln/diffusers/models/unets/__init__.py,sha256=k_c6RfSc_Yln9gINfKxl0coiHfAO_2-zpaLMrQCJr2w,736
|
|
42
42
|
optimum/rbln/diffusers/models/unets/unet_2d_condition.py,sha256=b1frE2BKKs7P6T22P99feQvMmP3NDe2sGLygHJg0RQs,17224
|
|
43
43
|
optimum/rbln/diffusers/models/unets/unet_spatio_temporal_condition.py,sha256=vSGk2wR6Xg8aDCaeVOb2E2SB_XCL9jUe1XDwuBPdKRA,7771
|
|
44
44
|
optimum/rbln/diffusers/pipelines/__init__.py,sha256=B8nRikvGrOSbaNFrp0is2GE4R9xVkhkvl8bxAUILsI4,3859
|
|
45
|
-
optimum/rbln/diffusers/pipelines/auto_pipeline.py,sha256=
|
|
45
|
+
optimum/rbln/diffusers/pipelines/auto_pipeline.py,sha256=4gMLw-esrj0L6KqG0bpJTRLEAp-zzvl3wFWsl_Bm0a8,12481
|
|
46
46
|
optimum/rbln/diffusers/pipelines/controlnet/__init__.py,sha256=n1Ef22TSeax-kENi_d8K6wGGHSNEo9QkUeygELHgcao,983
|
|
47
47
|
optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py,sha256=-6SFcfYr8FJD1y11_OOntWCNSqBpOgPkst0Ys6oIvXU,5295
|
|
48
|
-
optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py,sha256=
|
|
49
|
-
optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py,sha256=
|
|
50
|
-
optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py,sha256=
|
|
51
|
-
optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py,sha256=
|
|
48
|
+
optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py,sha256=YaDFJRRU2GoXnpdtcXmYyG6DiwSil4tGZKtuk5-CYc8,35758
|
|
49
|
+
optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py,sha256=1gHDWqnpAdVpg_-TuhqskJmM_tEcrKBG4G18WS0qEgg,34722
|
|
50
|
+
optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py,sha256=OgWZH3MaSPClKnliZ1tSX-ZN-EcdY55bsKmOJeLsttA,45831
|
|
51
|
+
optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py,sha256=Lmw9_pprEl_AqLvc7hsWLhBqqb4xktE7YrUvRgeX5P0,47171
|
|
52
52
|
optimum/rbln/diffusers/pipelines/cosmos/__init__.py,sha256=h2j6S8IJPVHeNU8qmW9vyXMgHBw0d7kQcuMAA5YoHPU,795
|
|
53
53
|
optimum/rbln/diffusers/pipelines/cosmos/configuration_cosmos_guardrail.py,sha256=BRHWXCxRO5l0YTFTBSkS4sd5Hx8YeuHB14Fr2copYFY,3747
|
|
54
|
-
optimum/rbln/diffusers/pipelines/cosmos/cosmos_guardrail.py,sha256=
|
|
54
|
+
optimum/rbln/diffusers/pipelines/cosmos/cosmos_guardrail.py,sha256=jy-H5Q8E7Ze8q_U6lItjaPTOWySYVpBNsTrg_GU5ALw,16668
|
|
55
55
|
optimum/rbln/diffusers/pipelines/cosmos/pipeline_cosmos_text2world.py,sha256=Nuewu5__SYQxcJcCR7rer1pqQ3YV52eSMb_0hAZeItk,5650
|
|
56
56
|
optimum/rbln/diffusers/pipelines/cosmos/pipeline_cosmos_video2world.py,sha256=KI7E5Iv401D2RZX3rjkec49ZYvGBnbkwDPQoHeRLIMU,5656
|
|
57
57
|
optimum/rbln/diffusers/pipelines/kandinsky2_2/__init__.py,sha256=I4YQq2HfA3xONbWsdJ870IEJPyLWeCDDG-UCJsu9YO8,1035
|
|
@@ -74,27 +74,28 @@ optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_x
|
|
|
74
74
|
optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py,sha256=XUchrMMrm70KKOheSUM6mmzoGWtTyCKd9vkAcd5kvEo,1407
|
|
75
75
|
optimum/rbln/diffusers/pipelines/stable_video_diffusion/__init__.py,sha256=8Mqu_saC_Wp67Zx5UKq90eeKv8tzv8bIm5z9lUdoa3o,677
|
|
76
76
|
optimum/rbln/diffusers/pipelines/stable_video_diffusion/pipeline_stable_video_diffusion.py,sha256=ApXTZZB_tzOBBCY97xHc6tg60-eY3zWXCtEWd3Ou3i4,1864
|
|
77
|
-
optimum/rbln/ops/__init__.py,sha256=
|
|
78
|
-
optimum/rbln/ops/attn.py,sha256=
|
|
79
|
-
optimum/rbln/ops/flash_attn.py,sha256=
|
|
77
|
+
optimum/rbln/ops/__init__.py,sha256=9d4zXHpf4EUYxUBt84_TFqpLcBVDHrBtuQ16vL35iPQ,757
|
|
78
|
+
optimum/rbln/ops/attn.py,sha256=fMSwLi0hSyI9StFGmdcyJKBcPVPzSYgo77e3asvT3og,13189
|
|
79
|
+
optimum/rbln/ops/flash_attn.py,sha256=IOQMF6NmYJjxxhvwo25Y2vDjMKivPSGjBX0W_9Xa1XM,8154
|
|
80
80
|
optimum/rbln/ops/kv_cache_update.py,sha256=aIvK2Sp7M3EfJzJgNvIvAJv4emoN6QOhmgaWj-VboLs,1440
|
|
81
81
|
optimum/rbln/ops/linear.py,sha256=5K3pcrrUHu_p8LrMIU-jX2TnafksveFjjZSCsYSp_yw,1328
|
|
82
|
-
optimum/rbln/ops/
|
|
83
|
-
optimum/rbln/
|
|
82
|
+
optimum/rbln/ops/moe.py,sha256=WJBFt88e3dEaLzs45PTD1vcnYhWTs6yHhNdKMROl9_E,5435
|
|
83
|
+
optimum/rbln/ops/sliding_window_attn.py,sha256=1geQsTLGzoOusTF9Uw-2QzWI8h8MsmD5qYEYG0gTvXw,3784
|
|
84
|
+
optimum/rbln/transformers/__init__.py,sha256=J2-drEitLkuqzZ23bF8FOoT5ke4bUhqeKTLmBZil5H8,14305
|
|
84
85
|
optimum/rbln/transformers/configuration_generic.py,sha256=5_KWSqcpsEoAHXhMzEpLV62m-0DlWqCY_zwgi9kzjIs,4161
|
|
85
|
-
optimum/rbln/transformers/modeling_attention_utils.py,sha256=
|
|
86
|
+
optimum/rbln/transformers/modeling_attention_utils.py,sha256=cM7rsWVFvkEXCw1oA8jlvfBJCErgBlfIyyxGKCmOybs,12693
|
|
86
87
|
optimum/rbln/transformers/modeling_generic.py,sha256=Z_1m5d_hsmQC2qnNkargjMIqlIm3FzBFTNUKqdYdaOc,11499
|
|
87
|
-
optimum/rbln/transformers/modeling_outputs.py,sha256=
|
|
88
|
-
optimum/rbln/transformers/modeling_rope_utils.py,sha256=
|
|
89
|
-
optimum/rbln/transformers/models/__init__.py,sha256=
|
|
88
|
+
optimum/rbln/transformers/modeling_outputs.py,sha256=7ANZ-i-pnY1iBHwD64Gizqdk5RyiAS1htO7EInTMNU0,2411
|
|
89
|
+
optimum/rbln/transformers/modeling_rope_utils.py,sha256=vKs2b1jI1PVxi7dlcLKZvm-T-9OdRPCRt_QZxZg7IyY,16383
|
|
90
|
+
optimum/rbln/transformers/models/__init__.py,sha256=EMLydC1CvBzRKYzMAoL5BCNRRixkjJgvjhMuTggJGWo,15427
|
|
90
91
|
optimum/rbln/transformers/models/audio_spectrogram_transformer/__init__.py,sha256=I2vL4lrzbT5p4eJcH-EKHzEfcPkj_XVsie7jb9q6yic,775
|
|
91
92
|
optimum/rbln/transformers/models/audio_spectrogram_transformer/configuration_audio_spectrogram_transformer.py,sha256=biFBo1twaWScF2CmNYoF_PW-RvJBUfVgBVpdfI_igBY,1741
|
|
92
93
|
optimum/rbln/transformers/models/audio_spectrogram_transformer/modeling_audio_spectrogram_transformer.py,sha256=Kzya5XlU15FkEQlWj1HYXBAGrJleEyF9wiTSiHXSIqo,4124
|
|
93
94
|
optimum/rbln/transformers/models/auto/__init__.py,sha256=tdYqXkg9xBGNr4fZjH7_O3qRVbHvpEVjrJ6wtNUMMJM,1150
|
|
94
|
-
optimum/rbln/transformers/models/auto/auto_factory.py,sha256=
|
|
95
|
+
optimum/rbln/transformers/models/auto/auto_factory.py,sha256=cgF7c9U9NJLZCsy0Dv50abGdK8PP7l-5he5w0WLjhiw,11859
|
|
95
96
|
optimum/rbln/transformers/models/auto/modeling_auto.py,sha256=Iu5vl60CHX1XNbn445woZhSUkNSf0qHPW0DzbcAnDYE,5797
|
|
96
97
|
optimum/rbln/transformers/models/bart/__init__.py,sha256=fVo-gZEmJ0yxkIxEX6ciuRAGgXNyuvaXE2s88bhbjAE,830
|
|
97
|
-
optimum/rbln/transformers/models/bart/bart_architecture.py,sha256=
|
|
98
|
+
optimum/rbln/transformers/models/bart/bart_architecture.py,sha256=XaUy0fV-HMwywS_ncO6B3q5IHFApWR6QqyMm9kzYO7I,6077
|
|
98
99
|
optimum/rbln/transformers/models/bart/configuration_bart.py,sha256=PrRA7OwPTegPamd_mmVnwNygRbNG7pZrsrXdKyfZ6Bo,1351
|
|
99
100
|
optimum/rbln/transformers/models/bart/modeling_bart.py,sha256=FCSZFmq0bhPHkne-1tmsxiQH3E427VfkWtLU9Nct3a0,3276
|
|
100
101
|
optimum/rbln/transformers/models/bert/__init__.py,sha256=86FuGRBLw315_Roa9D5OUx6Ku2PM0DqSPZ-YSqbF-io,806
|
|
@@ -102,30 +103,32 @@ optimum/rbln/transformers/models/bert/bert_architecture.py,sha256=cZgf-B-FV8qbeJ
|
|
|
102
103
|
optimum/rbln/transformers/models/bert/configuration_bert.py,sha256=nEZnX6LXpLKWaoPEd4pWSysw9h-PLb2ld0ibC3dcJ7w,1611
|
|
103
104
|
optimum/rbln/transformers/models/bert/modeling_bert.py,sha256=jVMouqvwqUEKSMcwefPmxopVjGAN-9LodN2THtaWzEg,6435
|
|
104
105
|
optimum/rbln/transformers/models/blip_2/__init__.py,sha256=L01gPXcUCa8Vg-bcng20vZvBIN_jlqCzwUSFuq0QOag,855
|
|
105
|
-
optimum/rbln/transformers/models/blip_2/configuration_blip_2.py,sha256=
|
|
106
|
-
optimum/rbln/transformers/models/blip_2/modeling_blip_2.py,sha256=
|
|
106
|
+
optimum/rbln/transformers/models/blip_2/configuration_blip_2.py,sha256=D2KcNd_o8jx47QUZX-EE8EFWliH53bzMtrBi9l9ORXY,4842
|
|
107
|
+
optimum/rbln/transformers/models/blip_2/modeling_blip_2.py,sha256=9mpiapxja1QWxPPTOqCY9vmnn-08fg06kAp0vANrAgk,21634
|
|
107
108
|
optimum/rbln/transformers/models/clip/__init__.py,sha256=TLeXDqcFK6M6v9x7Xr64kBbqGu3hFHM7p754dQ8UVQc,938
|
|
108
109
|
optimum/rbln/transformers/models/clip/configuration_clip.py,sha256=Ea8TCVmMayydfw9p4kTP3UdtvoaPWf4Z4claB61JuE4,4175
|
|
109
110
|
optimum/rbln/transformers/models/clip/modeling_clip.py,sha256=CeHl52UVr2UVKUeWTyT8OcRWXsZzrLnQpjzK_neu304,14835
|
|
110
111
|
optimum/rbln/transformers/models/colpali/__init__.py,sha256=n3rueXT_oC0N8myoZiic0YkVK24CW5hZBPa-0L8so6Y,119
|
|
111
|
-
optimum/rbln/transformers/models/colpali/colpali_architecture.py,sha256=
|
|
112
|
-
optimum/rbln/transformers/models/colpali/configuration_colpali.py,sha256=
|
|
113
|
-
optimum/rbln/transformers/models/colpali/modeling_colpali.py,sha256=
|
|
112
|
+
optimum/rbln/transformers/models/colpali/colpali_architecture.py,sha256=qeAdCmYHcDLNmFyIwYSIo1hI9K_8dyVgD76wDShdolo,7816
|
|
113
|
+
optimum/rbln/transformers/models/colpali/configuration_colpali.py,sha256=9qFi2N1T-3crCYzxG6JVmIr2eFh_SbT1wDIDF4B-Nck,2893
|
|
114
|
+
optimum/rbln/transformers/models/colpali/modeling_colpali.py,sha256=sKf0k5h5AGkOl9kVyYQ_Cj77_37otVA6A5Q3sPtZSRU,10479
|
|
114
115
|
optimum/rbln/transformers/models/colqwen2/__init__.py,sha256=gEKc5X4uGME4XKySDD1H6JlT89jaMvZ00HqbDVXNHU8,123
|
|
115
|
-
optimum/rbln/transformers/models/colqwen2/
|
|
116
|
-
optimum/rbln/transformers/models/colqwen2/
|
|
117
|
-
optimum/rbln/transformers/models/
|
|
118
|
-
optimum/rbln/transformers/models/decoderonly/
|
|
119
|
-
optimum/rbln/transformers/models/decoderonly/
|
|
120
|
-
optimum/rbln/transformers/models/decoderonly/
|
|
121
|
-
optimum/rbln/transformers/models/decoderonly/
|
|
122
|
-
optimum/rbln/transformers/models/decoderonly/decoderonly_runtime_utils.py,sha256=vY7S-4ms4eW3WIEGLfjDzX3dsQKcc6QHhOiUOXyWSWc,29268
|
|
116
|
+
optimum/rbln/transformers/models/colqwen2/configuration_colqwen2.py,sha256=nzz-mq11MXxoKaz8QgHTs8ywGkGS30BDTxoCOS5LGQA,3199
|
|
117
|
+
optimum/rbln/transformers/models/colqwen2/modeling_colqwen2.py,sha256=bZD6uvJ0lv8AjifG7lzsdR7q5F7NaQibQhsBlJm_sII,7946
|
|
118
|
+
optimum/rbln/transformers/models/decoderonly/__init__.py,sha256=uVUvtkIZ1ewX-9fHsPlmJSfAQTuT1WTFUT1rBLuXSHQ,1165
|
|
119
|
+
optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py,sha256=d9HqTmp_sRqT7bW2CH6QaQIBJUx8W5-bmkpAf02ki40,22331
|
|
120
|
+
optimum/rbln/transformers/models/decoderonly/configuration_lora.py,sha256=DAKpiqN1F53p3gImcUDsapUkRvOq3x3Igi9iAC4rNHo,17357
|
|
121
|
+
optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py,sha256=sCIe0LUTmWe1GaeXsbpf0g_rHnUL4ekvCMJ1R1J2GSk,51996
|
|
122
|
+
optimum/rbln/transformers/models/decoderonly/decoderonly_runtime_utils.py,sha256=FfPQuNMn7fQfEjWpFKvfkI4mUpRtcm20tUd17QrF4Cw,29216
|
|
123
123
|
optimum/rbln/transformers/models/decoderonly/generation_decoderonly.py,sha256=_Rp1vtGow4quWHnIKpHtZFGMxrLjIN-FCc6gz0XL1Sc,5539
|
|
124
124
|
optimum/rbln/transformers/models/decoderonly/lora_architecture.py,sha256=c4O5N56Y2uS-gxsXITt19qmqyV2rqSlPEHxkmOnWE2s,8306
|
|
125
|
-
optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py,sha256=
|
|
125
|
+
optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py,sha256=YP6D3YyLx_9e6yPKla_iDuXOoYrSW9x1OxLzByGhamg,39451
|
|
126
126
|
optimum/rbln/transformers/models/depth_anything/__init__.py,sha256=xvPSIriMJWyNeVYoVB1Z7YqB4kkHOIkaHq7loNps-dk,756
|
|
127
127
|
optimum/rbln/transformers/models/depth_anything/configuration_depth_anything.py,sha256=JujBVEUa_zZDXNPr1y-B_PhK5SgFFcY8Ib4EoGjjtmE,989
|
|
128
128
|
optimum/rbln/transformers/models/depth_anything/modeling_depth_anything.py,sha256=RxscJiKp7PDmbQTDUy2R_Ryxf_0YZ0TieRS5bg53dyQ,1698
|
|
129
|
+
optimum/rbln/transformers/models/detr/__init__.py,sha256=2e5tMUW64MQhMiWmUdU7CaFGxttM4zNtE5DLxrXi0vk,809
|
|
130
|
+
optimum/rbln/transformers/models/detr/configuration_detr.py,sha256=DyWTe6h6lb0Eb1ujDtQmCDCBpONp3bSnv7TFIUJmX2M,1489
|
|
131
|
+
optimum/rbln/transformers/models/detr/modeling_detr.py,sha256=euG1H4hGbdoyw00nAkbPGsv0OFYsuk3QJ5VB4QUhTJo,2075
|
|
129
132
|
optimum/rbln/transformers/models/distilbert/__init__.py,sha256=zXL78SOEORTnUN_wrdoaDaYpntG8lcFHvPobM6jC0CI,841
|
|
130
133
|
optimum/rbln/transformers/models/distilbert/configuration_distilbert.py,sha256=O3BW9JjyYk9PLyiofvOKEgTdMZ_jpIuPfot281pSsyg,984
|
|
131
134
|
optimum/rbln/transformers/models/distilbert/modeling_distilbert.py,sha256=wvMDMj0bTs9j-ZYi2hjGWNj65hEGai2pb6uWJZGEQ5A,2093
|
|
@@ -134,24 +137,32 @@ optimum/rbln/transformers/models/dpt/configuration_dpt.py,sha256=3Bb_K0sKI6TKeoH
|
|
|
134
137
|
optimum/rbln/transformers/models/dpt/modeling_dpt.py,sha256=2XnXwCTeJ7Vj28yK7kvqWxrViqikteX-7l-Ys7ubJpY,1649
|
|
135
138
|
optimum/rbln/transformers/models/exaone/__init__.py,sha256=eUL0mq3yGVzCQfjLlOtVF2MecIN3DQWm07EmXubGSTs,921
|
|
136
139
|
optimum/rbln/transformers/models/exaone/configuration_exaone.py,sha256=S4s4kJemPbmn-otYv-XNHE40DJaEYY6cmzaWV6MTGsY,1388
|
|
137
|
-
optimum/rbln/transformers/models/exaone/exaone_architecture.py,sha256=
|
|
140
|
+
optimum/rbln/transformers/models/exaone/exaone_architecture.py,sha256=jdl18rSIokNJDQDw2dZzPOYymfORSHXABqVUqhIMFUI,1322
|
|
138
141
|
optimum/rbln/transformers/models/exaone/modeling_exaone.py,sha256=yW0Hws35v_70OGn0nmDNMXAsnAzniyxUZ78VmjIbpJg,6060
|
|
139
142
|
optimum/rbln/transformers/models/gemma/__init__.py,sha256=HQISZaSrhwGtsvGuHqkiyMhoS1QAVhd0tXXCaCruq4U,746
|
|
140
143
|
optimum/rbln/transformers/models/gemma/configuration_gemma.py,sha256=H1nVp8HBJxxN__VFyDpBuhoqf_RZxgvfE2cVOSvxBIg,1569
|
|
141
|
-
optimum/rbln/transformers/models/gemma/gemma_architecture.py,sha256=
|
|
144
|
+
optimum/rbln/transformers/models/gemma/gemma_architecture.py,sha256=dDsmoiPippuQVOZefXN7cBXrDWb_1maRYpIUQ9iZe6k,929
|
|
142
145
|
optimum/rbln/transformers/models/gemma/modeling_gemma.py,sha256=AsuFnrwZcRCKtF39BpHHNea0S34N2lNWKV4qZimmY8I,4170
|
|
146
|
+
optimum/rbln/transformers/models/gemma2/__init__.py,sha256=AhpaC9zAb8yeNJyCspN1s-GnNr3ag5nAQa5Wta9OPLs,752
|
|
147
|
+
optimum/rbln/transformers/models/gemma2/configuration_gemma2.py,sha256=kJeo3dz4Ba-YqLEgIvxeRpEUa3-l0zG_x0IWdDXA5_M,1574
|
|
148
|
+
optimum/rbln/transformers/models/gemma2/gemma2_architecture.py,sha256=fjNr66rnN7JP3C2If09OXYwVbhLPKqZ7I7ng7YK3MF8,2896
|
|
149
|
+
optimum/rbln/transformers/models/gemma2/modeling_gemma2.py,sha256=cQUzthGnVQn3wWX2hrCc4idCEfEg4snbQ3i8LOuH1Tg,4209
|
|
143
150
|
optimum/rbln/transformers/models/gemma3/__init__.py,sha256=6rugk3615SEt4lh7gduo_J9VyGiSReuEIvL0Uno0eaI,790
|
|
144
|
-
optimum/rbln/transformers/models/gemma3/configuration_gemma3.py,sha256=
|
|
145
|
-
optimum/rbln/transformers/models/gemma3/gemma3_architecture.py,sha256=
|
|
151
|
+
optimum/rbln/transformers/models/gemma3/configuration_gemma3.py,sha256=mVuOZJYSERGTWa6h70C8WaWGm4_JhKmYIEUHAbZFGGU,4671
|
|
152
|
+
optimum/rbln/transformers/models/gemma3/gemma3_architecture.py,sha256=qdYHvn8KY93Is1W2PcOydnPRnzwD7OS4YhFCBrJukHg,6799
|
|
146
153
|
optimum/rbln/transformers/models/gemma3/gemma3_runtime_utils.py,sha256=1f8LVqtF3Tr6ITVC43QpiSXefFsVeZ7jStoR4SlNTfk,9640
|
|
147
|
-
optimum/rbln/transformers/models/gemma3/modeling_gemma3.py,sha256=
|
|
154
|
+
optimum/rbln/transformers/models/gemma3/modeling_gemma3.py,sha256=WHM0qhmgcKkcNzO0yMa5r09uv53iLa4TR7Iw-5ZEMl4,19410
|
|
148
155
|
optimum/rbln/transformers/models/gpt2/__init__.py,sha256=SsawHMStE3wYRtqkH5EvdTFkCdX0LLmp-QSKFhEBrHo,740
|
|
149
156
|
optimum/rbln/transformers/models/gpt2/configuration_gpt2.py,sha256=iGdHfzG7plekZcIz-Z5U8lRE4SB8gbJJNcFQJ9l8Myg,1533
|
|
150
|
-
optimum/rbln/transformers/models/gpt2/gpt2_architecture.py,sha256=
|
|
157
|
+
optimum/rbln/transformers/models/gpt2/gpt2_architecture.py,sha256=HidhcrVrZddMGdUMIspAER7NvSNyeDeihcSuP_9Lrn8,2264
|
|
151
158
|
optimum/rbln/transformers/models/gpt2/modeling_gpt2.py,sha256=DhF6hU3oCYGbZ7UijKCsRfTx-VCkTqqqNwqqMSrjqRE,2230
|
|
159
|
+
optimum/rbln/transformers/models/gpt_oss/__init__.py,sha256=pUUqYnDf9-Lc1GgKW5eRCxqQ7p9dUJMYzJSw1MDiq40,714
|
|
160
|
+
optimum/rbln/transformers/models/gpt_oss/configuration_gpt_oss.py,sha256=JUvhvT9phaeV8iKp32ldPFBoqILYmbB72x_el2aNqbI,1382
|
|
161
|
+
optimum/rbln/transformers/models/gpt_oss/gpt_oss_architecture.py,sha256=3bqFPSM8QJ1yGRnmcrqfQFV_joP0ewbCQ-0pO02wWos,4519
|
|
162
|
+
optimum/rbln/transformers/models/gpt_oss/modeling_gpt_oss.py,sha256=OJlORXgvf4q6ylp2rPlzRmn8me16JInK1SdMvXCEmew,6364
|
|
152
163
|
optimum/rbln/transformers/models/grounding_dino/__init__.py,sha256=DE7DipZGvrKC6b1T77k4I4X3G70ss8mlr-PrZCaohto,307
|
|
153
|
-
optimum/rbln/transformers/models/grounding_dino/configuration_grounding_dino.py,sha256=
|
|
154
|
-
optimum/rbln/transformers/models/grounding_dino/grounding_dino_architecture.py,sha256=
|
|
164
|
+
optimum/rbln/transformers/models/grounding_dino/configuration_grounding_dino.py,sha256=ktQD85690lD2R9HUYzYsORHZe9vUaKMqYK4f6RcRhuM,4182
|
|
165
|
+
optimum/rbln/transformers/models/grounding_dino/grounding_dino_architecture.py,sha256=dOvLHD7w4mLA325i1uJW65l3R2eaImYkLgrvnJkFTSM,26794
|
|
155
166
|
optimum/rbln/transformers/models/grounding_dino/modeling_grounding_dino.py,sha256=8LKysGbqrheFI2nWZpv4ErUfWmUuca3UE2lQo0RIYhc,48429
|
|
156
167
|
optimum/rbln/transformers/models/idefics3/__init__.py,sha256=ulxE7HEfXsNJhd25J9Fvi6vggo9aZH9sLKJjWB6LlzQ,814
|
|
157
168
|
optimum/rbln/transformers/models/idefics3/configuration_idefics3.py,sha256=7IENNxflZL8ZH3YRqtCXfYdKs-RdUeGiPzq-C03te_s,3679
|
|
@@ -162,52 +173,67 @@ optimum/rbln/transformers/models/llama/llama_architecture.py,sha256=S7MCPfyjG5eU
|
|
|
162
173
|
optimum/rbln/transformers/models/llama/modeling_llama.py,sha256=uRxEXYhHOuEwPjBo_Ps3eFU1uwScasla6P8HwsQgAu0,4214
|
|
163
174
|
optimum/rbln/transformers/models/llava/__init__.py,sha256=FaVLgBIqKGjT_nvwYO9k9BVqrzH_Ym3DfjGRCSUhG2s,734
|
|
164
175
|
optimum/rbln/transformers/models/llava/configuration_llava.py,sha256=c1rie8LCypxlsT7SNjZJE07_xCLAasV4EBs97o1757Q,2998
|
|
165
|
-
optimum/rbln/transformers/models/llava/modeling_llava.py,sha256=
|
|
176
|
+
optimum/rbln/transformers/models/llava/modeling_llava.py,sha256=9m8R6gappLYbkFvQKRFod1pmgKF1ejdlg6XI4TjHdI8,21069
|
|
166
177
|
optimum/rbln/transformers/models/llava_next/__init__.py,sha256=kDXKr7wMkp1XqE__DER2B8kQF_NYMxhzsQS5ytGg56I,752
|
|
167
178
|
optimum/rbln/transformers/models/llava_next/configuration_llava_next.py,sha256=Sz8L8p_23T7xw7pkUmW5pyK_wZclph1p_kQYbslc8m8,2708
|
|
168
179
|
optimum/rbln/transformers/models/llava_next/modeling_llava_next.py,sha256=aVpM0SYSSZ6jClMvpO5J83qrUg3GkDBAFkGC5ylSOvw,21303
|
|
169
180
|
optimum/rbln/transformers/models/midm/__init__.py,sha256=IC3FETwgYinbp3wDj7tp4zIHJhbqM-c6GfTRdYcMNj8,913
|
|
170
181
|
optimum/rbln/transformers/models/midm/configuration_midm.py,sha256=DxhcSJlApxfi00XxYmSkKZ6bY9vfLXT0zh-oMKkZot0,1365
|
|
171
|
-
optimum/rbln/transformers/models/midm/midm_architecture.py,sha256=
|
|
182
|
+
optimum/rbln/transformers/models/midm/midm_architecture.py,sha256=sWorUfJjUk3-19flA4_7FEOG_uhgXli4A9QCyIpTR4Y,5518
|
|
172
183
|
optimum/rbln/transformers/models/midm/modeling_midm.py,sha256=EXTBFaOWco2h3NL8jUACeDmPFJuAjFrtQcgO_BTMuCk,6004
|
|
173
184
|
optimum/rbln/transformers/models/mistral/__init__.py,sha256=bYPqrkmqXmhNDqRgKFaL9iH7piGLSHKzsVrGl_0qs1Q,758
|
|
174
185
|
optimum/rbln/transformers/models/mistral/configuration_mistral.py,sha256=mIfz8J8GZV9ojCMuNj9Zeky_PNu1Ir34DQ7FDZrGkP8,1595
|
|
175
186
|
optimum/rbln/transformers/models/mistral/mistral_architecture.py,sha256=gpQTcP83F4zYrCFXRFT_FAF66k5BSSfcYsaAr4eW9jI,722
|
|
176
187
|
optimum/rbln/transformers/models/mistral/modeling_mistral.py,sha256=TdOPjF1eUDWaGa_il05F95O5zacFJbxKff5Qc_IGEXY,3524
|
|
188
|
+
optimum/rbln/transformers/models/mixtral/__init__.py,sha256=P6EvuFq1MTMYbUX01j6ExnN2jDLnNv6XIsIsp2XXdc8,716
|
|
189
|
+
optimum/rbln/transformers/models/mixtral/configuration_mixtral.py,sha256=mg0q7xMWfs1HXOyq3wEr2xT23vOI6BY8d1mOcEzoVrE,1391
|
|
190
|
+
optimum/rbln/transformers/models/mixtral/mixtral_architecture.py,sha256=uPaHD2xu6ZQz5ic6Y4eCdLP89RPw9yGmmCbLgp3tDIs,3206
|
|
191
|
+
optimum/rbln/transformers/models/mixtral/modeling_mixtral.py,sha256=GeFNATHKRzcJLCudZ_1QM7Dvi9kdbfjkkVM9jRsryJ0,3145
|
|
177
192
|
optimum/rbln/transformers/models/opt/__init__.py,sha256=mkSmAUr_ezMtlMK77f48T0THTFddf0HThH1lp6y5Pfw,734
|
|
178
193
|
optimum/rbln/transformers/models/opt/configuration_opt.py,sha256=aP7cyEuBF4DrQxVERPdP3fXYkuqIUcGxEK2fc8ezh7I,1135
|
|
179
194
|
optimum/rbln/transformers/models/opt/modeling_opt.py,sha256=4KZlCnKwDIOMbltPxvO7FX-lIRmI2auC-NVTWqkIPmc,4002
|
|
180
|
-
optimum/rbln/transformers/models/opt/opt_architecture.py,sha256=
|
|
195
|
+
optimum/rbln/transformers/models/opt/opt_architecture.py,sha256=m2vdc9zveTvgXvvfNd9CRHsD4YTDKmc9wKXCu_ZHNRo,1128
|
|
196
|
+
optimum/rbln/transformers/models/paligemma/__init__.py,sha256=Q5hks3HpJ-V9RDHyf66EMKMku8UiZ69jx41g1YRqboI,796
|
|
197
|
+
optimum/rbln/transformers/models/paligemma/configuration_paligemma.py,sha256=z7sGydwLkTxK0MCE2NbaF6ATFNJGqFUo5aYQ7rpGDHE,5837
|
|
198
|
+
optimum/rbln/transformers/models/paligemma/modeling_paligemma.py,sha256=xiw3YWkniGn4XuingHT3aS_XM5aGL8cglVA7gzd03_k,23926
|
|
181
199
|
optimum/rbln/transformers/models/pegasus/__init__.py,sha256=hXKIvrY0OMe7o2qiOFdolim7yyMuVQrUma_C39YsTqM,848
|
|
182
200
|
optimum/rbln/transformers/models/pegasus/configuration_pegasus.py,sha256=FufYVCN_MrMH24RRCh6MJWlS2e380tG13Oua-dyginY,1478
|
|
183
201
|
optimum/rbln/transformers/models/pegasus/modeling_pegasus.py,sha256=L8xvVwecRqXiF7xoj-1WgSgLBSCSllw1YRdgZhg6kp0,2571
|
|
184
|
-
optimum/rbln/transformers/models/pegasus/pegasus_architecture.py,sha256=
|
|
202
|
+
optimum/rbln/transformers/models/pegasus/pegasus_architecture.py,sha256=GV647yxMP7awSks-nrtyvg2sMg9FKGU9N8RPDsYZMRk,6059
|
|
185
203
|
optimum/rbln/transformers/models/phi/__init__.py,sha256=M5Sh4AtIhJYegl-yAKPggAU3DtJtQOa8MrIQypZ6N7U,734
|
|
186
204
|
optimum/rbln/transformers/models/phi/configuration_phi.py,sha256=CXHIG3xlBdr628oDu_u4OGsu_QZLx5EUSqu3zfmfEnk,1553
|
|
187
205
|
optimum/rbln/transformers/models/phi/modeling_phi.py,sha256=r7B0NlqwIGjm-MmE-h5_xeRJPzs4O2OotgbjI-FYA2o,3403
|
|
188
|
-
optimum/rbln/transformers/models/phi/phi_architecture.py,sha256=
|
|
206
|
+
optimum/rbln/transformers/models/phi/phi_architecture.py,sha256=nGnTNHzzJCku7tsCMyNmyDTGAuHYIHbaarBRWLnJf_8,3666
|
|
189
207
|
optimum/rbln/transformers/models/pixtral/__init__.py,sha256=fhclVAWnIDsfMfC-TW6mYrJXxgyehlLaadK64LOShH4,716
|
|
190
208
|
optimum/rbln/transformers/models/pixtral/configuration_pixtral.py,sha256=b79zkJB1jzHx4S1wTe-Ju_Yel_PS5Q8bfmlQPzkchKU,1677
|
|
191
|
-
optimum/rbln/transformers/models/pixtral/modeling_pixtral.py,sha256=
|
|
209
|
+
optimum/rbln/transformers/models/pixtral/modeling_pixtral.py,sha256=sapLWEzF8JgxXBsk_jxZhhi-d-ZRy9LtJpT3DdUQnyQ,13272
|
|
192
210
|
optimum/rbln/transformers/models/pixtral/pixtral_architecture.py,sha256=55DNou1y3Ev_quCGOMsyBgF1AutJkHvKfqPamJdwP8M,2940
|
|
193
211
|
optimum/rbln/transformers/models/qwen2/__init__.py,sha256=h9dWJ3HX4xspMLt44g7r3UGU8QL03Ynmz_Mi3Vlu6UA,746
|
|
194
212
|
optimum/rbln/transformers/models/qwen2/configuration_qwen2.py,sha256=tTWcPOk_ycZvdSPlal9S5elTmWZAX2BbpZP5Ok2ySwI,1567
|
|
195
213
|
optimum/rbln/transformers/models/qwen2/modeling_qwen2.py,sha256=z0tegK-B7tC0ocTLUp_V4eNmwREa12wJ7qQpbnRLEFo,3477
|
|
196
214
|
optimum/rbln/transformers/models/qwen2/qwen2_architecture.py,sha256=XlNAMYAcDLohnSAhIFGKOPuCB5XLgzYs5ABWdeQSaZs,720
|
|
197
|
-
optimum/rbln/transformers/models/qwen2_5_vl/__init__.py,sha256=
|
|
198
|
-
optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py,sha256=
|
|
199
|
-
optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py,sha256=
|
|
200
|
-
optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py,sha256=
|
|
201
|
-
optimum/rbln/transformers/models/
|
|
202
|
-
optimum/rbln/transformers/models/
|
|
203
|
-
optimum/rbln/transformers/models/
|
|
204
|
-
optimum/rbln/transformers/models/
|
|
215
|
+
optimum/rbln/transformers/models/qwen2_5_vl/__init__.py,sha256=_YnG4LxYdKLW61tSM3__DNB1PfHov8TgR8cTCJ285F4,934
|
|
216
|
+
optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py,sha256=f0wj-VPEOH-N4xTk7yNZjaK4qj2n8PQAnqZL5sIHbIg,6544
|
|
217
|
+
optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py,sha256=fyDVCXlWbuVZtHvGkWdpHNJkH0REvNqVM-I3uKQ8Mas,32708
|
|
218
|
+
optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py,sha256=v4ejtIrbcCIHXBfkh7LD41z6Q_kzdtWpQSwYKkkxjks,8784
|
|
219
|
+
optimum/rbln/transformers/models/qwen2_moe/__init__.py,sha256=2a_ww3_9yBJnni9Sw_AudPsok0qPT37L4R-fdMWzHvI,722
|
|
220
|
+
optimum/rbln/transformers/models/qwen2_moe/configuration_qwen2_moe.py,sha256=SDkmCC7n8K14cPTW8Mkoc2z2Ac-hNnh4PFSYVrNC34o,1383
|
|
221
|
+
optimum/rbln/transformers/models/qwen2_moe/modeling_qwen2_moe.py,sha256=XmAkP1TjaO1QbZsCIHLjgXH_eCeLITSoY97eQ05zCoA,3114
|
|
222
|
+
optimum/rbln/transformers/models/qwen2_moe/qwen2_moe_architecture.py,sha256=Pux0PzBkTQuvQVgqDGsXp6RG0sFNQxTK_co8-Adyzl4,3985
|
|
223
|
+
optimum/rbln/transformers/models/qwen2_vl/__init__.py,sha256=KPL7ciTaA9n_6PFuOcvMwUnZLTLF_hDYGVGf3q8LNRI,912
|
|
224
|
+
optimum/rbln/transformers/models/qwen2_vl/configuration_qwen2_vl.py,sha256=PtWcWEm23EmUi7Q2_-deBv4EbrKJrq3AZZ52zlbAq4o,5101
|
|
225
|
+
optimum/rbln/transformers/models/qwen2_vl/modeling_qwen2_vl.py,sha256=5N6PWVgK-3ahtPfpmF-AwtpSVQJCbLaRYnokneezXdo,26838
|
|
226
|
+
optimum/rbln/transformers/models/qwen2_vl/qwen2_vl_architecture.py,sha256=B0EitNdFhT5CO6TK1uLyPMLUoa99b7vM6pGhi2Rmf-c,5879
|
|
205
227
|
optimum/rbln/transformers/models/qwen3/__init__.py,sha256=tI4KwvXpD35dUUaa8aLUXpWoU9gJGcmKXeywOlH14ZE,746
|
|
206
228
|
optimum/rbln/transformers/models/qwen3/configuration_qwen3.py,sha256=BFRPggnH4VlsXlOa19C6KAID-bPgQ8ooQ29dvogh5zk,2102
|
|
207
229
|
optimum/rbln/transformers/models/qwen3/modeling_qwen3.py,sha256=jOg1Oqefi88rpcn6P2GXL7JDnYl_AjfI63xMXwuWttQ,4888
|
|
208
|
-
optimum/rbln/transformers/models/qwen3/qwen3_architecture.py,sha256=
|
|
230
|
+
optimum/rbln/transformers/models/qwen3/qwen3_architecture.py,sha256=m_pZ1wnh6ib8PhabWbo_n8x-G5hVP9h9iUC1JgEabNA,1119
|
|
231
|
+
optimum/rbln/transformers/models/qwen3_moe/__init__.py,sha256=3Hh4LDyNM388a8VZ68IJJcBWrvJ7TL8Akdax1RE0RBM,722
|
|
232
|
+
optimum/rbln/transformers/models/qwen3_moe/configuration_qwen3_moe.py,sha256=0UJ-xtgFzjyQUj96O43LAdWDLy2M44Blb9jdQ-ROETY,1395
|
|
233
|
+
optimum/rbln/transformers/models/qwen3_moe/modeling_qwen3_moe.py,sha256=AV1EGDrvMFqM_xgj7tFe9ZoAJFsGdmg9eP0wg7m6L4A,3149
|
|
234
|
+
optimum/rbln/transformers/models/qwen3_moe/qwen3_moe_architecture.py,sha256=4KiG9uqWDF8ljSbeq1qQHIZzEs9z05dg1dztGHhpxis,3985
|
|
209
235
|
optimum/rbln/transformers/models/resnet/__init__.py,sha256=0QqtEQF1IMYgEmmfXMGarCDS8kJB5tzODfwTEzDVZRg,837
|
|
210
|
-
optimum/rbln/transformers/models/resnet/configuration_resnet.py,sha256=
|
|
236
|
+
optimum/rbln/transformers/models/resnet/configuration_resnet.py,sha256=hQcE87mI4tjJBhprKq7uKmUcyOTh_RXdW9DwNK2TnWU,1956
|
|
211
237
|
optimum/rbln/transformers/models/resnet/modeling_resnet.py,sha256=tAVa1r-yZMw56xEBtQUKMaUM0u1Zr5mg1uqXtr5u4gE,4419
|
|
212
238
|
optimum/rbln/transformers/models/roberta/__init__.py,sha256=SDoN6iKO6gZk2Wg-nfzEzxNe4jVsd9G4RsduFoMZkYo,974
|
|
213
239
|
optimum/rbln/transformers/models/roberta/configuration_roberta.py,sha256=6KhO-xBsDrYv5XFr6_JmOCFwpklpjB2fcA1V1nJVemo,1310
|
|
@@ -215,21 +241,21 @@ optimum/rbln/transformers/models/roberta/modeling_roberta.py,sha256=1ybyReE9EB--
|
|
|
215
241
|
optimum/rbln/transformers/models/seq2seq/__init__.py,sha256=HiSyWFcKeZ8okfo-s-_Mf_upyvAoZwraUIJyGNLNurY,714
|
|
216
242
|
optimum/rbln/transformers/models/seq2seq/configuration_seq2seq.py,sha256=SBIFHxsDce2_s3laDBLa21l7minrTh6ZWSyhq1vXLa0,3060
|
|
217
243
|
optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py,sha256=9sVR5IqEoN9H0nfG8dk89PDhuaPTRhinO2ZswWyQbn4,20128
|
|
218
|
-
optimum/rbln/transformers/models/seq2seq/seq2seq_architecture.py,sha256=
|
|
244
|
+
optimum/rbln/transformers/models/seq2seq/seq2seq_architecture.py,sha256=bKhh8hSQ4q9qo0yi7zFsEvIlxpdhEcAUGcuCo2DORBM,20193
|
|
219
245
|
optimum/rbln/transformers/models/siglip/__init__.py,sha256=X1Fc1GUnJ2EIxFx45nbeoW-T2t0OyP3W73C0HD8Vowo,712
|
|
220
246
|
optimum/rbln/transformers/models/siglip/configuration_siglip.py,sha256=Fy-ANF91bQno_QVd4ZpyRs-uNgC_XRyBRScBg2uKM6w,3029
|
|
221
|
-
optimum/rbln/transformers/models/siglip/modeling_siglip.py,sha256=
|
|
247
|
+
optimum/rbln/transformers/models/siglip/modeling_siglip.py,sha256=2Fyf8u-iWmJZmRGB9cFPIQhud_QKBd5oRRm5Zl2T6W4,7988
|
|
222
248
|
optimum/rbln/transformers/models/swin/__init__.py,sha256=gUsLDB8ceNxt53Cf69OT32JuZoRdmmIsRfjRdHTLDd0,698
|
|
223
|
-
optimum/rbln/transformers/models/swin/configuration_swin.py,sha256=
|
|
249
|
+
optimum/rbln/transformers/models/swin/configuration_swin.py,sha256=16PNp37KVemOGyuFaVXNWBi-JwEnRNpvfTKS7HmAot0,1490
|
|
224
250
|
optimum/rbln/transformers/models/swin/modeling_swin.py,sha256=SAsHPme9izpKUKrVbxN8HSbOID2jRo3DhEthoV2jIyI,14999
|
|
225
251
|
optimum/rbln/transformers/models/t5/__init__.py,sha256=R1Q8Z1vaIdx4rDjeCmm_ZMSgewWaqaI0l93AHwewtew,818
|
|
226
252
|
optimum/rbln/transformers/models/t5/configuration_t5.py,sha256=nqDbibqykeeWn1TlKk6LmCn-DawTVudMMuBn2c2jds8,1362
|
|
227
253
|
optimum/rbln/transformers/models/t5/modeling_t5.py,sha256=lP__icG548arC9N4FHKfV7PQTpaqT7RpaHO1Tuvq3Ds,5125
|
|
228
|
-
optimum/rbln/transformers/models/t5/t5_architecture.py,sha256=
|
|
254
|
+
optimum/rbln/transformers/models/t5/t5_architecture.py,sha256=_iXpRd7i2coO0pJbcMKJ7eGdwgbTHeZP0VJ8KAagI-Y,10061
|
|
229
255
|
optimum/rbln/transformers/models/time_series_transformer/__init__.py,sha256=xJaFWQawlwtv4H5tVFcY1pxLYzjHtMAlLq6nXysdkN8,1243
|
|
230
256
|
optimum/rbln/transformers/models/time_series_transformer/configuration_time_series_transformer.py,sha256=EUBXE_10W0wtuoAl2OVuQakBpsC7kSpRo3VokXI8Pdo,1619
|
|
231
257
|
optimum/rbln/transformers/models/time_series_transformer/modeling_time_series_transformer.py,sha256=4rrivdPuuyg2MnfLaey_inai_sYE83GLg0nqN4Y85dg,18783
|
|
232
|
-
optimum/rbln/transformers/models/time_series_transformer/time_series_transformers_architecture.py,sha256=
|
|
258
|
+
optimum/rbln/transformers/models/time_series_transformer/time_series_transformers_architecture.py,sha256=SG9K7Pk7YNHWOX2CruWe5IWmBHBU88zuUJ87iZg1WpE,13926
|
|
233
259
|
optimum/rbln/transformers/models/vit/__init__.py,sha256=CrrkHehfCe3U-_rUS00aMBY7Tncdeh43sNUgVI9Dt_g,807
|
|
234
260
|
optimum/rbln/transformers/models/vit/configuration_vit.py,sha256=x98CxKR1cpKAG7Eh43uuPeGeGn4gS3HcKLPoDL3SWJo,994
|
|
235
261
|
optimum/rbln/transformers/models/vit/modeling_vit.py,sha256=49P3b8Q7qhfYxVyJt3XzjE0UNSODqHZQTjFhw5rbVzM,1777
|
|
@@ -238,27 +264,27 @@ optimum/rbln/transformers/models/wav2vec2/configuration_wav2vec2.py,sha256=4uj4g
|
|
|
238
264
|
optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py,sha256=NbANJDBZUrN4pe4CdgVUoxDSg2lBKvHFOlkrNsgDMj0,4272
|
|
239
265
|
optimum/rbln/transformers/models/whisper/__init__.py,sha256=ErquiUlYycSYPsDcq9IwwmbZXoYLn1MVZ8VikWY5gQo,792
|
|
240
266
|
optimum/rbln/transformers/models/whisper/configuration_whisper.py,sha256=bSwDN7VLuk1aVXvfrQIgb9SLdFBDhO5q8ZFaPQPJal0,3077
|
|
241
|
-
optimum/rbln/transformers/models/whisper/generation_whisper.py,sha256=
|
|
267
|
+
optimum/rbln/transformers/models/whisper/generation_whisper.py,sha256=b61NhmWrH9QEcj1tsrP5Yx-6Bt0zwh9z5Vb_2Wo_w-M,7860
|
|
242
268
|
optimum/rbln/transformers/models/whisper/modeling_whisper.py,sha256=k3kiy5EtDAzoVRVhWVjRbcgk1K4-MFzgZLkWDxI1fZw,19325
|
|
243
|
-
optimum/rbln/transformers/models/whisper/whisper_architecture.py,sha256=
|
|
269
|
+
optimum/rbln/transformers/models/whisper/whisper_architecture.py,sha256=mmnZtj_cg6fn1FAP6UgsdcAX4ugsdrgI5bNxNd3UUc0,13869
|
|
244
270
|
optimum/rbln/transformers/models/xlm_roberta/__init__.py,sha256=O3o2KzJ8Li3QhB7GHdRQASc93SYO2jz00Rx4pxYRuDg,982
|
|
245
271
|
optimum/rbln/transformers/models/xlm_roberta/configuration_xlm_roberta.py,sha256=wHRpGTXL9khYqSkKL1IgA7__6_lt9QpOz9tHumjK7fo,1260
|
|
246
272
|
optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py,sha256=Pjqvfp0V0kFBW7U7VD3kthZkpWfzOKsRS_2-z6StTnI,3710
|
|
247
273
|
optimum/rbln/transformers/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
248
|
-
optimum/rbln/transformers/utils/rbln_quantization.py,sha256=
|
|
274
|
+
optimum/rbln/transformers/utils/rbln_quantization.py,sha256=Qdz3jwl4tsocA6chKbuiG45_veeuU-HM_9mHeu8w4LQ,22323
|
|
249
275
|
optimum/rbln/transformers/utils/rbln_runtime_wrapper.py,sha256=l_-zWpRrp6hp-tDANTrEbspIZH-AUSi_jNJICns_QgE,2672
|
|
250
276
|
optimum/rbln/utils/__init__.py,sha256=ieDBT2VFTt2E0M4v_POLBpuGW9LxSydpb_DuPd6PQqc,712
|
|
251
277
|
optimum/rbln/utils/decorator_utils.py,sha256=xu-TrsNi33SRC2a7DBsyoo6-pEQxWKZPZSmM9QlDe2Y,3745
|
|
252
|
-
optimum/rbln/utils/deprecation.py,sha256=
|
|
253
|
-
optimum/rbln/utils/hub.py,sha256=
|
|
254
|
-
optimum/rbln/utils/import_utils.py,sha256=
|
|
278
|
+
optimum/rbln/utils/deprecation.py,sha256=fkygmXIziNIOs7GqFSu2mn9TnaoficryCNvhqUWtRYI,16447
|
|
279
|
+
optimum/rbln/utils/hub.py,sha256=qPY2KysMj2FMb42RyDXuVm5DSw_4iNvMn-rHoWoBTdU,7278
|
|
280
|
+
optimum/rbln/utils/import_utils.py,sha256=ZAp6t5vwUVS9yiFxQYarTLO0v-WqPj75QG5QodzCa2E,6306
|
|
255
281
|
optimum/rbln/utils/logging.py,sha256=VKKBmlQSdg6iZCGmAXaWYiW67K84jyp1QJhLQSSjPPE,3453
|
|
256
282
|
optimum/rbln/utils/model_utils.py,sha256=4k5879Kh75m3x_vS4-qOGfqsOiAvc2kdNFFfvsFvz3k,1748
|
|
257
|
-
optimum/rbln/utils/runtime_utils.py,sha256=
|
|
283
|
+
optimum/rbln/utils/runtime_utils.py,sha256=fdT4QF0MVDOwLXLK82L03FxPpPrHSJ60VMWXGvwcuYI,9600
|
|
258
284
|
optimum/rbln/utils/save_utils.py,sha256=hG5uOtYmecSXZuGTvCXsTM-SiyZpr5q3InUGCCq_jzQ,3619
|
|
259
|
-
optimum/rbln/utils/submodule.py,sha256=
|
|
260
|
-
optimum_rbln-0.
|
|
261
|
-
optimum_rbln-0.
|
|
262
|
-
optimum_rbln-0.
|
|
263
|
-
optimum_rbln-0.
|
|
264
|
-
optimum_rbln-0.
|
|
285
|
+
optimum/rbln/utils/submodule.py,sha256=j-LxEbFpjixFWLRnSBJC-IC3bGSIl7L_hs3gwaqjK1Q,7503
|
|
286
|
+
optimum_rbln-0.10.0.post1.dist-info/METADATA,sha256=Q0QPcZjq4A8Xdw72e5aXu8S2X3Ev7eIL9wOGmVaypuo,5331
|
|
287
|
+
optimum_rbln-0.10.0.post1.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
|
|
288
|
+
optimum_rbln-0.10.0.post1.dist-info/entry_points.txt,sha256=-orKDGKfLypxlPlTz8-ZkmdKULNvax9yeCCCn-q89n4,59
|
|
289
|
+
optimum_rbln-0.10.0.post1.dist-info/licenses/LICENSE,sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE,11356
|
|
290
|
+
optimum_rbln-0.10.0.post1.dist-info/RECORD,,
|
|
@@ -1,233 +0,0 @@
|
|
|
1
|
-
# Copyright 2025 Rebellions Inc. All rights reserved.
|
|
2
|
-
|
|
3
|
-
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
|
-
# you may not use this file except in compliance with the License.
|
|
5
|
-
# You may obtain a copy of the License at:
|
|
6
|
-
|
|
7
|
-
# http://www.apache.org/licenses/LICENSE-2.0
|
|
8
|
-
|
|
9
|
-
# Unless required by applicable law or agreed to in writing, software
|
|
10
|
-
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
11
|
-
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
12
|
-
# See the License for the specific language governing permissions and
|
|
13
|
-
# limitations under the License.
|
|
14
|
-
|
|
15
|
-
from typing import List, Optional, Tuple, Union
|
|
16
|
-
|
|
17
|
-
import torch
|
|
18
|
-
import torch.nn as nn
|
|
19
|
-
from transformers import PreTrainedModel
|
|
20
|
-
|
|
21
|
-
from optimum.rbln.transformers.models.decoderonly.decoderonly_architecture import (
|
|
22
|
-
DecoderOnlyLayer,
|
|
23
|
-
DecoderOnlyModel,
|
|
24
|
-
DecoderOnlyWrapper,
|
|
25
|
-
)
|
|
26
|
-
|
|
27
|
-
from .configuration_colqwen2 import (
|
|
28
|
-
RBLNColQwen2ForRetrievalConfig,
|
|
29
|
-
)
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
def slice_and_unsqueeze_cos_sin(cos, sin, position_ids):
|
|
33
|
-
"""Slice cos[cache_position], sin[cache_position] vector for the query."""
|
|
34
|
-
cos = cos[position_ids[0]][None, None, None, :, :]
|
|
35
|
-
sin = sin[position_ids[0]][None, None, None, :, :]
|
|
36
|
-
|
|
37
|
-
return cos, sin
|
|
38
|
-
|
|
39
|
-
|
|
40
|
-
class ColQwen2LanguageModelWrapper(DecoderOnlyWrapper):
|
|
41
|
-
def __init__(
|
|
42
|
-
self, model: PreTrainedModel, rbln_config: "RBLNColQwen2ForRetrievalConfig", use_rotary_emb: bool = True
|
|
43
|
-
):
|
|
44
|
-
model.config = (
|
|
45
|
-
model.config.vlm_config.text_config if hasattr(model.config, "vlm_config") else model.config.text_config
|
|
46
|
-
)
|
|
47
|
-
super().__init__(model, rbln_config, use_rotary_emb)
|
|
48
|
-
|
|
49
|
-
def get_decoder_layers(self, model: PreTrainedModel):
|
|
50
|
-
return model.language_model.layers
|
|
51
|
-
|
|
52
|
-
def convert_to_rbln_class(self, model: PreTrainedModel, max_seq_len: int):
|
|
53
|
-
new_layers = []
|
|
54
|
-
for layer_idx, layer in enumerate(self.get_decoder_layers(model)):
|
|
55
|
-
is_sliding = layer_idx in self.rbln_config.sliding_window_layers
|
|
56
|
-
new_self_attn = self.get_rbln_attn_class()(
|
|
57
|
-
self.get_attn_layer(layer),
|
|
58
|
-
self.rbln_config,
|
|
59
|
-
is_sliding=is_sliding,
|
|
60
|
-
)
|
|
61
|
-
new_layer = self.get_rbln_layer_class()(layer, new_self_attn)
|
|
62
|
-
new_layers.append(new_layer)
|
|
63
|
-
|
|
64
|
-
new_model = self.get_rbln_model_class()(
|
|
65
|
-
model.language_model,
|
|
66
|
-
new_layers,
|
|
67
|
-
self.rbln_config,
|
|
68
|
-
use_learned_pos_emb=self.__class__._use_learned_pos_emb,
|
|
69
|
-
)
|
|
70
|
-
|
|
71
|
-
# text_projection layer from model
|
|
72
|
-
self.embedding_proj_layer = (
|
|
73
|
-
model.embedding_proj_layer if hasattr(model, "embedding_proj_layer") else model.custom_text_proj
|
|
74
|
-
)
|
|
75
|
-
return new_model
|
|
76
|
-
|
|
77
|
-
def get_rbln_model_class(self):
|
|
78
|
-
return RBLNColQwen2LanguageModel
|
|
79
|
-
|
|
80
|
-
def prepare_forward_args(self, *args):
|
|
81
|
-
args = list(args)
|
|
82
|
-
input_ids = None if self.rbln_config.use_inputs_embeds else args.pop(0)
|
|
83
|
-
inputs_embeds = args.pop(0) if self.rbln_config.use_inputs_embeds else None
|
|
84
|
-
cache_position = args.pop(0)
|
|
85
|
-
global_block_tables = args.pop(0)
|
|
86
|
-
local_block_tables = None
|
|
87
|
-
position_embeds = args.pop(0)
|
|
88
|
-
position_ids = None
|
|
89
|
-
attention_mask = args.pop(0) if self.rbln_config.use_attention_mask else None
|
|
90
|
-
past_key_values = args
|
|
91
|
-
|
|
92
|
-
if len(past_key_values) != 2 * self.num_hidden_layers:
|
|
93
|
-
raise ValueError(
|
|
94
|
-
f"Different past_key_values to model's config. {len(past_key_values)} != {2 * self.num_hidden_layers}"
|
|
95
|
-
)
|
|
96
|
-
|
|
97
|
-
_past_key_values = []
|
|
98
|
-
for i in range(self.config.num_hidden_layers):
|
|
99
|
-
key_states = past_key_values[i * 2]
|
|
100
|
-
value_states = past_key_values[i * 2 + 1]
|
|
101
|
-
past_key_value = [key_states, value_states]
|
|
102
|
-
_past_key_values.append(past_key_value)
|
|
103
|
-
past_key_values = _past_key_values
|
|
104
|
-
|
|
105
|
-
return (
|
|
106
|
-
input_ids,
|
|
107
|
-
inputs_embeds,
|
|
108
|
-
cache_position,
|
|
109
|
-
global_block_tables,
|
|
110
|
-
local_block_tables,
|
|
111
|
-
attention_mask,
|
|
112
|
-
position_ids,
|
|
113
|
-
past_key_values,
|
|
114
|
-
position_embeds,
|
|
115
|
-
)
|
|
116
|
-
|
|
117
|
-
def forward(self, *args):
|
|
118
|
-
(
|
|
119
|
-
input_ids,
|
|
120
|
-
inputs_embeds,
|
|
121
|
-
cache_position,
|
|
122
|
-
global_block_tables,
|
|
123
|
-
local_block_tables,
|
|
124
|
-
attention_mask,
|
|
125
|
-
position_ids,
|
|
126
|
-
past_key_values,
|
|
127
|
-
rotary_emb,
|
|
128
|
-
) = self.prepare_forward_args(*args)
|
|
129
|
-
|
|
130
|
-
last_hidden_states = self.model(
|
|
131
|
-
input_ids=input_ids,
|
|
132
|
-
inputs_embeds=inputs_embeds,
|
|
133
|
-
attention_mask=attention_mask,
|
|
134
|
-
cache_position=cache_position,
|
|
135
|
-
position_ids=position_ids,
|
|
136
|
-
past_key_values=past_key_values,
|
|
137
|
-
rotary_emb=rotary_emb,
|
|
138
|
-
global_block_tables=global_block_tables,
|
|
139
|
-
local_block_tables=local_block_tables,
|
|
140
|
-
)
|
|
141
|
-
|
|
142
|
-
proj = self.embedding_proj_layer(last_hidden_states[0])
|
|
143
|
-
all_hidden_states = last_hidden_states[1] if self.rbln_config.output_hidden_states else None
|
|
144
|
-
|
|
145
|
-
if self.rbln_config.output_hidden_states:
|
|
146
|
-
return proj, all_hidden_states
|
|
147
|
-
else:
|
|
148
|
-
return proj
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
class RBLNColQwen2LanguageModel(DecoderOnlyModel):
|
|
152
|
-
def __init__(
|
|
153
|
-
self,
|
|
154
|
-
model,
|
|
155
|
-
layers: List["DecoderOnlyLayer"],
|
|
156
|
-
rbln_config: "RBLNColQwen2ForRetrievalConfig",
|
|
157
|
-
use_learned_pos_emb=None,
|
|
158
|
-
):
|
|
159
|
-
super().__init__(model, layers, rbln_config, use_learned_pos_emb)
|
|
160
|
-
|
|
161
|
-
self.output_hidden_states = rbln_config.output_hidden_states
|
|
162
|
-
|
|
163
|
-
def forward(
|
|
164
|
-
self,
|
|
165
|
-
input_ids: torch.Tensor = None,
|
|
166
|
-
inputs_embeds: Optional[torch.Tensor] = None,
|
|
167
|
-
attention_mask: torch.Tensor = None,
|
|
168
|
-
cache_position: torch.Tensor = None,
|
|
169
|
-
position_ids: torch.Tensor = None,
|
|
170
|
-
query_position: torch.Tensor = None,
|
|
171
|
-
past_key_values: Tuple[Tuple[torch.Tensor]] = None,
|
|
172
|
-
rotary_emb: Optional[Union[nn.Module, torch.Tensor]] = None,
|
|
173
|
-
global_block_tables: Optional[torch.Tensor] = None,
|
|
174
|
-
local_block_tables: Optional[torch.Tensor] = None,
|
|
175
|
-
lora_int_id: Optional[torch.Tensor] = None,
|
|
176
|
-
):
|
|
177
|
-
# retrieve input_ids and inputs_embeds
|
|
178
|
-
if (input_ids is None) ^ (inputs_embeds is not None):
|
|
179
|
-
raise ValueError(
|
|
180
|
-
"You cannot specify both input_ids and inputs_embeds at the same time, and must specify either one"
|
|
181
|
-
)
|
|
182
|
-
|
|
183
|
-
# embed positions
|
|
184
|
-
if inputs_embeds is None:
|
|
185
|
-
inputs_embeds = self.get_embedding()(input_ids)
|
|
186
|
-
|
|
187
|
-
hidden_states = inputs_embeds * self.hidden_multiplier
|
|
188
|
-
|
|
189
|
-
# get cos,sin vector if needed
|
|
190
|
-
position_ids = position_ids if position_ids is not None else cache_position
|
|
191
|
-
if rotary_emb is not None:
|
|
192
|
-
if isinstance(rotary_emb, torch.Tensor):
|
|
193
|
-
cos = rotary_emb[0]
|
|
194
|
-
sin = rotary_emb[1]
|
|
195
|
-
else:
|
|
196
|
-
cos, sin = rotary_emb(hidden_states, self.max_seq_len) # dtype carrier, max_seq_len
|
|
197
|
-
cos, sin = slice_and_unsqueeze_cos_sin(cos, sin, position_ids)
|
|
198
|
-
|
|
199
|
-
# Get sequence positions for flash attention
|
|
200
|
-
if self.attn_impl == "flash_attn":
|
|
201
|
-
seq_positions = cache_position[:, 0]
|
|
202
|
-
seq_positions = self.convert_sequence_positions_for_flash_attn(
|
|
203
|
-
seq_positions=seq_positions, max_seq_len=self.max_seq_len
|
|
204
|
-
)
|
|
205
|
-
else:
|
|
206
|
-
seq_positions = cache_position[:, :1]
|
|
207
|
-
|
|
208
|
-
# Get local cache positions for sliding window layers
|
|
209
|
-
if len(self.sliding_window_layers) > 0:
|
|
210
|
-
sliding_cache_pos = self.get_local_cache_positions(position_ids, query_position)
|
|
211
|
-
|
|
212
|
-
all_hidden_states = () if self.output_hidden_states else None
|
|
213
|
-
for layer_idx, layer in enumerate(self.layers):
|
|
214
|
-
if self.output_hidden_states:
|
|
215
|
-
all_hidden_states += (hidden_states,)
|
|
216
|
-
|
|
217
|
-
is_sliding = True if layer_idx in self.sliding_window_layers else False
|
|
218
|
-
hidden_states = layer(
|
|
219
|
-
hidden_states=hidden_states,
|
|
220
|
-
attention_mask=attention_mask,
|
|
221
|
-
seq_positions=sliding_cache_pos if is_sliding else seq_positions,
|
|
222
|
-
past_key_values=past_key_values,
|
|
223
|
-
cos=cos,
|
|
224
|
-
sin=sin,
|
|
225
|
-
block_tables=local_block_tables if is_sliding else global_block_tables,
|
|
226
|
-
lora_int_id=lora_int_id,
|
|
227
|
-
)
|
|
228
|
-
|
|
229
|
-
hidden_states = self.get_last_layernorm()(hidden_states)
|
|
230
|
-
if self.output_hidden_states:
|
|
231
|
-
all_hidden_states += (hidden_states,)
|
|
232
|
-
|
|
233
|
-
return hidden_states, all_hidden_states
|
|
File without changes
|
|
File without changes
|
|
File without changes
|