optimum-rbln 0.8.2a0__tar.gz → 0.8.2a1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of optimum-rbln might be problematic. Click here for more details.
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/PKG-INFO +1 -1
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/__version__.py +2 -2
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py +10 -12
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/ISSUE_TEMPLATE/config.yml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/ISSUE_TEMPLATE/model_request.md +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/pull_request_template.md +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/scripts/auto_code_review.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/scripts/validate_docstrings.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/scripts/validate_pr_checklist.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/version.yaml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/auto_code_review.yml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/check_code_quality.yml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/deploy-on-tag.yaml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/deploy.yaml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/pr-title-check.yaml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/pr_checklist_validator.yml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/rbln_check_compiler.yaml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/rbln_dispatch_pytest.yaml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/rbln_optimum_inference_test.yaml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/rbln_optimum_pytest.yaml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/rbln_scheduled_test.yaml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/rbln_trigger_on_pr.yaml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/test-docstrings.yml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.gitignore +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/CODE_OF_CONDUCT.md +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/CONTRIBUTING.md +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/LICENSE +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/README.md +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/assets/rbln_logo.png +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/advanced/custom_class.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/audio-classification/run_ast_audio_classification.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/depth-estimation/run_dpt.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/image-classification/run_image_classification.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/image-classification/run_vit_image_classification.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/image-to-text/run_idefics3.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/image-to-text/run_llava_next_image_to_text.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/kandinsky2_2/run_kandinsky2_2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/kandinsky2_2/run_kandinsky2_2_combined.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/kandinsky2_2/run_kandinsky2_2_img2img.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/kandinsky2_2/run_kandinsky2_2_img2img_combined.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/kandinsky2_2/run_kandinsky2_2_inpaint.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/kandinsky2_2/run_kandinsky2_2_inpaint_combined.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/kandinsky2_2/run_kandinsky2_2_prior_interpolate.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/question-answering/run_question_answering.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/speech-recognition/run_wav2vec2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/speech-recognition/run_whisper.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/stable-diffusion/run_stable_diffusion.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/stable-diffusion/run_stable_diffusion_controlnet.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/stable-diffusion/run_stable_diffusion_img2img.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/stable-diffusion/run_stable_diffusion_img2img_controlnet.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/stable-diffusion/run_stable_diffusion_inpaint.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/stable-diffusion/run_stable_diffusion_lora.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/stable-diffusion/run_stable_diffusion_multicontrolnet.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/text-classification/run_bge_m3_text_classification.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/text-classification/run_bge_reranker_v2_m3_text_classification.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/text-classification/run_secureBERT.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/text-classification/run_t5_classification.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/text-classification/run_twitter_roberta_text_classification.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/text2text-generation/run_bart_text2text_generation.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/text2text-generation/run_llama_peft.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/text2text-generation/run_llama_text2text_generation.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/time-series-forecasting/run_time_series_forecasting.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/pyproject.toml +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/scripts/uv-lock.sh +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/scripts/uv-sync.sh +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/configuration_utils.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/models/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl_cosmos.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/models/configuration_controlnet.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/models/configuration_prior_transformer.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/models/configuration_transformer_cosmos.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/models/configuration_transformer_sd3.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/models/configuration_unet_2d_condition.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/models/configuration_vq_model.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/pipelines/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_controlnet.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_cosmos.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_kandinsky2_2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_3.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_xl.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/modeling_diffusers.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/autoencoders/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl_cosmos.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/autoencoders/vae.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/autoencoders/vq_model.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/controlnet.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/transformers/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/transformers/prior_transformer.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/transformers/transformer_cosmos.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/transformers/transformer_sd3.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/unets/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/unets/unet_2d_condition.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/controlnet/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/cosmos/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/cosmos/configuration_cosmos_guardrail.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/cosmos/cosmos_guardrail.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/cosmos/pipeline_cosmos_text2world.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/cosmos/pipeline_cosmos_video2world.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_combined.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_img2img.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_inpaint.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_prior.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_inpaint.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/modeling.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/modeling_base.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/ops/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/ops/attn.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/ops/flash_attn.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/ops/kv_cache_update.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/ops/linear.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/ops/sliding_window_attn.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/configuration_generic.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/modeling_generic.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/modeling_rope_utils.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/configuration_audio_spectrogram_transformer.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/modeling_audio_spectrogram_transformer.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/auto/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/auto/auto_factory.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/auto/modeling_auto.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/bart/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/bart/bart_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/bart/configuration_bart.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/bart/modeling_bart.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/bert/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/bert/configuration_bert.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/bert/modeling_bert.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/blip_2/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/blip_2/configuration_blip_2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/blip_2/modeling_blip_2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/clip/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/clip/configuration_clip.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/clip/modeling_clip.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/colpali/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/colpali/colpali_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/colpali/configuration_colpali.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/colpali/modeling_colpali.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/decoderonly/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/distilbert/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/distilbert/configuration_distilbert.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/distilbert/modeling_distilbert.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/dpt/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/dpt/configuration_dpt.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/dpt/modeling_dpt.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/exaone/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/exaone/configuration_exaone.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/exaone/exaone_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/exaone/modeling_exaone.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gemma/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gemma/configuration_gemma.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gemma/gemma_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gemma/modeling_gemma.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gemma3/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gemma3/configuration_gemma3.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gemma3/gemma3_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gemma3/modeling_gemma3.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gpt2/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gpt2/configuration_gpt2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gpt2/gpt2_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gpt2/modeling_gpt2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/idefics3/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/idefics3/configuration_idefics3.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/idefics3/modeling_idefics3.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/llama/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/llama/configuration_llama.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/llama/llama_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/llama/modeling_llama.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/llava_next/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/llava_next/configuration_llava_next.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/llava_next/modeling_llava_next.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/midm/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/midm/configuration_midm.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/midm/midm_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/midm/modeling_midm.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/mistral/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/mistral/configuration_mistral.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/mistral/mistral_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/mistral/modeling_mistral.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/opt/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/opt/configuration_opt.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/opt/modeling_opt.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/opt/opt_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/phi/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/phi/configuration_phi.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/phi/modeling_phi.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/phi/phi_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/qwen2/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/qwen2/configuration_qwen2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/qwen2/modeling_qwen2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/qwen2/qwen2_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/qwen2_5_vl/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/resnet/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/resnet/configuration_resnet.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/resnet/modeling_resnet.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/roberta/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/roberta/configuration_roberta.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/roberta/modeling_roberta.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/seq2seq/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/seq2seq/configuration_seq2seq.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/seq2seq/seq2seq_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/siglip/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/siglip/configuration_siglip.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/siglip/modeling_siglip.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/t5/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/t5/configuration_t5.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/t5/modeling_t5.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/t5/t5_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/time_series_transformer/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/time_series_transformer/configuration_time_series_transformer.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/time_series_transformer/modeling_time_series_transformer.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/time_series_transformer/time_series_transformers_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/vit/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/vit/configuration_vit.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/vit/modeling_vit.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/wav2vec2/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/wav2vec2/configuration_wav2vec2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/whisper/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/whisper/configuration_whisper.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/whisper/generation_whisper.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/whisper/modeling_whisper.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/whisper/whisper_architecture.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/xlm_roberta/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/xlm_roberta/configuration_xlm_roberta.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/utils/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/utils/rbln_quantization.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/utils/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/utils/decorator_utils.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/utils/hub.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/utils/import_utils.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/utils/logging.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/utils/model_utils.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/utils/runtime_utils.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/utils/save_utils.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/utils/submodule.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/tests/__init__.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/tests/psnr.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/tests/requirements_sdxl.txt +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/tests/run_stable_diffusion_xl_base.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/tests/test_base.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/tests/test_config.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/tests/test_diffusers.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/tests/test_llm.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/tests/test_transformers.py +0 -0
- {optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/uv.lock +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: optimum-rbln
|
|
3
|
-
Version: 0.8.
|
|
3
|
+
Version: 0.8.2a1
|
|
4
4
|
Summary: Optimum RBLN is the interface between the HuggingFace Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
|
|
5
5
|
Project-URL: Homepage, https://rebellions.ai
|
|
6
6
|
Project-URL: Documentation, https://docs.rbln.ai
|
|
@@ -17,5 +17,5 @@ __version__: str
|
|
|
17
17
|
__version_tuple__: VERSION_TUPLE
|
|
18
18
|
version_tuple: VERSION_TUPLE
|
|
19
19
|
|
|
20
|
-
__version__ = version = '0.8.
|
|
21
|
-
__version_tuple__ = version_tuple = (0, 8, 2, '
|
|
20
|
+
__version__ = version = '0.8.2a1'
|
|
21
|
+
__version_tuple__ = version_tuple = (0, 8, 2, 'a1')
|
|
@@ -231,15 +231,16 @@ class DecoderOnlyWrapper(nn.Module):
|
|
|
231
231
|
def convert_to_rbln_causal_lm(self, causal_lm: PreTrainedModel, max_seq_len: int):
|
|
232
232
|
new_layers = []
|
|
233
233
|
for layer_idx, layer in enumerate(self.get_decoder_layers(causal_lm)):
|
|
234
|
+
is_sliding = layer_idx in self.sliding_window_layers
|
|
234
235
|
new_self_attn = self.get_rbln_attn_class()(
|
|
235
236
|
self.get_attn_layer(layer),
|
|
236
|
-
self.use_attention_mask,
|
|
237
|
+
self.use_attention_mask if not is_sliding else True,
|
|
237
238
|
self.use_position_ids,
|
|
238
239
|
kvcache_block_size=self.sliding_window
|
|
239
240
|
if layer_idx in self.sliding_window_layers
|
|
240
241
|
else self.kvcache_block_size,
|
|
241
|
-
is_sliding=
|
|
242
|
-
attn_impl=self.attn_impl,
|
|
242
|
+
is_sliding=is_sliding,
|
|
243
|
+
attn_impl=self.attn_impl if not is_sliding else "eager",
|
|
243
244
|
kvcache_partition_len=self.kvcache_partition_len,
|
|
244
245
|
)
|
|
245
246
|
new_layer = self.get_rbln_layer_class()(layer, new_self_attn)
|
|
@@ -720,10 +721,6 @@ class DecoderOnlyAttention(nn.Module):
|
|
|
720
721
|
self.use_position_ids = use_position_ids
|
|
721
722
|
self.is_sliding = is_sliding
|
|
722
723
|
self.attn_impl = attn_impl
|
|
723
|
-
|
|
724
|
-
if self.is_sliding and self.attn_impl != "eager":
|
|
725
|
-
raise NotImplementedError("Sliding window attention is only supported with eager attention.")
|
|
726
|
-
|
|
727
724
|
self.kvcache_partition_len = kvcache_partition_len
|
|
728
725
|
|
|
729
726
|
setattr(self, self.get_attention_name(), self.create_attention_op())
|
|
@@ -873,7 +870,8 @@ class AttentionOp(nn.Module):
|
|
|
873
870
|
|
|
874
871
|
def get_attn_op_name(self):
|
|
875
872
|
phase = "decode" if self.phase == "decode" else "prefill"
|
|
876
|
-
|
|
873
|
+
|
|
874
|
+
if self.use_attention_mask and not self.use_position_ids:
|
|
877
875
|
attn_op_name = "paged_attn_"
|
|
878
876
|
else:
|
|
879
877
|
attn_op_name = "paged_causal_attn_"
|
|
@@ -1074,7 +1072,7 @@ class FlashAttentionOp(AttentionOp):
|
|
|
1074
1072
|
|
|
1075
1073
|
def get_attn_op_name(self):
|
|
1076
1074
|
phase = "decode" if self.phase == "decode" else "prefill"
|
|
1077
|
-
if self.use_attention_mask:
|
|
1075
|
+
if self.use_attention_mask and not self.use_position_ids:
|
|
1078
1076
|
attn_op_name = "paged_flash_attn_"
|
|
1079
1077
|
else:
|
|
1080
1078
|
attn_op_name = "paged_flash_causal_attn_"
|
|
@@ -1128,7 +1126,7 @@ class FlashAttentionOp(AttentionOp):
|
|
|
1128
1126
|
"partition": self.kvcache_partition_size,
|
|
1129
1127
|
}
|
|
1130
1128
|
|
|
1131
|
-
if self.use_attention_mask
|
|
1129
|
+
if self.use_attention_mask:
|
|
1132
1130
|
op_args["mask"] = attn_mask
|
|
1133
1131
|
|
|
1134
1132
|
if self.phase == "prefill" or self.phase == "image_prefill":
|
|
@@ -1151,8 +1149,8 @@ class FlashAttentionOp(AttentionOp):
|
|
|
1151
1149
|
class SlidingWindowAttentionOp(AttentionOp):
|
|
1152
1150
|
def get_attn_op_name(self):
|
|
1153
1151
|
phase = "decode" if self.phase == "decode" else "prefill"
|
|
1154
|
-
if self.use_attention_mask:
|
|
1155
|
-
raise NotImplementedError("Attention mask is
|
|
1152
|
+
if not self.use_attention_mask:
|
|
1153
|
+
raise NotImplementedError("Attention mask is needed for sliding window attention.")
|
|
1156
1154
|
|
|
1157
1155
|
attn_op_name = "paged_sliding_window_attn_" + phase
|
|
1158
1156
|
return attn_op_name
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/.github/workflows/rbln_optimum_inference_test.yaml
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/image-to-text/run_llava_next_image_to_text.py
RENAMED
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/kandinsky2_2/run_kandinsky2_2_combined.py
RENAMED
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/kandinsky2_2/run_kandinsky2_2_img2img.py
RENAMED
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/kandinsky2_2/run_kandinsky2_2_inpaint.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/question-answering/run_question_answering.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/stable-diffusion/run_stable_diffusion.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/stable-diffusion/run_stable_diffusion_lora.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/text-classification/run_secureBERT.py
RENAMED
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/text-classification/run_t5_classification.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/examples/text2text-generation/run_llama_peft.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/configurations/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/modeling_diffusers.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/autoencoders/vae.py
RENAMED
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/controlnet.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/models/unets/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/diffusers/pipelines/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/configuration_generic.py
RENAMED
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/modeling_generic.py
RENAMED
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/modeling_rope_utils.py
RENAMED
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/auto/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/bart/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/bert/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/clip/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/dpt/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gemma/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{optimum_rbln-0.8.2a0 → optimum_rbln-0.8.2a1}/src/optimum/rbln/transformers/models/gpt2/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|