optimum-rbln 0.8.1rc0__tar.gz → 0.8.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of optimum-rbln might be problematic. Click here for more details.
- optimum_rbln-0.8.2/.github/version.yaml +1 -0
- optimum_rbln-0.8.2/.github/workflows/rbln_optimum_pytest.yaml +138 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/rbln_scheduled_test.yaml +2 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/rbln_trigger_on_pr.yaml +0 -9
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/PKG-INFO +1 -1
- optimum_rbln-0.8.2/assets/rbln_logo.png +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/pyproject.toml +1 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/__init__.py +58 -9
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/__version__.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/configuration_utils.py +24 -5
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/models/__init__.py +1 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl_cosmos.py +5 -3
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/models/configuration_controlnet.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/models/configuration_prior_transformer.py +2 -2
- optimum_rbln-0.8.1rc0/src/optimum/rbln/diffusers/configurations/models/configuration_cosmos_transformer.py → optimum_rbln-0.8.2/src/optimum/rbln/diffusers/configurations/models/configuration_transformer_cosmos.py +7 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/models/configuration_transformer_sd3.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/models/configuration_unet_2d_condition.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/models/configuration_vq_model.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_controlnet.py +3 -3
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_cosmos.py +10 -6
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_kandinsky2_2.py +4 -4
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_3.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_xl.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/modeling_diffusers.py +4 -5
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/__init__.py +3 -13
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl.py +1 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl_cosmos.py +1 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/autoencoders/vq_model.py +1 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/transformers/transformer_cosmos.py +1 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/__init__.py +1 -5
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/cosmos/configuration_cosmos_guardrail.py +12 -4
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/cosmos/cosmos_guardrail.py +4 -26
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/cosmos/pipeline_cosmos_text2world.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/cosmos/pipeline_cosmos_video2world.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_combined.py +1 -6
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/modeling.py +4 -5
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/modeling_base.py +18 -14
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/ops/kv_cache_update.py +5 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/ops/linear.py +7 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/__init__.py +60 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/configuration_generic.py +4 -4
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/modeling_attention_utils.py +252 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/modeling_generic.py +1 -4
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/__init__.py +45 -30
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/bart/bart_architecture.py +2 -7
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/blip_2/configuration_blip_2.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/blip_2/modeling_blip_2.py +1 -5
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/clip/configuration_clip.py +14 -3
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/clip/modeling_clip.py +123 -28
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/colpali/colpali_architecture.py +1 -4
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/colpali/configuration_colpali.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/colpali/modeling_colpali.py +2 -10
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/decoderonly/__init__.py +2 -2
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py +392 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py +323 -454
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +579 -362
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/exaone/exaone_architecture.py +17 -42
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/gemma/__init__.py +16 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/gemma/configuration_gemma.py +9 -1
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/gemma/gemma_architecture.py +27 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/gemma/modeling_gemma.py +22 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/gemma3/configuration_gemma3.py +21 -9
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/gemma3/gemma3_architecture.py +9 -63
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/gemma3/modeling_gemma3.py +200 -292
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/gpt2/__init__.py +16 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/gpt2/configuration_gpt2.py +50 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/gpt2/gpt2_architecture.py +19 -24
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/gpt2/modeling_gpt2.py +18 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/idefics3/configuration_idefics3.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/idefics3/modeling_idefics3.py +3 -9
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/llama/__init__.py +16 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/llama/configuration_llama.py +9 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/llama/modeling_llama.py +22 -1
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/llava/__init__.py +16 -0
- optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/llava_next/configuration_llava_next.py → optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/llava/configuration_llava.py +5 -5
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/llava/modeling_llava.py +419 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/llava_next/configuration_llava_next.py +71 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/llava_next/modeling_llava_next.py +6 -16
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/midm/midm_architecture.py +14 -22
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/mistral/__init__.py +16 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/mistral/configuration_mistral.py +9 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/mistral/mistral_architecture.py +1 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/mistral/modeling_mistral.py +26 -3
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/opt/__init__.py +16 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/opt/configuration_opt.py +8 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/opt/modeling_opt.py +41 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/opt/opt_architecture.py +16 -25
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/pegasus/__init__.py +17 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/pegasus/configuration_pegasus.py +34 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/pegasus/modeling_pegasus.py +69 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/pegasus/pegasus_architecture.py +161 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/phi/__init__.py +16 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/phi/configuration_phi.py +9 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/phi/modeling_phi.py +10 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/phi/phi_architecture.py +16 -22
- {optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/gpt2 → optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/pixtral}/__init__.py +2 -2
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/pixtral/configuration_pixtral.py +43 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/pixtral/modeling_pixtral.py +315 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/pixtral/pixtral_architecture.py +73 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/qwen2/__init__.py +16 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/qwen2/configuration_qwen2.py +9 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/qwen2/modeling_qwen2.py +27 -1
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py +3 -3
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py +5 -15
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py +1 -4
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/qwen3/__init__.py +16 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/qwen3/configuration_qwen3.py +71 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/qwen3/modeling_qwen3.py +133 -0
- optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/qwen3/qwen3_architecture.py +31 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/seq2seq/configuration_seq2seq.py +2 -12
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py +3 -1
- {optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/gemma → optimum_rbln-0.8.2/src/optimum/rbln/transformers/models/siglip}/__init__.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/siglip/modeling_siglip.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/time_series_transformer/configuration_time_series_transformer.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/time_series_transformer/modeling_time_series_transformer.py +3 -5
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/whisper/configuration_whisper.py +3 -12
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/whisper/modeling_whisper.py +8 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/xlm_roberta/__init__.py +2 -8
- optimum_rbln-0.8.2/src/optimum/rbln/utils/depreacate_utils.py +16 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/utils/hub.py +8 -47
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/utils/runtime_utils.py +31 -5
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/tests/test_base.py +84 -78
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/tests/test_diffusers.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/tests/test_llm.py +254 -14
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/tests/test_transformers.py +2 -2
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/uv.lock +984 -962
- optimum_rbln-0.8.1rc0/.github/version.yaml +0 -1
- optimum_rbln-0.8.1rc0/.github/workflows/rbln_optimum_pytest.yaml +0 -104
- optimum_rbln-0.8.1rc0/assets/rbln_logo.png +0 -0
- optimum_rbln-0.8.1rc0/examples/cosmos/run_cosmos_text2world.py +0 -70
- optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py +0 -223
- optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/gemma/gemma_architecture.py +0 -68
- optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/gpt2/configuration_gpt2.py +0 -22
- optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/llama/__init__.py +0 -16
- optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/mistral/__init__.py +0 -16
- optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/opt/__init__.py +0 -16
- optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/phi/__init__.py +0 -16
- optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/qwen2/__init__.py +0 -16
- optimum_rbln-0.8.1rc0/src/optimum/rbln/transformers/models/siglip/__init__.py +0 -20
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/ISSUE_TEMPLATE/config.yml +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/ISSUE_TEMPLATE/model_request.md +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/pull_request_template.md +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/scripts/auto_code_review.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/scripts/validate_docstrings.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/scripts/validate_pr_checklist.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/auto_code_review.yml +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/check_code_quality.yml +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/deploy-on-tag.yaml +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/deploy.yaml +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/pr-title-check.yaml +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/pr_checklist_validator.yml +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/rbln_check_compiler.yaml +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/rbln_dispatch_pytest.yaml +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/rbln_optimum_inference_test.yaml +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.github/workflows/test-docstrings.yml +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/.gitignore +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/CODE_OF_CONDUCT.md +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/CONTRIBUTING.md +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/LICENSE +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/README.md +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/advanced/custom_class.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/audio-classification/run_ast_audio_classification.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/depth-estimation/run_dpt.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/image-classification/run_image_classification.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/image-classification/run_vit_image_classification.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/image-to-text/run_idefics3.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/image-to-text/run_llava_next_image_to_text.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/kandinsky2_2/run_kandinsky2_2.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/kandinsky2_2/run_kandinsky2_2_combined.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/kandinsky2_2/run_kandinsky2_2_img2img.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/kandinsky2_2/run_kandinsky2_2_img2img_combined.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/kandinsky2_2/run_kandinsky2_2_inpaint.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/kandinsky2_2/run_kandinsky2_2_inpaint_combined.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/kandinsky2_2/run_kandinsky2_2_prior_interpolate.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/question-answering/run_question_answering.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/speech-recognition/run_wav2vec2.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/speech-recognition/run_whisper.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/stable-diffusion/run_stable_diffusion.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/stable-diffusion/run_stable_diffusion_controlnet.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/stable-diffusion/run_stable_diffusion_img2img.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/stable-diffusion/run_stable_diffusion_img2img_controlnet.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/stable-diffusion/run_stable_diffusion_inpaint.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/stable-diffusion/run_stable_diffusion_lora.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/stable-diffusion/run_stable_diffusion_multicontrolnet.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/text-classification/run_bge_m3_text_classification.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/text-classification/run_bge_reranker_v2_m3_text_classification.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/text-classification/run_secureBERT.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/text-classification/run_t5_classification.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/text-classification/run_twitter_roberta_text_classification.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/text2text-generation/run_bart_text2text_generation.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/text2text-generation/run_llama_peft.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/text2text-generation/run_llama_text2text_generation.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/examples/time-series-forecasting/run_time_series_forecasting.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/scripts/uv-lock.sh +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/scripts/uv-sync.sh +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/configurations/pipelines/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/autoencoders/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/autoencoders/vae.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/controlnet.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/transformers/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/transformers/prior_transformer.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/transformers/transformer_sd3.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/unets/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/models/unets/unet_2d_condition.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/controlnet/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/cosmos/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_img2img.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_inpaint.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_prior.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_inpaint.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/ops/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/ops/attn.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/ops/flash_attn.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/ops/sliding_window_attn.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/modeling_rope_utils.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/configuration_audio_spectrogram_transformer.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/modeling_audio_spectrogram_transformer.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/auto/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/auto/auto_factory.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/auto/modeling_auto.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/bart/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/bart/configuration_bart.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/bart/modeling_bart.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/bert/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/bert/configuration_bert.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/bert/modeling_bert.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/blip_2/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/clip/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/colpali/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/distilbert/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/distilbert/configuration_distilbert.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/distilbert/modeling_distilbert.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/dpt/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/dpt/configuration_dpt.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/dpt/modeling_dpt.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/exaone/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/exaone/configuration_exaone.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/exaone/modeling_exaone.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/gemma3/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/idefics3/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/llama/llama_architecture.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/llava_next/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/midm/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/midm/configuration_midm.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/midm/modeling_midm.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/qwen2/qwen2_architecture.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/qwen2_5_vl/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/resnet/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/resnet/configuration_resnet.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/resnet/modeling_resnet.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/roberta/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/roberta/configuration_roberta.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/roberta/modeling_roberta.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/seq2seq/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/seq2seq/seq2seq_architecture.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/siglip/configuration_siglip.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/t5/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/t5/configuration_t5.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/t5/modeling_t5.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/t5/t5_architecture.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/time_series_transformer/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/time_series_transformer/time_series_transformers_architecture.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/vit/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/vit/configuration_vit.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/vit/modeling_vit.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/wav2vec2/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/wav2vec2/configuration_wav2vec2.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/whisper/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/whisper/generation_whisper.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/whisper/whisper_architecture.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/xlm_roberta/configuration_xlm_roberta.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/utils/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/transformers/utils/rbln_quantization.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/utils/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/utils/decorator_utils.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/utils/import_utils.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/utils/logging.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/utils/model_utils.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/utils/save_utils.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/src/optimum/rbln/utils/submodule.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/tests/__init__.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/tests/psnr.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/tests/requirements_sdxl.txt +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/tests/run_stable_diffusion_xl_base.py +0 -0
- {optimum_rbln-0.8.1rc0 → optimum_rbln-0.8.2}/tests/test_config.py +0 -0
|
@@ -0,0 +1 @@
|
|
|
1
|
+
rebel_compiler_version: 0.8.2.dev187+g9f5b6c9b
|
|
@@ -0,0 +1,138 @@
|
|
|
1
|
+
name: Optimum-rbln / PR / Pytest
|
|
2
|
+
|
|
3
|
+
on:
|
|
4
|
+
workflow_call:
|
|
5
|
+
inputs:
|
|
6
|
+
ref:
|
|
7
|
+
description: "ref to checkout"
|
|
8
|
+
required: false
|
|
9
|
+
type: string
|
|
10
|
+
pr_number:
|
|
11
|
+
description: "PR number to run"
|
|
12
|
+
required: false
|
|
13
|
+
type: string
|
|
14
|
+
rebel_compiler_version:
|
|
15
|
+
description: "rebel_compiler version to run"
|
|
16
|
+
required: true
|
|
17
|
+
type: string
|
|
18
|
+
test_level:
|
|
19
|
+
description: "Test level for OPTIMUM_RBLN_TEST_LEVEL (default, full, essential)"
|
|
20
|
+
required: false
|
|
21
|
+
type: string
|
|
22
|
+
default: "default"
|
|
23
|
+
enable_hf_hub_tests:
|
|
24
|
+
description: "Whether to enable HF Hub tests (requires HF credentials)"
|
|
25
|
+
required: false
|
|
26
|
+
type: boolean
|
|
27
|
+
default: false
|
|
28
|
+
fail_fast:
|
|
29
|
+
description: "Whether to fail fast when one matrix job fails"
|
|
30
|
+
required: false
|
|
31
|
+
type: boolean
|
|
32
|
+
default: true
|
|
33
|
+
|
|
34
|
+
env:
|
|
35
|
+
REBEL_PYPI_ENDPOINT: ${{ vars.REBEL_PYPI_INTERNAL_ENDPOINT }}
|
|
36
|
+
REBEL_PYPI_USERNAME: ${{ secrets.REBEL_PYPI_USERNAME }}
|
|
37
|
+
REBEL_PYPI_PASSWORD: ${{ secrets.REBEL_PYPI_PASSWORD }}
|
|
38
|
+
HF_HOME: ${{ secrets.HF_HOME }}
|
|
39
|
+
HF_USER_ID: ${{ inputs.enable_hf_hub_tests && secrets.HF_USER_ID || '' }}
|
|
40
|
+
HF_AUTH_TOKEN: ${{ inputs.enable_hf_hub_tests && secrets.HF_AUTH_TOKEN || '' }}
|
|
41
|
+
|
|
42
|
+
jobs:
|
|
43
|
+
pytest:
|
|
44
|
+
name: Pytest (${{ matrix.test_type }})
|
|
45
|
+
runs-on: vm-ci-0
|
|
46
|
+
strategy:
|
|
47
|
+
fail-fast: ${{ inputs.fail_fast }}
|
|
48
|
+
matrix:
|
|
49
|
+
test_type: [config, transformers, diffusers, llm]
|
|
50
|
+
steps:
|
|
51
|
+
- name: Checkout the optimum-rbln repository
|
|
52
|
+
uses: actions/checkout@v4
|
|
53
|
+
with:
|
|
54
|
+
ref: ${{ inputs.pr_number && format('refs/pull/{0}/merge', inputs.pr_number) || inputs.ref }}
|
|
55
|
+
submodules: recursive
|
|
56
|
+
fetch-depth: 0
|
|
57
|
+
|
|
58
|
+
- name: Get commit message if not provided
|
|
59
|
+
id: get_commit_message
|
|
60
|
+
if: ${{ inputs.commit_message == '' }}
|
|
61
|
+
run: |
|
|
62
|
+
COMMIT_MESSAGE=$(git log -1 --pretty=%B)
|
|
63
|
+
echo "message<<EOF" >> $GITHUB_OUTPUT
|
|
64
|
+
echo "$COMMIT_MESSAGE" >> $GITHUB_OUTPUT
|
|
65
|
+
echo "EOF" >> $GITHUB_OUTPUT
|
|
66
|
+
|
|
67
|
+
- name: Check if test should be skipped
|
|
68
|
+
id: should_skip
|
|
69
|
+
run: |
|
|
70
|
+
COMMIT_MESSAGE="${{ steps.get_commit_message.outputs.message }}"
|
|
71
|
+
SKIP=false
|
|
72
|
+
|
|
73
|
+
case "${{ matrix.test_type }}" in
|
|
74
|
+
"transformers")
|
|
75
|
+
if [[ "$COMMIT_MESSAGE" == *"[skip-transformers]"* ]]; then
|
|
76
|
+
SKIP=true
|
|
77
|
+
fi
|
|
78
|
+
;;
|
|
79
|
+
"diffusers")
|
|
80
|
+
if [[ "$COMMIT_MESSAGE" == *"[skip-diffusers]"* ]]; then
|
|
81
|
+
SKIP=true
|
|
82
|
+
fi
|
|
83
|
+
;;
|
|
84
|
+
"llm")
|
|
85
|
+
if [[ "$COMMIT_MESSAGE" == *"[skip-llms]"* ]]; then
|
|
86
|
+
SKIP=true
|
|
87
|
+
fi
|
|
88
|
+
;;
|
|
89
|
+
esac
|
|
90
|
+
|
|
91
|
+
echo "skip=$SKIP" >> $GITHUB_OUTPUT
|
|
92
|
+
|
|
93
|
+
- name: Setup uv
|
|
94
|
+
if: steps.should_skip.outputs.skip != 'true'
|
|
95
|
+
uses: astral-sh/setup-uv@v3
|
|
96
|
+
with:
|
|
97
|
+
enable-cache: true
|
|
98
|
+
cache-dependency-glob: "uv.lock"
|
|
99
|
+
|
|
100
|
+
- name: Setup Python
|
|
101
|
+
if: steps.should_skip.outputs.skip != 'true'
|
|
102
|
+
run: uv python install 3.9
|
|
103
|
+
|
|
104
|
+
- name: Install optimum-rbln with tests group dependencies
|
|
105
|
+
if: steps.should_skip.outputs.skip != 'true'
|
|
106
|
+
run: |
|
|
107
|
+
uv sync --frozen --group tests --reinstall-package optimum-rbln
|
|
108
|
+
|
|
109
|
+
- name: Install rebel-compiler
|
|
110
|
+
if: steps.should_skip.outputs.skip != 'true'
|
|
111
|
+
run: |
|
|
112
|
+
PYPI_URL=$(echo ${{ env.REBEL_PYPI_ENDPOINT }} | sed "s/\/\//\0${{ env.REBEL_PYPI_USERNAME}}:${{ env.REBEL_PYPI_PASSWORD}}@/")
|
|
113
|
+
uv pip install --extra-index-url $PYPI_URL rebel-compiler==${{ inputs.rebel_compiler_version }}
|
|
114
|
+
|
|
115
|
+
- name: Run pytest
|
|
116
|
+
if: steps.should_skip.outputs.skip != 'true'
|
|
117
|
+
env:
|
|
118
|
+
OPTIMUM_RBLN_TEST_LEVEL: ${{ inputs.test_level }}
|
|
119
|
+
run: |
|
|
120
|
+
case "${{ matrix.test_type }}" in
|
|
121
|
+
"config")
|
|
122
|
+
uv run --no-sync pytest tests/test_config.py -vv --durations 0
|
|
123
|
+
;;
|
|
124
|
+
"transformers")
|
|
125
|
+
uv run --no-sync pytest tests/test_transformers.py -vv --durations 0
|
|
126
|
+
;;
|
|
127
|
+
"diffusers")
|
|
128
|
+
uv run --no-sync pytest tests/test_diffusers.py -vv --durations 0
|
|
129
|
+
;;
|
|
130
|
+
"llm")
|
|
131
|
+
uv run --no-sync pytest tests/test_llm.py -vv --durations 0
|
|
132
|
+
;;
|
|
133
|
+
esac
|
|
134
|
+
|
|
135
|
+
- name: Skip message
|
|
136
|
+
if: steps.should_skip.outputs.skip == 'true'
|
|
137
|
+
run: |
|
|
138
|
+
echo "Found [skip-${{ matrix.test_type }}] in commit message, skipping CI"
|
|
@@ -92,13 +92,4 @@ jobs:
|
|
|
92
92
|
ref: ${{ github.event.pull_request.head.sha }}
|
|
93
93
|
rebel_compiler_version: ${{ needs.check-compiler.outputs.compiler_version }}
|
|
94
94
|
test_level: "default"
|
|
95
|
-
secrets: inherit
|
|
96
|
-
|
|
97
|
-
optimum-rbln-inference-test:
|
|
98
|
-
needs: [check-skip-ci, check-code-quality, test-docstrings, check-compiler, check-team-member]
|
|
99
|
-
if: ${{ needs.check-skip-ci.outputs.should_skip != 'true' && needs.check-team-member.outputs.is_team_member == 'true' }}
|
|
100
|
-
uses: ./.github/workflows/rbln_optimum_inference_test.yaml
|
|
101
|
-
with:
|
|
102
|
-
ref: ${{ github.event.pull_request.head.sha }}
|
|
103
|
-
rebel_compiler_version: ${{ needs.check-compiler.outputs.compiler_version }}
|
|
104
95
|
secrets: inherit
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: optimum-rbln
|
|
3
|
-
Version: 0.8.
|
|
3
|
+
Version: 0.8.2
|
|
4
4
|
Summary: Optimum RBLN is the interface between the HuggingFace Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
|
|
5
5
|
Project-URL: Homepage, https://rebellions.ai
|
|
6
6
|
Project-URL: Documentation, https://docs.rbln.ai
|
|
Binary file
|
|
@@ -72,6 +72,8 @@ _import_structure = {
|
|
|
72
72
|
"RBLNCLIPVisionModelWithProjectionConfig",
|
|
73
73
|
"RBLNColPaliForRetrieval",
|
|
74
74
|
"RBLNColPaliForRetrievalConfig",
|
|
75
|
+
"RBLNDecoderOnlyModelConfig",
|
|
76
|
+
"RBLNDecoderOnlyModel",
|
|
75
77
|
"RBLNDecoderOnlyModelForCausalLM",
|
|
76
78
|
"RBLNDecoderOnlyModelForCausalLMConfig",
|
|
77
79
|
"RBLNDistilBertForQuestionAnswering",
|
|
@@ -80,12 +82,16 @@ _import_structure = {
|
|
|
80
82
|
"RBLNDPTForDepthEstimationConfig",
|
|
81
83
|
"RBLNExaoneForCausalLM",
|
|
82
84
|
"RBLNExaoneForCausalLMConfig",
|
|
85
|
+
"RBLNGemmaModel",
|
|
86
|
+
"RBLNGemmaModelConfig",
|
|
83
87
|
"RBLNGemmaForCausalLM",
|
|
84
88
|
"RBLNGemmaForCausalLMConfig",
|
|
85
89
|
"RBLNGemma3ForCausalLM",
|
|
86
90
|
"RBLNGemma3ForCausalLMConfig",
|
|
87
91
|
"RBLNGemma3ForConditionalGeneration",
|
|
88
92
|
"RBLNGemma3ForConditionalGenerationConfig",
|
|
93
|
+
"RBLNGPT2Model",
|
|
94
|
+
"RBLNGPT2ModelConfig",
|
|
89
95
|
"RBLNGPT2LMHeadModel",
|
|
90
96
|
"RBLNGPT2LMHeadModelConfig",
|
|
91
97
|
"RBLNIdefics3VisionTransformer",
|
|
@@ -94,22 +100,44 @@ _import_structure = {
|
|
|
94
100
|
"RBLNIdefics3VisionTransformerConfig",
|
|
95
101
|
"RBLNLlamaForCausalLM",
|
|
96
102
|
"RBLNLlamaForCausalLMConfig",
|
|
103
|
+
"RBLNLlamaModel",
|
|
104
|
+
"RBLNLlamaModelConfig",
|
|
97
105
|
"RBLNOPTForCausalLM",
|
|
98
106
|
"RBLNOPTForCausalLMConfig",
|
|
107
|
+
"RBLNLlavaForConditionalGeneration",
|
|
108
|
+
"RBLNLlavaForConditionalGenerationConfig",
|
|
99
109
|
"RBLNLlavaNextForConditionalGeneration",
|
|
100
110
|
"RBLNLlavaNextForConditionalGenerationConfig",
|
|
101
111
|
"RBLNMidmLMHeadModel",
|
|
102
112
|
"RBLNMidmLMHeadModelConfig",
|
|
113
|
+
"RBLNMistralModel",
|
|
114
|
+
"RBLNMistralModelConfig",
|
|
103
115
|
"RBLNMistralForCausalLM",
|
|
104
116
|
"RBLNMistralForCausalLMConfig",
|
|
117
|
+
"RBLNOPTModel",
|
|
118
|
+
"RBLNOPTModelConfig",
|
|
119
|
+
"RBLNPegasusForConditionalGeneration",
|
|
120
|
+
"RBLNPegasusForConditionalGenerationConfig",
|
|
121
|
+
"RBLNPegasusModel",
|
|
122
|
+
"RBLNPegasusModelConfig",
|
|
105
123
|
"RBLNPhiForCausalLM",
|
|
106
124
|
"RBLNPhiForCausalLMConfig",
|
|
125
|
+
"RBLNPixtralVisionModel",
|
|
126
|
+
"RBLNPixtralVisionModelConfig",
|
|
127
|
+
"RBLNPhiModel",
|
|
128
|
+
"RBLNPhiModelConfig",
|
|
107
129
|
"RBLNQwen2ForCausalLM",
|
|
108
130
|
"RBLNQwen2ForCausalLMConfig",
|
|
109
131
|
"RBLNQwen2_5_VisionTransformerPretrainedModel",
|
|
110
132
|
"RBLNQwen2_5_VisionTransformerPretrainedModelConfig",
|
|
111
133
|
"RBLNQwen2_5_VLForConditionalGeneration",
|
|
112
134
|
"RBLNQwen2_5_VLForConditionalGenerationConfig",
|
|
135
|
+
"RBLNQwen2Model",
|
|
136
|
+
"RBLNQwen2ModelConfig",
|
|
137
|
+
"RBLNQwen3ForCausalLM",
|
|
138
|
+
"RBLNQwen3ForCausalLMConfig",
|
|
139
|
+
"RBLNQwen3Model",
|
|
140
|
+
"RBLNQwen3ModelConfig",
|
|
113
141
|
"RBLNResNetForImageClassification",
|
|
114
142
|
"RBLNResNetForImageClassificationConfig",
|
|
115
143
|
"RBLNRobertaForMaskedLM",
|
|
@@ -203,11 +231,7 @@ _import_structure = {
|
|
|
203
231
|
}
|
|
204
232
|
|
|
205
233
|
if TYPE_CHECKING:
|
|
206
|
-
from .configuration_utils import
|
|
207
|
-
RBLNAutoConfig,
|
|
208
|
-
RBLNCompileConfig,
|
|
209
|
-
RBLNModelConfig,
|
|
210
|
-
)
|
|
234
|
+
from .configuration_utils import RBLNAutoConfig, RBLNCompileConfig, RBLNModelConfig
|
|
211
235
|
from .diffusers import (
|
|
212
236
|
RBLNAutoencoderKL,
|
|
213
237
|
RBLNAutoencoderKLConfig,
|
|
@@ -273,10 +297,7 @@ if TYPE_CHECKING:
|
|
|
273
297
|
RBLNVQModel,
|
|
274
298
|
RBLNVQModelConfig,
|
|
275
299
|
)
|
|
276
|
-
from .modeling import
|
|
277
|
-
RBLNBaseModel,
|
|
278
|
-
RBLNModel,
|
|
279
|
-
)
|
|
300
|
+
from .modeling import RBLNBaseModel, RBLNModel
|
|
280
301
|
from .transformers import (
|
|
281
302
|
RBLNASTForAudioClassification,
|
|
282
303
|
RBLNASTForAudioClassificationConfig,
|
|
@@ -319,6 +340,8 @@ if TYPE_CHECKING:
|
|
|
319
340
|
RBLNCLIPVisionModelWithProjectionConfig,
|
|
320
341
|
RBLNColPaliForRetrieval,
|
|
321
342
|
RBLNColPaliForRetrievalConfig,
|
|
343
|
+
RBLNDecoderOnlyModel,
|
|
344
|
+
RBLNDecoderOnlyModelConfig,
|
|
322
345
|
RBLNDecoderOnlyModelForCausalLM,
|
|
323
346
|
RBLNDecoderOnlyModelForCausalLMConfig,
|
|
324
347
|
RBLNDistilBertForQuestionAnswering,
|
|
@@ -333,30 +356,56 @@ if TYPE_CHECKING:
|
|
|
333
356
|
RBLNGemma3ForConditionalGenerationConfig,
|
|
334
357
|
RBLNGemmaForCausalLM,
|
|
335
358
|
RBLNGemmaForCausalLMConfig,
|
|
359
|
+
RBLNGemmaModel,
|
|
360
|
+
RBLNGemmaModelConfig,
|
|
336
361
|
RBLNGPT2LMHeadModel,
|
|
337
362
|
RBLNGPT2LMHeadModelConfig,
|
|
363
|
+
RBLNGPT2Model,
|
|
364
|
+
RBLNGPT2ModelConfig,
|
|
338
365
|
RBLNIdefics3ForConditionalGeneration,
|
|
339
366
|
RBLNIdefics3ForConditionalGenerationConfig,
|
|
340
367
|
RBLNIdefics3VisionTransformer,
|
|
341
368
|
RBLNIdefics3VisionTransformerConfig,
|
|
342
369
|
RBLNLlamaForCausalLM,
|
|
343
370
|
RBLNLlamaForCausalLMConfig,
|
|
371
|
+
RBLNLlamaModel,
|
|
372
|
+
RBLNLlamaModelConfig,
|
|
373
|
+
RBLNLlavaForConditionalGeneration,
|
|
374
|
+
RBLNLlavaForConditionalGenerationConfig,
|
|
344
375
|
RBLNLlavaNextForConditionalGeneration,
|
|
345
376
|
RBLNLlavaNextForConditionalGenerationConfig,
|
|
346
377
|
RBLNMidmLMHeadModel,
|
|
347
378
|
RBLNMidmLMHeadModelConfig,
|
|
348
379
|
RBLNMistralForCausalLM,
|
|
349
380
|
RBLNMistralForCausalLMConfig,
|
|
381
|
+
RBLNMistralModel,
|
|
382
|
+
RBLNMistralModelConfig,
|
|
350
383
|
RBLNOPTForCausalLM,
|
|
351
384
|
RBLNOPTForCausalLMConfig,
|
|
385
|
+
RBLNOPTModel,
|
|
386
|
+
RBLNOPTModelConfig,
|
|
387
|
+
RBLNPegasusForConditionalGeneration,
|
|
388
|
+
RBLNPegasusForConditionalGenerationConfig,
|
|
389
|
+
RBLNPegasusModel,
|
|
390
|
+
RBLNPegasusModelConfig,
|
|
352
391
|
RBLNPhiForCausalLM,
|
|
353
392
|
RBLNPhiForCausalLMConfig,
|
|
393
|
+
RBLNPhiModel,
|
|
394
|
+
RBLNPhiModelConfig,
|
|
395
|
+
RBLNPixtralVisionModel,
|
|
396
|
+
RBLNPixtralVisionModelConfig,
|
|
354
397
|
RBLNQwen2_5_VisionTransformerPretrainedModel,
|
|
355
398
|
RBLNQwen2_5_VisionTransformerPretrainedModelConfig,
|
|
356
399
|
RBLNQwen2_5_VLForConditionalGeneration,
|
|
357
400
|
RBLNQwen2_5_VLForConditionalGenerationConfig,
|
|
358
401
|
RBLNQwen2ForCausalLM,
|
|
359
402
|
RBLNQwen2ForCausalLMConfig,
|
|
403
|
+
RBLNQwen2Model,
|
|
404
|
+
RBLNQwen2ModelConfig,
|
|
405
|
+
RBLNQwen3ForCausalLM,
|
|
406
|
+
RBLNQwen3ForCausalLMConfig,
|
|
407
|
+
RBLNQwen3Model,
|
|
408
|
+
RBLNQwen3ModelConfig,
|
|
360
409
|
RBLNResNetForImageClassification,
|
|
361
410
|
RBLNResNetForImageClassificationConfig,
|
|
362
411
|
RBLNRobertaForMaskedLM,
|
|
@@ -17,5 +17,5 @@ __version__: str
|
|
|
17
17
|
__version_tuple__: VERSION_TUPLE
|
|
18
18
|
version_tuple: VERSION_TUPLE
|
|
19
19
|
|
|
20
|
-
__version__ = version = '0.8.
|
|
21
|
-
__version_tuple__ = version_tuple = (0, 8,
|
|
20
|
+
__version__ = version = '0.8.2'
|
|
21
|
+
__version_tuple__ = version_tuple = (0, 8, 2)
|
|
@@ -23,6 +23,7 @@ import numpy as np
|
|
|
23
23
|
import torch
|
|
24
24
|
|
|
25
25
|
from .__version__ import __version__
|
|
26
|
+
from .utils.depreacate_utils import warn_deprecated_npu
|
|
26
27
|
from .utils.logging import get_logger
|
|
27
28
|
from .utils.runtime_utils import ContextRblnConfig
|
|
28
29
|
|
|
@@ -147,7 +148,7 @@ class RBLNCompileConfig:
|
|
|
147
148
|
return asdict(self)
|
|
148
149
|
|
|
149
150
|
|
|
150
|
-
RUNTIME_KEYWORDS = ["create_runtimes", "optimize_host_memory", "device", "device_map", "activate_profiler"]
|
|
151
|
+
RUNTIME_KEYWORDS = ["create_runtimes", "optimize_host_memory", "device", "device_map", "activate_profiler", "timeout"]
|
|
151
152
|
CONFIG_MAPPING: Dict[str, Type["RBLNModelConfig"]] = {}
|
|
152
153
|
|
|
153
154
|
|
|
@@ -481,6 +482,7 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
|
|
|
481
482
|
"device",
|
|
482
483
|
"device_map",
|
|
483
484
|
"activate_profiler",
|
|
485
|
+
"timeout",
|
|
484
486
|
]
|
|
485
487
|
submodules: List[str] = []
|
|
486
488
|
subclass_non_save_attributes = []
|
|
@@ -489,7 +491,7 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
|
|
|
489
491
|
self,
|
|
490
492
|
submodule_config_cls: Type["RBLNModelConfig"],
|
|
491
493
|
submodule_config: Optional[Union[Dict[str, Any], "RBLNModelConfig"]] = None,
|
|
492
|
-
**kwargs:
|
|
494
|
+
**kwargs: Any,
|
|
493
495
|
) -> "RBLNModelConfig":
|
|
494
496
|
# Initialize a submodule config from a dict or a RBLNModelConfig.
|
|
495
497
|
# kwargs is specified from the predecessor config.
|
|
@@ -561,9 +563,10 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
|
|
|
561
563
|
activate_profiler: Optional[bool] = None,
|
|
562
564
|
npu: Optional[str] = None,
|
|
563
565
|
tensor_parallel_size: Optional[int] = None,
|
|
566
|
+
timeout: Optional[int] = None,
|
|
564
567
|
optimum_rbln_version: Optional[str] = None,
|
|
565
568
|
_compile_cfgs: List[RBLNCompileConfig] = [],
|
|
566
|
-
**kwargs:
|
|
569
|
+
**kwargs: Any,
|
|
567
570
|
):
|
|
568
571
|
"""
|
|
569
572
|
Initialize a RBLN model configuration with runtime options and compile configurations.
|
|
@@ -577,6 +580,7 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
|
|
|
577
580
|
activate_profiler (Optional[bool]): Whether to activate the profiler for performance analysis.
|
|
578
581
|
npu (Optional[str]): The NPU device name to use for compilation.
|
|
579
582
|
tensor_parallel_size (Optional[int]): Size for tensor parallelism to distribute the model across devices.
|
|
583
|
+
timeout (Optional[int]): The timeout for the runtime in seconds. If it isn't provided, it will be set to 60 by default.
|
|
580
584
|
optimum_rbln_version (Optional[str]): The optimum-rbln version used for this configuration.
|
|
581
585
|
_compile_cfgs (List[RBLNCompileConfig]): List of compilation configurations for the model.
|
|
582
586
|
**kwargs: Additional keyword arguments.
|
|
@@ -599,6 +603,7 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
|
|
|
599
603
|
self._runtime_options["device"] = device
|
|
600
604
|
self._runtime_options["device_map"] = device_map
|
|
601
605
|
self._runtime_options["activate_profiler"] = activate_profiler
|
|
606
|
+
self._runtime_options["timeout"] = timeout
|
|
602
607
|
|
|
603
608
|
# Automatically pass npu, tensor_parallel_size to compile_cfgs
|
|
604
609
|
self.npu = npu
|
|
@@ -671,6 +676,9 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
|
|
|
671
676
|
compile_cfg.npu = self.npu
|
|
672
677
|
compile_cfg.tensor_parallel_size = self.tensor_parallel_size
|
|
673
678
|
|
|
679
|
+
target_npu = self.npu or next((cfg.npu for cfg in self._compile_cfgs if cfg.npu is not None), None)
|
|
680
|
+
warn_deprecated_npu(target_npu)
|
|
681
|
+
|
|
674
682
|
def freeze(self):
|
|
675
683
|
if self._frozen:
|
|
676
684
|
raise RuntimeError(f"`{self.__class__.__name__}` is already frozen.")
|
|
@@ -709,7 +717,7 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
|
|
|
709
717
|
json.dump(serializable_data, jsonf, indent=2)
|
|
710
718
|
|
|
711
719
|
@classmethod
|
|
712
|
-
def load(cls, path: str, **kwargs:
|
|
720
|
+
def load(cls, path: str, **kwargs: Any) -> "RBLNModelConfig":
|
|
713
721
|
"""
|
|
714
722
|
Load a RBLNModelConfig from a path.
|
|
715
723
|
|
|
@@ -742,7 +750,7 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
|
|
|
742
750
|
def initialize_from_kwargs(
|
|
743
751
|
cls: Type["RBLNModelConfig"],
|
|
744
752
|
rbln_config: Optional[Union[Dict[str, Any], "RBLNModelConfig"]] = None,
|
|
745
|
-
**kwargs:
|
|
753
|
+
**kwargs: Any,
|
|
746
754
|
) -> Tuple["RBLNModelConfig", Dict[str, Any]]:
|
|
747
755
|
# Initialize RBLNModelConfig from kwargs.
|
|
748
756
|
kwargs_keys = list(kwargs.keys())
|
|
@@ -838,3 +846,14 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
|
|
|
838
846
|
@activate_profiler.setter
|
|
839
847
|
def activate_profiler(self, activate_profiler: bool):
|
|
840
848
|
self._runtime_options["activate_profiler"] = activate_profiler
|
|
849
|
+
|
|
850
|
+
@property
|
|
851
|
+
def timeout(self):
|
|
852
|
+
context = ContextRblnConfig.get_current_context()["timeout"]
|
|
853
|
+
if context is not None:
|
|
854
|
+
return context
|
|
855
|
+
return self._runtime_options["timeout"]
|
|
856
|
+
|
|
857
|
+
@timeout.setter
|
|
858
|
+
def timeout(self, timeout: int):
|
|
859
|
+
self._runtime_options["timeout"] = timeout
|
|
@@ -1,8 +1,8 @@
|
|
|
1
1
|
from .configuration_autoencoder_kl import RBLNAutoencoderKLConfig
|
|
2
2
|
from .configuration_autoencoder_kl_cosmos import RBLNAutoencoderKLCosmosConfig
|
|
3
3
|
from .configuration_controlnet import RBLNControlNetModelConfig
|
|
4
|
-
from .configuration_cosmos_transformer import RBLNCosmosTransformer3DModelConfig
|
|
5
4
|
from .configuration_prior_transformer import RBLNPriorTransformerConfig
|
|
5
|
+
from .configuration_transformer_cosmos import RBLNCosmosTransformer3DModelConfig
|
|
6
6
|
from .configuration_transformer_sd3 import RBLNSD3Transformer2DModelConfig
|
|
7
7
|
from .configuration_unet_2d_condition import RBLNUNet2DConditionModelConfig
|
|
8
8
|
from .configuration_vq_model import RBLNVQModelConfig
|
|
@@ -12,7 +12,7 @@
|
|
|
12
12
|
# See the License for the specific language governing permissions and
|
|
13
13
|
# limitations under the License.
|
|
14
14
|
|
|
15
|
-
from typing import Any,
|
|
15
|
+
from typing import Any, Optional, Tuple
|
|
16
16
|
|
|
17
17
|
from ....configuration_utils import RBLNModelConfig
|
|
18
18
|
|
|
@@ -33,7 +33,7 @@ class RBLNAutoencoderKLConfig(RBLNModelConfig):
|
|
|
33
33
|
vae_scale_factor: Optional[float] = None, # TODO: rename to scaling_factor
|
|
34
34
|
in_channels: Optional[int] = None,
|
|
35
35
|
latent_channels: Optional[int] = None,
|
|
36
|
-
**kwargs:
|
|
36
|
+
**kwargs: Any,
|
|
37
37
|
):
|
|
38
38
|
"""
|
|
39
39
|
Args:
|
|
@@ -12,7 +12,7 @@
|
|
|
12
12
|
# See the License for the specific language governing permissions and
|
|
13
13
|
# limitations under the License.
|
|
14
14
|
|
|
15
|
-
from typing import Optional
|
|
15
|
+
from typing import Any, Optional
|
|
16
16
|
|
|
17
17
|
from ....configuration_utils import RBLNModelConfig
|
|
18
18
|
from ....utils.logging import get_logger
|
|
@@ -22,6 +22,8 @@ logger = get_logger(__name__)
|
|
|
22
22
|
|
|
23
23
|
|
|
24
24
|
class RBLNAutoencoderKLCosmosConfig(RBLNModelConfig):
|
|
25
|
+
"""Configuration class for RBLN Cosmos Variational Autoencoder (VAE) models."""
|
|
26
|
+
|
|
25
27
|
def __init__(
|
|
26
28
|
self,
|
|
27
29
|
batch_size: Optional[int] = None,
|
|
@@ -33,7 +35,7 @@ class RBLNAutoencoderKLCosmosConfig(RBLNModelConfig):
|
|
|
33
35
|
vae_scale_factor_temporal: Optional[int] = None,
|
|
34
36
|
vae_scale_factor_spatial: Optional[int] = None,
|
|
35
37
|
use_slicing: Optional[bool] = None,
|
|
36
|
-
**kwargs,
|
|
38
|
+
**kwargs: Any,
|
|
37
39
|
):
|
|
38
40
|
"""
|
|
39
41
|
Args:
|
|
@@ -48,7 +50,7 @@ class RBLNAutoencoderKLCosmosConfig(RBLNModelConfig):
|
|
|
48
50
|
Determines how much shorter the latent representations are compared to the original videos.
|
|
49
51
|
vae_scale_factor_spatial (Optional[int]): The scaling factor between pixel space and latent space.
|
|
50
52
|
Determines how much smaller the latent representations are compared to the original videos.
|
|
51
|
-
use_slicing (Optional[
|
|
53
|
+
use_slicing (Optional[bool]): Enable sliced VAE encoding and decoding.
|
|
52
54
|
If True, the VAE will split the input tensor in slices to compute encoding or decoding in several steps.
|
|
53
55
|
**kwargs: Additional arguments passed to the parent RBLNModelConfig.
|
|
54
56
|
|
|
@@ -12,7 +12,7 @@
|
|
|
12
12
|
# See the License for the specific language governing permissions and
|
|
13
13
|
# limitations under the License.
|
|
14
14
|
|
|
15
|
-
from typing import Any,
|
|
15
|
+
from typing import Any, Optional, Tuple
|
|
16
16
|
|
|
17
17
|
from ....configuration_utils import RBLNModelConfig
|
|
18
18
|
|
|
@@ -29,7 +29,7 @@ class RBLNControlNetModelConfig(RBLNModelConfig):
|
|
|
29
29
|
unet_sample_size: Optional[Tuple[int, int]] = None,
|
|
30
30
|
vae_sample_size: Optional[Tuple[int, int]] = None,
|
|
31
31
|
text_model_hidden_size: Optional[int] = None,
|
|
32
|
-
**kwargs:
|
|
32
|
+
**kwargs: Any,
|
|
33
33
|
):
|
|
34
34
|
"""
|
|
35
35
|
Args:
|
|
@@ -12,7 +12,7 @@
|
|
|
12
12
|
# See the License for the specific language governing permissions and
|
|
13
13
|
# limitations under the License.
|
|
14
14
|
|
|
15
|
-
from typing import Any,
|
|
15
|
+
from typing import Any, Optional
|
|
16
16
|
|
|
17
17
|
from ....configuration_utils import RBLNModelConfig
|
|
18
18
|
|
|
@@ -32,7 +32,7 @@ class RBLNPriorTransformerConfig(RBLNModelConfig):
|
|
|
32
32
|
batch_size: Optional[int] = None,
|
|
33
33
|
embedding_dim: Optional[int] = None,
|
|
34
34
|
num_embeddings: Optional[int] = None,
|
|
35
|
-
**kwargs:
|
|
35
|
+
**kwargs: Any,
|
|
36
36
|
):
|
|
37
37
|
"""
|
|
38
38
|
Args:
|
|
@@ -12,12 +12,14 @@
|
|
|
12
12
|
# See the License for the specific language governing permissions and
|
|
13
13
|
# limitations under the License.
|
|
14
14
|
|
|
15
|
-
from typing import Optional
|
|
15
|
+
from typing import Any, Optional
|
|
16
16
|
|
|
17
17
|
from ....configuration_utils import RBLNModelConfig
|
|
18
18
|
|
|
19
19
|
|
|
20
20
|
class RBLNCosmosTransformer3DModelConfig(RBLNModelConfig):
|
|
21
|
+
"""Configuration class for RBLN Cosmos Transformer models."""
|
|
22
|
+
|
|
21
23
|
def __init__(
|
|
22
24
|
self,
|
|
23
25
|
batch_size: Optional[int] = None,
|
|
@@ -31,7 +33,7 @@ class RBLNCosmosTransformer3DModelConfig(RBLNModelConfig):
|
|
|
31
33
|
num_latent_frames: Optional[int] = None,
|
|
32
34
|
latent_height: Optional[int] = None,
|
|
33
35
|
latent_width: Optional[int] = None,
|
|
34
|
-
**kwargs,
|
|
36
|
+
**kwargs: Any,
|
|
35
37
|
):
|
|
36
38
|
"""
|
|
37
39
|
Args:
|
|
@@ -50,6 +52,9 @@ class RBLNCosmosTransformer3DModelConfig(RBLNModelConfig):
|
|
|
50
52
|
Raises:
|
|
51
53
|
ValueError: If batch_size is not a positive integer.
|
|
52
54
|
"""
|
|
55
|
+
if kwargs.get("timeout") is None:
|
|
56
|
+
kwargs["timeout"] = 80
|
|
57
|
+
|
|
53
58
|
super().__init__(**kwargs)
|
|
54
59
|
self.batch_size = batch_size or 1
|
|
55
60
|
self.num_frames = num_frames or 121
|
|
@@ -12,7 +12,7 @@
|
|
|
12
12
|
# See the License for the specific language governing permissions and
|
|
13
13
|
# limitations under the License.
|
|
14
14
|
|
|
15
|
-
from typing import Any,
|
|
15
|
+
from typing import Any, Optional, Tuple, Union
|
|
16
16
|
|
|
17
17
|
from ....configuration_utils import RBLNModelConfig
|
|
18
18
|
|
|
@@ -27,7 +27,7 @@ class RBLNSD3Transformer2DModelConfig(RBLNModelConfig):
|
|
|
27
27
|
batch_size: Optional[int] = None,
|
|
28
28
|
sample_size: Optional[Union[int, Tuple[int, int]]] = None,
|
|
29
29
|
prompt_embed_length: Optional[int] = None,
|
|
30
|
-
**kwargs:
|
|
30
|
+
**kwargs: Any,
|
|
31
31
|
):
|
|
32
32
|
"""
|
|
33
33
|
Args:
|
|
@@ -12,7 +12,7 @@
|
|
|
12
12
|
# See the License for the specific language governing permissions and
|
|
13
13
|
# limitations under the License.
|
|
14
14
|
|
|
15
|
-
from typing import Any,
|
|
15
|
+
from typing import Any, Optional, Tuple
|
|
16
16
|
|
|
17
17
|
from ....configuration_utils import RBLNModelConfig
|
|
18
18
|
|
|
@@ -38,7 +38,7 @@ class RBLNUNet2DConditionModelConfig(RBLNModelConfig):
|
|
|
38
38
|
in_features: Optional[int] = None,
|
|
39
39
|
text_model_hidden_size: Optional[int] = None,
|
|
40
40
|
image_model_hidden_size: Optional[int] = None,
|
|
41
|
-
**kwargs:
|
|
41
|
+
**kwargs: Any,
|
|
42
42
|
):
|
|
43
43
|
"""
|
|
44
44
|
Args:
|
|
@@ -12,7 +12,7 @@
|
|
|
12
12
|
# See the License for the specific language governing permissions and
|
|
13
13
|
# limitations under the License.
|
|
14
14
|
|
|
15
|
-
from typing import Any,
|
|
15
|
+
from typing import Any, Optional, Tuple
|
|
16
16
|
|
|
17
17
|
from ....configuration_utils import RBLNModelConfig
|
|
18
18
|
|
|
@@ -33,7 +33,7 @@ class RBLNVQModelConfig(RBLNModelConfig):
|
|
|
33
33
|
vqmodel_scale_factor: Optional[float] = None, # TODO: rename to scaling_factor
|
|
34
34
|
in_channels: Optional[int] = None,
|
|
35
35
|
latent_channels: Optional[int] = None,
|
|
36
|
-
**kwargs:
|
|
36
|
+
**kwargs: Any,
|
|
37
37
|
):
|
|
38
38
|
"""
|
|
39
39
|
Args:
|