optimum-rbln 0.8.2a1__tar.gz → 0.8.2a2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of optimum-rbln might be problematic. Click here for more details.

Files changed (286) hide show
  1. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/PKG-INFO +1 -1
  2. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/__init__.py +8 -0
  3. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/__version__.py +2 -2
  4. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/configuration_utils.py +16 -1
  5. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/models/configuration_transformer_cosmos.py +3 -0
  6. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/modeling_diffusers.py +1 -0
  7. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl.py +1 -0
  8. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl_cosmos.py +1 -0
  9. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/autoencoders/vq_model.py +1 -0
  10. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/transformers/transformer_cosmos.py +1 -1
  11. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/cosmos/configuration_cosmos_guardrail.py +10 -2
  12. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/cosmos/cosmos_guardrail.py +4 -30
  13. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/modeling.py +1 -0
  14. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/__init__.py +8 -0
  15. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/__init__.py +2 -0
  16. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +7 -0
  17. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gemma3/modeling_gemma3.py +3 -0
  18. optimum_rbln-0.8.2a2/src/optimum/rbln/transformers/models/qwen3/__init__.py +16 -0
  19. optimum_rbln-0.8.2a2/src/optimum/rbln/transformers/models/qwen3/configuration_qwen3.py +71 -0
  20. optimum_rbln-0.8.2a2/src/optimum/rbln/transformers/models/qwen3/modeling_qwen3.py +377 -0
  21. optimum_rbln-0.8.2a2/src/optimum/rbln/transformers/models/qwen3/qwen3_architecture.py +275 -0
  22. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py +2 -0
  23. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/time_series_transformer/modeling_time_series_transformer.py +2 -0
  24. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/whisper/modeling_whisper.py +2 -0
  25. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/utils/runtime_utils.py +28 -2
  26. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/tests/test_llm.py +8 -0
  27. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
  28. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/ISSUE_TEMPLATE/config.yml +0 -0
  29. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
  30. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/ISSUE_TEMPLATE/model_request.md +0 -0
  31. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/pull_request_template.md +0 -0
  32. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/scripts/auto_code_review.py +0 -0
  33. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/scripts/validate_docstrings.py +0 -0
  34. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/scripts/validate_pr_checklist.py +0 -0
  35. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/version.yaml +0 -0
  36. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/auto_code_review.yml +0 -0
  37. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/check_code_quality.yml +0 -0
  38. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/deploy-on-tag.yaml +0 -0
  39. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/deploy.yaml +0 -0
  40. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/pr-title-check.yaml +0 -0
  41. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/pr_checklist_validator.yml +0 -0
  42. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/rbln_check_compiler.yaml +0 -0
  43. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/rbln_dispatch_pytest.yaml +0 -0
  44. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/rbln_optimum_inference_test.yaml +0 -0
  45. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/rbln_optimum_pytest.yaml +0 -0
  46. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/rbln_scheduled_test.yaml +0 -0
  47. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/rbln_trigger_on_pr.yaml +0 -0
  48. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.github/workflows/test-docstrings.yml +0 -0
  49. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/.gitignore +0 -0
  50. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/CODE_OF_CONDUCT.md +0 -0
  51. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/CONTRIBUTING.md +0 -0
  52. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/LICENSE +0 -0
  53. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/README.md +0 -0
  54. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/assets/rbln_logo.png +0 -0
  55. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/advanced/custom_class.py +0 -0
  56. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/audio-classification/run_ast_audio_classification.py +0 -0
  57. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/depth-estimation/run_dpt.py +0 -0
  58. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/image-classification/run_image_classification.py +0 -0
  59. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/image-classification/run_vit_image_classification.py +0 -0
  60. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/image-to-text/run_idefics3.py +0 -0
  61. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/image-to-text/run_llava_next_image_to_text.py +0 -0
  62. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/kandinsky2_2/run_kandinsky2_2.py +0 -0
  63. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/kandinsky2_2/run_kandinsky2_2_combined.py +0 -0
  64. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/kandinsky2_2/run_kandinsky2_2_img2img.py +0 -0
  65. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/kandinsky2_2/run_kandinsky2_2_img2img_combined.py +0 -0
  66. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/kandinsky2_2/run_kandinsky2_2_inpaint.py +0 -0
  67. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/kandinsky2_2/run_kandinsky2_2_inpaint_combined.py +0 -0
  68. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/kandinsky2_2/run_kandinsky2_2_prior_interpolate.py +0 -0
  69. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/question-answering/run_question_answering.py +0 -0
  70. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/speech-recognition/run_wav2vec2.py +0 -0
  71. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/speech-recognition/run_whisper.py +0 -0
  72. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/stable-diffusion/run_stable_diffusion.py +0 -0
  73. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/stable-diffusion/run_stable_diffusion_controlnet.py +0 -0
  74. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/stable-diffusion/run_stable_diffusion_img2img.py +0 -0
  75. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/stable-diffusion/run_stable_diffusion_img2img_controlnet.py +0 -0
  76. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/stable-diffusion/run_stable_diffusion_inpaint.py +0 -0
  77. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/stable-diffusion/run_stable_diffusion_lora.py +0 -0
  78. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/stable-diffusion/run_stable_diffusion_multicontrolnet.py +0 -0
  79. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/text-classification/run_bge_m3_text_classification.py +0 -0
  80. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/text-classification/run_bge_reranker_v2_m3_text_classification.py +0 -0
  81. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/text-classification/run_secureBERT.py +0 -0
  82. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/text-classification/run_t5_classification.py +0 -0
  83. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/text-classification/run_twitter_roberta_text_classification.py +0 -0
  84. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/text2text-generation/run_bart_text2text_generation.py +0 -0
  85. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/text2text-generation/run_llama_peft.py +0 -0
  86. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/text2text-generation/run_llama_text2text_generation.py +0 -0
  87. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/examples/time-series-forecasting/run_time_series_forecasting.py +0 -0
  88. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/pyproject.toml +0 -0
  89. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/scripts/uv-lock.sh +0 -0
  90. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/scripts/uv-sync.sh +0 -0
  91. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/__init__.py +0 -0
  92. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/__init__.py +0 -0
  93. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/models/__init__.py +0 -0
  94. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl.py +0 -0
  95. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl_cosmos.py +0 -0
  96. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/models/configuration_controlnet.py +0 -0
  97. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/models/configuration_prior_transformer.py +0 -0
  98. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/models/configuration_transformer_sd3.py +0 -0
  99. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/models/configuration_unet_2d_condition.py +0 -0
  100. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/models/configuration_vq_model.py +0 -0
  101. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/pipelines/__init__.py +0 -0
  102. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_controlnet.py +0 -0
  103. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_cosmos.py +0 -0
  104. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_kandinsky2_2.py +0 -0
  105. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion.py +0 -0
  106. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_3.py +0 -0
  107. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_xl.py +0 -0
  108. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/__init__.py +0 -0
  109. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/autoencoders/__init__.py +0 -0
  110. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/autoencoders/vae.py +0 -0
  111. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/controlnet.py +0 -0
  112. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/transformers/__init__.py +0 -0
  113. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/transformers/prior_transformer.py +0 -0
  114. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/transformers/transformer_sd3.py +0 -0
  115. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/unets/__init__.py +0 -0
  116. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/models/unets/unet_2d_condition.py +0 -0
  117. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/__init__.py +0 -0
  118. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/controlnet/__init__.py +0 -0
  119. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py +0 -0
  120. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py +0 -0
  121. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py +0 -0
  122. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py +0 -0
  123. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py +0 -0
  124. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/cosmos/__init__.py +0 -0
  125. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/cosmos/pipeline_cosmos_text2world.py +0 -0
  126. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/cosmos/pipeline_cosmos_video2world.py +0 -0
  127. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/__init__.py +0 -0
  128. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2.py +0 -0
  129. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_combined.py +0 -0
  130. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_img2img.py +0 -0
  131. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_inpaint.py +0 -0
  132. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_prior.py +0 -0
  133. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/__init__.py +0 -0
  134. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py +0 -0
  135. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py +0 -0
  136. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_inpaint.py +0 -0
  137. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/__init__.py +0 -0
  138. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py +0 -0
  139. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py +0 -0
  140. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py +0 -0
  141. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/__init__.py +0 -0
  142. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py +0 -0
  143. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py +0 -0
  144. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py +0 -0
  145. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/modeling_base.py +0 -0
  146. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/ops/__init__.py +0 -0
  147. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/ops/attn.py +0 -0
  148. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/ops/flash_attn.py +0 -0
  149. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/ops/kv_cache_update.py +0 -0
  150. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/ops/linear.py +0 -0
  151. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/ops/sliding_window_attn.py +0 -0
  152. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/configuration_generic.py +0 -0
  153. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/modeling_generic.py +0 -0
  154. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/modeling_rope_utils.py +0 -0
  155. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/__init__.py +0 -0
  156. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/configuration_audio_spectrogram_transformer.py +0 -0
  157. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/modeling_audio_spectrogram_transformer.py +0 -0
  158. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/auto/__init__.py +0 -0
  159. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/auto/auto_factory.py +0 -0
  160. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/auto/modeling_auto.py +0 -0
  161. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/bart/__init__.py +0 -0
  162. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/bart/bart_architecture.py +0 -0
  163. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/bart/configuration_bart.py +0 -0
  164. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/bart/modeling_bart.py +0 -0
  165. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/bert/__init__.py +0 -0
  166. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/bert/configuration_bert.py +0 -0
  167. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/bert/modeling_bert.py +0 -0
  168. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/blip_2/__init__.py +0 -0
  169. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/blip_2/configuration_blip_2.py +0 -0
  170. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/blip_2/modeling_blip_2.py +0 -0
  171. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/clip/__init__.py +0 -0
  172. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/clip/configuration_clip.py +0 -0
  173. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/clip/modeling_clip.py +0 -0
  174. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/colpali/__init__.py +0 -0
  175. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/colpali/colpali_architecture.py +0 -0
  176. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/colpali/configuration_colpali.py +0 -0
  177. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/colpali/modeling_colpali.py +0 -0
  178. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/decoderonly/__init__.py +0 -0
  179. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py +0 -0
  180. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py +0 -0
  181. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/distilbert/__init__.py +0 -0
  182. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/distilbert/configuration_distilbert.py +0 -0
  183. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/distilbert/modeling_distilbert.py +0 -0
  184. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/dpt/__init__.py +0 -0
  185. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/dpt/configuration_dpt.py +0 -0
  186. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/dpt/modeling_dpt.py +0 -0
  187. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/exaone/__init__.py +0 -0
  188. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/exaone/configuration_exaone.py +0 -0
  189. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/exaone/exaone_architecture.py +0 -0
  190. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/exaone/modeling_exaone.py +0 -0
  191. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gemma/__init__.py +0 -0
  192. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gemma/configuration_gemma.py +0 -0
  193. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gemma/gemma_architecture.py +0 -0
  194. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gemma/modeling_gemma.py +0 -0
  195. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gemma3/__init__.py +0 -0
  196. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gemma3/configuration_gemma3.py +0 -0
  197. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gemma3/gemma3_architecture.py +0 -0
  198. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gpt2/__init__.py +0 -0
  199. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gpt2/configuration_gpt2.py +0 -0
  200. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gpt2/gpt2_architecture.py +0 -0
  201. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/gpt2/modeling_gpt2.py +0 -0
  202. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/idefics3/__init__.py +0 -0
  203. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/idefics3/configuration_idefics3.py +0 -0
  204. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/idefics3/modeling_idefics3.py +0 -0
  205. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/llama/__init__.py +0 -0
  206. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/llama/configuration_llama.py +0 -0
  207. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/llama/llama_architecture.py +0 -0
  208. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/llama/modeling_llama.py +0 -0
  209. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/llava_next/__init__.py +0 -0
  210. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/llava_next/configuration_llava_next.py +0 -0
  211. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/llava_next/modeling_llava_next.py +0 -0
  212. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/midm/__init__.py +0 -0
  213. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/midm/configuration_midm.py +0 -0
  214. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/midm/midm_architecture.py +0 -0
  215. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/midm/modeling_midm.py +0 -0
  216. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/mistral/__init__.py +0 -0
  217. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/mistral/configuration_mistral.py +0 -0
  218. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/mistral/mistral_architecture.py +0 -0
  219. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/mistral/modeling_mistral.py +0 -0
  220. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/opt/__init__.py +0 -0
  221. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/opt/configuration_opt.py +0 -0
  222. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/opt/modeling_opt.py +0 -0
  223. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/opt/opt_architecture.py +0 -0
  224. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/phi/__init__.py +0 -0
  225. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/phi/configuration_phi.py +0 -0
  226. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/phi/modeling_phi.py +0 -0
  227. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/phi/phi_architecture.py +0 -0
  228. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/qwen2/__init__.py +0 -0
  229. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/qwen2/configuration_qwen2.py +0 -0
  230. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/qwen2/modeling_qwen2.py +0 -0
  231. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/qwen2/qwen2_architecture.py +0 -0
  232. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/qwen2_5_vl/__init__.py +0 -0
  233. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py +0 -0
  234. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py +0 -0
  235. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py +0 -0
  236. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/resnet/__init__.py +0 -0
  237. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/resnet/configuration_resnet.py +0 -0
  238. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/resnet/modeling_resnet.py +0 -0
  239. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/roberta/__init__.py +0 -0
  240. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/roberta/configuration_roberta.py +0 -0
  241. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/roberta/modeling_roberta.py +0 -0
  242. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/seq2seq/__init__.py +0 -0
  243. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/seq2seq/configuration_seq2seq.py +0 -0
  244. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/seq2seq/seq2seq_architecture.py +0 -0
  245. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/siglip/__init__.py +0 -0
  246. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/siglip/configuration_siglip.py +0 -0
  247. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/siglip/modeling_siglip.py +0 -0
  248. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/t5/__init__.py +0 -0
  249. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/t5/configuration_t5.py +0 -0
  250. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/t5/modeling_t5.py +0 -0
  251. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/t5/t5_architecture.py +0 -0
  252. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/time_series_transformer/__init__.py +0 -0
  253. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/time_series_transformer/configuration_time_series_transformer.py +0 -0
  254. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/time_series_transformer/time_series_transformers_architecture.py +0 -0
  255. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/vit/__init__.py +0 -0
  256. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/vit/configuration_vit.py +0 -0
  257. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/vit/modeling_vit.py +0 -0
  258. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/wav2vec2/__init__.py +0 -0
  259. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/wav2vec2/configuration_wav2vec2.py +0 -0
  260. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py +0 -0
  261. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/whisper/__init__.py +0 -0
  262. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/whisper/configuration_whisper.py +0 -0
  263. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/whisper/generation_whisper.py +0 -0
  264. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/whisper/whisper_architecture.py +0 -0
  265. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/xlm_roberta/__init__.py +0 -0
  266. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/xlm_roberta/configuration_xlm_roberta.py +0 -0
  267. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py +0 -0
  268. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/utils/__init__.py +0 -0
  269. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/transformers/utils/rbln_quantization.py +0 -0
  270. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/utils/__init__.py +0 -0
  271. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/utils/decorator_utils.py +0 -0
  272. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/utils/hub.py +0 -0
  273. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/utils/import_utils.py +0 -0
  274. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/utils/logging.py +0 -0
  275. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/utils/model_utils.py +0 -0
  276. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/utils/save_utils.py +0 -0
  277. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/src/optimum/rbln/utils/submodule.py +0 -0
  278. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/tests/__init__.py +0 -0
  279. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/tests/psnr.py +0 -0
  280. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/tests/requirements_sdxl.txt +0 -0
  281. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/tests/run_stable_diffusion_xl_base.py +0 -0
  282. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/tests/test_base.py +0 -0
  283. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/tests/test_config.py +0 -0
  284. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/tests/test_diffusers.py +0 -0
  285. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/tests/test_transformers.py +0 -0
  286. {optimum_rbln-0.8.2a1 → optimum_rbln-0.8.2a2}/uv.lock +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: optimum-rbln
3
- Version: 0.8.2a1
3
+ Version: 0.8.2a2
4
4
  Summary: Optimum RBLN is the interface between the HuggingFace Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
5
5
  Project-URL: Homepage, https://rebellions.ai
6
6
  Project-URL: Documentation, https://docs.rbln.ai
@@ -110,6 +110,10 @@ _import_structure = {
110
110
  "RBLNQwen2_5_VisionTransformerPretrainedModelConfig",
111
111
  "RBLNQwen2_5_VLForConditionalGeneration",
112
112
  "RBLNQwen2_5_VLForConditionalGenerationConfig",
113
+ "RBLNQwen3ForCausalLM",
114
+ "RBLNQwen3ForCausalLMConfig",
115
+ "RBLNQwen3Model",
116
+ "RBLNQwen3ModelConfig",
113
117
  "RBLNResNetForImageClassification",
114
118
  "RBLNResNetForImageClassificationConfig",
115
119
  "RBLNRobertaForMaskedLM",
@@ -357,6 +361,10 @@ if TYPE_CHECKING:
357
361
  RBLNQwen2_5_VLForConditionalGenerationConfig,
358
362
  RBLNQwen2ForCausalLM,
359
363
  RBLNQwen2ForCausalLMConfig,
364
+ RBLNQwen3ForCausalLM,
365
+ RBLNQwen3ForCausalLMConfig,
366
+ RBLNQwen3Model,
367
+ RBLNQwen3ModelConfig,
360
368
  RBLNResNetForImageClassification,
361
369
  RBLNResNetForImageClassificationConfig,
362
370
  RBLNRobertaForMaskedLM,
@@ -17,5 +17,5 @@ __version__: str
17
17
  __version_tuple__: VERSION_TUPLE
18
18
  version_tuple: VERSION_TUPLE
19
19
 
20
- __version__ = version = '0.8.2a1'
21
- __version_tuple__ = version_tuple = (0, 8, 2, 'a1')
20
+ __version__ = version = '0.8.2a2'
21
+ __version_tuple__ = version_tuple = (0, 8, 2, 'a2')
@@ -147,7 +147,7 @@ class RBLNCompileConfig:
147
147
  return asdict(self)
148
148
 
149
149
 
150
- RUNTIME_KEYWORDS = ["create_runtimes", "optimize_host_memory", "device", "device_map", "activate_profiler"]
150
+ RUNTIME_KEYWORDS = ["create_runtimes", "optimize_host_memory", "device", "device_map", "activate_profiler", "timeout"]
151
151
  CONFIG_MAPPING: Dict[str, Type["RBLNModelConfig"]] = {}
152
152
 
153
153
 
@@ -481,6 +481,7 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
481
481
  "device",
482
482
  "device_map",
483
483
  "activate_profiler",
484
+ "timeout",
484
485
  ]
485
486
  submodules: List[str] = []
486
487
  subclass_non_save_attributes = []
@@ -561,6 +562,7 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
561
562
  activate_profiler: Optional[bool] = None,
562
563
  npu: Optional[str] = None,
563
564
  tensor_parallel_size: Optional[int] = None,
565
+ timeout: Optional[int] = None,
564
566
  optimum_rbln_version: Optional[str] = None,
565
567
  _compile_cfgs: List[RBLNCompileConfig] = [],
566
568
  **kwargs: Dict[str, Any],
@@ -577,6 +579,7 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
577
579
  activate_profiler (Optional[bool]): Whether to activate the profiler for performance analysis.
578
580
  npu (Optional[str]): The NPU device name to use for compilation.
579
581
  tensor_parallel_size (Optional[int]): Size for tensor parallelism to distribute the model across devices.
582
+ timeout (Optional[int]): The timeout for the runtime in seconds. If it isn't provided, it will be set to 60 by default.
580
583
  optimum_rbln_version (Optional[str]): The optimum-rbln version used for this configuration.
581
584
  _compile_cfgs (List[RBLNCompileConfig]): List of compilation configurations for the model.
582
585
  **kwargs: Additional keyword arguments.
@@ -599,6 +602,7 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
599
602
  self._runtime_options["device"] = device
600
603
  self._runtime_options["device_map"] = device_map
601
604
  self._runtime_options["activate_profiler"] = activate_profiler
605
+ self._runtime_options["timeout"] = timeout
602
606
 
603
607
  # Automatically pass npu, tensor_parallel_size to compile_cfgs
604
608
  self.npu = npu
@@ -838,3 +842,14 @@ class RBLNModelConfig(RBLNSerializableConfigProtocol):
838
842
  @activate_profiler.setter
839
843
  def activate_profiler(self, activate_profiler: bool):
840
844
  self._runtime_options["activate_profiler"] = activate_profiler
845
+
846
+ @property
847
+ def timeout(self):
848
+ context = ContextRblnConfig.get_current_context()["timeout"]
849
+ if context is not None:
850
+ return context
851
+ return self._runtime_options["timeout"]
852
+
853
+ @timeout.setter
854
+ def timeout(self, timeout: int):
855
+ self._runtime_options["timeout"] = timeout
@@ -52,6 +52,9 @@ class RBLNCosmosTransformer3DModelConfig(RBLNModelConfig):
52
52
  Raises:
53
53
  ValueError: If batch_size is not a positive integer.
54
54
  """
55
+ if kwargs.get("timeout") is None:
56
+ kwargs["timeout"] = 80
57
+
55
58
  super().__init__(**kwargs)
56
59
  self.batch_size = batch_size or 1
57
60
  self.num_frames = num_frames or 121
@@ -230,6 +230,7 @@ class RBLNDiffusionMixin:
230
230
  create_runtimes=rbln_config.create_runtimes,
231
231
  optimize_host_mem=rbln_config.optimize_host_memory,
232
232
  activate_profiler=rbln_config.activate_profiler,
233
+ timeout=rbln_config.timeout,
233
234
  ):
234
235
  model = super().from_pretrained(pretrained_model_name_or_path=model_id, **kwargs)
235
236
 
@@ -209,6 +209,7 @@ class RBLNAutoencoderKL(RBLNModel):
209
209
  tensor_type="pt",
210
210
  device=device_val,
211
211
  activate_profiler=rbln_config.activate_profiler,
212
+ timeout=rbln_config.timeout,
212
213
  )
213
214
  for compiled_model, device_val in zip(compiled_models, device_vals)
214
215
  ]
@@ -200,6 +200,7 @@ class RBLNAutoencoderKLCosmos(RBLNModel):
200
200
  tensor_type="pt",
201
201
  device=device_val,
202
202
  activate_profiler=rbln_config.activate_profiler,
203
+ timeout=rbln_config.timeout,
203
204
  )
204
205
  for compiled_model, device_val in zip(compiled_models, device_vals)
205
206
  ]
@@ -165,6 +165,7 @@ class RBLNVQModel(RBLNModel):
165
165
  tensor_type="pt",
166
166
  device=device_val,
167
167
  activate_profiler=rbln_config.activate_profiler,
168
+ timeout=rbln_config.timeout,
168
169
  )
169
170
  for compiled_model, device_val in zip(compiled_models, device_vals)
170
171
  ]
@@ -279,7 +279,7 @@ class RBLNCosmosTransformer3DModel(RBLNModel):
279
279
  tensor_type="pt",
280
280
  device=rbln_config.device_map[DEFAULT_COMPILED_MODEL_NAME],
281
281
  activate_profiler=rbln_config.activate_profiler,
282
- timeout=120,
282
+ timeout=rbln_config.timeout,
283
283
  )
284
284
  for compiled_model in compiled_models
285
285
  ]
@@ -15,7 +15,7 @@
15
15
  from typing import Any, Dict, Optional, Tuple
16
16
 
17
17
  from ....configuration_utils import RBLNAutoConfig, RBLNModelConfig
18
- from ....transformers import RBLNSiglipVisionModelConfig
18
+ from ....transformers import RBLNLlamaForCausalLMConfig, RBLNSiglipVisionModelConfig
19
19
 
20
20
 
21
21
  class RBLNVideoSafetyModelConfig(RBLNModelConfig):
@@ -75,7 +75,15 @@ class RBLNCosmosSafetyCheckerConfig(RBLNModelConfig):
75
75
  if height is not None and width is not None:
76
76
  image_size = (height, width)
77
77
 
78
- self.aegis = self.init_submodule_config(RBLNModelConfig, aegis)
78
+ tensor_parallel_size = kwargs.get("tensor_parallel_size")
79
+
80
+ self.aegis = self.init_submodule_config(
81
+ RBLNLlamaForCausalLMConfig,
82
+ aegis,
83
+ batch_size=batch_size,
84
+ tensor_parallel_size=tensor_parallel_size,
85
+ )
86
+
79
87
  self.siglip_encoder = self.init_submodule_config(
80
88
  RBLNSiglipVisionModelConfig,
81
89
  siglip_encoder,
@@ -127,25 +127,13 @@ class RBLNSigLIPEncoder(SigLIPEncoder):
127
127
 
128
128
  # We don't use RBLNSiglipModel, but we need to override get_image_features to return pooler_output
129
129
  self.model = RBLNSiglipVisionModel.from_pretrained(
130
- self.checkpoint_dir,
131
- rbln_device=rbln_config.siglip_encoder.device,
132
- rbln_create_runtimes=rbln_config.siglip_encoder.create_runtimes,
133
- rbln_activate_profiler=rbln_config.siglip_encoder.activate_profiler,
134
- rbln_optimize_host_memory=rbln_config.siglip_encoder.optimize_host_memory,
130
+ self.checkpoint_dir, rbln_config=rbln_config.siglip_encoder
135
131
  )
136
132
  else:
137
133
  super().__init__(model_name, checkpoint_id)
138
134
  model = self.model
139
135
  del self.model
140
- self.model = RBLNSiglipVisionModel.from_model(
141
- model,
142
- rbln_device=rbln_config.siglip_encoder.device,
143
- rbln_image_size=rbln_config.siglip_encoder.image_size,
144
- rbln_npu=rbln_config.siglip_encoder.npu,
145
- rbln_create_runtimes=rbln_config.siglip_encoder.create_runtimes,
146
- rbln_activate_profiler=rbln_config.siglip_encoder.activate_profiler,
147
- rbln_optimize_host_memory=rbln_config.siglip_encoder.optimize_host_memory,
148
- )
136
+ self.model = RBLNSiglipVisionModel.from_model(model, rbln_config=rbln_config.siglip_encoder)
149
137
  self.rbln_config = rbln_config
150
138
 
151
139
  # Override get_image_features to return pooler_output
@@ -336,28 +324,14 @@ class RBLNAegis(Aegis):
336
324
  torch.nn.Module.__init__(self)
337
325
  cache_dir = pathlib.Path(checkpoint_id) / "aegis"
338
326
  self.tokenizer = AutoTokenizer.from_pretrained(cache_dir)
339
- self.model = RBLNAutoModelForCausalLM.from_pretrained(
340
- cache_dir,
341
- rbln_device=rbln_config.aegis.device,
342
- rbln_create_runtimes=rbln_config.aegis.create_runtimes,
343
- rbln_activate_profiler=rbln_config.aegis.activate_profiler,
344
- rbln_optimize_host_memory=rbln_config.aegis.optimize_host_memory,
345
- )
327
+ self.model = RBLNAutoModelForCausalLM.from_pretrained(cache_dir, rbln_config=rbln_config.aegis)
346
328
 
347
329
  else:
348
330
  super().__init__(checkpoint_id, base_model_id, aegis_adapter)
349
331
  model = self.model.merge_and_unload() # peft merge
350
332
  del self.model
351
333
 
352
- self.model = RBLNAutoModelForCausalLM.from_model(
353
- model,
354
- rbln_tensor_parallel_size=4,
355
- rbln_device=rbln_config.aegis.device,
356
- rbln_create_runtimes=rbln_config.aegis.create_runtimes,
357
- rbln_npu=rbln_config.aegis.npu,
358
- rbln_activate_profiler=rbln_config.aegis.activate_profiler,
359
- rbln_optimize_host_memory=rbln_config.aegis.optimize_host_memory,
360
- )
334
+ self.model = RBLNAutoModelForCausalLM.from_model(model, rbln_config=rbln_config.aegis)
361
335
 
362
336
  self.rbln_config = rbln_config
363
337
  self.dtype = torch.bfloat16
@@ -238,6 +238,7 @@ class RBLNModel(RBLNBaseModel):
238
238
  tensor_type="pt",
239
239
  device=rbln_config.device_map[DEFAULT_COMPILED_MODEL_NAME],
240
240
  activate_profiler=rbln_config.activate_profiler,
241
+ timeout=rbln_config.timeout,
241
242
  )
242
243
  for compiled_model in compiled_models
243
244
  ]
@@ -98,6 +98,10 @@ _import_structure = {
98
98
  "RBLNQwen2_5_VLForConditionalGenerationConfig",
99
99
  "RBLNQwen2ForCausalLM",
100
100
  "RBLNQwen2ForCausalLMConfig",
101
+ "RBLNQwen3ForCausalLM",
102
+ "RBLNQwen3ForCausalLMConfig",
103
+ "RBLNQwen3Model",
104
+ "RBLNQwen3ModelConfig",
101
105
  "RBLNResNetForImageClassification",
102
106
  "RBLNResNetForImageClassificationConfig",
103
107
  "RBLNRobertaForMaskedLM",
@@ -204,6 +208,10 @@ if TYPE_CHECKING:
204
208
  RBLNQwen2_5_VLForConditionalGenerationConfig,
205
209
  RBLNQwen2ForCausalLM,
206
210
  RBLNQwen2ForCausalLMConfig,
211
+ RBLNQwen3ForCausalLM,
212
+ RBLNQwen3ForCausalLMConfig,
213
+ RBLNQwen3Model,
214
+ RBLNQwen3ModelConfig,
207
215
  RBLNResNetForImageClassification,
208
216
  RBLNResNetForImageClassificationConfig,
209
217
  RBLNRobertaForMaskedLM,
@@ -113,6 +113,7 @@ _import_structure = {
113
113
  "mistral": ["RBLNMistralForCausalLM", "RBLNMistralForCausalLMConfig"],
114
114
  "phi": ["RBLNPhiForCausalLM", "RBLNPhiForCausalLMConfig"],
115
115
  "qwen2": ["RBLNQwen2ForCausalLM", "RBLNQwen2ForCausalLMConfig"],
116
+ "qwen3": ["RBLNQwen3ForCausalLM", "RBLNQwen3ForCausalLMConfig", "RBLNQwen3Model", "RBLNQwen3ModelConfig"],
116
117
  "resnet": ["RBLNResNetForImageClassification", "RBLNResNetForImageClassificationConfig"],
117
118
  "roberta": [
118
119
  "RBLNRobertaForMaskedLM",
@@ -241,6 +242,7 @@ if TYPE_CHECKING:
241
242
  RBLNQwen2_5_VLForConditionalGeneration,
242
243
  RBLNQwen2_5_VLForConditionalGenerationConfig,
243
244
  )
245
+ from .qwen3 import RBLNQwen3ForCausalLM, RBLNQwen3ForCausalLMConfig, RBLNQwen3Model, RBLNQwen3ModelConfig
244
246
  from .resnet import RBLNResNetForImageClassification, RBLNResNetForImageClassificationConfig
245
247
  from .roberta import (
246
248
  RBLNRobertaForMaskedLM,
@@ -1085,6 +1085,7 @@ class RBLNDecoderOnlyModelForCausalLM(RBLNModel):
1085
1085
  tensor_type="pt",
1086
1086
  device=rbln_config.device_map["prefill"],
1087
1087
  activate_profiler=rbln_config.activate_profiler,
1088
+ timeout=rbln_config.timeout,
1088
1089
  ),
1089
1090
  *[
1090
1091
  rebel.Runtime(
@@ -1092,6 +1093,7 @@ class RBLNDecoderOnlyModelForCausalLM(RBLNModel):
1092
1093
  tensor_type="pt",
1093
1094
  device=rbln_config.device_map[f"decoder_batch_{batch_size}"],
1094
1095
  activate_profiler=rbln_config.activate_profiler,
1096
+ timeout=rbln_config.timeout,
1095
1097
  )
1096
1098
  for i, batch_size in enumerate(rbln_config.decoder_batch_sizes)
1097
1099
  ],
@@ -1190,6 +1192,11 @@ class RBLNDecoderOnlyModelForCausalLM(RBLNModel):
1190
1192
  if cache_position is None:
1191
1193
  logits = []
1192
1194
  inputs = inputs_embeds if inputs_embeds is not None else input_ids
1195
+ # for only use forward
1196
+ if generate_idx is None:
1197
+ generate_idx = attention_mask.sum(dim=-1, keepdim=True).int()
1198
+ if padded_cache_lengths is None:
1199
+ padded_cache_lengths = torch.zeros_like(generate_idx)
1193
1200
  batch_size = inputs.shape[0]
1194
1201
  for b_idx in range(batch_size):
1195
1202
  cache_position = torch.arange(0, generate_idx[b_idx].item(), dtype=torch.int32).unsqueeze(0)
@@ -884,12 +884,14 @@ class RBLNGemma3ForCausalLM(RBLNDecoderOnlyModelForCausalLM):
884
884
  tensor_type="pt",
885
885
  device=rbln_config.device_map["prefill"],
886
886
  activate_profiler=rbln_config.activate_profiler,
887
+ timeout=rbln_config.timeout,
887
888
  ),
888
889
  rebel.Runtime(
889
890
  compiled_models[1],
890
891
  tensor_type="pt",
891
892
  device=rbln_config.device_map["image_prefill"],
892
893
  activate_profiler=rbln_config.activate_profiler,
894
+ timeout=rbln_config.timeout,
893
895
  ),
894
896
  *[
895
897
  rebel.Runtime(
@@ -897,6 +899,7 @@ class RBLNGemma3ForCausalLM(RBLNDecoderOnlyModelForCausalLM):
897
899
  tensor_type="pt",
898
900
  device=rbln_config.device_map[f"decoder_batch_{batch_size}"],
899
901
  activate_profiler=rbln_config.activate_profiler,
902
+ timeout=rbln_config.timeout,
900
903
  )
901
904
  for i, batch_size in enumerate(rbln_config.decoder_batch_sizes)
902
905
  ],
@@ -0,0 +1,16 @@
1
+ # Copyright 2025 Rebellions Inc. All rights reserved.
2
+
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at:
6
+
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ from .configuration_qwen3 import RBLNQwen3ForCausalLMConfig, RBLNQwen3ModelConfig
16
+ from .modeling_qwen3 import RBLNQwen3ForCausalLM, RBLNQwen3Model
@@ -0,0 +1,71 @@
1
+ # Copyright 2025 Rebellions Inc. All rights reserved.
2
+
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at:
6
+
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ from ..decoderonly.configuration_decoderonly import RBLNDecoderOnlyModelForCausalLMConfig
16
+
17
+
18
+ class RBLNQwen3ForCausalLMConfig(RBLNDecoderOnlyModelForCausalLMConfig):
19
+ """
20
+ Configuration class for RBLN Qwen3 models.
21
+
22
+ This class is an alias of RBLNDecoderOnlyModelForCausalLMConfig.
23
+
24
+ Example usage:
25
+ ```python
26
+ from optimum.rbln import RBLNQwen3ForCausalLM, RBLNQwen3ForCausalLMConfig
27
+
28
+ # Create a configuration object
29
+ config = RBLNQwen3ForCausalLMConfig(
30
+ batch_size=1,
31
+ max_seq_len=40960,
32
+ tensor_parallel_size=4,
33
+ kvcache_partition_len=16384
34
+ )
35
+
36
+ # Use the configuration with from_pretrained
37
+ model = RBLNQwen3ForCausalLM.from_pretrained(
38
+ "Qwen/Qwen3-4B",
39
+ export=True,
40
+ rbln_config=config
41
+ )
42
+ ```
43
+ """
44
+
45
+
46
+ class RBLNQwen3ModelConfig(RBLNDecoderOnlyModelForCausalLMConfig):
47
+ """
48
+ Configuration class for RBLN Qwen3 models.
49
+
50
+ This class is an alias of RBLNDecoderOnlyModelForCausalLMConfig.
51
+
52
+ Example usage:
53
+ ```python
54
+ from optimum.rbln import RBLNQwen3Model, RBLNQwen3ModelConfig
55
+
56
+ # Create a configuration object
57
+ config = RBLNQwen3ModelConfig(
58
+ batch_size=1,
59
+ max_seq_len=40960,
60
+ tensor_parallel_size=4,
61
+ kvcache_partition_len=16384
62
+ )
63
+
64
+ # Use the configuration with from_pretrained
65
+ model = RBLNQwen3Model.from_pretrained(
66
+ "Qwen/Qwen3-Embedding-4B",
67
+ export=True,
68
+ rbln_config=config
69
+ )
70
+ ```
71
+ """