optimum-rbln 0.8.0__tar.gz → 0.8.1a0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (252) hide show
  1. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/PKG-INFO +1 -1
  2. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/__version__.py +2 -2
  3. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +3 -1
  4. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/tests/test_llm.py +54 -0
  5. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
  6. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/ISSUE_TEMPLATE/config.yml +0 -0
  7. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
  8. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/ISSUE_TEMPLATE/model_request.md +0 -0
  9. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/pull_request_template.md +0 -0
  10. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/scripts/auto_code_review.py +0 -0
  11. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/scripts/validate_pr_checklist.py +0 -0
  12. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/version.yaml +0 -0
  13. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/auto_code_review.yml +0 -0
  14. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/check_code_quality.yml +0 -0
  15. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/deploy-on-tag.yaml +0 -0
  16. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/deploy.yaml +0 -0
  17. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/pr-title-check.yaml +0 -0
  18. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/pr_checklist_validator.yml +0 -0
  19. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/rbln_check_compiler.yaml +0 -0
  20. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/rbln_dispatch_pytest.yaml +0 -0
  21. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/rbln_optimum_inference_test.yaml +0 -0
  22. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/rbln_optimum_pytest.yaml +0 -0
  23. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/rbln_scheduled_test.yaml +0 -0
  24. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.github/workflows/rbln_trigger_on_pr.yaml +0 -0
  25. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/.gitignore +0 -0
  26. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/CODE_OF_CONDUCT.md +0 -0
  27. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/CONTRIBUTING.md +0 -0
  28. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/LICENSE +0 -0
  29. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/README.md +0 -0
  30. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/assets/rbln_logo.png +0 -0
  31. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/audio-classification/run_ast_audio_classification.py +0 -0
  32. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/depth-estimation/run_dpt.py +0 -0
  33. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/image-classification/run_image_classification.py +0 -0
  34. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/image-classification/run_vit_image_classification.py +0 -0
  35. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/image-to-text/run_idefics3.py +0 -0
  36. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/image-to-text/run_llava_next_image_to_text.py +0 -0
  37. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/kandinsky2_2/run_kandinsky2_2.py +0 -0
  38. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/kandinsky2_2/run_kandinsky2_2_combined.py +0 -0
  39. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/kandinsky2_2/run_kandinsky2_2_img2img.py +0 -0
  40. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/kandinsky2_2/run_kandinsky2_2_img2img_combined.py +0 -0
  41. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/kandinsky2_2/run_kandinsky2_2_inpaint.py +0 -0
  42. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/kandinsky2_2/run_kandinsky2_2_inpaint_combined.py +0 -0
  43. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/kandinsky2_2/run_kandinsky2_2_prior_interpolate.py +0 -0
  44. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/question-answering/run_question_answering.py +0 -0
  45. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/speech-recognition/run_wav2vec2.py +0 -0
  46. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/speech-recognition/run_whisper.py +0 -0
  47. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/stable-diffusion/run_stable_diffusion.py +0 -0
  48. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/stable-diffusion/run_stable_diffusion_controlnet.py +0 -0
  49. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/stable-diffusion/run_stable_diffusion_img2img.py +0 -0
  50. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/stable-diffusion/run_stable_diffusion_img2img_controlnet.py +0 -0
  51. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/stable-diffusion/run_stable_diffusion_inpaint.py +0 -0
  52. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/stable-diffusion/run_stable_diffusion_lora.py +0 -0
  53. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/stable-diffusion/run_stable_diffusion_multicontrolnet.py +0 -0
  54. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/text-classification/run_bge_m3_text_classification.py +0 -0
  55. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/text-classification/run_bge_reranker_v2_m3_text_classification.py +0 -0
  56. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/text-classification/run_secureBERT.py +0 -0
  57. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/text-classification/run_t5_classification.py +0 -0
  58. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/text-classification/run_twitter_roberta_text_classification.py +0 -0
  59. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/text2text-generation/run_bart_text2text_generation.py +0 -0
  60. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/text2text-generation/run_llama_peft.py +0 -0
  61. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/text2text-generation/run_llama_text2text_generation.py +0 -0
  62. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/examples/time-series-forecasting/run_time_series_forecasting.py +0 -0
  63. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/pyproject.toml +0 -0
  64. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/scripts/uv-lock.sh +0 -0
  65. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/scripts/uv-sync.sh +0 -0
  66. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/__init__.py +0 -0
  67. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/configuration_utils.py +0 -0
  68. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/__init__.py +0 -0
  69. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/__init__.py +0 -0
  70. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/models/__init__.py +0 -0
  71. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl.py +0 -0
  72. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/models/configuration_controlnet.py +0 -0
  73. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/models/configuration_prior_transformer.py +0 -0
  74. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/models/configuration_transformer_sd3.py +0 -0
  75. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/models/configuration_unet_2d_condition.py +0 -0
  76. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/models/configuration_vq_model.py +0 -0
  77. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/pipelines/__init__.py +0 -0
  78. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_controlnet.py +0 -0
  79. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_kandinsky2_2.py +0 -0
  80. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion.py +0 -0
  81. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_3.py +0 -0
  82. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_xl.py +0 -0
  83. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/modeling_diffusers.py +0 -0
  84. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/models/__init__.py +0 -0
  85. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/models/autoencoders/__init__.py +0 -0
  86. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl.py +0 -0
  87. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/models/autoencoders/vae.py +0 -0
  88. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/models/autoencoders/vq_model.py +0 -0
  89. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/models/controlnet.py +0 -0
  90. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/models/transformers/__init__.py +0 -0
  91. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/models/transformers/prior_transformer.py +0 -0
  92. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/models/transformers/transformer_sd3.py +0 -0
  93. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/models/unets/__init__.py +0 -0
  94. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/models/unets/unet_2d_condition.py +0 -0
  95. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/__init__.py +0 -0
  96. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/controlnet/__init__.py +0 -0
  97. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py +0 -0
  98. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py +0 -0
  99. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py +0 -0
  100. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py +0 -0
  101. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py +0 -0
  102. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/__init__.py +0 -0
  103. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2.py +0 -0
  104. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_combined.py +0 -0
  105. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_img2img.py +0 -0
  106. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_inpaint.py +0 -0
  107. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_prior.py +0 -0
  108. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/__init__.py +0 -0
  109. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py +0 -0
  110. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py +0 -0
  111. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_inpaint.py +0 -0
  112. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/__init__.py +0 -0
  113. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py +0 -0
  114. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py +0 -0
  115. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py +0 -0
  116. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/__init__.py +0 -0
  117. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py +0 -0
  118. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py +0 -0
  119. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py +0 -0
  120. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/modeling.py +0 -0
  121. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/modeling_base.py +0 -0
  122. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/ops/__init__.py +0 -0
  123. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/ops/attn.py +0 -0
  124. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/ops/flash_attn.py +0 -0
  125. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/ops/kv_cache_update.py +0 -0
  126. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/ops/linear.py +0 -0
  127. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/ops/sliding_window_attn.py +0 -0
  128. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/__init__.py +0 -0
  129. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/configuration_alias.py +0 -0
  130. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/configuration_generic.py +0 -0
  131. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/modeling_alias.py +0 -0
  132. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/modeling_generic.py +0 -0
  133. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/modeling_rope_utils.py +0 -0
  134. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/__init__.py +0 -0
  135. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/auto/__init__.py +0 -0
  136. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/auto/auto_factory.py +0 -0
  137. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/auto/modeling_auto.py +0 -0
  138. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/bart/__init__.py +0 -0
  139. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/bart/bart_architecture.py +0 -0
  140. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/bart/configuration_bart.py +0 -0
  141. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/bart/modeling_bart.py +0 -0
  142. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/bert/__init__.py +0 -0
  143. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/bert/configuration_bert.py +0 -0
  144. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/bert/modeling_bert.py +0 -0
  145. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/blip_2/__init__.py +0 -0
  146. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/blip_2/configuration_blip_2.py +0 -0
  147. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/blip_2/modeling_blip_2.py +0 -0
  148. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/clip/__init__.py +0 -0
  149. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/clip/configuration_clip.py +0 -0
  150. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/clip/modeling_clip.py +0 -0
  151. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/decoderonly/__init__.py +0 -0
  152. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py +0 -0
  153. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py +0 -0
  154. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/dpt/__init__.py +0 -0
  155. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/dpt/configuration_dpt.py +0 -0
  156. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/dpt/modeling_dpt.py +0 -0
  157. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/exaone/__init__.py +0 -0
  158. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/exaone/configuration_exaone.py +0 -0
  159. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/exaone/exaone_architecture.py +0 -0
  160. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/exaone/modeling_exaone.py +0 -0
  161. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gemma/__init__.py +0 -0
  162. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gemma/configuration_gemma.py +0 -0
  163. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gemma/gemma_architecture.py +0 -0
  164. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gemma/modeling_gemma.py +0 -0
  165. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gemma3/__init__.py +0 -0
  166. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gemma3/configuration_gemma3.py +0 -0
  167. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gemma3/gemma3_architecture.py +0 -0
  168. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gemma3/modeling_gemma3.py +0 -0
  169. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gpt2/__init__.py +0 -0
  170. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gpt2/configuration_gpt2.py +0 -0
  171. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gpt2/gpt2_architecture.py +0 -0
  172. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/gpt2/modeling_gpt2.py +0 -0
  173. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/idefics3/__init__.py +0 -0
  174. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/idefics3/configuration_idefics3.py +0 -0
  175. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/idefics3/modeling_idefics3.py +0 -0
  176. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/llama/__init__.py +0 -0
  177. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/llama/configuration_llama.py +0 -0
  178. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/llama/llama_architecture.py +0 -0
  179. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/llama/modeling_llama.py +0 -0
  180. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/llava_next/__init__.py +0 -0
  181. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/llava_next/configuration_llava_next.py +0 -0
  182. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/llava_next/modeling_llava_next.py +0 -0
  183. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/midm/__init__.py +0 -0
  184. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/midm/configuration_midm.py +0 -0
  185. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/midm/midm_architecture.py +0 -0
  186. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/midm/modeling_midm.py +0 -0
  187. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/mistral/__init__.py +0 -0
  188. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/mistral/configuration_mistral.py +0 -0
  189. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/mistral/mistral_architecture.py +0 -0
  190. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/mistral/modeling_mistral.py +0 -0
  191. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/opt/__init__.py +0 -0
  192. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/opt/configuration_opt.py +0 -0
  193. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/opt/modeling_opt.py +0 -0
  194. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/opt/opt_architecture.py +0 -0
  195. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/phi/__init__.py +0 -0
  196. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/phi/configuration_phi.py +0 -0
  197. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/phi/modeling_phi.py +0 -0
  198. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/phi/phi_architecture.py +0 -0
  199. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/qwen2/__init__.py +0 -0
  200. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/qwen2/configuration_qwen2.py +0 -0
  201. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/qwen2/modeling_qwen2.py +0 -0
  202. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/qwen2/qwen2_architecture.py +0 -0
  203. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/qwen2_5_vl/__init__.py +0 -0
  204. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py +0 -0
  205. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py +0 -0
  206. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py +0 -0
  207. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/seq2seq/__init__.py +0 -0
  208. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/seq2seq/configuration_seq2seq2.py +0 -0
  209. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py +0 -0
  210. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/seq2seq/seq2seq_architecture.py +0 -0
  211. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/siglip/__init__.py +0 -0
  212. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/siglip/configuration_siglip.py +0 -0
  213. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/siglip/modeling_siglip.py +0 -0
  214. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/t5/__init__.py +0 -0
  215. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/t5/configuration_t5.py +0 -0
  216. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/t5/modeling_t5.py +0 -0
  217. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/t5/t5_architecture.py +0 -0
  218. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/time_series_transformers/__init__.py +0 -0
  219. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/time_series_transformers/configuration_time_series_transformer.py +0 -0
  220. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/time_series_transformers/modeling_time_series_transformers.py +0 -0
  221. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/time_series_transformers/time_series_transformers_architecture.py +0 -0
  222. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/wav2vec2/__init__.py +0 -0
  223. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/wav2vec2/configuration_wav2vec.py +0 -0
  224. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py +0 -0
  225. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/whisper/__init__.py +0 -0
  226. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/whisper/configuration_whisper.py +0 -0
  227. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/whisper/generation_whisper.py +0 -0
  228. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/whisper/modeling_whisper.py +0 -0
  229. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/whisper/whisper_architecture.py +0 -0
  230. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/xlm_roberta/__init__.py +0 -0
  231. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/xlm_roberta/configuration_xlm_roberta.py +0 -0
  232. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py +0 -0
  233. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/utils/__init__.py +0 -0
  234. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/transformers/utils/rbln_quantization.py +0 -0
  235. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/utils/__init__.py +0 -0
  236. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/utils/decorator_utils.py +0 -0
  237. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/utils/hub.py +0 -0
  238. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/utils/import_utils.py +0 -0
  239. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/utils/logging.py +0 -0
  240. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/utils/model_utils.py +0 -0
  241. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/utils/runtime_utils.py +0 -0
  242. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/utils/save_utils.py +0 -0
  243. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/src/optimum/rbln/utils/submodule.py +0 -0
  244. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/tests/__init__.py +0 -0
  245. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/tests/psnr.py +0 -0
  246. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/tests/requirements_sdxl.txt +0 -0
  247. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/tests/run_stable_diffusion_xl_base.py +0 -0
  248. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/tests/test_base.py +0 -0
  249. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/tests/test_config.py +0 -0
  250. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/tests/test_diffusers.py +0 -0
  251. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/tests/test_transformers.py +0 -0
  252. {optimum_rbln-0.8.0 → optimum_rbln-0.8.1a0}/uv.lock +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: optimum-rbln
3
- Version: 0.8.0
3
+ Version: 0.8.1a0
4
4
  Summary: Optimum RBLN is the interface between the HuggingFace Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
5
5
  Project-URL: Homepage, https://rebellions.ai
6
6
  Project-URL: Documentation, https://docs.rbln.ai
@@ -17,5 +17,5 @@ __version__: str
17
17
  __version_tuple__: VERSION_TUPLE
18
18
  version_tuple: VERSION_TUPLE
19
19
 
20
- __version__ = version = '0.8.0'
21
- __version_tuple__ = version_tuple = (0, 8, 0)
20
+ __version__ = version = '0.8.1a0'
21
+ __version_tuple__ = version_tuple = (0, 8, 1, 'a0')
@@ -709,7 +709,9 @@ class RBLNDecoderOnlyModelForCausalLM(RBLNModel):
709
709
  compiled_models[f"decoder_batch_{batch_size}"].get_alloc_per_node_by_key().items()
710
710
  ):
711
711
  alloc_memory_by_key[key] += sum(memory_per_node)
712
- alloc_memory_by_key.pop("PortRecur") # kv-cache
712
+
713
+ alloc_memory_by_key.pop("PortRecur", None) # Old compiler's kv-cache Key
714
+ alloc_memory_by_key.pop("DramTensor", None) # kv-cache
713
715
  kernel_size = alloc_memory_by_key.pop("Kernel") # model weight
714
716
 
715
717
  # Get the maximum number of blocks that can be allocated
@@ -14,11 +14,13 @@ from optimum.rbln import (
14
14
  RBLNAutoModelForSeq2SeqLM,
15
15
  RBLNAutoModelForVision2Seq,
16
16
  RBLNBartForConditionalGeneration,
17
+ RBLNBlip2ForConditionalGeneration,
17
18
  RBLNExaoneForCausalLM,
18
19
  RBLNGPT2LMHeadModel,
19
20
  RBLNIdefics3ForConditionalGeneration,
20
21
  RBLNLlamaForCausalLM,
21
22
  RBLNLlavaNextForConditionalGeneration,
23
+ RBLNOPTForCausalLM,
22
24
  RBLNPhiForCausalLM,
23
25
  RBLNQwen2_5_VLForConditionalGeneration,
24
26
  RBLNQwen2ForCausalLM,
@@ -69,6 +71,13 @@ class TestQwen2Model(LLMTest.TestLLM):
69
71
  HF_CONFIG_KWARGS = {"max_position_embeddings": 1024}
70
72
 
71
73
 
74
+ class TestOptModel(LLMTest.TestLLM):
75
+ RBLN_CLASS = RBLNOPTForCausalLM
76
+ HF_MODEL_ID = "facebook/opt-2.7b"
77
+ EXPECTED_OUTPUT = "\nI'm a guy who likes to play video games.\nI'm a guy who likes to"
78
+ HF_CONFIG_KWARGS = {"max_position_embeddings": 2048}
79
+
80
+
72
81
  class TestLlamaForCausalLM(LLMTest.TestLLM):
73
82
  RBLN_CLASS = RBLNLlamaForCausalLM
74
83
  HF_MODEL_ID = "afmck/testing-llama-tiny"
@@ -291,6 +300,51 @@ class TestLlavaNextForConditionalGeneration(LLMTest.TestLLM):
291
300
  )
292
301
 
293
302
 
303
+ class TestBlip2ForConditionalGeneration(LLMTest.TestLLM):
304
+ RBLN_AUTO_CLASS = RBLNAutoModelForVision2Seq
305
+ RBLN_CLASS = RBLNBlip2ForConditionalGeneration
306
+ HF_MODEL_ID = "Salesforce/blip2-opt-2.7b" # No tiny model yet.
307
+ PROMPT = "Question: Describe this image? Answer:"
308
+ RBLN_CLASS_KWARGS = {"rbln_config": {"language_model": {"use_inputs_embeds": True}}}
309
+ EXPECTED_OUTPUT = "::::::::::::::::::::"
310
+
311
+ @classmethod
312
+ def get_tokenizer(cls):
313
+ if cls._tokenizer is None:
314
+ cls._tokenizer = AutoProcessor.from_pretrained(cls.HF_MODEL_ID)
315
+ return cls._tokenizer
316
+
317
+ # override
318
+ @classmethod
319
+ def setUpClass(cls):
320
+ config = AutoConfig.from_pretrained(cls.HF_MODEL_ID)
321
+
322
+ text_config = json.loads(config.text_config.to_json_string())
323
+ text_config["num_hidden_layers"] = 1
324
+ kwargs = {"text_config": text_config}
325
+ cls.HF_CONFIG_KWARGS.update(kwargs)
326
+ return super().setUpClass()
327
+
328
+ def get_inputs(self):
329
+ tokenizer = self.get_tokenizer()
330
+ img_path = f"{os.path.dirname(__file__)}/../assets/rbln_logo.png"
331
+ image = Image.open(img_path)
332
+ inputs = tokenizer(images=image, text=self.PROMPT, return_tensors="pt", padding=True)
333
+ inputs["max_new_tokens"] = 20
334
+ inputs["do_sample"] = False
335
+ return inputs
336
+
337
+ def _inner_test_save_load(self, tmpdir):
338
+ super()._inner_test_save_load(tmpdir)
339
+ # Test loading from nested config
340
+ _ = self.RBLN_CLASS.from_pretrained(
341
+ tmpdir,
342
+ export=False,
343
+ rbln_config={"language_model": {"create_runtimes": False}},
344
+ **self.HF_CONFIG_KWARGS,
345
+ )
346
+
347
+
294
348
  class TestIdefics3ForConditionalGeneration(LLMTest.TestLLM):
295
349
  RBLN_AUTO_CLASS = RBLNAutoModelForVision2Seq
296
350
  RBLN_CLASS = RBLNIdefics3ForConditionalGeneration
File without changes
File without changes
File without changes
File without changes