optimum-rbln 0.7.3a4__tar.gz → 0.7.3a5__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (181) hide show
  1. optimum_rbln-0.7.3a5/.github/version.yaml +1 -0
  2. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/PKG-INFO +1 -1
  3. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/__version__.py +2 -2
  4. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +19 -21
  5. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/phi/phi_architecture.py +3 -3
  6. optimum_rbln-0.7.3a4/.github/version.yaml +0 -1
  7. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
  8. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/ISSUE_TEMPLATE/config.yml +0 -0
  9. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
  10. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/ISSUE_TEMPLATE/model_request.md +0 -0
  11. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/pull_request_template.md +0 -0
  12. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/scripts/auto_code_review.py +0 -0
  13. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/scripts/validate_pr_checklist.py +0 -0
  14. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/auto_code_review.yml +0 -0
  15. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/check_code_quality.yml +0 -0
  16. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/deploy-on-tag.yaml +0 -0
  17. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/deploy.yaml +0 -0
  18. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/pr-title-check.yaml +0 -0
  19. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/pr_checklist_validator.yml +0 -0
  20. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/rbln_check_compiler.yaml +0 -0
  21. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/rbln_dispatch_pytest.yaml +0 -0
  22. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/rbln_optimum_inference_test.yaml +0 -0
  23. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/rbln_optimum_pytest.yaml +0 -0
  24. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/rbln_scheduled_test.yaml +0 -0
  25. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.github/workflows/rbln_trigger_on_pr.yaml +0 -0
  26. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/.gitignore +0 -0
  27. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/CODE_OF_CONDUCT.md +0 -0
  28. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/CONTRIBUTING.md +0 -0
  29. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/LICENSE +0 -0
  30. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/README.md +0 -0
  31. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/assets/rbln_logo.png +0 -0
  32. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/audio-classification/run_ast_audio_classification.py +0 -0
  33. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/depth-estimation/run_dpt.py +0 -0
  34. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/image-classification/run_image_classification.py +0 -0
  35. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/image-classification/run_vit_image_classification.py +0 -0
  36. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/image-to-text/run_llava_next_image_to_text.py +0 -0
  37. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/kandinsky2_2/run_kandinsky2_2_inpaint.py +0 -0
  38. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/kandinsky2_2/run_kandinsky2_2_inpaint_combined.py +0 -0
  39. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/question-answering/run_question_answering.py +0 -0
  40. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/speech-recognition/run_wav2vec2.py +0 -0
  41. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/speech-recognition/run_whisper.py +0 -0
  42. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/stable-diffusion/run_stable_diffusion.py +0 -0
  43. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/stable-diffusion/run_stable_diffusion_controlnet.py +0 -0
  44. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/stable-diffusion/run_stable_diffusion_img2img.py +0 -0
  45. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/stable-diffusion/run_stable_diffusion_img2img_controlnet.py +0 -0
  46. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/stable-diffusion/run_stable_diffusion_inpaint.py +0 -0
  47. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/stable-diffusion/run_stable_diffusion_lora.py +0 -0
  48. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/stable-diffusion/run_stable_diffusion_multicontrolnet.py +0 -0
  49. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/text-classification/run_bge_m3_text_classification.py +0 -0
  50. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/text-classification/run_bge_reranker_v2_m3_text_classification.py +0 -0
  51. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/text-classification/run_secureBERT.py +0 -0
  52. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/text-classification/run_t5_classification.py +0 -0
  53. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/text-classification/run_twitter_roberta_text_classification.py +0 -0
  54. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/text2text-generation/run_bart_text2text_generation.py +0 -0
  55. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/text2text-generation/run_llama_peft.py +0 -0
  56. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/examples/text2text-generation/run_llama_text2text_generation.py +0 -0
  57. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/pyproject.toml +0 -0
  58. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/scripts/uv-lock.sh +0 -0
  59. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/scripts/uv-sync.sh +0 -0
  60. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/__init__.py +0 -0
  61. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/__init__.py +0 -0
  62. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/modeling_diffusers.py +0 -0
  63. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/models/__init__.py +0 -0
  64. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/models/autoencoders/__init__.py +0 -0
  65. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl.py +0 -0
  66. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/models/autoencoders/vae.py +0 -0
  67. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/models/autoencoders/vq_model.py +0 -0
  68. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/models/controlnet.py +0 -0
  69. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/models/transformers/__init__.py +0 -0
  70. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/models/transformers/prior_transformer.py +0 -0
  71. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/models/transformers/transformer_sd3.py +0 -0
  72. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/models/unets/__init__.py +0 -0
  73. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/models/unets/unet_2d_condition.py +0 -0
  74. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/__init__.py +0 -0
  75. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/controlnet/__init__.py +0 -0
  76. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py +0 -0
  77. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py +0 -0
  78. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py +0 -0
  79. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py +0 -0
  80. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py +0 -0
  81. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/__init__.py +0 -0
  82. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_combined.py +0 -0
  83. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_inpaint.py +0 -0
  84. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_prior.py +0 -0
  85. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/__init__.py +0 -0
  86. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py +0 -0
  87. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py +0 -0
  88. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_inpaint.py +0 -0
  89. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/__init__.py +0 -0
  90. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py +0 -0
  91. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py +0 -0
  92. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py +0 -0
  93. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/__init__.py +0 -0
  94. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py +0 -0
  95. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py +0 -0
  96. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py +0 -0
  97. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/modeling.py +0 -0
  98. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/modeling_base.py +0 -0
  99. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/modeling_config.py +0 -0
  100. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/ops/__init__.py +0 -0
  101. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/ops/attn.py +0 -0
  102. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/ops/flash_attn.py +0 -0
  103. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/ops/kv_cache_update.py +0 -0
  104. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/__init__.py +0 -0
  105. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/modeling_alias.py +0 -0
  106. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/modeling_generic.py +0 -0
  107. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/modeling_rope_utils.py +0 -0
  108. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/__init__.py +0 -0
  109. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/auto/__init__.py +0 -0
  110. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/auto/auto_factory.py +0 -0
  111. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/auto/modeling_auto.py +0 -0
  112. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/bart/__init__.py +0 -0
  113. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/bart/bart_architecture.py +0 -0
  114. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/bart/modeling_bart.py +0 -0
  115. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/bert/__init__.py +0 -0
  116. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/bert/modeling_bert.py +0 -0
  117. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/clip/__init__.py +0 -0
  118. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/clip/modeling_clip.py +0 -0
  119. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/decoderonly/__init__.py +0 -0
  120. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py +0 -0
  121. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/dpt/__init__.py +0 -0
  122. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/dpt/modeling_dpt.py +0 -0
  123. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/exaone/__init__.py +0 -0
  124. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/exaone/exaone_architecture.py +0 -0
  125. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/exaone/modeling_exaone.py +0 -0
  126. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/gemma/__init__.py +0 -0
  127. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/gemma/gemma_architecture.py +0 -0
  128. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/gemma/modeling_gemma.py +0 -0
  129. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/gpt2/__init__.py +0 -0
  130. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/gpt2/gpt2_architecture.py +0 -0
  131. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/gpt2/modeling_gpt2.py +0 -0
  132. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/llama/__init__.py +0 -0
  133. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/llama/llama_architecture.py +0 -0
  134. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/llama/modeling_llama.py +0 -0
  135. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/llava_next/__init__.py +0 -0
  136. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/llava_next/modeling_llava_next.py +0 -0
  137. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/midm/__init__.py +0 -0
  138. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/midm/midm_architecture.py +0 -0
  139. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/midm/modeling_midm.py +0 -0
  140. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/mistral/__init__.py +0 -0
  141. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/mistral/mistral_architecture.py +0 -0
  142. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/mistral/modeling_mistral.py +0 -0
  143. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/phi/__init__.py +0 -0
  144. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/phi/modeling_phi.py +0 -0
  145. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/qwen2/__init__.py +0 -0
  146. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/qwen2/modeling_qwen2.py +0 -0
  147. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/qwen2/qwen2_architecture.py +0 -0
  148. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/seq2seq/__init__.py +0 -0
  149. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py +0 -0
  150. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/seq2seq/seq2seq_architecture.py +0 -0
  151. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/t5/__init__.py +0 -0
  152. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/t5/modeling_t5.py +0 -0
  153. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/t5/t5_architecture.py +0 -0
  154. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/wav2vec2/__init__.py +0 -0
  155. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py +0 -0
  156. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/whisper/__init__.py +0 -0
  157. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/whisper/generation_whisper.py +0 -0
  158. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/whisper/modeling_whisper.py +0 -0
  159. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/whisper/whisper_architecture.py +0 -0
  160. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/xlm_roberta/__init__.py +0 -0
  161. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py +0 -0
  162. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/utils/__init__.py +0 -0
  163. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/transformers/utils/rbln_quantization.py +0 -0
  164. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/utils/__init__.py +0 -0
  165. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/utils/decorator_utils.py +0 -0
  166. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/utils/hub.py +0 -0
  167. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/utils/import_utils.py +0 -0
  168. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/utils/logging.py +0 -0
  169. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/utils/model_utils.py +0 -0
  170. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/utils/runtime_utils.py +0 -0
  171. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/utils/save_utils.py +0 -0
  172. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/src/optimum/rbln/utils/submodule.py +0 -0
  173. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/tests/__init__.py +0 -0
  174. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/tests/psnr.py +0 -0
  175. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/tests/requirements_sdxl.txt +0 -0
  176. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/tests/run_stable_diffusion_xl_base.py +0 -0
  177. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/tests/test_base.py +0 -0
  178. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/tests/test_diffusers.py +0 -0
  179. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/tests/test_llm.py +0 -0
  180. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/tests/test_transformers.py +0 -0
  181. {optimum_rbln-0.7.3a4 → optimum_rbln-0.7.3a5}/uv.lock +0 -0
@@ -0,0 +1 @@
1
+ rebel_compiler_version: 0.7.3.dev196+ge9a294be
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: optimum-rbln
3
- Version: 0.7.3a4
3
+ Version: 0.7.3a5
4
4
  Summary: Optimum RBLN is the interface between the Hugging Face Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
5
5
  Project-URL: Homepage, https://rebellions.ai
6
6
  Project-URL: Documentation, https://docs.rbln.ai
@@ -17,5 +17,5 @@ __version__: str
17
17
  __version_tuple__: VERSION_TUPLE
18
18
  version_tuple: VERSION_TUPLE
19
19
 
20
- __version__ = version = '0.7.3a4'
21
- __version_tuple__ = version_tuple = (0, 7, 3, 'a4')
20
+ __version__ = version = '0.7.3a5'
21
+ __version_tuple__ = version_tuple = (0, 7, 3, 'a5')
@@ -685,27 +685,28 @@ class RBLNDecoderOnlyModelForCausalLM(RBLNModel):
685
685
  else:
686
686
  rbln_kvcache_block_size = rbln_kvcache_partition_len
687
687
 
688
- max_num_blocks, nbytes_per_block = cls.get_maximum_num_blocks(
689
- config=model_config,
690
- tensor_parallel_size=rbln_kwargs.get("tensor_parallel_size", 1),
691
- kvcache_block_size=rbln_kvcache_block_size,
692
- nbits_per_param=16 if rbln_quantization is None else 4, # TODO(jongho): FIX Ad-hoc
693
- n_model_params=rbln_kwargs["n_model_params"],
694
- )
695
- model_num_blocks = (rbln_max_seq_len // rbln_kvcache_block_size) * rbln_batch_size
696
- rbln_kvcache_num_blocks = min(model_num_blocks, max_num_blocks)
688
+ rbln_kvcache_num_blocks = (rbln_max_seq_len // rbln_kvcache_block_size) * rbln_batch_size
689
+ if rbln_attn_impl == "flash_attn":
690
+ max_num_blocks, _ = cls.get_maximum_num_blocks(
691
+ config=model_config,
692
+ tensor_parallel_size=rbln_kwargs.get("tensor_parallel_size", 1),
693
+ kvcache_block_size=rbln_kvcache_block_size,
694
+ nbits_per_param=16 if rbln_quantization is None else 4, # TODO(jongho): FIX Ad-hoc
695
+ n_model_params=rbln_kwargs["n_model_params"],
696
+ )
697
+ rbln_kvcache_num_blocks = min(rbln_kvcache_num_blocks, max_num_blocks)
697
698
 
698
- required_blocks = rbln_max_seq_len // rbln_kvcache_block_size + 1
699
- if rbln_kvcache_num_blocks < required_blocks:
700
- rbln_kvcache_num_blocks = required_blocks
699
+ required_blocks = rbln_max_seq_len // rbln_kvcache_block_size + 1
700
+ if rbln_kvcache_num_blocks < required_blocks:
701
+ rbln_kvcache_num_blocks = required_blocks
701
702
 
702
- logger.info(f"[KVCache] Compiling with num_blocks: {rbln_kvcache_num_blocks}")
703
+ logger.info(f"[KVCache] Compiling with num_blocks: {rbln_kvcache_num_blocks}")
703
704
 
704
- if rbln_kvcache_num_blocks < rbln_batch_size:
705
- raise RuntimeError(
706
- f"Batch size ({rbln_batch_size}) exceeds available KV cache blocks ({rbln_kvcache_num_blocks}). "
707
- "Ensure the number of blocks is at least equal to the batch size."
708
- )
705
+ if rbln_kvcache_num_blocks < rbln_batch_size:
706
+ raise RuntimeError(
707
+ f"Batch size ({rbln_batch_size}) exceeds available KV cache blocks ({rbln_kvcache_num_blocks}). "
708
+ "Ensure the number of blocks is at least equal to the batch size."
709
+ )
709
710
 
710
711
  num_attention_heads = getattr(model_config, "n_head", None) or getattr(model_config, "num_attention_heads")
711
712
  num_key_value_heads = getattr(model_config, "num_key_value_heads", None) or num_attention_heads
@@ -805,9 +806,6 @@ class RBLNDecoderOnlyModelForCausalLM(RBLNModel):
805
806
  "kvcache_block_size": rbln_kvcache_block_size,
806
807
  "attn_impl": rbln_attn_impl,
807
808
  "kvcache_num_blocks": rbln_kvcache_num_blocks,
808
- "model_num_blocks": model_num_blocks,
809
- "max_num_blocks": max_num_blocks,
810
- "nbytes_per_block": nbytes_per_block,
811
809
  }
812
810
  )
813
811
 
@@ -92,7 +92,7 @@ class PhiLayer(DecoderOnlyLayer):
92
92
 
93
93
  hidden_states = self.get_pre_attention_layernorm()(hidden_states)
94
94
 
95
- attn_outputs, present_key_values = self.self_attn(
95
+ attn_output = self.self_attn(
96
96
  hidden_states=hidden_states,
97
97
  attention_mask=attention_mask,
98
98
  seq_positions=seq_positions,
@@ -104,9 +104,9 @@ class PhiLayer(DecoderOnlyLayer):
104
104
 
105
105
  feed_forward_hidden_states = self._original_mod.mlp(hidden_states)
106
106
 
107
- hidden_states = attn_outputs + feed_forward_hidden_states + residual
107
+ hidden_states = attn_output + feed_forward_hidden_states + residual
108
108
 
109
- return hidden_states, present_key_values
109
+ return hidden_states
110
110
 
111
111
 
112
112
  class PhiModel(DecoderOnlyModel):
@@ -1 +0,0 @@
1
- rebel_compiler_version: 0.7.3.dev162+g81024cdb
File without changes
File without changes
File without changes