optimum-rbln 0.8.1a2__tar.gz → 0.8.1a3__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (266) hide show
  1. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/PKG-INFO +1 -1
  2. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/__version__.py +2 -2
  3. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +2 -2
  4. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gemma3/modeling_gemma3.py +4 -12
  5. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py +1 -11
  6. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py +0 -43
  7. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/tests/test_llm.py +2 -2
  8. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
  9. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/ISSUE_TEMPLATE/config.yml +0 -0
  10. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
  11. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/ISSUE_TEMPLATE/model_request.md +0 -0
  12. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/pull_request_template.md +0 -0
  13. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/scripts/auto_code_review.py +0 -0
  14. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/scripts/validate_pr_checklist.py +0 -0
  15. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/version.yaml +0 -0
  16. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/auto_code_review.yml +0 -0
  17. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/check_code_quality.yml +0 -0
  18. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/deploy-on-tag.yaml +0 -0
  19. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/deploy.yaml +0 -0
  20. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/pr-title-check.yaml +0 -0
  21. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/pr_checklist_validator.yml +0 -0
  22. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/rbln_check_compiler.yaml +0 -0
  23. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/rbln_dispatch_pytest.yaml +0 -0
  24. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/rbln_optimum_inference_test.yaml +0 -0
  25. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/rbln_optimum_pytest.yaml +0 -0
  26. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/rbln_scheduled_test.yaml +0 -0
  27. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.github/workflows/rbln_trigger_on_pr.yaml +0 -0
  28. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/.gitignore +0 -0
  29. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/CODE_OF_CONDUCT.md +0 -0
  30. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/CONTRIBUTING.md +0 -0
  31. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/LICENSE +0 -0
  32. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/README.md +0 -0
  33. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/assets/rbln_logo.png +0 -0
  34. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/advanced/custom_class.py +0 -0
  35. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/audio-classification/run_ast_audio_classification.py +0 -0
  36. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/depth-estimation/run_dpt.py +0 -0
  37. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/image-classification/run_image_classification.py +0 -0
  38. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/image-classification/run_vit_image_classification.py +0 -0
  39. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/image-to-text/run_idefics3.py +0 -0
  40. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/image-to-text/run_llava_next_image_to_text.py +0 -0
  41. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/kandinsky2_2/run_kandinsky2_2.py +0 -0
  42. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/kandinsky2_2/run_kandinsky2_2_combined.py +0 -0
  43. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/kandinsky2_2/run_kandinsky2_2_img2img.py +0 -0
  44. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/kandinsky2_2/run_kandinsky2_2_img2img_combined.py +0 -0
  45. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/kandinsky2_2/run_kandinsky2_2_inpaint.py +0 -0
  46. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/kandinsky2_2/run_kandinsky2_2_inpaint_combined.py +0 -0
  47. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/kandinsky2_2/run_kandinsky2_2_prior_interpolate.py +0 -0
  48. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/question-answering/run_question_answering.py +0 -0
  49. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/speech-recognition/run_wav2vec2.py +0 -0
  50. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/speech-recognition/run_whisper.py +0 -0
  51. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/stable-diffusion/run_stable_diffusion.py +0 -0
  52. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/stable-diffusion/run_stable_diffusion_controlnet.py +0 -0
  53. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/stable-diffusion/run_stable_diffusion_img2img.py +0 -0
  54. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/stable-diffusion/run_stable_diffusion_img2img_controlnet.py +0 -0
  55. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/stable-diffusion/run_stable_diffusion_inpaint.py +0 -0
  56. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/stable-diffusion/run_stable_diffusion_lora.py +0 -0
  57. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/stable-diffusion/run_stable_diffusion_multicontrolnet.py +0 -0
  58. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/text-classification/run_bge_m3_text_classification.py +0 -0
  59. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/text-classification/run_bge_reranker_v2_m3_text_classification.py +0 -0
  60. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/text-classification/run_secureBERT.py +0 -0
  61. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/text-classification/run_t5_classification.py +0 -0
  62. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/text-classification/run_twitter_roberta_text_classification.py +0 -0
  63. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/text2text-generation/run_bart_text2text_generation.py +0 -0
  64. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/text2text-generation/run_llama_peft.py +0 -0
  65. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/text2text-generation/run_llama_text2text_generation.py +0 -0
  66. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/examples/time-series-forecasting/run_time_series_forecasting.py +0 -0
  67. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/pyproject.toml +0 -0
  68. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/scripts/uv-lock.sh +0 -0
  69. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/scripts/uv-sync.sh +0 -0
  70. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/__init__.py +0 -0
  71. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/configuration_utils.py +0 -0
  72. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/__init__.py +0 -0
  73. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/__init__.py +0 -0
  74. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/models/__init__.py +0 -0
  75. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl.py +0 -0
  76. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/models/configuration_controlnet.py +0 -0
  77. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/models/configuration_prior_transformer.py +0 -0
  78. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/models/configuration_transformer_sd3.py +0 -0
  79. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/models/configuration_unet_2d_condition.py +0 -0
  80. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/models/configuration_vq_model.py +0 -0
  81. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/pipelines/__init__.py +0 -0
  82. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_controlnet.py +0 -0
  83. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_kandinsky2_2.py +0 -0
  84. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion.py +0 -0
  85. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_3.py +0 -0
  86. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_xl.py +0 -0
  87. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/modeling_diffusers.py +0 -0
  88. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/models/__init__.py +0 -0
  89. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/models/autoencoders/__init__.py +0 -0
  90. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl.py +0 -0
  91. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/models/autoencoders/vae.py +0 -0
  92. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/models/autoencoders/vq_model.py +0 -0
  93. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/models/controlnet.py +0 -0
  94. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/models/transformers/__init__.py +0 -0
  95. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/models/transformers/prior_transformer.py +0 -0
  96. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/models/transformers/transformer_sd3.py +0 -0
  97. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/models/unets/__init__.py +0 -0
  98. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/models/unets/unet_2d_condition.py +0 -0
  99. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/__init__.py +0 -0
  100. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/controlnet/__init__.py +0 -0
  101. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py +0 -0
  102. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py +0 -0
  103. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py +0 -0
  104. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py +0 -0
  105. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py +0 -0
  106. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/__init__.py +0 -0
  107. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2.py +0 -0
  108. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_combined.py +0 -0
  109. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_img2img.py +0 -0
  110. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_inpaint.py +0 -0
  111. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_prior.py +0 -0
  112. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/__init__.py +0 -0
  113. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py +0 -0
  114. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py +0 -0
  115. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_inpaint.py +0 -0
  116. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/__init__.py +0 -0
  117. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py +0 -0
  118. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py +0 -0
  119. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py +0 -0
  120. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/__init__.py +0 -0
  121. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py +0 -0
  122. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py +0 -0
  123. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py +0 -0
  124. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/modeling.py +0 -0
  125. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/modeling_base.py +0 -0
  126. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/ops/__init__.py +0 -0
  127. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/ops/attn.py +0 -0
  128. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/ops/flash_attn.py +0 -0
  129. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/ops/kv_cache_update.py +0 -0
  130. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/ops/linear.py +0 -0
  131. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/ops/sliding_window_attn.py +0 -0
  132. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/__init__.py +0 -0
  133. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/configuration_generic.py +0 -0
  134. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/modeling_generic.py +0 -0
  135. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/modeling_rope_utils.py +0 -0
  136. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/__init__.py +0 -0
  137. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/__init__.py +0 -0
  138. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/configuration_audio_spectrogram_transformer.py +0 -0
  139. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/audio_spectrogram_transformer/modeling_audio_spectrogram_transformer.py +0 -0
  140. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/auto/__init__.py +0 -0
  141. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/auto/auto_factory.py +0 -0
  142. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/auto/modeling_auto.py +0 -0
  143. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/bart/__init__.py +0 -0
  144. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/bart/bart_architecture.py +0 -0
  145. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/bart/configuration_bart.py +0 -0
  146. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/bart/modeling_bart.py +0 -0
  147. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/bert/__init__.py +0 -0
  148. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/bert/configuration_bert.py +0 -0
  149. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/bert/modeling_bert.py +0 -0
  150. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/blip_2/__init__.py +0 -0
  151. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/blip_2/configuration_blip_2.py +0 -0
  152. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/blip_2/modeling_blip_2.py +0 -0
  153. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/clip/__init__.py +0 -0
  154. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/clip/configuration_clip.py +0 -0
  155. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/clip/modeling_clip.py +0 -0
  156. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/decoderonly/__init__.py +0 -0
  157. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py +0 -0
  158. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py +0 -0
  159. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/distilbert/__init__.py +0 -0
  160. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/distilbert/configuration_distilbert.py +0 -0
  161. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/distilbert/modeling_distilbert.py +0 -0
  162. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/dpt/__init__.py +0 -0
  163. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/dpt/configuration_dpt.py +0 -0
  164. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/dpt/modeling_dpt.py +0 -0
  165. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/exaone/__init__.py +0 -0
  166. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/exaone/configuration_exaone.py +0 -0
  167. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/exaone/exaone_architecture.py +0 -0
  168. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/exaone/modeling_exaone.py +0 -0
  169. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gemma/__init__.py +0 -0
  170. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gemma/configuration_gemma.py +0 -0
  171. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gemma/gemma_architecture.py +0 -0
  172. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gemma/modeling_gemma.py +0 -0
  173. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gemma3/__init__.py +0 -0
  174. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gemma3/configuration_gemma3.py +0 -0
  175. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gemma3/gemma3_architecture.py +0 -0
  176. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gpt2/__init__.py +0 -0
  177. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gpt2/configuration_gpt2.py +0 -0
  178. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gpt2/gpt2_architecture.py +0 -0
  179. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/gpt2/modeling_gpt2.py +0 -0
  180. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/idefics3/__init__.py +0 -0
  181. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/idefics3/configuration_idefics3.py +0 -0
  182. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/idefics3/modeling_idefics3.py +0 -0
  183. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/llama/__init__.py +0 -0
  184. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/llama/configuration_llama.py +0 -0
  185. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/llama/llama_architecture.py +0 -0
  186. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/llama/modeling_llama.py +0 -0
  187. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/llava_next/__init__.py +0 -0
  188. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/llava_next/configuration_llava_next.py +0 -0
  189. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/llava_next/modeling_llava_next.py +0 -0
  190. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/midm/__init__.py +0 -0
  191. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/midm/configuration_midm.py +0 -0
  192. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/midm/midm_architecture.py +0 -0
  193. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/midm/modeling_midm.py +0 -0
  194. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/mistral/__init__.py +0 -0
  195. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/mistral/configuration_mistral.py +0 -0
  196. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/mistral/mistral_architecture.py +0 -0
  197. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/mistral/modeling_mistral.py +0 -0
  198. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/opt/__init__.py +0 -0
  199. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/opt/configuration_opt.py +0 -0
  200. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/opt/modeling_opt.py +0 -0
  201. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/opt/opt_architecture.py +0 -0
  202. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/phi/__init__.py +0 -0
  203. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/phi/configuration_phi.py +0 -0
  204. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/phi/modeling_phi.py +0 -0
  205. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/phi/phi_architecture.py +0 -0
  206. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/qwen2/__init__.py +0 -0
  207. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/qwen2/configuration_qwen2.py +0 -0
  208. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/qwen2/modeling_qwen2.py +0 -0
  209. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/qwen2/qwen2_architecture.py +0 -0
  210. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/qwen2_5_vl/__init__.py +0 -0
  211. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py +0 -0
  212. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/resnet/__init__.py +0 -0
  213. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/resnet/configuration_resnet.py +0 -0
  214. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/resnet/modeling_resnet.py +0 -0
  215. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/roberta/__init__.py +0 -0
  216. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/roberta/configuration_roberta.py +0 -0
  217. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/roberta/modeling_roberta.py +0 -0
  218. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/seq2seq/__init__.py +0 -0
  219. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/seq2seq/configuration_seq2seq.py +0 -0
  220. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py +0 -0
  221. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/seq2seq/seq2seq_architecture.py +0 -0
  222. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/siglip/__init__.py +0 -0
  223. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/siglip/configuration_siglip.py +0 -0
  224. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/siglip/modeling_siglip.py +0 -0
  225. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/t5/__init__.py +0 -0
  226. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/t5/configuration_t5.py +0 -0
  227. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/t5/modeling_t5.py +0 -0
  228. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/t5/t5_architecture.py +0 -0
  229. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/time_series_transformer/__init__.py +0 -0
  230. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/time_series_transformer/configuration_time_series_transformer.py +0 -0
  231. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/time_series_transformer/modeling_time_series_transformer.py +0 -0
  232. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/time_series_transformer/time_series_transformers_architecture.py +0 -0
  233. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/vit/__init__.py +0 -0
  234. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/vit/configuration_vit.py +0 -0
  235. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/vit/modeling_vit.py +0 -0
  236. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/wav2vec2/__init__.py +0 -0
  237. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/wav2vec2/configuration_wav2vec2.py +0 -0
  238. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py +0 -0
  239. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/whisper/__init__.py +0 -0
  240. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/whisper/configuration_whisper.py +0 -0
  241. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/whisper/generation_whisper.py +0 -0
  242. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/whisper/modeling_whisper.py +0 -0
  243. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/whisper/whisper_architecture.py +0 -0
  244. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/xlm_roberta/__init__.py +0 -0
  245. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/xlm_roberta/configuration_xlm_roberta.py +0 -0
  246. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py +0 -0
  247. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/utils/__init__.py +0 -0
  248. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/transformers/utils/rbln_quantization.py +0 -0
  249. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/utils/__init__.py +0 -0
  250. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/utils/decorator_utils.py +0 -0
  251. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/utils/hub.py +0 -0
  252. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/utils/import_utils.py +0 -0
  253. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/utils/logging.py +0 -0
  254. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/utils/model_utils.py +0 -0
  255. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/utils/runtime_utils.py +0 -0
  256. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/utils/save_utils.py +0 -0
  257. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/src/optimum/rbln/utils/submodule.py +0 -0
  258. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/tests/__init__.py +0 -0
  259. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/tests/psnr.py +0 -0
  260. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/tests/requirements_sdxl.txt +0 -0
  261. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/tests/run_stable_diffusion_xl_base.py +0 -0
  262. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/tests/test_base.py +0 -0
  263. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/tests/test_config.py +0 -0
  264. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/tests/test_diffusers.py +0 -0
  265. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/tests/test_transformers.py +0 -0
  266. {optimum_rbln-0.8.1a2 → optimum_rbln-0.8.1a3}/uv.lock +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: optimum-rbln
3
- Version: 0.8.1a2
3
+ Version: 0.8.1a3
4
4
  Summary: Optimum RBLN is the interface between the HuggingFace Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
5
5
  Project-URL: Homepage, https://rebellions.ai
6
6
  Project-URL: Documentation, https://docs.rbln.ai
@@ -17,5 +17,5 @@ __version__: str
17
17
  __version_tuple__: VERSION_TUPLE
18
18
  version_tuple: VERSION_TUPLE
19
19
 
20
- __version__ = version = '0.8.1a2'
21
- __version_tuple__ = version_tuple = (0, 8, 1, 'a2')
20
+ __version__ = version = '0.8.1a3'
21
+ __version_tuple__ = version_tuple = (0, 8, 1, 'a3')
@@ -177,8 +177,8 @@ class RBLNRuntimeModel(RBLNPytorchRuntime):
177
177
  )
178
178
  elif block_tables is None and local_block_tables is None:
179
179
  return False
180
- else:
181
- return True
180
+
181
+ return True
182
182
 
183
183
  def forward(
184
184
  self,
@@ -559,7 +559,7 @@ class RBLNGemma3RuntimeModel(RBLNRuntimeModel):
559
559
  (
560
560
  inputs,
561
561
  cache_position,
562
- chunked_attention_mask,
562
+ padded_attention_mask,
563
563
  out_buffers,
564
564
  position_ids,
565
565
  position_embed,
@@ -571,7 +571,7 @@ class RBLNGemma3RuntimeModel(RBLNRuntimeModel):
571
571
  )
572
572
  if not is_external_block_tables:
573
573
  local_block_tables = torch.tensor([batch_idx], dtype=torch.int16)
574
- self.dec_attn_mask[batch_idx : batch_idx + 1] = chunked_attention_mask[:1]
574
+ self.dec_attn_mask[batch_idx : batch_idx + 1] = padded_attention_mask[:1]
575
575
 
576
576
  if self.rbln_config.use_attention_mask and self.rbln_config.use_position_ids:
577
577
  chunked_attention_mask = torch.zeros(1, self.rbln_config.max_seq_len, dtype=torch.float32)
@@ -587,18 +587,10 @@ class RBLNGemma3RuntimeModel(RBLNRuntimeModel):
587
587
  else None
588
588
  )
589
589
 
590
- # Not used in Gemma3 yet.
591
590
  if self.rbln_config.use_attention_mask:
592
591
  if self.rbln_config.use_position_ids:
593
- chunked_attention_mask[0, step : step + self.rbln_config.prefill_chunk_size] = self.dec_attn_mask[
594
- batch_idx, step : step + self.rbln_config.prefill_chunk_size
595
- ]
596
- else:
597
- # Update attention mask to ensure proper causal behavior
598
- if step >= self.rbln_config.prefill_chunk_size:
599
- chunked_attention_mask[:, :, :, step - self.rbln_config.prefill_chunk_size : step] = 1
600
- chunked_attention_mask[:, :, :, step : step + self.rbln_config.prefill_chunk_size] = (
601
- self.causal_mask
592
+ chunked_attention_mask[0, step : step + self.rbln_config.prefill_chunk_size] = (
593
+ padded_attention_mask[0, step : step + self.rbln_config.prefill_chunk_size]
602
594
  )
603
595
 
604
596
  # Define query position
@@ -28,7 +28,6 @@ from transformers.models.qwen2_5_vl.modeling_qwen2_5_vl import (
28
28
  Qwen2_5_VisionPatchEmbed,
29
29
  Qwen2_5_VisionRotaryEmbedding,
30
30
  Qwen2_5_VisionTransformerPretrainedModel,
31
- Qwen2_5_VLModel,
32
31
  Qwen2_5_VLRotaryEmbedding,
33
32
  )
34
33
 
@@ -391,14 +390,6 @@ class RBLNQwen2_5_VLForConditionalGeneration(RBLNDecoderOnlyModelForCausalLM):
391
390
  def can_generate(self):
392
391
  return True
393
392
 
394
- @classmethod
395
- def get_pytorch_model(cls, *args, **kwargs):
396
- model = super().get_pytorch_model(*args, **kwargs)
397
- model.model.lm_head = model.lm_head
398
- model.lm_head = None
399
- del model.lm_head
400
- return model
401
-
402
393
  @classmethod
403
394
  def update_kwargs(cls, kwargs):
404
395
  kwargs.update(
@@ -540,8 +531,7 @@ class RBLNQwen2_5_VLForConditionalGeneration(RBLNDecoderOnlyModelForCausalLM):
540
531
  vision_tokens = input_id[0][vision_start_indices + 1]
541
532
  image_nums = (vision_tokens == image_token_id).sum()
542
533
  video_nums = (vision_tokens == video_token_id).sum()
543
- position_ids, rope_deltas = Qwen2_5_VLModel.get_rope_index(
544
- self,
534
+ position_ids, rope_deltas = self.get_rope_index(
545
535
  input_id,
546
536
  image_grid_thw[image_idx : image_idx + image_nums] if image_grid_thw is not None else None,
547
537
  video_grid_thw[video_idx : video_idx + video_nums] if video_grid_thw is not None else None,
@@ -3,14 +3,8 @@ from typing import Tuple
3
3
 
4
4
  import torch
5
5
  import torch.nn as nn
6
- from transformers import PreTrainedModel
7
6
 
8
7
  from ..decoderonly.decoderonly_architecture import (
9
- DecoderOnlyAttention,
10
- DecoderOnlyFlashAttention,
11
- DecoderOnlyForCausalLM,
12
- DecoderOnlyLayer,
13
- DecoderOnlyModel,
14
8
  DecoderOnlyWrapper,
15
9
  apply_rotary_pos_emb,
16
10
  )
@@ -203,40 +197,3 @@ class Qwen2_5_VL_LanguageModelWrapper(DecoderOnlyWrapper):
203
197
  past_key_values,
204
198
  position_embeds,
205
199
  )
206
-
207
- def convert_to_rbln_causal_lm(self, causal_lm: PreTrainedModel, max_seq_len: int):
208
- new_layers = []
209
-
210
- for layer in causal_lm.model.language_model.layers:
211
- if self.attn_impl == "eager":
212
- new_self_attn = DecoderOnlyAttention(
213
- layer.self_attn,
214
- self.use_attention_mask,
215
- self.use_position_ids,
216
- kvcache_block_size=self.kvcache_block_size,
217
- )
218
- elif self.attn_impl == "flash_attn":
219
- new_self_attn = DecoderOnlyFlashAttention(
220
- layer.self_attn,
221
- kvcache_partition_len=self.kvcache_partition_len,
222
- kvcache_block_size=self.kvcache_block_size,
223
- use_attention_mask=self.use_attention_mask,
224
- use_position_ids=self.use_position_ids,
225
- )
226
- else:
227
- raise NotImplementedError(f"Unknwon attn : {self.attn_impl}")
228
-
229
- new_layer = DecoderOnlyLayer(layer, new_self_attn)
230
- new_layers.append(new_layer)
231
-
232
- new_model = DecoderOnlyModel(
233
- causal_lm.model.language_model,
234
- new_layers,
235
- partition_len=self.kvcache_partition_len,
236
- max_seq_len=max_seq_len,
237
- kvcache_block_size=self.kvcache_block_size,
238
- use_learned_pos_emb=self.use_learned_pos_emb,
239
- sliding_window_layers=self.sliding_window_layers,
240
- )
241
- new_causal_lm = DecoderOnlyForCausalLM(causal_lm.model, new_model)
242
- return new_causal_lm
@@ -67,7 +67,7 @@ class LLMTest:
67
67
  class TestQwen2Model(LLMTest.TestLLM):
68
68
  RBLN_CLASS = RBLNQwen2ForCausalLM
69
69
  HF_MODEL_ID = "Qwen/Qwen2-0.5B-Instruct"
70
- EXPECTED_OUTPUT = " I am a 30-year-old woman who has been living with lupus for over 1"
70
+ EXPECTED_OUTPUT = " I am a 20 year old girl from the United States. I have been studying English for"
71
71
  HF_CONFIG_KWARGS = {"max_position_embeddings": 1024}
72
72
 
73
73
 
@@ -108,7 +108,7 @@ class TestLlamaForCausalLM_Flash(LLMTest.TestLLM):
108
108
  class TestLlamaForCausalLM_Multibatch(TestLlamaForCausalLM):
109
109
  PROMPT = ["Who are you?", "What is the capital of France?", "What is the capital of Germany?"]
110
110
  EXPECTED_OUTPUT = [
111
- "reress makefable R���� noethetsshss rechoolso�",
111
+ "reress makefable R���� noethetss0oss invetetet",
112
112
  "resget makeget makeichget makeichualichual#choolchool accngngngng",
113
113
  "resget makeget makeichget makeichualichual#choolchool accngngngng",
114
114
  ]
File without changes
File without changes