optimum-rbln 0.2.1a4__tar.gz → 0.2.1a5__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (169) hide show
  1. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/PKG-INFO +1 -1
  2. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/__version__.py +1 -1
  3. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/modeling_base.py +10 -9
  4. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py +3 -1
  5. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/seq2seq/seq2seq_architecture.py +1 -1
  6. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
  7. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/ISSUE_TEMPLATE/config.yml +0 -0
  8. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
  9. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/ISSUE_TEMPLATE/model_request.md +0 -0
  10. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/pull_request_template.md +0 -0
  11. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/scripts/auto_code_review.py +0 -0
  12. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/scripts/validate_pr_checklist.py +0 -0
  13. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/workflows/auto_code_review.yml +0 -0
  14. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/workflows/check_code_quality.yml +0 -0
  15. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/workflows/deploy-on-tag.yaml +0 -0
  16. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/workflows/deploy.yaml +0 -0
  17. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/workflows/pr-title-check.yaml +0 -0
  18. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/workflows/pr_checklist_validator.yml +0 -0
  19. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/workflows/rbln_dispatch_pytest.yaml +0 -0
  20. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/workflows/rbln_optimum_inference_test.yaml +0 -0
  21. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/workflows/rbln_optimum_pytest.yaml +0 -0
  22. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.github/workflows/rbln_trigger_on_pr.yaml +0 -0
  23. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/.gitignore +0 -0
  24. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/CODE_OF_CONDUCT.md +0 -0
  25. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/CONTRIBUTING.md +0 -0
  26. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/LICENSE +0 -0
  27. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/README.md +0 -0
  28. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/assets/rbln_logo.png +0 -0
  29. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/audio-classification/run_ast_audio_classification.py +0 -0
  30. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/depth-estimation/run_dpt.py +0 -0
  31. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/image-classification/run_image_classification.py +0 -0
  32. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/image-classification/run_vit_image_classification.py +0 -0
  33. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/image-to-text/run_llava_next_image_to_text.py +0 -0
  34. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/question-answering/run_question_answering.py +0 -0
  35. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/speech-recognition/run_wav2vec2.py +0 -0
  36. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/speech-recognition/run_whisper.py +0 -0
  37. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/stable-diffusion/run_stable_diffusion.py +0 -0
  38. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/stable-diffusion/run_stable_diffusion_controlnet.py +0 -0
  39. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/stable-diffusion/run_stable_diffusion_img2img.py +0 -0
  40. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/stable-diffusion/run_stable_diffusion_img2img_controlnet.py +0 -0
  41. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/stable-diffusion/run_stable_diffusion_inpaint.py +0 -0
  42. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/stable-diffusion/run_stable_diffusion_lora.py +0 -0
  43. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/stable-diffusion/run_stable_diffusion_multicontrolnet.py +0 -0
  44. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/text-classification/run_bge_m3_text_classification.py +0 -0
  45. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/text-classification/run_bge_reranker_v2_m3_text_classification.py +0 -0
  46. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/text-classification/run_secureBERT.py +0 -0
  47. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/text-classification/run_t5_classification.py +0 -0
  48. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/text-classification/run_twitter_roberta_text_classification.py +0 -0
  49. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/text2text-generation/run_bart_text2text_generation.py +0 -0
  50. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/text2text-generation/run_llama_peft.py +0 -0
  51. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/examples/text2text-generation/run_llama_text2text_generation.py +0 -0
  52. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/pyproject.toml +0 -0
  53. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/scripts/uv-lock.sh +0 -0
  54. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/scripts/uv-sync.sh +0 -0
  55. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/__init__.py +0 -0
  56. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/__init__.py +0 -0
  57. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/modeling_diffusers.py +0 -0
  58. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/models/__init__.py +0 -0
  59. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/models/autoencoders/__init__.py +0 -0
  60. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl.py +0 -0
  61. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/models/autoencoders/vae.py +0 -0
  62. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/models/controlnet.py +0 -0
  63. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/models/transformers/__init__.py +0 -0
  64. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/models/transformers/transformer_sd3.py +0 -0
  65. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/models/unets/__init__.py +0 -0
  66. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/models/unets/unet_2d_condition.py +0 -0
  67. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/__init__.py +0 -0
  68. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/controlnet/__init__.py +0 -0
  69. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py +0 -0
  70. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py +0 -0
  71. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py +0 -0
  72. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py +0 -0
  73. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py +0 -0
  74. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/__init__.py +0 -0
  75. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py +0 -0
  76. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py +0 -0
  77. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_inpaint.py +0 -0
  78. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/__init__.py +0 -0
  79. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py +0 -0
  80. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py +0 -0
  81. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py +0 -0
  82. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/__init__.py +0 -0
  83. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py +0 -0
  84. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py +0 -0
  85. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py +0 -0
  86. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/modeling.py +0 -0
  87. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/modeling_config.py +0 -0
  88. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/ops/__init__.py +0 -0
  89. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/ops/attn.py +0 -0
  90. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/ops/flash_attn.py +0 -0
  91. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/ops/kv_cache_update.py +0 -0
  92. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/__init__.py +0 -0
  93. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/modeling_alias.py +0 -0
  94. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/modeling_generic.py +0 -0
  95. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/modeling_rope_utils.py +0 -0
  96. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/__init__.py +0 -0
  97. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/auto/__init__.py +0 -0
  98. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/auto/auto_factory.py +0 -0
  99. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/auto/modeling_auto.py +0 -0
  100. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/bart/__init__.py +0 -0
  101. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/bart/bart_architecture.py +0 -0
  102. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/bart/modeling_bart.py +0 -0
  103. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/bert/__init__.py +0 -0
  104. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/bert/modeling_bert.py +0 -0
  105. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/clip/__init__.py +0 -0
  106. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/clip/modeling_clip.py +0 -0
  107. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/decoderonly/__init__.py +0 -0
  108. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +0 -0
  109. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/dpt/__init__.py +0 -0
  110. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/dpt/modeling_dpt.py +0 -0
  111. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/exaone/__init__.py +0 -0
  112. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/exaone/exaone_architecture.py +0 -0
  113. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/exaone/modeling_exaone.py +0 -0
  114. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/gemma/__init__.py +0 -0
  115. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/gemma/gemma_architecture.py +0 -0
  116. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/gemma/modeling_gemma.py +0 -0
  117. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/gpt2/__init__.py +0 -0
  118. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/gpt2/gpt2_architecture.py +0 -0
  119. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/gpt2/modeling_gpt2.py +0 -0
  120. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/llama/__init__.py +0 -0
  121. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/llama/llama_architecture.py +0 -0
  122. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/llama/modeling_llama.py +0 -0
  123. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/llava_next/__init__.py +0 -0
  124. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/llava_next/modeling_llava_next.py +0 -0
  125. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/midm/__init__.py +0 -0
  126. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/midm/midm_architecture.py +0 -0
  127. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/midm/modeling_midm.py +0 -0
  128. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/mistral/__init__.py +0 -0
  129. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/mistral/mistral_architecture.py +0 -0
  130. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/mistral/modeling_mistral.py +0 -0
  131. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/phi/__init__.py +0 -0
  132. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/phi/modeling_phi.py +0 -0
  133. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/phi/phi_architecture.py +0 -0
  134. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/qwen2/__init__.py +0 -0
  135. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/qwen2/modeling_qwen2.py +0 -0
  136. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/qwen2/qwen2_architecture.py +0 -0
  137. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/seq2seq/__init__.py +0 -0
  138. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py +0 -0
  139. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/t5/__init__.py +0 -0
  140. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/t5/modeling_t5.py +0 -0
  141. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/t5/t5_architecture.py +0 -0
  142. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/wav2vec2/__init__.py +0 -0
  143. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py +0 -0
  144. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/whisper/__init__.py +0 -0
  145. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/whisper/generation_whisper.py +0 -0
  146. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/whisper/modeling_whisper.py +0 -0
  147. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/whisper/whisper_architecture.py +0 -0
  148. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/xlm_roberta/__init__.py +0 -0
  149. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py +0 -0
  150. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/utils/__init__.py +0 -0
  151. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/transformers/utils/rbln_quantization.py +0 -0
  152. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/utils/__init__.py +0 -0
  153. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/utils/decorator_utils.py +0 -0
  154. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/utils/hub.py +0 -0
  155. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/utils/import_utils.py +0 -0
  156. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/utils/logging.py +0 -0
  157. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/utils/model_utils.py +0 -0
  158. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/utils/runtime_utils.py +0 -0
  159. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/utils/save_utils.py +0 -0
  160. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/src/optimum/rbln/utils/submodule.py +0 -0
  161. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/tests/__init__.py +0 -0
  162. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/tests/psnr.py +0 -0
  163. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/tests/requirements_sdxl.txt +0 -0
  164. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/tests/run_stable_diffusion_xl_base.py +0 -0
  165. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/tests/test_base.py +0 -0
  166. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/tests/test_diffusers.py +0 -0
  167. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/tests/test_llm.py +0 -0
  168. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/tests/test_transformers.py +0 -0
  169. {optimum_rbln-0.2.1a4 → optimum_rbln-0.2.1a5}/uv.lock +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: optimum-rbln
3
- Version: 0.2.1a4
3
+ Version: 0.2.1a5
4
4
  Summary: Optimum RBLN is the interface between the Hugging Face Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
5
5
  Project-URL: Homepage, https://rebellions.ai
6
6
  Project-URL: Documentation, https://docs.rbln.ai
@@ -12,5 +12,5 @@ __version__: str
12
12
  __version_tuple__: VERSION_TUPLE
13
13
  version_tuple: VERSION_TUPLE
14
14
 
15
- __version__ = version = '0.2.1a4'
15
+ __version__ = version = '0.2.1a5'
16
16
  __version_tuple__ = version_tuple = (0, 2, 1)
@@ -442,8 +442,9 @@ class RBLNBaseModel(SubModulesMixin, PushToHubMixin, PreTrainedModel):
442
442
  logger.error(f"Provided path ({save_directory}) should be a directory, not a file")
443
443
  return
444
444
 
445
- real_save_dir = self.model_save_dir / self.subfolder
446
- save_directory_path = Path(save_directory)
445
+ # Normalize paths to handle relative paths and symlinks
446
+ real_save_dir = Path(self.model_save_dir).resolve() / self.subfolder
447
+ save_directory_path = Path(save_directory).resolve()
447
448
 
448
449
  if not os.path.exists(real_save_dir) or not os.path.isdir(real_save_dir):
449
450
  raise FileNotFoundError(
@@ -452,13 +453,13 @@ class RBLNBaseModel(SubModulesMixin, PushToHubMixin, PreTrainedModel):
452
453
  f"Please ensure the model directory exists and you have the necessary permissions to access it."
453
454
  )
454
455
 
455
- if save_directory_path.absolute() == real_save_dir.absolute():
456
+ if save_directory_path == real_save_dir:
456
457
  raise FileExistsError(
457
458
  f"Cannot save model to '{save_directory}'. This directory already exists and contains the model files."
458
459
  )
459
460
 
460
- # Create a temporary directory next to the target directory
461
- tmp_dir = save_directory + ".tmp"
461
+ # Create a temporary directory with normalized path
462
+ tmp_dir = str(save_directory_path) + ".tmp"
462
463
  try:
463
464
  # Remove temporary directory if it exists from a previous failed attempt
464
465
  if os.path.exists(tmp_dir):
@@ -473,9 +474,9 @@ class RBLNBaseModel(SubModulesMixin, PushToHubMixin, PreTrainedModel):
473
474
  self.generation_config.save_pretrained(tmp_dir)
474
475
 
475
476
  # If everything succeeded, atomically replace the target directory
476
- if os.path.exists(save_directory):
477
- shutil.rmtree(save_directory)
478
- os.rename(tmp_dir, save_directory)
477
+ if os.path.exists(save_directory_path):
478
+ shutil.rmtree(save_directory_path)
479
+ os.rename(tmp_dir, save_directory_path)
479
480
 
480
481
  except Exception as e:
481
482
  # Clean up the temporary directory if anything fails
@@ -484,7 +485,7 @@ class RBLNBaseModel(SubModulesMixin, PushToHubMixin, PreTrainedModel):
484
485
  raise e # Re-raise the exception after cleanup
485
486
 
486
487
  if push_to_hub:
487
- return super().push_to_hub(save_directory, **kwargs)
488
+ return super().push_to_hub(str(save_directory_path), **kwargs)
488
489
 
489
490
  @staticmethod
490
491
  def _raise_missing_compiled_file_error(missing_files: List[str]):
@@ -427,12 +427,14 @@ class DecoderOnlyModel(nn.Module):
427
427
  cos, sin = None, None
428
428
 
429
429
  # (batch, seq_len) -> (batch,)
430
- seq_positions = cache_position[:, 0]
431
430
  if self.attn_impl == "flash_attn":
431
+ seq_positions = cache_position[:, 0]
432
432
  max_seq_len = past_key_values[0][0].shape[-2]
433
433
  seq_positions = self.convert_sequence_positions_for_flash_attn(
434
434
  seq_positions=seq_positions, max_seq_len=max_seq_len
435
435
  )
436
+ else:
437
+ seq_positions = cache_position[:, :1]
436
438
 
437
439
  present_key_values = past_key_values
438
440
  for layer in self.layers:
@@ -459,7 +459,7 @@ class Seq2SeqSelfAttention(nn.Module):
459
459
  ), # Unsqueeze group axis since CustomKernel expects it for group query attention
460
460
  past_key_value[0].view(bsz, self.num_heads, 1, -1, self.head_dim),
461
461
  past_key_value[1].view(bsz, self.num_heads, 1, -1, self.head_dim),
462
- cache_position.squeeze(1),
462
+ cache_position,
463
463
  torch.tensor(1.0, dtype=torch.float32), # scale
464
464
  )
465
465
 
File without changes
File without changes
File without changes