optimum-rbln 0.7.5rc2__tar.gz → 0.8.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (252) hide show
  1. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/rbln_optimum_pytest.yaml +1 -0
  2. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/PKG-INFO +1 -1
  3. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/__version__.py +2 -2
  4. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gemma3/configuration_gemma3.py +6 -1
  5. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gemma3/modeling_gemma3.py +0 -5
  6. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py +1 -2
  7. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/tests/test_llm.py +1 -54
  8. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
  9. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/ISSUE_TEMPLATE/config.yml +0 -0
  10. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
  11. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/ISSUE_TEMPLATE/model_request.md +0 -0
  12. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/pull_request_template.md +0 -0
  13. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/scripts/auto_code_review.py +0 -0
  14. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/scripts/validate_pr_checklist.py +0 -0
  15. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/version.yaml +0 -0
  16. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/auto_code_review.yml +0 -0
  17. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/check_code_quality.yml +0 -0
  18. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/deploy-on-tag.yaml +0 -0
  19. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/deploy.yaml +0 -0
  20. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/pr-title-check.yaml +0 -0
  21. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/pr_checklist_validator.yml +0 -0
  22. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/rbln_check_compiler.yaml +0 -0
  23. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/rbln_dispatch_pytest.yaml +0 -0
  24. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/rbln_optimum_inference_test.yaml +0 -0
  25. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/rbln_scheduled_test.yaml +0 -0
  26. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.github/workflows/rbln_trigger_on_pr.yaml +0 -0
  27. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/.gitignore +0 -0
  28. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/CODE_OF_CONDUCT.md +0 -0
  29. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/CONTRIBUTING.md +0 -0
  30. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/LICENSE +0 -0
  31. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/README.md +0 -0
  32. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/assets/rbln_logo.png +0 -0
  33. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/audio-classification/run_ast_audio_classification.py +0 -0
  34. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/depth-estimation/run_dpt.py +0 -0
  35. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/image-classification/run_image_classification.py +0 -0
  36. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/image-classification/run_vit_image_classification.py +0 -0
  37. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/image-to-text/run_idefics3.py +0 -0
  38. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/image-to-text/run_llava_next_image_to_text.py +0 -0
  39. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/kandinsky2_2/run_kandinsky2_2.py +0 -0
  40. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/kandinsky2_2/run_kandinsky2_2_combined.py +0 -0
  41. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/kandinsky2_2/run_kandinsky2_2_img2img.py +0 -0
  42. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/kandinsky2_2/run_kandinsky2_2_img2img_combined.py +0 -0
  43. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/kandinsky2_2/run_kandinsky2_2_inpaint.py +0 -0
  44. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/kandinsky2_2/run_kandinsky2_2_inpaint_combined.py +0 -0
  45. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/kandinsky2_2/run_kandinsky2_2_prior_interpolate.py +0 -0
  46. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/question-answering/run_question_answering.py +0 -0
  47. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/speech-recognition/run_wav2vec2.py +0 -0
  48. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/speech-recognition/run_whisper.py +0 -0
  49. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/stable-diffusion/run_stable_diffusion.py +0 -0
  50. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/stable-diffusion/run_stable_diffusion_controlnet.py +0 -0
  51. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/stable-diffusion/run_stable_diffusion_img2img.py +0 -0
  52. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/stable-diffusion/run_stable_diffusion_img2img_controlnet.py +0 -0
  53. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/stable-diffusion/run_stable_diffusion_inpaint.py +0 -0
  54. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/stable-diffusion/run_stable_diffusion_lora.py +0 -0
  55. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/stable-diffusion/run_stable_diffusion_multicontrolnet.py +0 -0
  56. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/text-classification/run_bge_m3_text_classification.py +0 -0
  57. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/text-classification/run_bge_reranker_v2_m3_text_classification.py +0 -0
  58. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/text-classification/run_secureBERT.py +0 -0
  59. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/text-classification/run_t5_classification.py +0 -0
  60. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/text-classification/run_twitter_roberta_text_classification.py +0 -0
  61. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/text2text-generation/run_bart_text2text_generation.py +0 -0
  62. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/text2text-generation/run_llama_peft.py +0 -0
  63. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/text2text-generation/run_llama_text2text_generation.py +0 -0
  64. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/examples/time-series-forecasting/run_time_series_forecasting.py +0 -0
  65. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/pyproject.toml +0 -0
  66. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/scripts/uv-lock.sh +0 -0
  67. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/scripts/uv-sync.sh +0 -0
  68. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/__init__.py +0 -0
  69. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/configuration_utils.py +0 -0
  70. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/__init__.py +0 -0
  71. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/__init__.py +0 -0
  72. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/models/__init__.py +0 -0
  73. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/models/configuration_autoencoder_kl.py +0 -0
  74. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/models/configuration_controlnet.py +0 -0
  75. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/models/configuration_prior_transformer.py +0 -0
  76. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/models/configuration_transformer_sd3.py +0 -0
  77. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/models/configuration_unet_2d_condition.py +0 -0
  78. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/models/configuration_vq_model.py +0 -0
  79. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/pipelines/__init__.py +0 -0
  80. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_controlnet.py +0 -0
  81. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_kandinsky2_2.py +0 -0
  82. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion.py +0 -0
  83. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_3.py +0 -0
  84. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/configurations/pipelines/configuration_stable_diffusion_xl.py +0 -0
  85. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/modeling_diffusers.py +0 -0
  86. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/models/__init__.py +0 -0
  87. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/models/autoencoders/__init__.py +0 -0
  88. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/models/autoencoders/autoencoder_kl.py +0 -0
  89. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/models/autoencoders/vae.py +0 -0
  90. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/models/autoencoders/vq_model.py +0 -0
  91. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/models/controlnet.py +0 -0
  92. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/models/transformers/__init__.py +0 -0
  93. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/models/transformers/prior_transformer.py +0 -0
  94. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/models/transformers/transformer_sd3.py +0 -0
  95. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/models/unets/__init__.py +0 -0
  96. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/models/unets/unet_2d_condition.py +0 -0
  97. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/__init__.py +0 -0
  98. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/controlnet/__init__.py +0 -0
  99. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py +0 -0
  100. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py +0 -0
  101. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py +0 -0
  102. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py +0 -0
  103. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py +0 -0
  104. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/__init__.py +0 -0
  105. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2.py +0 -0
  106. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_combined.py +0 -0
  107. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_img2img.py +0 -0
  108. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_inpaint.py +0 -0
  109. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_prior.py +0 -0
  110. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/__init__.py +0 -0
  111. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py +0 -0
  112. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py +0 -0
  113. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_inpaint.py +0 -0
  114. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/__init__.py +0 -0
  115. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py +0 -0
  116. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py +0 -0
  117. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py +0 -0
  118. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/__init__.py +0 -0
  119. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py +0 -0
  120. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py +0 -0
  121. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py +0 -0
  122. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/modeling.py +0 -0
  123. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/modeling_base.py +0 -0
  124. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/ops/__init__.py +0 -0
  125. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/ops/attn.py +0 -0
  126. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/ops/flash_attn.py +0 -0
  127. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/ops/kv_cache_update.py +0 -0
  128. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/ops/linear.py +0 -0
  129. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/ops/sliding_window_attn.py +0 -0
  130. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/__init__.py +0 -0
  131. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/configuration_alias.py +0 -0
  132. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/configuration_generic.py +0 -0
  133. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/modeling_alias.py +0 -0
  134. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/modeling_generic.py +0 -0
  135. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/modeling_rope_utils.py +0 -0
  136. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/__init__.py +0 -0
  137. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/auto/__init__.py +0 -0
  138. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/auto/auto_factory.py +0 -0
  139. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/auto/modeling_auto.py +0 -0
  140. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/bart/__init__.py +0 -0
  141. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/bart/bart_architecture.py +0 -0
  142. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/bart/configuration_bart.py +0 -0
  143. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/bart/modeling_bart.py +0 -0
  144. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/bert/__init__.py +0 -0
  145. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/bert/configuration_bert.py +0 -0
  146. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/bert/modeling_bert.py +0 -0
  147. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/blip_2/__init__.py +0 -0
  148. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/blip_2/configuration_blip_2.py +0 -0
  149. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/blip_2/modeling_blip_2.py +0 -0
  150. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/clip/__init__.py +0 -0
  151. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/clip/configuration_clip.py +0 -0
  152. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/clip/modeling_clip.py +0 -0
  153. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/decoderonly/__init__.py +0 -0
  154. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/decoderonly/configuration_decoderonly.py +0 -0
  155. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py +0 -0
  156. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +0 -0
  157. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/dpt/__init__.py +0 -0
  158. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/dpt/configuration_dpt.py +0 -0
  159. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/dpt/modeling_dpt.py +0 -0
  160. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/exaone/__init__.py +0 -0
  161. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/exaone/configuration_exaone.py +0 -0
  162. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/exaone/exaone_architecture.py +0 -0
  163. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/exaone/modeling_exaone.py +0 -0
  164. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gemma/__init__.py +0 -0
  165. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gemma/configuration_gemma.py +0 -0
  166. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gemma/gemma_architecture.py +0 -0
  167. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gemma/modeling_gemma.py +0 -0
  168. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gemma3/__init__.py +0 -0
  169. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gemma3/gemma3_architecture.py +0 -0
  170. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gpt2/__init__.py +0 -0
  171. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gpt2/configuration_gpt2.py +0 -0
  172. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gpt2/gpt2_architecture.py +0 -0
  173. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/gpt2/modeling_gpt2.py +0 -0
  174. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/idefics3/__init__.py +0 -0
  175. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/idefics3/configuration_idefics3.py +0 -0
  176. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/idefics3/modeling_idefics3.py +0 -0
  177. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/llama/__init__.py +0 -0
  178. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/llama/configuration_llama.py +0 -0
  179. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/llama/llama_architecture.py +0 -0
  180. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/llama/modeling_llama.py +0 -0
  181. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/llava_next/__init__.py +0 -0
  182. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/llava_next/configuration_llava_next.py +0 -0
  183. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/llava_next/modeling_llava_next.py +0 -0
  184. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/midm/__init__.py +0 -0
  185. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/midm/configuration_midm.py +0 -0
  186. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/midm/midm_architecture.py +0 -0
  187. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/midm/modeling_midm.py +0 -0
  188. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/mistral/__init__.py +0 -0
  189. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/mistral/configuration_mistral.py +0 -0
  190. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/mistral/mistral_architecture.py +0 -0
  191. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/mistral/modeling_mistral.py +0 -0
  192. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/opt/__init__.py +0 -0
  193. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/opt/configuration_opt.py +0 -0
  194. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/opt/modeling_opt.py +0 -0
  195. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/opt/opt_architecture.py +0 -0
  196. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/phi/__init__.py +0 -0
  197. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/phi/configuration_phi.py +0 -0
  198. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/phi/modeling_phi.py +0 -0
  199. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/phi/phi_architecture.py +0 -0
  200. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/qwen2/__init__.py +0 -0
  201. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/qwen2/configuration_qwen2.py +0 -0
  202. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/qwen2/modeling_qwen2.py +0 -0
  203. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/qwen2/qwen2_architecture.py +0 -0
  204. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/qwen2_5_vl/__init__.py +0 -0
  205. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/qwen2_5_vl/configuration_qwen2_5_vl.py +0 -0
  206. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/qwen2_5_vl/qwen2_5_vl_architecture.py +0 -0
  207. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/seq2seq/__init__.py +0 -0
  208. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/seq2seq/configuration_seq2seq2.py +0 -0
  209. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py +0 -0
  210. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/seq2seq/seq2seq_architecture.py +0 -0
  211. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/siglip/__init__.py +0 -0
  212. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/siglip/configuration_siglip.py +0 -0
  213. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/siglip/modeling_siglip.py +0 -0
  214. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/t5/__init__.py +0 -0
  215. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/t5/configuration_t5.py +0 -0
  216. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/t5/modeling_t5.py +0 -0
  217. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/t5/t5_architecture.py +0 -0
  218. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/time_series_transformers/__init__.py +0 -0
  219. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/time_series_transformers/configuration_time_series_transformer.py +0 -0
  220. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/time_series_transformers/modeling_time_series_transformers.py +0 -0
  221. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/time_series_transformers/time_series_transformers_architecture.py +0 -0
  222. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/wav2vec2/__init__.py +0 -0
  223. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/wav2vec2/configuration_wav2vec.py +0 -0
  224. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py +0 -0
  225. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/whisper/__init__.py +0 -0
  226. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/whisper/configuration_whisper.py +0 -0
  227. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/whisper/generation_whisper.py +0 -0
  228. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/whisper/modeling_whisper.py +0 -0
  229. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/whisper/whisper_architecture.py +0 -0
  230. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/xlm_roberta/__init__.py +0 -0
  231. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/xlm_roberta/configuration_xlm_roberta.py +0 -0
  232. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py +0 -0
  233. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/utils/__init__.py +0 -0
  234. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/transformers/utils/rbln_quantization.py +0 -0
  235. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/utils/__init__.py +0 -0
  236. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/utils/decorator_utils.py +0 -0
  237. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/utils/hub.py +0 -0
  238. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/utils/import_utils.py +0 -0
  239. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/utils/logging.py +0 -0
  240. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/utils/model_utils.py +0 -0
  241. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/utils/runtime_utils.py +0 -0
  242. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/utils/save_utils.py +0 -0
  243. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/src/optimum/rbln/utils/submodule.py +0 -0
  244. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/tests/__init__.py +0 -0
  245. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/tests/psnr.py +0 -0
  246. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/tests/requirements_sdxl.txt +0 -0
  247. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/tests/run_stable_diffusion_xl_base.py +0 -0
  248. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/tests/test_base.py +0 -0
  249. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/tests/test_config.py +0 -0
  250. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/tests/test_diffusers.py +0 -0
  251. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/tests/test_transformers.py +0 -0
  252. {optimum_rbln-0.7.5rc2 → optimum_rbln-0.8.0}/uv.lock +0 -0
@@ -25,6 +25,7 @@ env:
25
25
  REBEL_PYPI_ENDPOINT: ${{ vars.REBEL_PYPI_INTERNAL_ENDPOINT }}
26
26
  REBEL_PYPI_USERNAME: ${{ secrets.REBEL_PYPI_USERNAME }}
27
27
  REBEL_PYPI_PASSWORD: ${{ secrets.REBEL_PYPI_PASSWORD }}
28
+ HF_HOME: ${{ secrets.HF_HOME }}
28
29
 
29
30
  jobs:
30
31
  pytest:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: optimum-rbln
3
- Version: 0.7.5rc2
3
+ Version: 0.8.0
4
4
  Summary: Optimum RBLN is the interface between the HuggingFace Transformers and Diffusers libraries and RBLN accelerators. It provides a set of tools enabling easy model loading and inference on single and multiple rbln device settings for different downstream tasks.
5
5
  Project-URL: Homepage, https://rebellions.ai
6
6
  Project-URL: Documentation, https://docs.rbln.ai
@@ -17,5 +17,5 @@ __version__: str
17
17
  __version_tuple__: VERSION_TUPLE
18
18
  version_tuple: VERSION_TUPLE
19
19
 
20
- __version__ = version = '0.7.5rc2'
21
- __version_tuple__ = version_tuple = (0, 7, 5, 'rc2')
20
+ __version__ = version = '0.8.0'
21
+ __version_tuple__ = version_tuple = (0, 8, 0)
@@ -11,9 +11,10 @@
11
11
  # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
12
  # See the License for the specific language governing permissions and
13
13
  # limitations under the License.
14
-
15
14
  from typing import Optional
16
15
 
16
+ import rebel
17
+
17
18
  from ....configuration_utils import RBLNModelConfig
18
19
  from ..decoderonly.configuration_decoderonly import RBLNDecoderOnlyModelForCausalLMConfig
19
20
  from ..siglip.configuration_siglip import RBLNSiglipVisionModelConfig
@@ -39,6 +40,10 @@ class RBLNGemma3ForCausalLMConfig(RBLNDecoderOnlyModelForCausalLMConfig):
39
40
  **kwargs,
40
41
  )
41
42
 
43
+ npu = self.npu or rebel.get_npu_name()
44
+ if npu == "RBLN-CA02":
45
+ raise NotImplementedError("Gemma3 is currently not supported on RBLN-CA02")
46
+
42
47
 
43
48
  class RBLNGemma3ForConditionalGenerationConfig(RBLNModelConfig):
44
49
  submodules = ["vision_tower", "language_model"]
@@ -858,11 +858,6 @@ class RBLNGemma3ForCausalLM(RBLNDecoderOnlyModelForCausalLM):
858
858
  max_seq_len=rbln_config.max_seq_len,
859
859
  )
860
860
 
861
- if rbln_config.attn_impl == "eager":
862
- raise ValueError(
863
- "Eager attention is not supported for Gemma3. Please use flash attention by setting `rbln_attn_impl='flash_attn'`. Stay tuned for future updates!"
864
- )
865
-
866
861
  validate_attention_method(
867
862
  attn_impl=rbln_config.attn_impl,
868
863
  kvcache_partition_len=rbln_config.kvcache_partition_len,
@@ -595,9 +595,8 @@ class RBLNQwen2_5_VLForConditionalGeneration(RBLNDecoderOnlyModelForCausalLM):
595
595
  )
596
596
  logits.append(output.logits)
597
597
  logits = torch.cat(logits, dim=0)
598
- # Decoder
598
+ # Decoder
599
599
  else:
600
- print(input_ids[0], cache_position[0])
601
600
  inputs_embeds, position_embed = self._preprocess_decoder(input_ids, cache_position)
602
601
  output = self.decoder(
603
602
  inputs_embeds=inputs_embeds,
@@ -11,13 +11,10 @@ from transformers import AutoConfig, AutoProcessor, AutoTokenizer
11
11
  from optimum.rbln import (
12
12
  RBLNAutoModel,
13
13
  RBLNAutoModelForCausalLM,
14
- RBLNAutoModelForImageTextToText,
15
14
  RBLNAutoModelForSeq2SeqLM,
16
15
  RBLNAutoModelForVision2Seq,
17
16
  RBLNBartForConditionalGeneration,
18
17
  RBLNExaoneForCausalLM,
19
- RBLNGemma3ForCausalLM,
20
- RBLNGemma3ForConditionalGeneration,
21
18
  RBLNGPT2LMHeadModel,
22
19
  RBLNIdefics3ForConditionalGeneration,
23
20
  RBLNLlamaForCausalLM,
@@ -68,7 +65,7 @@ class LLMTest:
68
65
  class TestQwen2Model(LLMTest.TestLLM):
69
66
  RBLN_CLASS = RBLNQwen2ForCausalLM
70
67
  HF_MODEL_ID = "Qwen/Qwen2-0.5B-Instruct"
71
- EXPECTED_OUTPUT = " I am a 30-year-old woman who has been living with a chronic illness for the past"
68
+ EXPECTED_OUTPUT = " I am a 30-year-old woman who has been living with lupus for over 1"
72
69
  HF_CONFIG_KWARGS = {"max_position_embeddings": 1024}
73
70
 
74
71
 
@@ -395,55 +392,5 @@ class TestDisallowedLlama_4(DisallowedTestBase.DisallowedTest):
395
392
  RBLN_CLASS_KWARGS = {"rbln_config": {"attn_impl": "flash_attn", "kvcache_partition_len": 1024}}
396
393
 
397
394
 
398
- class TestGemma3ForConditionalGeneration(LLMTest.TestLLM):
399
- RBLN_AUTO_CLASS = RBLNAutoModelForImageTextToText
400
- RBLN_CLASS = RBLNGemma3ForConditionalGeneration
401
- HF_MODEL_ID = "google/gemma-3-4b-it" # No tiny model yet.
402
- PROMPT = "<bos><start_of_turn>user\n<start_of_image>Describe the image.<end_of_turn>\n<start_of_turn>model\n'"
403
- RBLN_CLASS_KWARGS = {"rbln_config": {"language_model": {"use_inputs_embeds": True, "kvcache_partition_len": 4096}}}
404
- EXPECTED_OUTPUT = "ִיсмотрятОднакоettingiPadaenуdenlyticsinท์नियमितinท์नियमित"
405
-
406
- @classmethod
407
- def get_tokenizer(cls):
408
- if cls._tokenizer is None:
409
- cls._tokenizer = AutoProcessor.from_pretrained(cls.HF_MODEL_ID)
410
- return cls._tokenizer
411
-
412
- # override
413
- @classmethod
414
- def setUpClass(cls):
415
- config = AutoConfig.from_pretrained(cls.HF_MODEL_ID)
416
- text_config = json.loads(config.text_config.to_json_string())
417
- text_config["num_hidden_layers"] = 2
418
- text_config["sliding_window_pattern"] = 2
419
- vision_config = json.loads(config.vision_config.to_json_string())
420
- vision_config["num_hidden_layers"] = 1
421
- kwargs = {"text_config": text_config, "vision_config": vision_config}
422
- cls.HF_CONFIG_KWARGS.update(kwargs)
423
- return super().setUpClass()
424
-
425
- def get_inputs(self):
426
- tokenizer = self.get_tokenizer()
427
- img_path = f"{os.path.dirname(__file__)}/../assets/rbln_logo.png"
428
- image = Image.open(img_path)
429
- image = image.convert("RGB")
430
- inputs = tokenizer(images=[image], text=[self.PROMPT], return_tensors="pt", padding=True)
431
- inputs["max_new_tokens"] = 20
432
- inputs["do_sample"] = False
433
- return inputs
434
-
435
-
436
- class TestGemma3ForCausalLM(LLMTest.TestLLM):
437
- RBLN_CLASS = RBLNGemma3ForCausalLM
438
- HF_MODEL_ID = "google/gemma-3-1b-it"
439
- EXPECTED_OUTPUT = "1st L L L L L L L L L L L L L L L L L L"
440
- HF_CONFIG_KWARGS = {
441
- "num_hidden_layers": 2,
442
- "sliding_window_pattern": 2,
443
- "max_position_embeddings": 1024,
444
- "trust_remote_code": True,
445
- }
446
-
447
-
448
395
  if __name__ == "__main__":
449
396
  unittest.main()
File without changes
File without changes
File without changes