optimum-rbln 0.1.13__py3-none-any.whl → 0.1.15__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (79) hide show
  1. optimum/rbln/__init__.py +22 -12
  2. optimum/rbln/__version__.py +16 -1
  3. optimum/rbln/diffusers/__init__.py +22 -2
  4. optimum/rbln/diffusers/models/__init__.py +34 -3
  5. optimum/rbln/{transformers/generation → diffusers/models/autoencoders}/__init__.py +1 -2
  6. optimum/rbln/diffusers/models/{autoencoder_kl.py → autoencoders/autoencoder_kl.py} +44 -58
  7. optimum/rbln/diffusers/models/autoencoders/vae.py +84 -0
  8. optimum/rbln/diffusers/models/controlnet.py +54 -14
  9. optimum/rbln/diffusers/models/transformers/__init__.py +24 -0
  10. optimum/rbln/diffusers/models/transformers/transformer_sd3.py +203 -0
  11. optimum/rbln/diffusers/models/unets/__init__.py +24 -0
  12. optimum/rbln/diffusers/models/{unet_2d_condition.py → unets/unet_2d_condition.py} +78 -16
  13. optimum/rbln/diffusers/pipelines/__init__.py +22 -2
  14. optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py +5 -26
  15. optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py +1 -0
  16. optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py +1 -0
  17. optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py +1 -0
  18. optimum/rbln/diffusers/pipelines/stable_diffusion/__init__.py +1 -0
  19. optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py +1 -0
  20. optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py +0 -11
  21. optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_inpaint.py +32 -0
  22. optimum/rbln/diffusers/pipelines/stable_diffusion_3/__init__.py +26 -0
  23. optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py +32 -0
  24. optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py +32 -0
  25. optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py +32 -0
  26. optimum/rbln/diffusers/pipelines/stable_diffusion_xl/__init__.py +1 -0
  27. optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py +14 -6
  28. optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py +14 -6
  29. optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py +32 -0
  30. optimum/rbln/modeling.py +572 -0
  31. optimum/rbln/modeling_alias.py +1 -1
  32. optimum/rbln/modeling_base.py +164 -758
  33. optimum/rbln/modeling_diffusers.py +51 -122
  34. optimum/rbln/transformers/__init__.py +0 -2
  35. optimum/rbln/transformers/models/auto/auto_factory.py +117 -23
  36. optimum/rbln/transformers/models/auto/modeling_auto.py +37 -12
  37. optimum/rbln/transformers/models/bart/modeling_bart.py +3 -6
  38. optimum/rbln/transformers/models/bert/modeling_bert.py +3 -6
  39. optimum/rbln/transformers/models/clip/modeling_clip.py +8 -25
  40. optimum/rbln/transformers/models/decoderonly/__init__.py +0 -3
  41. optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py +672 -412
  42. optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py +38 -155
  43. optimum/rbln/transformers/models/dpt/modeling_dpt.py +1 -1
  44. optimum/rbln/transformers/models/exaone/exaone_architecture.py +61 -45
  45. optimum/rbln/transformers/models/exaone/modeling_exaone.py +4 -2
  46. optimum/rbln/transformers/models/gemma/gemma_architecture.py +33 -104
  47. optimum/rbln/transformers/models/gpt2/gpt2_architecture.py +50 -238
  48. optimum/rbln/transformers/models/gpt2/modeling_gpt2.py +3 -2
  49. optimum/rbln/transformers/models/llava_next/modeling_llava_next.py +2 -75
  50. optimum/rbln/transformers/models/midm/midm_architecture.py +88 -242
  51. optimum/rbln/transformers/models/midm/modeling_midm.py +6 -6
  52. optimum/rbln/transformers/models/phi/phi_architecture.py +61 -261
  53. optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py +1 -46
  54. optimum/rbln/transformers/models/t5/modeling_t5.py +102 -4
  55. optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py +1 -1
  56. optimum/rbln/transformers/models/whisper/modeling_whisper.py +1 -1
  57. optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py +3 -35
  58. optimum/rbln/transformers/utils/rbln_quantization.py +120 -3
  59. optimum/rbln/utils/decorator_utils.py +10 -6
  60. optimum/rbln/utils/hub.py +131 -0
  61. optimum/rbln/utils/import_utils.py +15 -1
  62. optimum/rbln/utils/model_utils.py +53 -0
  63. optimum/rbln/utils/runtime_utils.py +1 -1
  64. optimum/rbln/utils/submodule.py +114 -0
  65. optimum_rbln-0.1.15.dist-info/METADATA +106 -0
  66. {optimum_rbln-0.1.13.dist-info → optimum_rbln-0.1.15.dist-info}/RECORD +69 -66
  67. {optimum_rbln-0.1.13.dist-info → optimum_rbln-0.1.15.dist-info}/WHEEL +1 -1
  68. optimum/rbln/transformers/generation/streamers.py +0 -139
  69. optimum/rbln/transformers/generation/utils.py +0 -397
  70. optimum/rbln/transformers/models/exaone/hf_hub_cached/configuration_exaone.py +0 -181
  71. optimum/rbln/transformers/models/exaone/hf_hub_cached/modeling_exaone.py +0 -1725
  72. optimum/rbln/transformers/models/midm/hf_hub_cached/configuration_midm.py +0 -22
  73. optimum/rbln/transformers/models/midm/hf_hub_cached/midm_bitext_tokenization.py +0 -304
  74. optimum/rbln/transformers/models/midm/hf_hub_cached/modeling_midm.py +0 -1469
  75. optimum/rbln/transformers/models/midm/hf_hub_cached/rotary_position_embedding.py +0 -98
  76. optimum/rbln/utils/context.py +0 -58
  77. optimum_rbln-0.1.13.dist-info/METADATA +0 -120
  78. optimum_rbln-0.1.13.dist-info/entry_points.txt +0 -4
  79. {optimum_rbln-0.1.13.dist-info → optimum_rbln-0.1.15.dist-info}/licenses/LICENSE +0 -0
@@ -1,107 +1,110 @@
1
- optimum/rbln/__init__.py,sha256=QcWA83wvYEp0MGNvxP8_nMziofD0MZNGCt73KLheOhY,6459
2
- optimum/rbln/__version__.py,sha256=jGw4tQiBX4GF6k-kjNLN011jLkBRZrHCX6wC2au3JJ8,22
3
- optimum/rbln/diffusers/__init__.py,sha256=w4W7Wy-Mmh8CQZ5M9JnrrE5bN0UsfNehZI41QadE-hk,2605
4
- optimum/rbln/diffusers/models/__init__.py,sha256=aY6Llq_31dZjdB9HPBDvi7sXVtdQT9r11gokXG5ffxA,1139
5
- optimum/rbln/diffusers/models/autoencoder_kl.py,sha256=Nqczw1nn1azoiTlBCbmjfLx2uJ4leVfJpOWiHnvXriM,8373
6
- optimum/rbln/diffusers/models/controlnet.py,sha256=Nlp1l1X_F2sOa3nO1O4S2i7LQJRYUFaOUWIASyVJTtM,8607
7
- optimum/rbln/diffusers/models/unet_2d_condition.py,sha256=Bi0KzXR6pBqhHZotiD21p1t2xCztM_JLRa7rByxJ80Y,11250
8
- optimum/rbln/diffusers/pipelines/__init__.py,sha256=M-I5HSUN7YTiY1zfaKxDPjxFzBTYi5fRwru_dI1z2Fw,2289
1
+ optimum/rbln/__init__.py,sha256=rjaGo_lPR8m4RwnTYuLTOL15KNRKXbD2EGn7j_STXIg,6895
2
+ optimum/rbln/__version__.py,sha256=ZKlmJ822TJ49YEqc2wCAMbrp81vFvzcFa9OTia84voM,413
3
+ optimum/rbln/modeling.py,sha256=GpTLugUsFx5qTjyENwR7263naVZrMugtoVvWFEaQLzQ,23788
4
+ optimum/rbln/modeling_alias.py,sha256=Z9vGv6ca82_mhbYclxIZ6e8jt-gf07g--k3ljdQvtGo,2128
5
+ optimum/rbln/modeling_base.py,sha256=TPcJ8JhFvWepIrmPuMQp_IKLWlTmvy2Wb99rhoz_YDk,19755
6
+ optimum/rbln/modeling_config.py,sha256=va58Gpbn3rolqKu9y2u3vYVT6kynBGpox_jod6cs-j0,10612
7
+ optimum/rbln/modeling_diffusers.py,sha256=VabNyhVN5s8M_fCx18SkR9hAfJqfXBZwz1m4Sl9Yihg,14138
8
+ optimum/rbln/diffusers/__init__.py,sha256=jad5hGtgXfP6ZZzYI4uBnb1Qbt6TwfEIJjFOtdNzCgc,3187
9
+ optimum/rbln/diffusers/models/__init__.py,sha256=CKgWCqCEPrAc-l5SxKcwu7TadkSGvqkpNqpwrXZVv90,1749
10
+ optimum/rbln/diffusers/models/controlnet.py,sha256=rIYshEXkBqAGh7cOpfu2quffVHNJj9SQ-ATsgQkre5o,10889
11
+ optimum/rbln/diffusers/models/autoencoders/__init__.py,sha256=yc1ABZG3xxzWPDGf0ADEeuSz3Nrq4ZP-CwddQ-VvWCU,1039
12
+ optimum/rbln/diffusers/models/autoencoders/autoencoder_kl.py,sha256=EoI8EQYYS0SA4wurM3I2shs5Z6MA-YEXohoxDg40LrE,8554
13
+ optimum/rbln/diffusers/models/autoencoders/vae.py,sha256=Ys802twDAnNIMVRp-lL3Rhb8Gh-jot0IFCLBm68FrK8,2889
14
+ optimum/rbln/diffusers/models/transformers/__init__.py,sha256=2bVk_6nuqcREOIVyR-4w5ksmdWJqyIV7Wxc5x0dqYO8,1048
15
+ optimum/rbln/diffusers/models/transformers/transformer_sd3.py,sha256=C_50IkKUYnpCbRlsTsX07PVI5RLRgnouQyISvZhlVOg,7684
16
+ optimum/rbln/diffusers/models/unets/__init__.py,sha256=-0PyRbBVBFujd7nBh0Z4NOe3RVOlAWyvWLU8r62dqdo,1049
17
+ optimum/rbln/diffusers/models/unets/unet_2d_condition.py,sha256=p-obj4tVxBkQMS8W1On8oFrLK-TXCo3Zksw1bOBXRPw,14467
18
+ optimum/rbln/diffusers/pipelines/__init__.py,sha256=M6UtFsGnGKYnuHkuJnfyR5WzajAgUidVUNGaqLBS6bM,2862
9
19
  optimum/rbln/diffusers/pipelines/controlnet/__init__.py,sha256=k0govvSBxBUR5qpxUGxRMHuQCMX7hXHVZ4EqVRw1LWk,1377
10
- optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py,sha256=qm5EtOEtp2LMLlyT61CVj8jChCXPI49mwtLGbmqZVWg,5365
20
+ optimum/rbln/diffusers/pipelines/controlnet/multicontrolnet.py,sha256=OnOvqnNCK1WrnU7JH93GSmEdMRW8Z2__eorYaj-zHAw,4424
11
21
  optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet.py,sha256=xlfDdKxgIK1DvIQAbOipA00LAMni8f7z8urpeOAyEkE,34884
12
- optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py,sha256=_r1B2xasytCUcth4fUF4RNVdVt5zHlnw9hszWY9DkrI,33307
13
- optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py,sha256=KwfoTDpZCJ6Y8e_v5ZEc7HAEly9KzoW-N9IdcGTjwC0,44409
14
- optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py,sha256=Xa8spvzhmj9rToseCX5hP6Dv3w7z9xFpXQf1BEvIInQ,45715
15
- optimum/rbln/diffusers/pipelines/stable_diffusion/__init__.py,sha256=qf_uMWSwD-CyRMRC73y1QsTMyl_qCMreIdg0a8rhJuA,1142
16
- optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py,sha256=gt1h5zg4258NeKfvfmMlJVECOex8Lqw5jN9NkoF3Xuk,1317
17
- optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py,sha256=SpT38WG4uYRrWa57PRT8o2Dq8lnR5zewL6umprsAEP0,1958
18
- optimum/rbln/diffusers/pipelines/stable_diffusion_xl/__init__.py,sha256=8MDMHIVsDrM6lZAyvpjFtWOFwiY_IoSxzCQe-gJYTPI,159
19
- optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py,sha256=GyaOv18zZlPImCQLpkGnEGPokAsmkxlFLUWRoDhiB4s,1024
20
- optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py,sha256=jUEjw64Oh29_wI7OzoV7LdTfsetcQj-aeRBl-gN_nHM,1052
21
- optimum/rbln/modeling.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
22
- optimum/rbln/modeling_alias.py,sha256=lvyUxIrrXWgV2o0ymbeFkhz_ou8S9_CRRfQ_EfAvQZU,2133
23
- optimum/rbln/modeling_base.py,sha256=S6kbesSHzE0XtYqB5A72j07dfYUGVyQzf91X65GdZnw,44094
24
- optimum/rbln/modeling_config.py,sha256=va58Gpbn3rolqKu9y2u3vYVT6kynBGpox_jod6cs-j0,10612
25
- optimum/rbln/modeling_diffusers.py,sha256=3DiPbbgB9YzU9SrR58DZfdBfL7sSuLQJiPWrubXFA2A,17816
26
- optimum/rbln/transformers/__init__.py,sha256=Ga_NISWJftvExXepKjXCcNHQs5Ogw0Y60MLLIl9csbI,3859
22
+ optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py,sha256=C9DwjPiNSQanqNNWiOHJvw3yZtL8tR4YaQZwVkC02_o,33369
23
+ optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py,sha256=QvoS7g3dfZ3b1Fq1taIfRBf9kNpoR0jsv-H97hXNQ4A,44466
24
+ optimum/rbln/diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py,sha256=hHkNKnBsSGdHeFjf45zIpum0DE6JRcw_NEYFLYYmxSg,45779
25
+ optimum/rbln/diffusers/pipelines/stable_diffusion/__init__.py,sha256=7lX6f9XiqROsArw1X0lGsW06H0TrWKwvM9Ye16vis9Y,1224
26
+ optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py,sha256=33LQR11kryvQqfQ0Srl8O8QqRsfJnKYUZAQHHSruKTY,1362
27
+ optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py,sha256=WJ4pRfmE0DIAQANXoytoeVyKBa750j-f5oKOHLUmoyY,1390
28
+ optimum/rbln/diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_inpaint.py,sha256=DaXqP_2oik-L7LitAXtaiMqcOZixOui67BWSU_qoxu4,1397
29
+ optimum/rbln/diffusers/pipelines/stable_diffusion_3/__init__.py,sha256=I1IbI4uo2ZqA2uLbhqW67wW7-8DwqeE-qPGc3BTL7dQ,1233
30
+ optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py,sha256=Hb4cGwz422jWvFefTfrPMSt7__KEdlrq41OjiSpNtFo,1410
31
+ optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py,sha256=hQUAMqQn62-aezWlwscyJu6QlXjXByJ-NXnrvYVIpRk,1445
32
+ optimum/rbln/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py,sha256=8PorhGURHd01eob_4pkZhH6azjqk77FS2xZFnBED5Yg,1445
33
+ optimum/rbln/diffusers/pipelines/stable_diffusion_xl/__init__.py,sha256=giP9dJokdRT4-a5wdJqA1qW8os5Zz0huCack8nlcyxs,246
34
+ optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py,sha256=XeeZqH63No7NPIXKXgv8Vxq_I0-iql4jHJ0sIkbYSvw,1390
35
+ optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py,sha256=o1WTLCFjsDZAtGZ84cykU0F4Qw_iMP0g7jaPw1xobP0,1418
36
+ optimum/rbln/diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py,sha256=aozAYG2mba2G9ITspDVuos-eWy0MoxlwnVtxGgtN7zk,1425
37
+ optimum/rbln/transformers/__init__.py,sha256=H__SYW4dhcFb02euqtfFZx212QZxkmKu4kgd2sBtVAs,3756
27
38
  optimum/rbln/transformers/cache_utils.py,sha256=Ak6yJlzkXsu5jQ-kWIgO97GrsLpoCezpEgQoZnvjmec,3796
28
- optimum/rbln/transformers/generation/__init__.py,sha256=6MmqS9D21ir4dcH6_fq8kRsX1VK3QspSn6Qw83F4ORE,1081
29
- optimum/rbln/transformers/generation/streamers.py,sha256=X-dEmL1L_0Oy0QSFj2RNdamb_xbDWLXd-Ms8ckx6OZ4,5778
30
- optimum/rbln/transformers/generation/utils.py,sha256=XqPbYQCe6cEuWssG9iHpbbL-wgSQTcyKHabGwKj7lnE,19462
31
39
  optimum/rbln/transformers/modeling_rope_utils.py,sha256=ob8haNW5f0tPq26xd4sTg-rMrBT9M2VDP7wxt-PkvYY,13087
32
40
  optimum/rbln/transformers/models/__init__.py,sha256=gffOrFFYG3W8ypxpDiUotU-McvjhytffeuUzunjv4nQ,3971
33
41
  optimum/rbln/transformers/models/auto/__init__.py,sha256=zMqaMIdGwuZJq4gLjRC-69M2mGUKrd0aRpmb4Rpm6-g,435
34
- optimum/rbln/transformers/models/auto/auto_factory.py,sha256=Up052AXID12uqa5UgLRW89EkYXDpuXR70Bt-xNHEZto,3159
35
- optimum/rbln/transformers/models/auto/modeling_auto.py,sha256=zET3k5GiqREvPuc_d9Sauea7rITlP6Wl32xdlCFqdhY,3165
42
+ optimum/rbln/transformers/models/auto/auto_factory.py,sha256=JIFL404RVf6kAONhLeEz6z59tdahcUAyVSU8hdZZe0g,7421
43
+ optimum/rbln/transformers/models/auto/modeling_auto.py,sha256=DDx8ZUpWPtTr8ZNv7cO_dUgJtDLXjax7gdxwc-wkkgQ,4328
36
44
  optimum/rbln/transformers/models/bart/__init__.py,sha256=-mrB4kmPpEIVk713yEIRtC57AZ7kZ23g4bsOKcvBFNE,1138
37
45
  optimum/rbln/transformers/models/bart/bart_architecture.py,sha256=W6XeumvuKv1i7p4YzKM0NgpO3NCnc1qwGXknZZrPlP0,21298
38
- optimum/rbln/transformers/models/bart/modeling_bart.py,sha256=-ulamfBSlXDL67Q1Bzo4Q8sGuuzJBjut9XPRTeQhCbA,5261
46
+ optimum/rbln/transformers/models/bart/modeling_bart.py,sha256=xzZZf-yZdUkq4F271Wfd1l-Hnm4jjgf_yy6hjVohxbo,5144
39
47
  optimum/rbln/transformers/models/bert/__init__.py,sha256=divBpVNrRAdNAPgnQkGiEZI4oJHCJtLuwdYpMbD3dMM,1034
40
- optimum/rbln/transformers/models/bert/modeling_bert.py,sha256=F5FKVgiIBdDFq-Ql8AmE0WT_mjL0gFfr1AGE_frTexs,4228
48
+ optimum/rbln/transformers/models/bert/modeling_bert.py,sha256=akbsBTsGTs7wrxPw120ryZspwYkmHAUrM4A8Kr3COw4,4111
41
49
  optimum/rbln/transformers/models/clip/__init__.py,sha256=iXZfPPIztzMDOkY3fbEzx9dCkFKKtWYXCpLGfjEUeZE,1092
42
- optimum/rbln/transformers/models/clip/modeling_clip.py,sha256=vLT8u13wrW64CnQRF7r94Eb6-dAcYiemLOLjJxMuMDA,6679
43
- optimum/rbln/transformers/models/decoderonly/__init__.py,sha256=-t8W6DtDa9z6FhDtEYuVbA9Ke71EZpJstJAEVPyZLk0,1299
44
- optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py,sha256=iYYey7UGA7DhNkun8Zocfgp3yVr4iFOoZ6loAsqou1o,27560
45
- optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py,sha256=o2G5r5_P1eT3Kg10CO5VvEVEKIqb30JGZiQZpVugRwo,29814
50
+ optimum/rbln/transformers/models/clip/modeling_clip.py,sha256=DI_N-bQcA_Kj7NSkv9VPvV1zsN6IscctVczE_2_ZkVM,6089
51
+ optimum/rbln/transformers/models/decoderonly/__init__.py,sha256=ozc0c3XBI3-5VHhGvZ0zcv6TD-kIXpDCqsAvdW3JSaY,1222
52
+ optimum/rbln/transformers/models/decoderonly/decoderonly_architecture.py,sha256=ratAjwMF3eiHTaXwPNqHqWzmkGEC5fG37xP4mGJOMI8,36833
53
+ optimum/rbln/transformers/models/decoderonly/modeling_decoderonly.py,sha256=esQp936mlHuAjb1A75jepyB3QVXsUR7a5WgVUhV7wJw,26132
46
54
  optimum/rbln/transformers/models/dpt/__init__.py,sha256=R8OHDxOAYPjkk5t8osaPqRh85Pf1Cg1BtzqesqFRcTI,1045
47
- optimum/rbln/transformers/models/dpt/modeling_dpt.py,sha256=pKQ2vmR50GyEyKK0aV7p33PqTuksiorDhC0cH5qUYiw,3810
55
+ optimum/rbln/transformers/models/dpt/modeling_dpt.py,sha256=Re15veJwAz3NaUv2GfrHyGUblW0Jcd2KLv23GutFp64,3805
48
56
  optimum/rbln/transformers/models/exaone/__init__.py,sha256=CuWNwnZrbd_cLU7jDDPqC0kZIqx1ii_BYyQ98CKDag0,1253
49
- optimum/rbln/transformers/models/exaone/exaone_architecture.py,sha256=jBrEohavlSgQz_mBnfnG3KJk23oqzKZbqNQ0CImZdUI,3051
50
- optimum/rbln/transformers/models/exaone/hf_hub_cached/configuration_exaone.py,sha256=cKtUHugxwnbR6JOtD2a0912a2iepRpX9dEAWDeSu194,10537
51
- optimum/rbln/transformers/models/exaone/hf_hub_cached/modeling_exaone.py,sha256=CUd-z7f-BMIe8WPRVx-u5A60ljW2C6u8CzrAuw__d5M,80983
52
- optimum/rbln/transformers/models/exaone/modeling_exaone.py,sha256=x-yrv1SObC3GjgHvTRbbVzhA7Xj3QPE2RVkqoBixOI4,2155
57
+ optimum/rbln/transformers/models/exaone/exaone_architecture.py,sha256=sf0GF35u2AtyadR6WLxaau_0-JKusSomtfh0ILQMras,3528
58
+ optimum/rbln/transformers/models/exaone/modeling_exaone.py,sha256=-0VjxpBOQLM3PAmrWCJXkTKQEap577bS_izn-gx8Ew8,2141
53
59
  optimum/rbln/transformers/models/gemma/__init__.py,sha256=L1Qfr6dufWtoUZND_ofwxXPSxivEvPR8exy16a_nM2o,1042
54
- optimum/rbln/transformers/models/gemma/gemma_architecture.py,sha256=3OFXjt4E4uUXiXVS5Y0ts-Unj-Mvyu9EjZfTQJtUiLk,5002
60
+ optimum/rbln/transformers/models/gemma/gemma_architecture.py,sha256=4irFBUeL1rEnHl-r5be_doz4QaqDN3jYZMcN1aHMLYo,2317
55
61
  optimum/rbln/transformers/models/gemma/modeling_gemma.py,sha256=floBHXgogv3iAPyjhjKzbjFHeH67L3FYUKs_wtRm-gM,1924
56
62
  optimum/rbln/transformers/models/gpt2/__init__.py,sha256=jsOKYXUclG9G6cwUTUX4eeKqjCPfQUwev7TTFIMXS4Y,1040
57
- optimum/rbln/transformers/models/gpt2/gpt2_architecture.py,sha256=nXCITctShY2OTw7chGGSdIOECv8zAd-sxqbYuvSuoK8,10410
58
- optimum/rbln/transformers/models/gpt2/modeling_gpt2.py,sha256=uKVDrfQb1O6HSrAH1e1evthG0AMW1I78JpLQDeaDRzI,1878
63
+ optimum/rbln/transformers/models/gpt2/gpt2_architecture.py,sha256=w4dAVeubsNkGtcapknwyyQ5VevWPTWETg4M6Y_tZ9UI,3359
64
+ optimum/rbln/transformers/models/gpt2/modeling_gpt2.py,sha256=uz29eh8bLWxsm8pVHwvA-X8FThW2khSO-Rjysp3RoQk,1910
59
65
  optimum/rbln/transformers/models/llama/__init__.py,sha256=5mX-MuKzVBj6WQeVxyPhtvFTv0jeZXAFfg4RZ2nVUh0,1042
60
66
  optimum/rbln/transformers/models/llama/llama_architecture.py,sha256=j4mifSOaIk7wwV9fL9wQSt5kR3rpnvjtxd3VzhMNdgY,1123
61
67
  optimum/rbln/transformers/models/llama/modeling_llama.py,sha256=D9efkBVUr7TaOkAkiN_qrtQC0AyzLK7cb7UbZpo4XwI,1924
62
68
  optimum/rbln/transformers/models/llava_next/__init__.py,sha256=3vi2rmTeKBydGRFOtxELhxWixZggFMpGex6xqfMgi-I,1064
63
- optimum/rbln/transformers/models/llava_next/modeling_llava_next.py,sha256=Bdza5gOwBIxCzfdVHmGcMY9zQQ6qZ4yCOzGVrbfPVWA,28863
69
+ optimum/rbln/transformers/models/llava_next/modeling_llava_next.py,sha256=Rkpso3eQ1tHXpfLdRUayut4X3J9zsXjF2in4UVN1Yhs,25883
64
70
  optimum/rbln/transformers/models/midm/__init__.py,sha256=_6kYchy47frGMZ8uoUspZ9IwrmCBQJ-8kVfXM7xOMew,1249
65
- optimum/rbln/transformers/models/midm/hf_hub_cached/configuration_midm.py,sha256=P5JqTTcx56HOccxKbR14ZjA67BI0RNnJycG738JMaJ4,833
66
- optimum/rbln/transformers/models/midm/hf_hub_cached/midm_bitext_tokenization.py,sha256=5lhMXfqnIak1PJ9YL-vUxIdY_3DUr3IBXzTqf3ofpmI,12835
67
- optimum/rbln/transformers/models/midm/hf_hub_cached/modeling_midm.py,sha256=54__wd9EXwGxmaHDksTTcUD2aWl6WoszYsR8dlL1wfE,61031
68
- optimum/rbln/transformers/models/midm/hf_hub_cached/rotary_position_embedding.py,sha256=5ywaUVKTvqO8GRsHOSXOOGlbiEn-DbGkpJs59_dFb18,4059
69
- optimum/rbln/transformers/models/midm/midm_architecture.py,sha256=DCYf7TdvzGe-rn4Qr6feFqfZHJE4uqsExenq3SuQngw,11107
70
- optimum/rbln/transformers/models/midm/modeling_midm.py,sha256=HPWax1NWJ90OzqluuPDVTe5aru3DR41wQ76HZy8FnQY,2154
71
+ optimum/rbln/transformers/models/midm/midm_architecture.py,sha256=PwGwHaYCHmJ4DRvlieVK_IzsZgG79_n-Y8kQs5NwT0A,5790
72
+ optimum/rbln/transformers/models/midm/modeling_midm.py,sha256=NB1Ie2GN9Ilisd9CMIbENRiTtUV0pK3eTStbuz0yQBg,2129
71
73
  optimum/rbln/transformers/models/mistral/__init__.py,sha256=XtuOmzBITjj-H1yctXobJjHF908x1Wlxr_p4hi06v8I,1046
72
74
  optimum/rbln/transformers/models/mistral/mistral_architecture.py,sha256=LCvY4L0Wq1VruKhZ3JTSiuZJqQRJlTae5A2bKsUBGAg,1128
73
75
  optimum/rbln/transformers/models/mistral/modeling_mistral.py,sha256=i3X3HKGNee2ocEmpxdHMxuq7UAOgUs-QWlq2OizqA4g,1954
74
76
  optimum/rbln/transformers/models/phi/__init__.py,sha256=LrGFTUo1oQnsPSTlxJqAJVVNUdUwq4u_Bf60RUgjLz4,1038
75
77
  optimum/rbln/transformers/models/phi/modeling_phi.py,sha256=JfpuUB6cign-lqcUoprgq3gbQclZFT9HGV-NYVkSads,1910
76
- optimum/rbln/transformers/models/phi/phi_architecture.py,sha256=iCAIicuN-YFG02ZOT6-VN5ZMw_saNryXAFmh10DKGfs,12777
78
+ optimum/rbln/transformers/models/phi/phi_architecture.py,sha256=GTmqWF6cJn4rhFTkuYxuzEcVTE-fM4dfpV0Ve1Abi9Q,4440
77
79
  optimum/rbln/transformers/models/qwen2/__init__.py,sha256=1PLl1rlF14C6eSk3EZaDfyEHPaC4DZ2vwVlrklTkOYg,1042
78
80
  optimum/rbln/transformers/models/qwen2/modeling_qwen2.py,sha256=8ldxWKk85snFX_EViA7kgcgKAZ_QSbmQxhlO4yFvhOA,1924
79
81
  optimum/rbln/transformers/models/qwen2/qwen2_architecture.py,sha256=-X9OZ4HUCYDtwKnvidkWzCMPh_Xuu1wj-wRXIsQ9Pjg,1115
80
82
  optimum/rbln/transformers/models/seq2seq/__init__.py,sha256=Oa11lBWDNQWahqvDco3JIsZldYS-lO8qjpnaGKSfR00,1045
81
- optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py,sha256=ytDTNTTW221ShVRXClfQQBQV96NW-oYWwRjlbv9aXZU,18403
83
+ optimum/rbln/transformers/models/seq2seq/modeling_seq2seq.py,sha256=GSy_9bVdiZ4kavavsX-UJ62RIQn18_7k8i8PN6G2P9E,16131
82
84
  optimum/rbln/transformers/models/t5/__init__.py,sha256=H1ns7mquQDkImSI1KT4oTe4owK4s_n28YqVxmZ31TF0,1133
83
- optimum/rbln/transformers/models/t5/modeling_t5.py,sha256=FlYH-x-p9YmYOKKyTLN-AVDCFmFrmk3sjEJq4D2X1XI,3952
85
+ optimum/rbln/transformers/models/t5/modeling_t5.py,sha256=jBZDKwWXbuKEHUraU0N7P-XUPxznpCNdaRYs4buJY0Y,7776
84
86
  optimum/rbln/transformers/models/t5/t5_architecture.py,sha256=k3ROGNSGGuF1gFNV-LxoFFgfxo7ab5GSQA4GIi5MLsI,21074
85
87
  optimum/rbln/transformers/models/wav2vec2/__init__.py,sha256=mz4cXqG9b0tDpTAw3qYn3FaJuolX601VmKBE3gohLSw,1043
86
- optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py,sha256=lTtLGKuAxuVNguqSc2y0D0MsE6eHCraDS7-l2-0QJEY,4236
88
+ optimum/rbln/transformers/models/wav2vec2/modeling_wav2vec2.py,sha256=vRDKoujGRvMvyAlJVJhj_EHf0OtQWbZHickFLzGjmDI,4231
87
89
  optimum/rbln/transformers/models/whisper/__init__.py,sha256=PZ8qeAAFMas2MizwVYFxlpFWd5k1Pe1x-0IJfYAMhT8,1059
88
90
  optimum/rbln/transformers/models/whisper/generation_whisper.py,sha256=Kwwskbp48wJxEkFGQLlm0L252rO7tx_YLYmOA-_IPwI,3387
89
- optimum/rbln/transformers/models/whisper/modeling_whisper.py,sha256=pIwMH06JUWk9oYrwEhQeo-_Y_D2ari0sxmoiHFSCl60,15360
91
+ optimum/rbln/transformers/models/whisper/modeling_whisper.py,sha256=DX4tBJxULJY_UCm1Tw4EiGn1FjZioBjZZbFAB1Uipm4,15355
90
92
  optimum/rbln/transformers/models/whisper/whisper_architecture.py,sha256=OQzkGa2WSUn3OVQ1DYVOY49N46QvxO1hdEbQ7Ke-o_c,17203
91
93
  optimum/rbln/transformers/models/xlm_roberta/__init__.py,sha256=NTj4hCpd8L2_i5DZuV5wp-h8OlTLYVUqTrJxzY_Dg9g,1047
92
- optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py,sha256=8xLhJvuFSCmURyKWpB3O1GLLUn00ewwdAdbzJCV7B78,4929
94
+ optimum/rbln/transformers/models/xlm_roberta/modeling_xlm_roberta.py,sha256=H5SEtmCAuG6pL1ovl4eLPGZ3tx1IPOilsxKvnbFDN-E,3821
93
95
  optimum/rbln/transformers/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
94
- optimum/rbln/transformers/utils/rbln_quantization.py,sha256=X03egWZPycrcBAUgSmuW2bEPuDu7bMtMkmpgufr4FyU,3551
96
+ optimum/rbln/transformers/utils/rbln_quantization.py,sha256=-abKYe20hnwx1RtPE2Yz7C5slEKYmKohBSscoRoA2bo,7807
95
97
  optimum/rbln/utils/__init__.py,sha256=F6hJP00eV1_hT_IVwqqYwLWcLQAvZbmmrNMJTia3mjI,1106
96
- optimum/rbln/utils/context.py,sha256=NylAkP-AdPaZrlAeuukaU9rLEMrFITU1IBA-rsoXgDk,2212
97
- optimum/rbln/utils/decorator_utils.py,sha256=Fp3_hD0PeCzdq1wSzKlPRwS8EeUJcGUbbASNRYmstkM,2093
98
- optimum/rbln/utils/import_utils.py,sha256=mIA5o4byYHlLFhYUq3KCvmmzTCgLxSmMPF0MjwGhzVg,3955
98
+ optimum/rbln/utils/decorator_utils.py,sha256=KDxCPC6G1Au8nokvTGjo--JyZbaWjOLzfJl_oewJ5oQ,2311
99
+ optimum/rbln/utils/hub.py,sha256=o-nA2I_jnB0S2AX0-q9lSpSNcdP_TeqZbHv84Gxxvi4,4592
100
+ optimum/rbln/utils/import_utils.py,sha256=fk8VIS46sB5zNqinfpmJLINjcJhTRSf-xdvp-g98Aps,4287
99
101
  optimum/rbln/utils/logging.py,sha256=xIcLmUQoIJoBj3owkXN5_WQkQljcos6J6KSdX35IApw,2271
100
- optimum/rbln/utils/runtime_utils.py,sha256=RUYpDbp5PuWQ00pBqlL-URElZZKaNFA2qngTmpyGzec,3814
102
+ optimum/rbln/utils/model_utils.py,sha256=cnQbNtc2KUAJOcB6rHVwF8RpCNJFOTiCa91AQlUlgMM,1673
103
+ optimum/rbln/utils/runtime_utils.py,sha256=DXzRJKvLkiRYspefJsps5mHDpgQl_skA1BfIADsXPTg,3815
101
104
  optimum/rbln/utils/save_utils.py,sha256=eFIPtmiblCJ3MvtxEPxmAR3iuLEUrzpyzwtVotDauhw,3283
105
+ optimum/rbln/utils/submodule.py,sha256=UHizJSL3osA5Jiaarjbvl7AUWlXp4p8Pb_9JZKsaoCI,3472
102
106
  optimum/rbln/utils/timer_utils.py,sha256=o6EI-7-pcr3LhvCGJ1HIs1KH17yF2CaNpTsbHHbHmzc,1229
103
- optimum_rbln-0.1.13.dist-info/METADATA,sha256=otsCzUqeDLZOIwDPusqhubMaG4Mw3wU9kOjKZtrygZM,4653
104
- optimum_rbln-0.1.13.dist-info/WHEEL,sha256=thaaA2w1JzcGC48WYufAs8nrYZjJm8LqNfnXFOFyCC4,90
105
- optimum_rbln-0.1.13.dist-info/entry_points.txt,sha256=6OYgBcLyFCUgeqLgnvMyOJxPCWzgy7se4rLPKtNonMs,34
106
- optimum_rbln-0.1.13.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
107
- optimum_rbln-0.1.13.dist-info/RECORD,,
107
+ optimum_rbln-0.1.15.dist-info/METADATA,sha256=4Zxw1eSnrtAUDNrEEkOhMal7Ryh2CQ4niAKs-9I-dbc,4248
108
+ optimum_rbln-0.1.15.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
109
+ optimum_rbln-0.1.15.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
110
+ optimum_rbln-0.1.15.dist-info/RECORD,,
@@ -1,4 +1,4 @@
1
1
  Wheel-Version: 1.0
2
- Generator: pdm-backend (2.4.3)
2
+ Generator: hatchling 1.27.0
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
@@ -1,139 +0,0 @@
1
- # Copyright 2024 Rebellions Inc.
2
-
3
- # Licensed under the Apache License, Version 2.0 (the "License");
4
- # you may not use this file except in compliance with the License.
5
- # You may obtain a copy of the License at:
6
-
7
- # http://www.apache.org/licenses/LICENSE-2.0
8
-
9
- # Unless required by applicable law or agreed to in writing, software
10
- # distributed under the License is distributed on an "AS IS" BASIS,
11
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
- # See the License for the specific language governing permissions and
13
- # limitations under the License.
14
-
15
- # Portions of this software are licensed under the Apache License,
16
- # Version 2.0. See the NOTICE file distributed with this work for
17
- # additional information regarding copyright ownership.
18
-
19
- # All other portions of this software, including proprietary code,
20
- # are the intellectual property of Rebellions Inc. and may not be
21
- # copied, modified, or distributed without prior written permission
22
- # from Rebellions Inc.
23
-
24
- from typing import List, Optional
25
-
26
- import torch
27
- from transformers import AutoTokenizer, TextIteratorStreamer
28
-
29
-
30
- class BatchTextIteratorStreamer(TextIteratorStreamer):
31
- """
32
- Streamer that stores print-ready text in a queue, to be used by a downstream application as an iterator. This is
33
- useful for applications that benefit from accessing the generated text in a non-blocking way (e.g., in an interactive
34
- Gradio demo).
35
-
36
- This iterator extends TextIteratorStreamer to support batching of text generation. Each put operation appends
37
- generated text to a batch, and the end operation finalizes the batch by processing and storing the generated
38
- sequences.
39
-
40
- Parameters:
41
- batch_size (int):
42
- The size of each text generation batch.
43
- tokenizer (AutoTokenizer):
44
- The tokenizer used to decode the tokens.
45
- skip_prompt (bool, optional, default=False):
46
- Whether to skip the prompt to `.generate()` or not. Useful, for example, for chatbots.
47
- timeout (float, optional):
48
- The timeout for the text queue. If `None`, the queue will block indefinitely. Useful to handle exceptions
49
- in `.generate()` when it is called in a separate thread.
50
- **decode_kwargs (dict, optional):
51
- Additional keyword arguments to pass to the tokenizer's `decode` method.
52
-
53
- """
54
-
55
- def __init__(
56
- self,
57
- batch_size: int,
58
- tokenizer: "AutoTokenizer",
59
- skip_prompt: bool = False,
60
- timeout: Optional[float] = None,
61
- **decode_kwargs,
62
- ):
63
- super().__init__(tokenizer, skip_prompt, timeout, **decode_kwargs)
64
- self.batch_size: int = batch_size
65
- self.token_cache: List[List[int]] = [[] for _ in range(batch_size)]
66
- self.print_len = [0] * batch_size
67
- self.blocked = False
68
-
69
- def put(self, value):
70
- """
71
- Receives tokens, decodes them, and prints them to buffer as soon as they form entire words.
72
- """
73
-
74
- if len(value.shape) < 2:
75
- value = torch.reshape(value, (self.batch_size, value.shape[0] // self.batch_size))
76
-
77
- if self.skip_prompt and self.next_tokens_are_prompt:
78
- self.next_tokens_are_prompt = False
79
- return
80
-
81
- batch_printable_text = []
82
- for i in range(self.batch_size):
83
- # Add the new token to the cache and decodes the entire thing
84
- self.token_cache[i].extend(value[i].tolist())
85
- text = self.tokenizer.decode(self.token_cache[i], **self.decode_kwargs)
86
-
87
- # After the symbol for a new line, we flush the cache.
88
- if text.endswith("\n"):
89
- printable_text = text[self.print_len[i] :]
90
- self.token_cache[i] = []
91
- self.print_len[i] = 0
92
- # If the last token is a CJK character, we print the characters.
93
- elif len(text) > 0 and self._is_chinese_char(ord(text[-1])):
94
- printable_text = text[self.print_len[i] :]
95
- self.print_len[i] += len(printable_text)
96
- # Otherwise, prints until the last space char (simple heuristic to avoid printing incomplete words,
97
- # which may change with the subsequent token -- there are probably smarter ways to do this!)
98
- else:
99
- printable_text = text[self.print_len[i] : text.rfind(" ") + 1]
100
- self.print_len[i] += len(printable_text)
101
- batch_printable_text.append(printable_text)
102
-
103
- self.on_finalized_text(batch_printable_text)
104
-
105
- def end(self):
106
- """Flushes any remaining cache and prints a newline to stdout."""
107
- batch_printable_text = []
108
- for idx in range(self.batch_size):
109
- if len(self.token_cache[idx]) > 0:
110
- text = self.tokenizer.decode(self.token_cache[idx], **self.decode_kwargs)
111
- printable_text = text[self.print_len[idx] :]
112
- self.token_cache[idx] = []
113
- self.print_len[idx] = 0
114
- else:
115
- printable_text = ""
116
- batch_printable_text.append(printable_text)
117
-
118
- self.next_tokens_are_prompt = True
119
- self.on_finalized_text(batch_printable_text, stream_end=True)
120
- self.blocked = False
121
-
122
- def on_finalized_text(self, texts: List[str], stream_end: bool = False):
123
- self.text_queue.put(texts, timeout=self.timeout)
124
- if stream_end:
125
- self.text_queue.put(self.stop_signal, timeout=self.timeout)
126
-
127
- # thkim change for demo
128
- def __next__(self):
129
- value = self.text_queue.get(timeout=self.timeout)
130
- if value == self.stop_signal:
131
- raise StopIteration()
132
- else:
133
- return value
134
-
135
- def block(self):
136
- self.blocked = True
137
-
138
- def is_blocked(self):
139
- return self.blocked