keras-hub-nightly 0.21.0.dev202504060503__py3-none-any.whl → 0.21.0.dev202504070403__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- keras_hub/src/models/qwen/qwen_backbone.py +1 -1
- keras_hub/src/utils/transformers/convert_qwen.py +1 -0
- keras_hub/src/version_utils.py +1 -1
- {keras_hub_nightly-0.21.0.dev202504060503.dist-info → keras_hub_nightly-0.21.0.dev202504070403.dist-info}/METADATA +1 -1
- {keras_hub_nightly-0.21.0.dev202504060503.dist-info → keras_hub_nightly-0.21.0.dev202504070403.dist-info}/RECORD +7 -7
- {keras_hub_nightly-0.21.0.dev202504060503.dist-info → keras_hub_nightly-0.21.0.dev202504070403.dist-info}/WHEEL +0 -0
- {keras_hub_nightly-0.21.0.dev202504060503.dist-info → keras_hub_nightly-0.21.0.dev202504070403.dist-info}/top_level.txt +0 -0
@@ -168,7 +168,7 @@ class QwenBackbone(Backbone):
|
|
168
168
|
self.layer_norm_epsilon = layer_norm_epsilon
|
169
169
|
self.dropout = dropout
|
170
170
|
self.tie_word_embeddings = tie_word_embeddings
|
171
|
-
self.use_sliding_window_attention =
|
171
|
+
self.use_sliding_window_attention = use_sliding_window_attention
|
172
172
|
self.sliding_window_size = sliding_window_size
|
173
173
|
|
174
174
|
def get_config(self):
|
@@ -18,6 +18,7 @@ def convert_backbone_config(transformers_config):
|
|
18
18
|
"rope_max_wavelength": transformers_config["rope_theta"],
|
19
19
|
"use_sliding_window": transformers_config["use_sliding_window"],
|
20
20
|
"sliding_window_size": transformers_config["sliding_window"],
|
21
|
+
"tie_word_embeddings": transformers_config["tie_word_embeddings"],
|
21
22
|
}
|
22
23
|
|
23
24
|
|
keras_hub/src/version_utils.py
CHANGED
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: keras-hub-nightly
|
3
|
-
Version: 0.21.0.
|
3
|
+
Version: 0.21.0.dev202504070403
|
4
4
|
Summary: Industry-strength Natural Language Processing extensions for Keras.
|
5
5
|
Home-page: https://github.com/keras-team/keras-hub
|
6
6
|
Author: Keras team
|
@@ -8,7 +8,7 @@ keras_hub/api/tokenizers/__init__.py,sha256=ZMrudLg7bR9_ZoXJbiUEU3J6NHBqFRjKqLlf
|
|
8
8
|
keras_hub/api/utils/__init__.py,sha256=Gp1E6gG-RtKQS3PBEQEOz9PQvXkXaJ0ySGMqZ7myN7A,215
|
9
9
|
keras_hub/src/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
10
10
|
keras_hub/src/api_export.py,sha256=9pQZK27JObxWZ96QPLBp1OBsjWigh1iuV6RglPGMRk0,1499
|
11
|
-
keras_hub/src/version_utils.py,sha256=
|
11
|
+
keras_hub/src/version_utils.py,sha256=k5kCFHtcK4GfHigaw4Z4EdPeShVAlCnpHq4G6lzDMOY,222
|
12
12
|
keras_hub/src/layers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
13
13
|
keras_hub/src/layers/modeling/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
14
14
|
keras_hub/src/layers/modeling/alibi_bias.py,sha256=1XBTHI52L_iJDhN_w5ydu_iMhCuTgQAxEPwcLA6BPuk,4411
|
@@ -286,7 +286,7 @@ keras_hub/src/models/phi3/phi3_rotary_embedding.py,sha256=wqiRn8nETNcLc5Vsm_d_8s
|
|
286
286
|
keras_hub/src/models/phi3/phi3_tokenizer.py,sha256=bOPH14wTVVHJHq8mgzXLjsgvKMNhfO8eayevAPpjYVA,1992
|
287
287
|
keras_hub/src/models/qwen/__init__.py,sha256=hskG3tZUY_AYZPp0WVzbCtw37AIYENyp3DOnqHmdRBw,65
|
288
288
|
keras_hub/src/models/qwen/qwen_attention.py,sha256=FL_09-eCFugktDNzFPm6beZLD04pNg9TFKgfXdhWUwk,12953
|
289
|
-
keras_hub/src/models/qwen/qwen_backbone.py,sha256=
|
289
|
+
keras_hub/src/models/qwen/qwen_backbone.py,sha256=e9AR-7z7Wxn-Lbk3dk5MXUNJ1N8ykO9Tt-RVdLBlU3o,12845
|
290
290
|
keras_hub/src/models/qwen/qwen_causal_lm.py,sha256=TuGpp9EXkEMQLJ0XybRuOkUl_g-v0Bq-Vdfcw6JkjC0,12079
|
291
291
|
keras_hub/src/models/qwen/qwen_causal_lm_preprocessor.py,sha256=pozIzd5bDgMvaYw13HBM5eKV8VBdg91_HzctnTultLg,415
|
292
292
|
keras_hub/src/models/qwen/qwen_decoder.py,sha256=utmAvZlU7_nP-6pjGPDinK4JaMzsQSwOARG0ote-jAg,11771
|
@@ -461,11 +461,11 @@ keras_hub/src/utils/transformers/convert_gpt2.py,sha256=HCeHN_-GiQJRxLCM9OCJJ1wa
|
|
461
461
|
keras_hub/src/utils/transformers/convert_llama3.py,sha256=zlg0yFscjytyOFymDwqnbuXkmYvb88qqYzAROKcpaPU,5250
|
462
462
|
keras_hub/src/utils/transformers/convert_mistral.py,sha256=kVhN9h1ZFVhwkNW8p3wnS7eANJUXIsNy1RxWXy20Gqw,4760
|
463
463
|
keras_hub/src/utils/transformers/convert_pali_gemma.py,sha256=B1leeDw96Yvu81hYumf66hIid07k5NLqoeWAJgPnaLs,10649
|
464
|
-
keras_hub/src/utils/transformers/convert_qwen.py,sha256=
|
464
|
+
keras_hub/src/utils/transformers/convert_qwen.py,sha256=WUxMAEFVqRs7TRw7QU5TH3_ev4yf02R1xFVliMvTQqg,5886
|
465
465
|
keras_hub/src/utils/transformers/convert_vit.py,sha256=9SUZ9utNJhW_5cj3acMn9cRy47u2eIcDsrhmzj77o9k,5187
|
466
466
|
keras_hub/src/utils/transformers/preset_loader.py,sha256=0Hi7R8HnATcwFVLsJwMMIMWTCXHNfep4IPiRpQXqM-w,3933
|
467
467
|
keras_hub/src/utils/transformers/safetensor_utils.py,sha256=CYUHyA4y-B61r7NDnCsFb4t_UmSwZ1k9L-8gzEd6KRg,3339
|
468
|
-
keras_hub_nightly-0.21.0.
|
469
|
-
keras_hub_nightly-0.21.0.
|
470
|
-
keras_hub_nightly-0.21.0.
|
471
|
-
keras_hub_nightly-0.21.0.
|
468
|
+
keras_hub_nightly-0.21.0.dev202504070403.dist-info/METADATA,sha256=zt8-OymtnrsPExqiSPf2wxFbaWIZ-Jm06hq8dV1cHRE,7715
|
469
|
+
keras_hub_nightly-0.21.0.dev202504070403.dist-info/WHEEL,sha256=CmyFI0kx5cdEMTLiONQRbGQwjIoR1aIYB7eCAQ4KPJ0,91
|
470
|
+
keras_hub_nightly-0.21.0.dev202504070403.dist-info/top_level.txt,sha256=N4J6piIWBKa38A4uV-CnIopnOEf8mHAbkNXafXm_CuA,10
|
471
|
+
keras_hub_nightly-0.21.0.dev202504070403.dist-info/RECORD,,
|
File without changes
|