tf-models-nightly 2.19.0.dev20250101__py2.py3-none-any.whl → 2.19.0.dev20250103__py2.py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- official/nlp/modeling/layers/block_sparse_attention.py +11 -0
- official/nlp/modeling/layers/multi_query_attention.py +5 -0
- {tf_models_nightly-2.19.0.dev20250101.dist-info → tf_models_nightly-2.19.0.dev20250103.dist-info}/METADATA +1 -1
- {tf_models_nightly-2.19.0.dev20250101.dist-info → tf_models_nightly-2.19.0.dev20250103.dist-info}/RECORD +8 -8
- {tf_models_nightly-2.19.0.dev20250101.dist-info → tf_models_nightly-2.19.0.dev20250103.dist-info}/AUTHORS +0 -0
- {tf_models_nightly-2.19.0.dev20250101.dist-info → tf_models_nightly-2.19.0.dev20250103.dist-info}/LICENSE +0 -0
- {tf_models_nightly-2.19.0.dev20250101.dist-info → tf_models_nightly-2.19.0.dev20250103.dist-info}/WHEEL +0 -0
- {tf_models_nightly-2.19.0.dev20250101.dist-info → tf_models_nightly-2.19.0.dev20250103.dist-info}/top_level.txt +0 -0
@@ -84,6 +84,17 @@ class MultiHeadAttention(tf_keras.layers.MultiHeadAttention):
|
|
84
84
|
"sigmoid_attn_bias must be specified for sigmoid attn."
|
85
85
|
)
|
86
86
|
|
87
|
+
def get_config(self):
|
88
|
+
config = super().get_config()
|
89
|
+
config.update({
|
90
|
+
"src_block_size": self._src_block_size,
|
91
|
+
"tgt_block_size": self._tgt_block_size,
|
92
|
+
"use_sigmoid_attn": self._use_sigmoid_attn,
|
93
|
+
"sigmoid_attn_bias": self._sigmoid_attn_bias,
|
94
|
+
"num_kv_heads": self._num_kv_heads,
|
95
|
+
})
|
96
|
+
return config
|
97
|
+
|
87
98
|
def _build_from_signature(self, query, value, key=None):
|
88
99
|
# pytype: disable=attribute-error
|
89
100
|
super()._build_from_signature(query, value, key)
|
@@ -93,6 +93,11 @@ class MultiHeadAttention(tf_keras.layers.MultiHeadAttention):
|
|
93
93
|
self._num_heads % self._num_kv_heads == 0
|
94
94
|
), "num_kv_heads needs to divide num_heads exactly."
|
95
95
|
|
96
|
+
def get_config(self):
|
97
|
+
config = super().get_config()
|
98
|
+
config.update({"num_kv_heads": self._num_kv_heads})
|
99
|
+
return config
|
100
|
+
|
96
101
|
def _build_from_signature(
|
97
102
|
self,
|
98
103
|
query: Union[tf.Tensor, tf.TensorShape],
|
@@ -305,7 +305,7 @@ official/nlp/modeling/layers/bigbird_attention.py,sha256=dzutgRoQt2DFsYMpMILv_QF
|
|
305
305
|
official/nlp/modeling/layers/bigbird_attention_test.py,sha256=cBYwK5k1rnykZ0gif-n7VaByLIoElA-N0_svCRKASoU,2206
|
306
306
|
official/nlp/modeling/layers/block_diag_feedforward.py,sha256=FDEt-J_QjOxwar3eT5yjMs4hR41Ppke1zj7iswsZR4M,7243
|
307
307
|
official/nlp/modeling/layers/block_diag_feedforward_test.py,sha256=wcg8In6FIOCxcKqe5rucftjJ_kUWTi9Ei7eEmlVCYpE,4181
|
308
|
-
official/nlp/modeling/layers/block_sparse_attention.py,sha256=
|
308
|
+
official/nlp/modeling/layers/block_sparse_attention.py,sha256=3UDjvvv4oYM-0oLUu_jJNueKfwiFm4sAT-qymicG3kU,12583
|
309
309
|
official/nlp/modeling/layers/block_sparse_attention_test.py,sha256=9YiKtv4YCrKIyUbv27P2xcTXFohoaRxq2K6vsOUi4zU,16447
|
310
310
|
official/nlp/modeling/layers/cls_head.py,sha256=0X_gdjnAt6TZVrH_xkDcQCpwLuVz5Pb7d04wEVN_Kn8,16208
|
311
311
|
official/nlp/modeling/layers/cls_head_test.py,sha256=01oMmiuyp1lDEXBYa9r3krn6BtH-QuSedGOca9LViEc,8888
|
@@ -331,7 +331,7 @@ official/nlp/modeling/layers/moe.py,sha256=azoK1Cz5l-5yT-FOtb7VYSbePTxmoje-2XAcq
|
|
331
331
|
official/nlp/modeling/layers/moe_test.py,sha256=sr4hys2su_fcf9-6t0awqOkico92pQ3I2ApVF2rvvf0,9414
|
332
332
|
official/nlp/modeling/layers/multi_channel_attention.py,sha256=fInxZUAPrrgCoCkM62JylM_vf5Wp8D0uZAvd5yuooVU,7322
|
333
333
|
official/nlp/modeling/layers/multi_channel_attention_test.py,sha256=KcKuq22gOOq8HBzxRs3gGCwDRhmJPzYxfzfnqorQ1fw,1922
|
334
|
-
official/nlp/modeling/layers/multi_query_attention.py,sha256=
|
334
|
+
official/nlp/modeling/layers/multi_query_attention.py,sha256=efi58Dne1kDSH6TdfTHW9CJVVOJB10fSvvQhC-8JUHE,7111
|
335
335
|
official/nlp/modeling/layers/multi_query_attention_test.py,sha256=3VFF2hz85YExWPwdbhYWaSrIaSOkC1x7axdGfXr0W90,8512
|
336
336
|
official/nlp/modeling/layers/on_device_embedding.py,sha256=FgsHyRXf5TWVTyo4OeKImmrTnn4uOPJgS3AGKzKMWYY,4582
|
337
337
|
official/nlp/modeling/layers/on_device_embedding_test.py,sha256=M-LUba4QXV37s9Cx7aH8LL3bz_YotC6qITmWRI7Fhjk,8589
|
@@ -1222,9 +1222,9 @@ tensorflow_models/tensorflow_models_test.py,sha256=nc6A9K53OGqF25xN5St8EiWvdVbda
|
|
1222
1222
|
tensorflow_models/nlp/__init__.py,sha256=4tA5Pf4qaFwT-fIFOpX7x7FHJpnyJT-5UgOeFYTyMlc,807
|
1223
1223
|
tensorflow_models/uplift/__init__.py,sha256=mqfa55gweOdpKoaQyid4A_4u7xw__FcQeSIF0k_pYmI,999
|
1224
1224
|
tensorflow_models/vision/__init__.py,sha256=zBorY_v5xva1uI-qxhZO3Qh-Dii-Suq6wEYh6hKHDfc,833
|
1225
|
-
tf_models_nightly-2.19.0.
|
1226
|
-
tf_models_nightly-2.19.0.
|
1227
|
-
tf_models_nightly-2.19.0.
|
1228
|
-
tf_models_nightly-2.19.0.
|
1229
|
-
tf_models_nightly-2.19.0.
|
1230
|
-
tf_models_nightly-2.19.0.
|
1225
|
+
tf_models_nightly-2.19.0.dev20250103.dist-info/AUTHORS,sha256=1dG3fXVu9jlo7bul8xuix5F5vOnczMk7_yWn4y70uw0,337
|
1226
|
+
tf_models_nightly-2.19.0.dev20250103.dist-info/LICENSE,sha256=WxeBS_DejPZQabxtfMOM_xn8qoZNJDQjrT7z2wG1I4U,11512
|
1227
|
+
tf_models_nightly-2.19.0.dev20250103.dist-info/METADATA,sha256=OzGqZyxnQDnpq6JstzJEuJPHLq31ivjdzj-gLfYzi04,1432
|
1228
|
+
tf_models_nightly-2.19.0.dev20250103.dist-info/WHEEL,sha256=kGT74LWyRUZrL4VgLh6_g12IeVl_9u9ZVhadrgXZUEY,110
|
1229
|
+
tf_models_nightly-2.19.0.dev20250103.dist-info/top_level.txt,sha256=gum2FfO5R4cvjl2-QtP-S1aNmsvIZaFFT6VFzU0f4-g,33
|
1230
|
+
tf_models_nightly-2.19.0.dev20250103.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|