tf-models-nightly 2.19.0.dev20250102__py2.py3-none-any.whl → 2.19.0.dev20250103__py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -84,6 +84,17 @@ class MultiHeadAttention(tf_keras.layers.MultiHeadAttention):
84
84
  "sigmoid_attn_bias must be specified for sigmoid attn."
85
85
  )
86
86
 
87
+ def get_config(self):
88
+ config = super().get_config()
89
+ config.update({
90
+ "src_block_size": self._src_block_size,
91
+ "tgt_block_size": self._tgt_block_size,
92
+ "use_sigmoid_attn": self._use_sigmoid_attn,
93
+ "sigmoid_attn_bias": self._sigmoid_attn_bias,
94
+ "num_kv_heads": self._num_kv_heads,
95
+ })
96
+ return config
97
+
87
98
  def _build_from_signature(self, query, value, key=None):
88
99
  # pytype: disable=attribute-error
89
100
  super()._build_from_signature(query, value, key)
@@ -93,6 +93,11 @@ class MultiHeadAttention(tf_keras.layers.MultiHeadAttention):
93
93
  self._num_heads % self._num_kv_heads == 0
94
94
  ), "num_kv_heads needs to divide num_heads exactly."
95
95
 
96
+ def get_config(self):
97
+ config = super().get_config()
98
+ config.update({"num_kv_heads": self._num_kv_heads})
99
+ return config
100
+
96
101
  def _build_from_signature(
97
102
  self,
98
103
  query: Union[tf.Tensor, tf.TensorShape],
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: tf-models-nightly
3
- Version: 2.19.0.dev20250102
3
+ Version: 2.19.0.dev20250103
4
4
  Summary: TensorFlow Official Models
5
5
  Home-page: https://github.com/tensorflow/models
6
6
  Author: Google Inc.
@@ -305,7 +305,7 @@ official/nlp/modeling/layers/bigbird_attention.py,sha256=dzutgRoQt2DFsYMpMILv_QF
305
305
  official/nlp/modeling/layers/bigbird_attention_test.py,sha256=cBYwK5k1rnykZ0gif-n7VaByLIoElA-N0_svCRKASoU,2206
306
306
  official/nlp/modeling/layers/block_diag_feedforward.py,sha256=FDEt-J_QjOxwar3eT5yjMs4hR41Ppke1zj7iswsZR4M,7243
307
307
  official/nlp/modeling/layers/block_diag_feedforward_test.py,sha256=wcg8In6FIOCxcKqe5rucftjJ_kUWTi9Ei7eEmlVCYpE,4181
308
- official/nlp/modeling/layers/block_sparse_attention.py,sha256=8Jyinyf5XuU6nuxblGRfNnAviBEZIltMSoNJzAVjAYo,12233
308
+ official/nlp/modeling/layers/block_sparse_attention.py,sha256=3UDjvvv4oYM-0oLUu_jJNueKfwiFm4sAT-qymicG3kU,12583
309
309
  official/nlp/modeling/layers/block_sparse_attention_test.py,sha256=9YiKtv4YCrKIyUbv27P2xcTXFohoaRxq2K6vsOUi4zU,16447
310
310
  official/nlp/modeling/layers/cls_head.py,sha256=0X_gdjnAt6TZVrH_xkDcQCpwLuVz5Pb7d04wEVN_Kn8,16208
311
311
  official/nlp/modeling/layers/cls_head_test.py,sha256=01oMmiuyp1lDEXBYa9r3krn6BtH-QuSedGOca9LViEc,8888
@@ -331,7 +331,7 @@ official/nlp/modeling/layers/moe.py,sha256=azoK1Cz5l-5yT-FOtb7VYSbePTxmoje-2XAcq
331
331
  official/nlp/modeling/layers/moe_test.py,sha256=sr4hys2su_fcf9-6t0awqOkico92pQ3I2ApVF2rvvf0,9414
332
332
  official/nlp/modeling/layers/multi_channel_attention.py,sha256=fInxZUAPrrgCoCkM62JylM_vf5Wp8D0uZAvd5yuooVU,7322
333
333
  official/nlp/modeling/layers/multi_channel_attention_test.py,sha256=KcKuq22gOOq8HBzxRs3gGCwDRhmJPzYxfzfnqorQ1fw,1922
334
- official/nlp/modeling/layers/multi_query_attention.py,sha256=fFPBa9IBVj_O5x5OfGuHUFnJmiouNL6F1KsBCeHUqwM,6978
334
+ official/nlp/modeling/layers/multi_query_attention.py,sha256=efi58Dne1kDSH6TdfTHW9CJVVOJB10fSvvQhC-8JUHE,7111
335
335
  official/nlp/modeling/layers/multi_query_attention_test.py,sha256=3VFF2hz85YExWPwdbhYWaSrIaSOkC1x7axdGfXr0W90,8512
336
336
  official/nlp/modeling/layers/on_device_embedding.py,sha256=FgsHyRXf5TWVTyo4OeKImmrTnn4uOPJgS3AGKzKMWYY,4582
337
337
  official/nlp/modeling/layers/on_device_embedding_test.py,sha256=M-LUba4QXV37s9Cx7aH8LL3bz_YotC6qITmWRI7Fhjk,8589
@@ -1222,9 +1222,9 @@ tensorflow_models/tensorflow_models_test.py,sha256=nc6A9K53OGqF25xN5St8EiWvdVbda
1222
1222
  tensorflow_models/nlp/__init__.py,sha256=4tA5Pf4qaFwT-fIFOpX7x7FHJpnyJT-5UgOeFYTyMlc,807
1223
1223
  tensorflow_models/uplift/__init__.py,sha256=mqfa55gweOdpKoaQyid4A_4u7xw__FcQeSIF0k_pYmI,999
1224
1224
  tensorflow_models/vision/__init__.py,sha256=zBorY_v5xva1uI-qxhZO3Qh-Dii-Suq6wEYh6hKHDfc,833
1225
- tf_models_nightly-2.19.0.dev20250102.dist-info/AUTHORS,sha256=1dG3fXVu9jlo7bul8xuix5F5vOnczMk7_yWn4y70uw0,337
1226
- tf_models_nightly-2.19.0.dev20250102.dist-info/LICENSE,sha256=WxeBS_DejPZQabxtfMOM_xn8qoZNJDQjrT7z2wG1I4U,11512
1227
- tf_models_nightly-2.19.0.dev20250102.dist-info/METADATA,sha256=wpz6mIqvedDtyUHDM4pKQfHos2FIhmOE93NmfQvIyiY,1432
1228
- tf_models_nightly-2.19.0.dev20250102.dist-info/WHEEL,sha256=kGT74LWyRUZrL4VgLh6_g12IeVl_9u9ZVhadrgXZUEY,110
1229
- tf_models_nightly-2.19.0.dev20250102.dist-info/top_level.txt,sha256=gum2FfO5R4cvjl2-QtP-S1aNmsvIZaFFT6VFzU0f4-g,33
1230
- tf_models_nightly-2.19.0.dev20250102.dist-info/RECORD,,
1225
+ tf_models_nightly-2.19.0.dev20250103.dist-info/AUTHORS,sha256=1dG3fXVu9jlo7bul8xuix5F5vOnczMk7_yWn4y70uw0,337
1226
+ tf_models_nightly-2.19.0.dev20250103.dist-info/LICENSE,sha256=WxeBS_DejPZQabxtfMOM_xn8qoZNJDQjrT7z2wG1I4U,11512
1227
+ tf_models_nightly-2.19.0.dev20250103.dist-info/METADATA,sha256=OzGqZyxnQDnpq6JstzJEuJPHLq31ivjdzj-gLfYzi04,1432
1228
+ tf_models_nightly-2.19.0.dev20250103.dist-info/WHEEL,sha256=kGT74LWyRUZrL4VgLh6_g12IeVl_9u9ZVhadrgXZUEY,110
1229
+ tf_models_nightly-2.19.0.dev20250103.dist-info/top_level.txt,sha256=gum2FfO5R4cvjl2-QtP-S1aNmsvIZaFFT6VFzU0f4-g,33
1230
+ tf_models_nightly-2.19.0.dev20250103.dist-info/RECORD,,