keras-nlp 0.6.3.dev0__tar.gz → 0.6.4.dev0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (313) hide show
  1. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/PKG-INFO +60 -11
  2. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/README.md +59 -10
  3. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/__init__.py +1 -1
  4. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/__init__.py +1 -1
  5. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/backend/__init__.py +9 -7
  6. keras-nlp-0.6.4.dev0/keras_nlp/src/backend/config.py +64 -0
  7. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/backend/keras.py +0 -2
  8. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/conftest.py +11 -51
  9. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/__init__.py +1 -0
  10. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/cached_multi_head_attention_test.py +2 -2
  11. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_backbone_test.py +0 -31
  12. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_backbone_test.py +0 -28
  13. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_backbone_test.py +0 -27
  14. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_backbone_test.py +0 -27
  15. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/disentangled_self_attention.py +3 -2
  16. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_backbone_test.py +0 -26
  17. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_backbone_test.py +0 -26
  18. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_backbone.py +0 -72
  19. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_backbone_test.py +0 -43
  20. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_causal_lm.py +0 -36
  21. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_causal_lm_test.py +0 -10
  22. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_backbone_test.py +0 -26
  23. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_backbone.py +0 -72
  24. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_backbone_test.py +0 -43
  25. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_causal_lm.py +0 -36
  26. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_causal_lm_test.py +0 -10
  27. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_backbone_test.py +0 -26
  28. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_backbone_test.py +0 -27
  29. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/task.py +4 -1
  30. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_backbone_test.py +0 -41
  31. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_backbone_test.py +0 -26
  32. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/xlnet_backbone_test.py +0 -28
  33. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/test_case.py +8 -6
  34. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/tensor_utils.py +1 -1
  35. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp.egg-info/PKG-INFO +60 -11
  36. keras-nlp-0.6.3.dev0/keras_nlp/src/backend/config.py +0 -105
  37. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/layers/__init__.py +0 -0
  38. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/metrics/__init__.py +0 -0
  39. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/models/__init__.py +0 -0
  40. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/samplers/__init__.py +0 -0
  41. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/api_export.py +0 -0
  42. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/backend/ops.py +0 -0
  43. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/backend/random.py +0 -0
  44. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/__init__.py +0 -0
  45. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/cached_multi_head_attention.py +0 -0
  46. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/f_net_encoder.py +0 -0
  47. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/f_net_encoder_test.py +0 -0
  48. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/masked_lm_head.py +0 -0
  49. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/masked_lm_head_test.py +0 -0
  50. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/position_embedding.py +0 -0
  51. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/position_embedding_test.py +0 -0
  52. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/reversible_embedding.py +0 -0
  53. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/reversible_embedding_test.py +0 -0
  54. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/rotary_embedding.py +0 -0
  55. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/rotary_embedding_test.py +0 -0
  56. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/sine_position_encoding.py +0 -0
  57. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/sine_position_encoding_test.py +0 -0
  58. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/token_and_position_embedding.py +0 -0
  59. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/token_and_position_embedding_test.py +0 -0
  60. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_decoder.py +0 -0
  61. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_decoder_test.py +0 -0
  62. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_encoder.py +0 -0
  63. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_encoder_test.py +0 -0
  64. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_layer_utils.py +0 -0
  65. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_layer_utils_test.py +0 -0
  66. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/__init__.py +0 -0
  67. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/masked_lm_mask_generator.py +0 -0
  68. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/masked_lm_mask_generator_test.py +0 -0
  69. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/multi_segment_packer.py +0 -0
  70. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/multi_segment_packer_test.py +0 -0
  71. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/preprocessing_layer.py +0 -0
  72. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/random_deletion.py +0 -0
  73. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/random_deletion_test.py +0 -0
  74. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/random_swap.py +0 -0
  75. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/random_swap_test.py +0 -0
  76. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/start_end_packer.py +0 -0
  77. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/start_end_packer_test.py +0 -0
  78. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/__init__.py +0 -0
  79. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/bleu.py +0 -0
  80. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/bleu_test.py +0 -0
  81. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/edit_distance.py +0 -0
  82. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/edit_distance_test.py +0 -0
  83. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/perplexity.py +0 -0
  84. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/perplexity_test.py +0 -0
  85. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/rouge_base.py +0 -0
  86. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/rouge_l.py +0 -0
  87. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/rouge_l_test.py +0 -0
  88. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/rouge_n.py +0 -0
  89. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/rouge_n_test.py +0 -0
  90. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/__init__.py +0 -0
  91. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/__init__.py +0 -0
  92. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_backbone.py +0 -0
  93. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_classifier.py +0 -0
  94. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_classifier_test.py +0 -0
  95. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_masked_lm.py +0 -0
  96. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_masked_lm_preprocessor.py +0 -0
  97. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_masked_lm_preprocessor_test.py +0 -0
  98. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_masked_lm_test.py +0 -0
  99. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_preprocessor.py +0 -0
  100. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_preprocessor_test.py +0 -0
  101. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_presets.py +0 -0
  102. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_presets_test.py +0 -0
  103. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_tokenizer.py +0 -0
  104. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_tokenizer_test.py +0 -0
  105. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/backbone.py +0 -0
  106. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/__init__.py +0 -0
  107. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_backbone.py +0 -0
  108. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_preprocessor.py +0 -0
  109. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_preprocessor_test.py +0 -0
  110. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_presets.py +0 -0
  111. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_presets_test.py +0 -0
  112. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_seq_2_seq_lm.py +0 -0
  113. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_seq_2_seq_lm_preprocessor.py +0 -0
  114. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_seq_2_seq_lm_preprocessor_test.py +0 -0
  115. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_seq_2_seq_lm_test.py +0 -0
  116. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_tokenizer.py +0 -0
  117. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_tokenizer_test.py +0 -0
  118. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/__init__.py +0 -0
  119. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_backbone.py +0 -0
  120. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_classifier.py +0 -0
  121. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_classifier_test.py +0 -0
  122. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_masked_lm.py +0 -0
  123. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_masked_lm_preprocessor.py +0 -0
  124. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_masked_lm_preprocessor_test.py +0 -0
  125. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_masked_lm_test.py +0 -0
  126. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_preprocessor.py +0 -0
  127. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_preprocessor_test.py +0 -0
  128. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_presets.py +0 -0
  129. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_presets_test.py +0 -0
  130. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_tokenizer.py +0 -0
  131. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_tokenizer_test.py +0 -0
  132. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/__init__.py +0 -0
  133. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_backbone.py +0 -0
  134. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_classifier.py +0 -0
  135. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_classifier_test.py +0 -0
  136. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_masked_lm.py +0 -0
  137. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_masked_lm_preprocessor.py +0 -0
  138. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_masked_lm_preprocessor_test.py +0 -0
  139. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_masked_lm_test.py +0 -0
  140. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_preprocessor.py +0 -0
  141. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_preprocessor_test.py +0 -0
  142. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_presets.py +0 -0
  143. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_presets_test.py +0 -0
  144. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_tokenizer.py +0 -0
  145. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_tokenizer_test.py +0 -0
  146. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/disentangled_attention_encoder.py +0 -0
  147. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/relative_embedding.py +0 -0
  148. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/__init__.py +0 -0
  149. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_backbone.py +0 -0
  150. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_classifier.py +0 -0
  151. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_classifier_test.py +0 -0
  152. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_masked_lm.py +0 -0
  153. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_masked_lm_preprocessor.py +0 -0
  154. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_masked_lm_preprocessor_test.py +0 -0
  155. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_masked_lm_test.py +0 -0
  156. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_preprocessor.py +0 -0
  157. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_preprocessor_test.py +0 -0
  158. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_presets.py +0 -0
  159. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_presets_test.py +0 -0
  160. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_tokenizer.py +0 -0
  161. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_tokenizer_test.py +0 -0
  162. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/__init__.py +0 -0
  163. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_backbone.py +0 -0
  164. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_classifier.py +0 -0
  165. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_classifier_test.py +0 -0
  166. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_masked_lm.py +0 -0
  167. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_masked_lm_preprocessor.py +0 -0
  168. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_masked_lm_preprocessor_test.py +0 -0
  169. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_masked_lm_test.py +0 -0
  170. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_preprocessor.py +0 -0
  171. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_preprocessor_test.py +0 -0
  172. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_presets.py +0 -0
  173. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_presets_test.py +0 -0
  174. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_tokenizer.py +0 -0
  175. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_tokenizer_test.py +0 -0
  176. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/generative_task.py +0 -0
  177. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/__init__.py +0 -0
  178. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_causal_lm_preprocessor.py +0 -0
  179. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_causal_lm_preprocessor_test.py +0 -0
  180. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_preprocessor.py +0 -0
  181. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_preprocessor_test.py +0 -0
  182. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_presets.py +0 -0
  183. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_presets_test.py +0 -0
  184. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_tokenizer.py +0 -0
  185. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_tokenizer_test.py +0 -0
  186. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/__init__.py +0 -0
  187. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_attention.py +0 -0
  188. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_backbone.py +0 -0
  189. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_causal_lm.py +0 -0
  190. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_causal_lm_preprocessor.py +0 -0
  191. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_causal_lm_preprocessor_test.py +0 -0
  192. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_causal_lm_test.py +0 -0
  193. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_decoder.py +0 -0
  194. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_preprocessor.py +0 -0
  195. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_preprocessor_test.py +0 -0
  196. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_tokenizer.py +0 -0
  197. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_tokenizer_test.py +0 -0
  198. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/__init__.py +0 -0
  199. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_causal_lm_preprocessor.py +0 -0
  200. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_causal_lm_preprocessor_test.py +0 -0
  201. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_preprocessor.py +0 -0
  202. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_preprocessor_test.py +0 -0
  203. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_presets.py +0 -0
  204. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_presets_test.py +0 -0
  205. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_tokenizer.py +0 -0
  206. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_tokenizer_test.py +0 -0
  207. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/preprocessor.py +0 -0
  208. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/__init__.py +0 -0
  209. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_backbone.py +0 -0
  210. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_classifier.py +0 -0
  211. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_classifier_test.py +0 -0
  212. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_masked_lm.py +0 -0
  213. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_masked_lm_preprocessor.py +0 -0
  214. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_masked_lm_preprocessor_test.py +0 -0
  215. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_masked_lm_test.py +0 -0
  216. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_preprocessor.py +0 -0
  217. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_preprocessor_test.py +0 -0
  218. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_presets.py +0 -0
  219. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_presets_test.py +0 -0
  220. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_tokenizer.py +0 -0
  221. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_tokenizer_test.py +0 -0
  222. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/__init__.py +0 -0
  223. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_backbone.py +0 -0
  224. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_layer_norm.py +0 -0
  225. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_multi_head_attention.py +0 -0
  226. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_tokenizer.py +0 -0
  227. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_tokenizer_test.py +0 -0
  228. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_transformer_layer.py +0 -0
  229. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/task_test.py +0 -0
  230. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/__init__.py +0 -0
  231. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_audio_feature_extractor.py +0 -0
  232. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_audio_feature_extractor_test.py +0 -0
  233. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_backbone.py +0 -0
  234. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_decoder.py +0 -0
  235. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_encoder.py +0 -0
  236. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_preprocessor.py +0 -0
  237. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_preprocessor_test.py +0 -0
  238. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_presets.py +0 -0
  239. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_presets_test.py +0 -0
  240. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_tokenizer.py +0 -0
  241. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_tokenizer_test.py +0 -0
  242. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/__init__.py +0 -0
  243. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_backbone.py +0 -0
  244. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_classifier.py +0 -0
  245. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_classifier_test.py +0 -0
  246. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_masked_lm.py +0 -0
  247. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_masked_lm_preprocessor.py +0 -0
  248. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_masked_lm_preprocessor_test.py +0 -0
  249. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_masked_lm_test.py +0 -0
  250. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_preprocessor.py +0 -0
  251. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_preprocessor_test.py +0 -0
  252. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_presets.py +0 -0
  253. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_presets_test.py +0 -0
  254. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_tokenizer.py +0 -0
  255. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_tokenizer_test.py +0 -0
  256. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/__init__.py +0 -0
  257. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/relative_attention.py +0 -0
  258. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/xlnet_backbone.py +0 -0
  259. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/xlnet_content_and_query_embedding.py +0 -0
  260. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/xlnet_encoder.py +0 -0
  261. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/__init__.py +0 -0
  262. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/beam_sampler.py +0 -0
  263. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/beam_sampler_test.py +0 -0
  264. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/contrastive_sampler.py +0 -0
  265. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/contrastive_sampler_test.py +0 -0
  266. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/greedy_sampler.py +0 -0
  267. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/greedy_sampler_test.py +0 -0
  268. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/random_sampler.py +0 -0
  269. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/random_sampler_test.py +0 -0
  270. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/sampler.py +0 -0
  271. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/serialization.py +0 -0
  272. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/serialization_test.py +0 -0
  273. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/top_k_sampler.py +0 -0
  274. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/top_k_sampler_test.py +0 -0
  275. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/top_p_sampler.py +0 -0
  276. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/top_p_sampler_test.py +0 -0
  277. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/__init__.py +0 -0
  278. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/doc_tests/__init__.py +0 -0
  279. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/doc_tests/docstring_lib.py +0 -0
  280. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/doc_tests/docstring_test.py +0 -0
  281. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/doc_tests/fenced_docstring_lib.py +0 -0
  282. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/__init__.py +0 -0
  283. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/byte_pair_tokenizer.py +0 -0
  284. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/byte_pair_tokenizer_test.py +0 -0
  285. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/byte_tokenizer.py +0 -0
  286. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/byte_tokenizer_test.py +0 -0
  287. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/sentence_piece_tokenizer.py +0 -0
  288. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/sentence_piece_tokenizer_test.py +0 -0
  289. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/sentence_piece_tokenizer_trainer.py +0 -0
  290. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/sentence_piece_tokenizer_trainer_test.py +0 -0
  291. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/tokenizer.py +0 -0
  292. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/tokenizer_test.py +0 -0
  293. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/unicode_codepoint_tokenizer.py +0 -0
  294. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/unicode_codepoint_tokenizer_test.py +0 -0
  295. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/word_piece_tokenizer.py +0 -0
  296. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/word_piece_tokenizer_test.py +0 -0
  297. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/word_piece_tokenizer_trainer.py +0 -0
  298. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/word_piece_tokenizer_trainer_test.py +0 -0
  299. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/__init__.py +0 -0
  300. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/keras_utils.py +0 -0
  301. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/keras_utils_test.py +0 -0
  302. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/pipeline_model.py +0 -0
  303. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/pipeline_model_test.py +0 -0
  304. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/python_utils.py +0 -0
  305. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/python_utils_test.py +0 -0
  306. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/tensor_utils_test.py +0 -0
  307. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/tokenizers/__init__.py +0 -0
  308. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp.egg-info/SOURCES.txt +0 -0
  309. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp.egg-info/dependency_links.txt +0 -0
  310. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp.egg-info/requires.txt +0 -0
  311. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp.egg-info/top_level.txt +0 -0
  312. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/setup.cfg +0 -0
  313. {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/setup.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: keras-nlp
3
- Version: 0.6.3.dev0
3
+ Version: 0.6.4.dev0
4
4
  Summary: Industry-strength Natural Language Processing extensions for Keras.
5
5
  Home-page: https://github.com/keras-team/keras-nlp
6
6
  Author: Keras team
@@ -39,11 +39,10 @@ Requires-Dist: sentencepiece; extra == "extras"
39
39
  ![Tensorflow](https://img.shields.io/badge/tensorflow-v2.5.0+-success.svg)
40
40
  [![contributions welcome](https://img.shields.io/badge/contributions-welcome-brightgreen.svg?style=flat)](https://github.com/keras-team/keras-nlp/issues)
41
41
 
42
- KerasNLP is a natural language processing library that works natively
43
- with TensorFlow, JAX, or PyTorch. Built on [Keras Core](https://keras.io/keras_core/announcement/),
44
- these models, layers, metrics, callbacks, etc., can be trained and serialized
45
- in any framework and re-used in another without costly migrations. See "Using
46
- KerasNLP with Keras Core" below for more details on multi-framework KerasNLP.
42
+ KerasNLP is a natural language processing library that works natively
43
+ with TensorFlow, JAX, or PyTorch. Built on Keras 3, these models, layers,
44
+ metrics, and tokenizers can be trained and serialized in any framework and
45
+ re-used in another without costly migrations.
47
46
 
48
47
  KerasNLP supports users through their entire development cycle. Our workflows
49
48
  are built from modular components that have state-of-the-art preset weights and
@@ -82,17 +81,28 @@ We are a new and growing project and welcome [contributions](CONTRIBUTING.md).
82
81
 
83
82
  ## Installation
84
83
 
85
- To install the latest official release:
84
+ KerasNLP supports both Keras 2 and Keras 3. We recommend Keras 3 for all new
85
+ users, as it enables using KerasNLP models and layers with JAX, TensorFlow and
86
+ PyTorch.
87
+
88
+ ### Keras 2 Installation
89
+
90
+ To install the latest KerasNLP release with Keras 2, simply run:
86
91
 
87
92
  ```
88
- pip install keras-nlp --upgrade
93
+ pip install --upgrade keras-nlp
89
94
  ```
90
95
 
91
- To install the latest unreleased changes to the library, we recommend using
92
- pip to install directly from the master branch on github:
96
+ ### Keras 3 Installation
97
+
98
+ There are currently two ways to install Keras 3 with KerasNLP. To install the
99
+ stable versions of KerasNLP and Keras 3, you should install Keras 3 **after**
100
+ installing KerasNLP. This is a temporary step while TensorFlow is pinned to
101
+ Keras 2, and will no longer be necessary after TensorFlow 2.16.
93
102
 
94
103
  ```
95
- pip install git+https://github.com/keras-team/keras-nlp.git --upgrade
104
+ pip install --upgrade keras-nlp
105
+ pip install --upgrade keras>=3
96
106
  ```
97
107
  ## Using KerasNLP with Keras Core
98
108
 
@@ -123,12 +133,28 @@ Until Keras Core is officially released as Keras 3.0, KerasNLP will use
123
133
  `.keras/keras_nlp.json`. You will need to restart the Python runtime for changes
124
134
  to take effect.
125
135
 
136
+ To install the latest nightly changes for both KerasNLP and Keras, you can use
137
+ our nightly package.
138
+
139
+ ```
140
+ pip install --upgrade keras-nlp-nightly
141
+ ```
142
+
143
+ > [!IMPORTANT]
144
+ > Keras 3 will not function with TensorFlow 2.14 or earlier.
145
+
146
+ Read [Getting started with Keras](https://keras.io/getting_started/) for more information
147
+ on installing Keras 3 and compatibility with different frameworks.
148
+
126
149
  ## Quickstart
127
150
 
128
151
  Fine-tune BERT on a small sentiment analysis task using the
129
152
  [`keras_nlp.models`](https://keras.io/api/keras_nlp/models/) API:
130
153
 
131
154
  ```python
155
+ import os
156
+ os.environ["KERAS_BACKEND"] = "tensorflow" # Or "jax" or "torch"!
157
+
132
158
  import keras_nlp
133
159
  import tensorflow_datasets as tfds
134
160
 
@@ -151,6 +177,29 @@ classifier.predict(["What an amazing movie!", "A total waste of my time."])
151
177
 
152
178
  For more in depth guides and examples, visit https://keras.io/keras_nlp/.
153
179
 
180
+ ## Configuring your backend
181
+
182
+ If you have Keras 3 installed in your environment (see installation above),
183
+ you can use KerasNLP with any of JAX, TensorFlow and PyTorch. To do so, set the
184
+ `KERAS_BACKEND` environment variable. For example:
185
+
186
+ ```shell
187
+ export KERAS_BACKEND=jax
188
+ ```
189
+
190
+ Or in Colab, with:
191
+
192
+ ```python
193
+ import os
194
+ os.environ["KERAS_BACKEND"] = "jax"
195
+
196
+ import keras_nlp
197
+ ```
198
+
199
+ > [!IMPORTANT]
200
+ > Make sure to set the `KERAS_BACKEND` before import any Keras libraries, it
201
+ > will be used to set up Keras when it is first imported.
202
+
154
203
  ## Compatibility
155
204
 
156
205
  We follow [Semantic Versioning](https://semver.org/), and plan to
@@ -4,11 +4,10 @@
4
4
  ![Tensorflow](https://img.shields.io/badge/tensorflow-v2.5.0+-success.svg)
5
5
  [![contributions welcome](https://img.shields.io/badge/contributions-welcome-brightgreen.svg?style=flat)](https://github.com/keras-team/keras-nlp/issues)
6
6
 
7
- KerasNLP is a natural language processing library that works natively
8
- with TensorFlow, JAX, or PyTorch. Built on [Keras Core](https://keras.io/keras_core/announcement/),
9
- these models, layers, metrics, callbacks, etc., can be trained and serialized
10
- in any framework and re-used in another without costly migrations. See "Using
11
- KerasNLP with Keras Core" below for more details on multi-framework KerasNLP.
7
+ KerasNLP is a natural language processing library that works natively
8
+ with TensorFlow, JAX, or PyTorch. Built on Keras 3, these models, layers,
9
+ metrics, and tokenizers can be trained and serialized in any framework and
10
+ re-used in another without costly migrations.
12
11
 
13
12
  KerasNLP supports users through their entire development cycle. Our workflows
14
13
  are built from modular components that have state-of-the-art preset weights and
@@ -47,17 +46,28 @@ We are a new and growing project and welcome [contributions](CONTRIBUTING.md).
47
46
 
48
47
  ## Installation
49
48
 
50
- To install the latest official release:
49
+ KerasNLP supports both Keras 2 and Keras 3. We recommend Keras 3 for all new
50
+ users, as it enables using KerasNLP models and layers with JAX, TensorFlow and
51
+ PyTorch.
52
+
53
+ ### Keras 2 Installation
54
+
55
+ To install the latest KerasNLP release with Keras 2, simply run:
51
56
 
52
57
  ```
53
- pip install keras-nlp --upgrade
58
+ pip install --upgrade keras-nlp
54
59
  ```
55
60
 
56
- To install the latest unreleased changes to the library, we recommend using
57
- pip to install directly from the master branch on github:
61
+ ### Keras 3 Installation
62
+
63
+ There are currently two ways to install Keras 3 with KerasNLP. To install the
64
+ stable versions of KerasNLP and Keras 3, you should install Keras 3 **after**
65
+ installing KerasNLP. This is a temporary step while TensorFlow is pinned to
66
+ Keras 2, and will no longer be necessary after TensorFlow 2.16.
58
67
 
59
68
  ```
60
- pip install git+https://github.com/keras-team/keras-nlp.git --upgrade
69
+ pip install --upgrade keras-nlp
70
+ pip install --upgrade keras>=3
61
71
  ```
62
72
  ## Using KerasNLP with Keras Core
63
73
 
@@ -88,12 +98,28 @@ Until Keras Core is officially released as Keras 3.0, KerasNLP will use
88
98
  `.keras/keras_nlp.json`. You will need to restart the Python runtime for changes
89
99
  to take effect.
90
100
 
101
+ To install the latest nightly changes for both KerasNLP and Keras, you can use
102
+ our nightly package.
103
+
104
+ ```
105
+ pip install --upgrade keras-nlp-nightly
106
+ ```
107
+
108
+ > [!IMPORTANT]
109
+ > Keras 3 will not function with TensorFlow 2.14 or earlier.
110
+
111
+ Read [Getting started with Keras](https://keras.io/getting_started/) for more information
112
+ on installing Keras 3 and compatibility with different frameworks.
113
+
91
114
  ## Quickstart
92
115
 
93
116
  Fine-tune BERT on a small sentiment analysis task using the
94
117
  [`keras_nlp.models`](https://keras.io/api/keras_nlp/models/) API:
95
118
 
96
119
  ```python
120
+ import os
121
+ os.environ["KERAS_BACKEND"] = "tensorflow" # Or "jax" or "torch"!
122
+
97
123
  import keras_nlp
98
124
  import tensorflow_datasets as tfds
99
125
 
@@ -116,6 +142,29 @@ classifier.predict(["What an amazing movie!", "A total waste of my time."])
116
142
 
117
143
  For more in depth guides and examples, visit https://keras.io/keras_nlp/.
118
144
 
145
+ ## Configuring your backend
146
+
147
+ If you have Keras 3 installed in your environment (see installation above),
148
+ you can use KerasNLP with any of JAX, TensorFlow and PyTorch. To do so, set the
149
+ `KERAS_BACKEND` environment variable. For example:
150
+
151
+ ```shell
152
+ export KERAS_BACKEND=jax
153
+ ```
154
+
155
+ Or in Colab, with:
156
+
157
+ ```python
158
+ import os
159
+ os.environ["KERAS_BACKEND"] = "jax"
160
+
161
+ import keras_nlp
162
+ ```
163
+
164
+ > [!IMPORTANT]
165
+ > Make sure to set the `KERAS_BACKEND` before import any Keras libraries, it
166
+ > will be used to set up Keras when it is first imported.
167
+
119
168
  ## Compatibility
120
169
 
121
170
  We follow [Semantic Versioning](https://semver.org/), and plan to
@@ -12,4 +12,4 @@ from keras_nlp import samplers
12
12
  from keras_nlp import tokenizers
13
13
 
14
14
 
15
- __version__ = "0.6.3.dev0"
15
+ __version__ = "0.6.4.dev0"
@@ -28,5 +28,5 @@ from keras_nlp.src import tokenizers
28
28
  from keras_nlp.src import utils
29
29
 
30
30
  # This is the global source of truth for the version number.
31
- __version__ = "0.6.3.dev0"
31
+ __version__ = "0.6.4.dev0"
32
32
 
@@ -14,14 +14,16 @@
14
14
  """
15
15
  Keras backend module.
16
16
 
17
- This module adds a temporarily Keras API surface that is fully under KerasNLP
18
- control. This allows us to switch between `keras_core` and `tf.keras`, as well
19
- as add shims to support older version of `tf.keras`.
17
+ This module adds a temporary Keras API surface that is fully under KerasNLP
18
+ control. The goal is to allow us to write Keras 3-like code everywhere, while
19
+ still supporting Keras 2. We do this by using the `keras_core` package with
20
+ Keras 2 to backport Keras 3 numerics APIs (`keras.ops` and `keras.random`) into
21
+ Keras 2. The sub-modules exposed are as follows:
20
22
 
21
- - `config`: check which backend is being run.
22
- - `keras`: The full `keras` API (via `keras_core` or `tf.keras`).
23
- - `ops`: `keras_core.ops`, always tf backed if using `tf.keras`.
24
- - `random`: `keras_core.random`, always tf backed if using `tf.keras`.
23
+ - `config`: check which version of Keras is being run.
24
+ - `keras`: The full `keras` API with compat shims for older Keras versions.
25
+ - `ops`: `keras.ops` for Keras 3 or `keras_core.ops` for Keras 2.
26
+ - `random`: `keras.random` for Keras 3 or `keras_core.ops` for Keras 2.
25
27
  """
26
28
 
27
29
  from keras_nlp.src.backend import config
@@ -0,0 +1,64 @@
1
+ # Copyright 2023 The KerasNLP Authors
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # https://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ import os
16
+
17
+
18
+ def detect_if_tensorflow_uses_keras_3():
19
+ # We follow the version of keras that tensorflow is configured to use.
20
+ try:
21
+ from tensorflow import keras
22
+
23
+ # Note that only recent versions of keras have a `version()` function.
24
+ if hasattr(keras, "version") and keras.version().startswith("3."):
25
+ return True
26
+ except:
27
+ raise ValueError(
28
+ "Unable to import `keras` with `tensorflow`. Please check your "
29
+ "Keras and Tensorflow version are compatible; Keras 3 requires "
30
+ "TensorFlow 2.15 or later. See keras.io/getting_started for more "
31
+ "information on installing Keras."
32
+ )
33
+
34
+ # No `keras.version()` means we are on an old version of keras.
35
+ return False
36
+
37
+
38
+ _USE_KERAS_3 = detect_if_tensorflow_uses_keras_3()
39
+
40
+ if not _USE_KERAS_3:
41
+ backend = os.environ.get("KERAS_BACKEND")
42
+ if backend and backend != "tensorflow":
43
+ raise RuntimeError(
44
+ "When running Keras 2, the `KERAS_BACKEND` environment variable "
45
+ f"must either be unset or `'tensorflow'`. Received: `{backend}`. "
46
+ "To set another backend, please install Keras 3. See "
47
+ "https://github.com/keras-team/keras-nlp#installation"
48
+ )
49
+
50
+
51
+ def keras_3():
52
+ """Check if Keras 3 is being used."""
53
+ return _USE_KERAS_3
54
+
55
+
56
+ def backend():
57
+ """Check the backend framework."""
58
+ if not keras_3():
59
+ return "tensorflow"
60
+
61
+ import keras
62
+
63
+ return keras.config.backend()
64
+
@@ -20,8 +20,6 @@ from keras_nlp.src.backend import config
20
20
 
21
21
  if config.keras_3():
22
22
  from keras import * # noqa: F403, F401
23
- elif config.multi_backend():
24
- from keras_core import * # noqa: F403, F401
25
23
  else:
26
24
  from tensorflow.keras import * # noqa: F403, F401
27
25
 
@@ -12,8 +12,6 @@
12
12
  # See the License for the specific language governing permissions and
13
13
  # limitations under the License.
14
14
 
15
- import os
16
-
17
15
  import pytest
18
16
  import tensorflow as tf
19
17
 
@@ -21,21 +19,6 @@ from keras_nlp.src.backend import config as backend_config
21
19
  from keras_nlp.src.backend import keras
22
20
 
23
21
 
24
- @pytest.fixture(scope="session")
25
- def tpu_strategy():
26
- tpu_name = os.getenv("KUBE_GOOGLE_CLOUD_TPU_ENDPOINTS")
27
- resolver = tf.distribute.cluster_resolver.TPUClusterResolver.connect(
28
- tpu=tpu_name,
29
- )
30
- return tf.distribute.TPUStrategy(resolver)
31
-
32
-
33
- @pytest.fixture(scope="class")
34
- def tpu_test_class(request, tpu_strategy):
35
- # set a class attribute on the invoking test context
36
- request.cls.tpu_strategy = tpu_strategy
37
-
38
-
39
22
  def pytest_addoption(parser):
40
23
  parser.addoption(
41
24
  "--run_large",
@@ -49,18 +32,6 @@ def pytest_addoption(parser):
49
32
  default=False,
50
33
  help="run extra_large tests",
51
34
  )
52
- parser.addoption(
53
- "--run_tpu",
54
- action="store_true",
55
- default=False,
56
- help="run tpu tests",
57
- )
58
- parser.addoption(
59
- "--mixed_precision",
60
- action="store_true",
61
- default=False,
62
- help="run with mixed precision",
63
- )
64
35
  parser.addoption(
65
36
  "--docstring_module",
66
37
  action="store",
@@ -70,18 +41,13 @@ def pytest_addoption(parser):
70
41
 
71
42
 
72
43
  def pytest_configure(config):
73
- if config.getoption("--mixed_precision"):
74
- keras.mixed_precision.set_global_policy("mixed_float16")
75
- config.addinivalue_line(
76
- "markers", "large: mark test as being slow or requiring a network"
77
- )
78
44
  config.addinivalue_line(
79
45
  "markers",
80
- "extra_large: mark test as being too large to run continuously",
46
+ "large: mark test as being slow or requiring a network",
81
47
  )
82
48
  config.addinivalue_line(
83
49
  "markers",
84
- "tpu: mark test as tpu test",
50
+ "extra_large: mark test as being too large to run continuously",
85
51
  )
86
52
  config.addinivalue_line(
87
53
  "markers",
@@ -93,7 +59,6 @@ def pytest_collection_modifyitems(config, items):
93
59
  run_extra_large_tests = config.getoption("--run_extra_large")
94
60
  # Run large tests for --run_extra_large or --run_large.
95
61
  run_large_tests = config.getoption("--run_large") or run_extra_large_tests
96
- run_tpu = config.getoption("--run_tpu")
97
62
 
98
63
  # Messages to annotate skipped tests with.
99
64
  skip_large = pytest.mark.skipif(
@@ -104,32 +69,27 @@ def pytest_collection_modifyitems(config, items):
104
69
  not run_extra_large_tests,
105
70
  reason="need --run_extra_large option to run",
106
71
  )
107
- skip_tpu = pytest.mark.skipif(
108
- not run_tpu,
109
- reason="need --run_tpu option to run",
110
- )
111
- skip_tf_only = pytest.mark.skipif(
72
+ tf_only = pytest.mark.skipif(
112
73
  not backend_config.backend() == "tensorflow",
113
74
  reason="tests only run on tf backend",
114
75
  )
76
+ keras_3_only = pytest.mark.skipif(
77
+ not backend_config.keras_3(),
78
+ reason="tests only run on with multi-backend keras",
79
+ )
115
80
  for item in items:
116
81
  if "large" in item.keywords:
117
82
  item.add_marker(skip_large)
118
83
  if "extra_large" in item.keywords:
119
84
  item.add_marker(skip_extra_large)
120
- if "tpu" in item.keywords:
121
- item.add_marker(skip_tpu)
122
85
  if "tf_only" in item.keywords:
123
- item.add_marker(skip_tf_only)
86
+ item.add_marker(tf_only)
87
+ if "keras_3_only" in item.keywords:
88
+ item.add_marker(keras_3_only)
124
89
 
125
90
 
126
91
  # Disable traceback filtering for quicker debugging of tests failures.
127
92
  tf.debugging.disable_traceback_filtering()
128
- if backend_config.multi_backend():
93
+ if backend_config.keras_3():
129
94
  keras.config.disable_traceback_filtering()
130
95
 
131
- # One off setup for dtensor tests.
132
- if not backend_config.multi_backend():
133
- keras.backend.experimental.enable_tf_random_generator()
134
- keras.utils.set_random_seed(1337)
135
-
@@ -18,6 +18,7 @@ from keras_nlp.src.layers.modeling.cached_multi_head_attention import (
18
18
  from keras_nlp.src.layers.modeling.f_net_encoder import FNetEncoder
19
19
  from keras_nlp.src.layers.modeling.masked_lm_head import MaskedLMHead
20
20
  from keras_nlp.src.layers.modeling.position_embedding import PositionEmbedding
21
+ from keras_nlp.src.layers.modeling.reversible_embedding import ReversibleEmbedding
21
22
  from keras_nlp.src.layers.modeling.rotary_embedding import RotaryEmbedding
22
23
  from keras_nlp.src.layers.modeling.sine_position_encoding import (
23
24
  SinePositionEncoding,
@@ -36,9 +36,9 @@ class CachedMultiHeadAttentionTest(TestCase):
36
36
  expected_output_shape=(2, 4, 6),
37
37
  expected_num_trainable_weights=8,
38
38
  expected_num_non_trainable_variables=1,
39
- # tf.keras does not handle mixed precision correctly when not set
39
+ # Keras 2 does not handle mixed precision correctly when not set
40
40
  # globally.
41
- run_mixed_precision_check=config.multi_backend(),
41
+ run_mixed_precision_check=config.keras_3(),
42
42
  )
43
43
 
44
44
  def test_cache_call_is_correct(self):
@@ -102,34 +102,3 @@ class AlbertBackboneTest(TestCase):
102
102
  model_output["pooled_output"], restored_output["pooled_output"]
103
103
  )
104
104
 
105
-
106
- @pytest.mark.tpu
107
- @pytest.mark.usefixtures("tpu_test_class")
108
- class AlbertBackboneTPUTest(TestCase):
109
- def setUp(self):
110
- with self.tpu_strategy.scope():
111
- self.backbone = AlbertBackbone(
112
- vocabulary_size=10,
113
- num_layers=2,
114
- num_heads=2,
115
- num_groups=1,
116
- num_inner_repetitions=1,
117
- embedding_dim=16,
118
- hidden_dim=2,
119
- intermediate_dim=2,
120
- max_sequence_length=4,
121
- )
122
-
123
- self.input_batch = {
124
- "token_ids": np.ones((8, 128), dtype="int32"),
125
- "segment_ids": np.ones((8, 128), dtype="int32"),
126
- "padding_mask": np.ones((8, 128), dtype="int32"),
127
- }
128
- self.input_dataset = tf.data.Dataset.from_tensor_slices(
129
- self.input_batch
130
- ).batch(2)
131
-
132
- def test_predict(self):
133
- self.backbone.compile()
134
- self.backbone.predict(self.input_dataset)
135
-
@@ -92,31 +92,3 @@ class BartBackboneTest(TestCase):
92
92
  restored_output["decoder_sequence_output"],
93
93
  )
94
94
 
95
-
96
- @pytest.mark.tpu
97
- @pytest.mark.usefixtures("tpu_test_class")
98
- class BartBackboneTPUTest(TestCase):
99
- def setUp(self):
100
- with self.tpu_strategy.scope():
101
- self.backbone = BartBackbone(
102
- vocabulary_size=1000,
103
- num_layers=2,
104
- num_heads=2,
105
- hidden_dim=64,
106
- intermediate_dim=128,
107
- max_sequence_length=128,
108
- )
109
- self.input_batch = {
110
- "encoder_token_ids": np.ones((8, 128), dtype="int32"),
111
- "encoder_padding_mask": np.ones((8, 128), dtype="int32"),
112
- "decoder_token_ids": np.ones((8, 128), dtype="int32"),
113
- "decoder_padding_mask": np.ones((8, 128), dtype="int32"),
114
- }
115
- self.input_dataset = tf.data.Dataset.from_tensor_slices(
116
- self.input_batch
117
- ).batch(2)
118
-
119
- def test_predict(self):
120
- self.backbone.compile()
121
- self.backbone.predict(self.input_dataset)
122
-
@@ -86,30 +86,3 @@ class BertBackboneTest(TestCase):
86
86
  restored_output = restored_model(self.input_batch)
87
87
  self.assertAllClose(model_output, restored_output)
88
88
 
89
-
90
- @pytest.mark.tpu
91
- @pytest.mark.usefixtures("tpu_test_class")
92
- class BertBackboneTPUTest(TestCase):
93
- def setUp(self):
94
- with self.tpu_strategy.scope():
95
- self.backbone = BertBackbone(
96
- vocabulary_size=1000,
97
- num_layers=2,
98
- num_heads=2,
99
- hidden_dim=64,
100
- intermediate_dim=128,
101
- max_sequence_length=128,
102
- )
103
- self.input_batch = {
104
- "token_ids": np.ones((8, 128), dtype="int32"),
105
- "segment_ids": np.ones((8, 128), dtype="int32"),
106
- "padding_mask": np.ones((8, 128), dtype="int32"),
107
- }
108
- self.input_dataset = tf.data.Dataset.from_tensor_slices(
109
- self.input_batch
110
- ).batch(2)
111
-
112
- def test_predict(self):
113
- self.backbone.compile()
114
- self.backbone.predict(self.input_dataset)
115
-
@@ -91,30 +91,3 @@ class DebertaV3BackboneTest(TestCase):
91
91
  restored_output = restored_model(self.input_batch)
92
92
  self.assertAllClose(model_output, restored_output)
93
93
 
94
-
95
- @pytest.mark.tpu
96
- @pytest.mark.usefixtures("tpu_test_class")
97
- class DebertaV3BackboneTPUTest(TestCase):
98
- def setUp(self):
99
- with self.tpu_strategy.scope():
100
- self.backbone = DebertaV3Backbone(
101
- vocabulary_size=10,
102
- num_layers=2,
103
- num_heads=2,
104
- hidden_dim=2,
105
- intermediate_dim=4,
106
- max_sequence_length=5,
107
- bucket_size=2,
108
- )
109
- self.input_batch = {
110
- "token_ids": np.ones((2, 5), dtype="int32"),
111
- "padding_mask": np.ones((2, 5), dtype="int32"),
112
- }
113
- self.input_dataset = tf.data.Dataset.from_tensor_slices(
114
- self.input_batch
115
- ).batch(2)
116
-
117
- def test_predict(self):
118
- self.backbone.compile()
119
- self.backbone.predict(self.input_dataset)
120
-
@@ -232,12 +232,13 @@ class DisentangledSelfAttention(keras.layers.Layer):
232
232
  x1=rel_pos,
233
233
  x2=log_pos * sign,
234
234
  )
235
- bucket_pos = ops.cast(bucket_pos, dtype="int64")
235
+ bucket_pos = ops.cast(bucket_pos, dtype="int")
236
236
 
237
237
  return bucket_pos
238
238
 
239
239
  def _get_rel_pos(self, num_positions):
240
- ids = ops.arange(num_positions, dtype="int64")
240
+ ids = ops.arange(num_positions)
241
+ ids = ops.cast(ids, dtype="int")
241
242
  query_ids = ops.expand_dims(ids, axis=-1)
242
243
  key_ids = ops.expand_dims(ids, axis=0)
243
244
  key_ids = ops.repeat(key_ids, repeats=num_positions, axis=0)
@@ -84,29 +84,3 @@ class DistilBertTest(TestCase):
84
84
  restored_output = restored_model(self.input_batch)
85
85
  self.assertAllClose(model_output, restored_output)
86
86
 
87
-
88
- @pytest.mark.tpu
89
- @pytest.mark.usefixtures("tpu_test_class")
90
- class DistilBertTPUTest(TestCase):
91
- def setUp(self):
92
- with self.tpu_strategy.scope():
93
- self.backbone = DistilBertBackbone(
94
- vocabulary_size=1000,
95
- num_layers=2,
96
- num_heads=2,
97
- hidden_dim=64,
98
- intermediate_dim=128,
99
- max_sequence_length=128,
100
- )
101
- self.input_batch = {
102
- "token_ids": np.ones((8, 128), dtype="int32"),
103
- "padding_mask": np.ones((8, 128), dtype="int32"),
104
- }
105
- self.input_dataset = tf.data.Dataset.from_tensor_slices(
106
- self.input_batch
107
- ).batch(2)
108
-
109
- def test_predict(self):
110
- self.backbone.compile()
111
- self.backbone.predict(self.input_dataset)
112
-