keras-nlp 0.6.3.dev0__tar.gz → 0.6.4.dev0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/PKG-INFO +60 -11
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/README.md +59 -10
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/__init__.py +1 -1
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/__init__.py +1 -1
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/backend/__init__.py +9 -7
- keras-nlp-0.6.4.dev0/keras_nlp/src/backend/config.py +64 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/backend/keras.py +0 -2
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/conftest.py +11 -51
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/__init__.py +1 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/cached_multi_head_attention_test.py +2 -2
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_backbone_test.py +0 -31
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_backbone_test.py +0 -28
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_backbone_test.py +0 -27
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_backbone_test.py +0 -27
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/disentangled_self_attention.py +3 -2
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_backbone_test.py +0 -26
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_backbone_test.py +0 -26
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_backbone.py +0 -72
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_backbone_test.py +0 -43
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_causal_lm.py +0 -36
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_causal_lm_test.py +0 -10
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_backbone_test.py +0 -26
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_backbone.py +0 -72
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_backbone_test.py +0 -43
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_causal_lm.py +0 -36
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_causal_lm_test.py +0 -10
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_backbone_test.py +0 -26
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_backbone_test.py +0 -27
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/task.py +4 -1
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_backbone_test.py +0 -41
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_backbone_test.py +0 -26
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/xlnet_backbone_test.py +0 -28
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/test_case.py +8 -6
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/tensor_utils.py +1 -1
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp.egg-info/PKG-INFO +60 -11
- keras-nlp-0.6.3.dev0/keras_nlp/src/backend/config.py +0 -105
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/layers/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/metrics/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/models/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/samplers/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/api_export.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/backend/ops.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/backend/random.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/cached_multi_head_attention.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/f_net_encoder.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/f_net_encoder_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/masked_lm_head.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/masked_lm_head_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/position_embedding.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/position_embedding_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/reversible_embedding.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/reversible_embedding_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/rotary_embedding.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/rotary_embedding_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/sine_position_encoding.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/sine_position_encoding_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/token_and_position_embedding.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/token_and_position_embedding_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_decoder.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_decoder_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_encoder.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_encoder_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_layer_utils.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/modeling/transformer_layer_utils_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/masked_lm_mask_generator.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/masked_lm_mask_generator_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/multi_segment_packer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/multi_segment_packer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/preprocessing_layer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/random_deletion.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/random_deletion_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/random_swap.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/random_swap_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/start_end_packer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/layers/preprocessing/start_end_packer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/bleu.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/bleu_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/edit_distance.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/edit_distance_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/perplexity.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/perplexity_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/rouge_base.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/rouge_l.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/rouge_l_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/rouge_n.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/metrics/rouge_n_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_classifier.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_classifier_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_masked_lm.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_masked_lm_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_masked_lm_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_masked_lm_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_presets.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_presets_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_presets.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_presets_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_seq_2_seq_lm.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_seq_2_seq_lm_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_seq_2_seq_lm_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_seq_2_seq_lm_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_classifier.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_classifier_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_masked_lm.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_masked_lm_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_masked_lm_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_masked_lm_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_presets.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_presets_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_classifier.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_classifier_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_masked_lm.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_masked_lm_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_masked_lm_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_masked_lm_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_presets.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_presets_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/deberta_v3_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/disentangled_attention_encoder.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/deberta_v3/relative_embedding.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_classifier.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_classifier_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_masked_lm.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_masked_lm_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_masked_lm_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_masked_lm_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_presets.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_presets_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/distil_bert/distil_bert_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_classifier.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_classifier_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_masked_lm.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_masked_lm_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_masked_lm_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_masked_lm_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_presets.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_presets_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/f_net/f_net_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/generative_task.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_causal_lm_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_causal_lm_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_presets.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_presets_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt2/gpt2_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_attention.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_causal_lm.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_causal_lm_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_causal_lm_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_causal_lm_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_decoder.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/gpt_neo_x/gpt_neo_x_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_causal_lm_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_causal_lm_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_presets.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_presets_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/opt/opt_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_classifier.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_classifier_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_masked_lm.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_masked_lm_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_masked_lm_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_masked_lm_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_presets.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_presets_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/roberta/roberta_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_layer_norm.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_multi_head_attention.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/t5/t5_transformer_layer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/task_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_audio_feature_extractor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_audio_feature_extractor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_decoder.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_encoder.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_presets.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_presets_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/whisper/whisper_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_classifier.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_classifier_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_masked_lm.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_masked_lm_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_masked_lm_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_masked_lm_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_preprocessor.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_preprocessor_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_presets.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_presets_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlm_roberta/xlm_roberta_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/relative_attention.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/xlnet_backbone.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/xlnet_content_and_query_embedding.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/xlnet/xlnet_encoder.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/beam_sampler.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/beam_sampler_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/contrastive_sampler.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/contrastive_sampler_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/greedy_sampler.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/greedy_sampler_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/random_sampler.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/random_sampler_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/sampler.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/serialization.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/serialization_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/top_k_sampler.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/top_k_sampler_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/top_p_sampler.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/samplers/top_p_sampler_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/doc_tests/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/doc_tests/docstring_lib.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/doc_tests/docstring_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tests/doc_tests/fenced_docstring_lib.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/byte_pair_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/byte_pair_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/byte_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/byte_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/sentence_piece_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/sentence_piece_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/sentence_piece_tokenizer_trainer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/sentence_piece_tokenizer_trainer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/unicode_codepoint_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/unicode_codepoint_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/word_piece_tokenizer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/word_piece_tokenizer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/word_piece_tokenizer_trainer.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/tokenizers/word_piece_tokenizer_trainer_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/keras_utils.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/keras_utils_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/pipeline_model.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/pipeline_model_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/python_utils.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/python_utils_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/utils/tensor_utils_test.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/tokenizers/__init__.py +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp.egg-info/SOURCES.txt +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp.egg-info/dependency_links.txt +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp.egg-info/requires.txt +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp.egg-info/top_level.txt +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/setup.cfg +0 -0
- {keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/setup.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: keras-nlp
|
|
3
|
-
Version: 0.6.
|
|
3
|
+
Version: 0.6.4.dev0
|
|
4
4
|
Summary: Industry-strength Natural Language Processing extensions for Keras.
|
|
5
5
|
Home-page: https://github.com/keras-team/keras-nlp
|
|
6
6
|
Author: Keras team
|
|
@@ -39,11 +39,10 @@ Requires-Dist: sentencepiece; extra == "extras"
|
|
|
39
39
|

|
|
40
40
|
[](https://github.com/keras-team/keras-nlp/issues)
|
|
41
41
|
|
|
42
|
-
KerasNLP is a natural language processing library that works natively
|
|
43
|
-
with TensorFlow, JAX, or PyTorch. Built on
|
|
44
|
-
|
|
45
|
-
|
|
46
|
-
KerasNLP with Keras Core" below for more details on multi-framework KerasNLP.
|
|
42
|
+
KerasNLP is a natural language processing library that works natively
|
|
43
|
+
with TensorFlow, JAX, or PyTorch. Built on Keras 3, these models, layers,
|
|
44
|
+
metrics, and tokenizers can be trained and serialized in any framework and
|
|
45
|
+
re-used in another without costly migrations.
|
|
47
46
|
|
|
48
47
|
KerasNLP supports users through their entire development cycle. Our workflows
|
|
49
48
|
are built from modular components that have state-of-the-art preset weights and
|
|
@@ -82,17 +81,28 @@ We are a new and growing project and welcome [contributions](CONTRIBUTING.md).
|
|
|
82
81
|
|
|
83
82
|
## Installation
|
|
84
83
|
|
|
85
|
-
|
|
84
|
+
KerasNLP supports both Keras 2 and Keras 3. We recommend Keras 3 for all new
|
|
85
|
+
users, as it enables using KerasNLP models and layers with JAX, TensorFlow and
|
|
86
|
+
PyTorch.
|
|
87
|
+
|
|
88
|
+
### Keras 2 Installation
|
|
89
|
+
|
|
90
|
+
To install the latest KerasNLP release with Keras 2, simply run:
|
|
86
91
|
|
|
87
92
|
```
|
|
88
|
-
pip install keras-nlp
|
|
93
|
+
pip install --upgrade keras-nlp
|
|
89
94
|
```
|
|
90
95
|
|
|
91
|
-
|
|
92
|
-
|
|
96
|
+
### Keras 3 Installation
|
|
97
|
+
|
|
98
|
+
There are currently two ways to install Keras 3 with KerasNLP. To install the
|
|
99
|
+
stable versions of KerasNLP and Keras 3, you should install Keras 3 **after**
|
|
100
|
+
installing KerasNLP. This is a temporary step while TensorFlow is pinned to
|
|
101
|
+
Keras 2, and will no longer be necessary after TensorFlow 2.16.
|
|
93
102
|
|
|
94
103
|
```
|
|
95
|
-
pip install
|
|
104
|
+
pip install --upgrade keras-nlp
|
|
105
|
+
pip install --upgrade keras>=3
|
|
96
106
|
```
|
|
97
107
|
## Using KerasNLP with Keras Core
|
|
98
108
|
|
|
@@ -123,12 +133,28 @@ Until Keras Core is officially released as Keras 3.0, KerasNLP will use
|
|
|
123
133
|
`.keras/keras_nlp.json`. You will need to restart the Python runtime for changes
|
|
124
134
|
to take effect.
|
|
125
135
|
|
|
136
|
+
To install the latest nightly changes for both KerasNLP and Keras, you can use
|
|
137
|
+
our nightly package.
|
|
138
|
+
|
|
139
|
+
```
|
|
140
|
+
pip install --upgrade keras-nlp-nightly
|
|
141
|
+
```
|
|
142
|
+
|
|
143
|
+
> [!IMPORTANT]
|
|
144
|
+
> Keras 3 will not function with TensorFlow 2.14 or earlier.
|
|
145
|
+
|
|
146
|
+
Read [Getting started with Keras](https://keras.io/getting_started/) for more information
|
|
147
|
+
on installing Keras 3 and compatibility with different frameworks.
|
|
148
|
+
|
|
126
149
|
## Quickstart
|
|
127
150
|
|
|
128
151
|
Fine-tune BERT on a small sentiment analysis task using the
|
|
129
152
|
[`keras_nlp.models`](https://keras.io/api/keras_nlp/models/) API:
|
|
130
153
|
|
|
131
154
|
```python
|
|
155
|
+
import os
|
|
156
|
+
os.environ["KERAS_BACKEND"] = "tensorflow" # Or "jax" or "torch"!
|
|
157
|
+
|
|
132
158
|
import keras_nlp
|
|
133
159
|
import tensorflow_datasets as tfds
|
|
134
160
|
|
|
@@ -151,6 +177,29 @@ classifier.predict(["What an amazing movie!", "A total waste of my time."])
|
|
|
151
177
|
|
|
152
178
|
For more in depth guides and examples, visit https://keras.io/keras_nlp/.
|
|
153
179
|
|
|
180
|
+
## Configuring your backend
|
|
181
|
+
|
|
182
|
+
If you have Keras 3 installed in your environment (see installation above),
|
|
183
|
+
you can use KerasNLP with any of JAX, TensorFlow and PyTorch. To do so, set the
|
|
184
|
+
`KERAS_BACKEND` environment variable. For example:
|
|
185
|
+
|
|
186
|
+
```shell
|
|
187
|
+
export KERAS_BACKEND=jax
|
|
188
|
+
```
|
|
189
|
+
|
|
190
|
+
Or in Colab, with:
|
|
191
|
+
|
|
192
|
+
```python
|
|
193
|
+
import os
|
|
194
|
+
os.environ["KERAS_BACKEND"] = "jax"
|
|
195
|
+
|
|
196
|
+
import keras_nlp
|
|
197
|
+
```
|
|
198
|
+
|
|
199
|
+
> [!IMPORTANT]
|
|
200
|
+
> Make sure to set the `KERAS_BACKEND` before import any Keras libraries, it
|
|
201
|
+
> will be used to set up Keras when it is first imported.
|
|
202
|
+
|
|
154
203
|
## Compatibility
|
|
155
204
|
|
|
156
205
|
We follow [Semantic Versioning](https://semver.org/), and plan to
|
|
@@ -4,11 +4,10 @@
|
|
|
4
4
|

|
|
5
5
|
[](https://github.com/keras-team/keras-nlp/issues)
|
|
6
6
|
|
|
7
|
-
KerasNLP is a natural language processing library that works natively
|
|
8
|
-
with TensorFlow, JAX, or PyTorch. Built on
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
KerasNLP with Keras Core" below for more details on multi-framework KerasNLP.
|
|
7
|
+
KerasNLP is a natural language processing library that works natively
|
|
8
|
+
with TensorFlow, JAX, or PyTorch. Built on Keras 3, these models, layers,
|
|
9
|
+
metrics, and tokenizers can be trained and serialized in any framework and
|
|
10
|
+
re-used in another without costly migrations.
|
|
12
11
|
|
|
13
12
|
KerasNLP supports users through their entire development cycle. Our workflows
|
|
14
13
|
are built from modular components that have state-of-the-art preset weights and
|
|
@@ -47,17 +46,28 @@ We are a new and growing project and welcome [contributions](CONTRIBUTING.md).
|
|
|
47
46
|
|
|
48
47
|
## Installation
|
|
49
48
|
|
|
50
|
-
|
|
49
|
+
KerasNLP supports both Keras 2 and Keras 3. We recommend Keras 3 for all new
|
|
50
|
+
users, as it enables using KerasNLP models and layers with JAX, TensorFlow and
|
|
51
|
+
PyTorch.
|
|
52
|
+
|
|
53
|
+
### Keras 2 Installation
|
|
54
|
+
|
|
55
|
+
To install the latest KerasNLP release with Keras 2, simply run:
|
|
51
56
|
|
|
52
57
|
```
|
|
53
|
-
pip install keras-nlp
|
|
58
|
+
pip install --upgrade keras-nlp
|
|
54
59
|
```
|
|
55
60
|
|
|
56
|
-
|
|
57
|
-
|
|
61
|
+
### Keras 3 Installation
|
|
62
|
+
|
|
63
|
+
There are currently two ways to install Keras 3 with KerasNLP. To install the
|
|
64
|
+
stable versions of KerasNLP and Keras 3, you should install Keras 3 **after**
|
|
65
|
+
installing KerasNLP. This is a temporary step while TensorFlow is pinned to
|
|
66
|
+
Keras 2, and will no longer be necessary after TensorFlow 2.16.
|
|
58
67
|
|
|
59
68
|
```
|
|
60
|
-
pip install
|
|
69
|
+
pip install --upgrade keras-nlp
|
|
70
|
+
pip install --upgrade keras>=3
|
|
61
71
|
```
|
|
62
72
|
## Using KerasNLP with Keras Core
|
|
63
73
|
|
|
@@ -88,12 +98,28 @@ Until Keras Core is officially released as Keras 3.0, KerasNLP will use
|
|
|
88
98
|
`.keras/keras_nlp.json`. You will need to restart the Python runtime for changes
|
|
89
99
|
to take effect.
|
|
90
100
|
|
|
101
|
+
To install the latest nightly changes for both KerasNLP and Keras, you can use
|
|
102
|
+
our nightly package.
|
|
103
|
+
|
|
104
|
+
```
|
|
105
|
+
pip install --upgrade keras-nlp-nightly
|
|
106
|
+
```
|
|
107
|
+
|
|
108
|
+
> [!IMPORTANT]
|
|
109
|
+
> Keras 3 will not function with TensorFlow 2.14 or earlier.
|
|
110
|
+
|
|
111
|
+
Read [Getting started with Keras](https://keras.io/getting_started/) for more information
|
|
112
|
+
on installing Keras 3 and compatibility with different frameworks.
|
|
113
|
+
|
|
91
114
|
## Quickstart
|
|
92
115
|
|
|
93
116
|
Fine-tune BERT on a small sentiment analysis task using the
|
|
94
117
|
[`keras_nlp.models`](https://keras.io/api/keras_nlp/models/) API:
|
|
95
118
|
|
|
96
119
|
```python
|
|
120
|
+
import os
|
|
121
|
+
os.environ["KERAS_BACKEND"] = "tensorflow" # Or "jax" or "torch"!
|
|
122
|
+
|
|
97
123
|
import keras_nlp
|
|
98
124
|
import tensorflow_datasets as tfds
|
|
99
125
|
|
|
@@ -116,6 +142,29 @@ classifier.predict(["What an amazing movie!", "A total waste of my time."])
|
|
|
116
142
|
|
|
117
143
|
For more in depth guides and examples, visit https://keras.io/keras_nlp/.
|
|
118
144
|
|
|
145
|
+
## Configuring your backend
|
|
146
|
+
|
|
147
|
+
If you have Keras 3 installed in your environment (see installation above),
|
|
148
|
+
you can use KerasNLP with any of JAX, TensorFlow and PyTorch. To do so, set the
|
|
149
|
+
`KERAS_BACKEND` environment variable. For example:
|
|
150
|
+
|
|
151
|
+
```shell
|
|
152
|
+
export KERAS_BACKEND=jax
|
|
153
|
+
```
|
|
154
|
+
|
|
155
|
+
Or in Colab, with:
|
|
156
|
+
|
|
157
|
+
```python
|
|
158
|
+
import os
|
|
159
|
+
os.environ["KERAS_BACKEND"] = "jax"
|
|
160
|
+
|
|
161
|
+
import keras_nlp
|
|
162
|
+
```
|
|
163
|
+
|
|
164
|
+
> [!IMPORTANT]
|
|
165
|
+
> Make sure to set the `KERAS_BACKEND` before import any Keras libraries, it
|
|
166
|
+
> will be used to set up Keras when it is first imported.
|
|
167
|
+
|
|
119
168
|
## Compatibility
|
|
120
169
|
|
|
121
170
|
We follow [Semantic Versioning](https://semver.org/), and plan to
|
|
@@ -14,14 +14,16 @@
|
|
|
14
14
|
"""
|
|
15
15
|
Keras backend module.
|
|
16
16
|
|
|
17
|
-
This module adds a
|
|
18
|
-
control.
|
|
19
|
-
|
|
17
|
+
This module adds a temporary Keras API surface that is fully under KerasNLP
|
|
18
|
+
control. The goal is to allow us to write Keras 3-like code everywhere, while
|
|
19
|
+
still supporting Keras 2. We do this by using the `keras_core` package with
|
|
20
|
+
Keras 2 to backport Keras 3 numerics APIs (`keras.ops` and `keras.random`) into
|
|
21
|
+
Keras 2. The sub-modules exposed are as follows:
|
|
20
22
|
|
|
21
|
-
- `config`: check which
|
|
22
|
-
- `keras`: The full `keras` API
|
|
23
|
-
- `ops`: `
|
|
24
|
-
- `random`: `
|
|
23
|
+
- `config`: check which version of Keras is being run.
|
|
24
|
+
- `keras`: The full `keras` API with compat shims for older Keras versions.
|
|
25
|
+
- `ops`: `keras.ops` for Keras 3 or `keras_core.ops` for Keras 2.
|
|
26
|
+
- `random`: `keras.random` for Keras 3 or `keras_core.ops` for Keras 2.
|
|
25
27
|
"""
|
|
26
28
|
|
|
27
29
|
from keras_nlp.src.backend import config
|
|
@@ -0,0 +1,64 @@
|
|
|
1
|
+
# Copyright 2023 The KerasNLP Authors
|
|
2
|
+
#
|
|
3
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
|
+
# you may not use this file except in compliance with the License.
|
|
5
|
+
# You may obtain a copy of the License at
|
|
6
|
+
#
|
|
7
|
+
# https://www.apache.org/licenses/LICENSE-2.0
|
|
8
|
+
#
|
|
9
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
10
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
11
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
12
|
+
# See the License for the specific language governing permissions and
|
|
13
|
+
# limitations under the License.
|
|
14
|
+
|
|
15
|
+
import os
|
|
16
|
+
|
|
17
|
+
|
|
18
|
+
def detect_if_tensorflow_uses_keras_3():
|
|
19
|
+
# We follow the version of keras that tensorflow is configured to use.
|
|
20
|
+
try:
|
|
21
|
+
from tensorflow import keras
|
|
22
|
+
|
|
23
|
+
# Note that only recent versions of keras have a `version()` function.
|
|
24
|
+
if hasattr(keras, "version") and keras.version().startswith("3."):
|
|
25
|
+
return True
|
|
26
|
+
except:
|
|
27
|
+
raise ValueError(
|
|
28
|
+
"Unable to import `keras` with `tensorflow`. Please check your "
|
|
29
|
+
"Keras and Tensorflow version are compatible; Keras 3 requires "
|
|
30
|
+
"TensorFlow 2.15 or later. See keras.io/getting_started for more "
|
|
31
|
+
"information on installing Keras."
|
|
32
|
+
)
|
|
33
|
+
|
|
34
|
+
# No `keras.version()` means we are on an old version of keras.
|
|
35
|
+
return False
|
|
36
|
+
|
|
37
|
+
|
|
38
|
+
_USE_KERAS_3 = detect_if_tensorflow_uses_keras_3()
|
|
39
|
+
|
|
40
|
+
if not _USE_KERAS_3:
|
|
41
|
+
backend = os.environ.get("KERAS_BACKEND")
|
|
42
|
+
if backend and backend != "tensorflow":
|
|
43
|
+
raise RuntimeError(
|
|
44
|
+
"When running Keras 2, the `KERAS_BACKEND` environment variable "
|
|
45
|
+
f"must either be unset or `'tensorflow'`. Received: `{backend}`. "
|
|
46
|
+
"To set another backend, please install Keras 3. See "
|
|
47
|
+
"https://github.com/keras-team/keras-nlp#installation"
|
|
48
|
+
)
|
|
49
|
+
|
|
50
|
+
|
|
51
|
+
def keras_3():
|
|
52
|
+
"""Check if Keras 3 is being used."""
|
|
53
|
+
return _USE_KERAS_3
|
|
54
|
+
|
|
55
|
+
|
|
56
|
+
def backend():
|
|
57
|
+
"""Check the backend framework."""
|
|
58
|
+
if not keras_3():
|
|
59
|
+
return "tensorflow"
|
|
60
|
+
|
|
61
|
+
import keras
|
|
62
|
+
|
|
63
|
+
return keras.config.backend()
|
|
64
|
+
|
|
@@ -12,8 +12,6 @@
|
|
|
12
12
|
# See the License for the specific language governing permissions and
|
|
13
13
|
# limitations under the License.
|
|
14
14
|
|
|
15
|
-
import os
|
|
16
|
-
|
|
17
15
|
import pytest
|
|
18
16
|
import tensorflow as tf
|
|
19
17
|
|
|
@@ -21,21 +19,6 @@ from keras_nlp.src.backend import config as backend_config
|
|
|
21
19
|
from keras_nlp.src.backend import keras
|
|
22
20
|
|
|
23
21
|
|
|
24
|
-
@pytest.fixture(scope="session")
|
|
25
|
-
def tpu_strategy():
|
|
26
|
-
tpu_name = os.getenv("KUBE_GOOGLE_CLOUD_TPU_ENDPOINTS")
|
|
27
|
-
resolver = tf.distribute.cluster_resolver.TPUClusterResolver.connect(
|
|
28
|
-
tpu=tpu_name,
|
|
29
|
-
)
|
|
30
|
-
return tf.distribute.TPUStrategy(resolver)
|
|
31
|
-
|
|
32
|
-
|
|
33
|
-
@pytest.fixture(scope="class")
|
|
34
|
-
def tpu_test_class(request, tpu_strategy):
|
|
35
|
-
# set a class attribute on the invoking test context
|
|
36
|
-
request.cls.tpu_strategy = tpu_strategy
|
|
37
|
-
|
|
38
|
-
|
|
39
22
|
def pytest_addoption(parser):
|
|
40
23
|
parser.addoption(
|
|
41
24
|
"--run_large",
|
|
@@ -49,18 +32,6 @@ def pytest_addoption(parser):
|
|
|
49
32
|
default=False,
|
|
50
33
|
help="run extra_large tests",
|
|
51
34
|
)
|
|
52
|
-
parser.addoption(
|
|
53
|
-
"--run_tpu",
|
|
54
|
-
action="store_true",
|
|
55
|
-
default=False,
|
|
56
|
-
help="run tpu tests",
|
|
57
|
-
)
|
|
58
|
-
parser.addoption(
|
|
59
|
-
"--mixed_precision",
|
|
60
|
-
action="store_true",
|
|
61
|
-
default=False,
|
|
62
|
-
help="run with mixed precision",
|
|
63
|
-
)
|
|
64
35
|
parser.addoption(
|
|
65
36
|
"--docstring_module",
|
|
66
37
|
action="store",
|
|
@@ -70,18 +41,13 @@ def pytest_addoption(parser):
|
|
|
70
41
|
|
|
71
42
|
|
|
72
43
|
def pytest_configure(config):
|
|
73
|
-
if config.getoption("--mixed_precision"):
|
|
74
|
-
keras.mixed_precision.set_global_policy("mixed_float16")
|
|
75
|
-
config.addinivalue_line(
|
|
76
|
-
"markers", "large: mark test as being slow or requiring a network"
|
|
77
|
-
)
|
|
78
44
|
config.addinivalue_line(
|
|
79
45
|
"markers",
|
|
80
|
-
"
|
|
46
|
+
"large: mark test as being slow or requiring a network",
|
|
81
47
|
)
|
|
82
48
|
config.addinivalue_line(
|
|
83
49
|
"markers",
|
|
84
|
-
"
|
|
50
|
+
"extra_large: mark test as being too large to run continuously",
|
|
85
51
|
)
|
|
86
52
|
config.addinivalue_line(
|
|
87
53
|
"markers",
|
|
@@ -93,7 +59,6 @@ def pytest_collection_modifyitems(config, items):
|
|
|
93
59
|
run_extra_large_tests = config.getoption("--run_extra_large")
|
|
94
60
|
# Run large tests for --run_extra_large or --run_large.
|
|
95
61
|
run_large_tests = config.getoption("--run_large") or run_extra_large_tests
|
|
96
|
-
run_tpu = config.getoption("--run_tpu")
|
|
97
62
|
|
|
98
63
|
# Messages to annotate skipped tests with.
|
|
99
64
|
skip_large = pytest.mark.skipif(
|
|
@@ -104,32 +69,27 @@ def pytest_collection_modifyitems(config, items):
|
|
|
104
69
|
not run_extra_large_tests,
|
|
105
70
|
reason="need --run_extra_large option to run",
|
|
106
71
|
)
|
|
107
|
-
|
|
108
|
-
not run_tpu,
|
|
109
|
-
reason="need --run_tpu option to run",
|
|
110
|
-
)
|
|
111
|
-
skip_tf_only = pytest.mark.skipif(
|
|
72
|
+
tf_only = pytest.mark.skipif(
|
|
112
73
|
not backend_config.backend() == "tensorflow",
|
|
113
74
|
reason="tests only run on tf backend",
|
|
114
75
|
)
|
|
76
|
+
keras_3_only = pytest.mark.skipif(
|
|
77
|
+
not backend_config.keras_3(),
|
|
78
|
+
reason="tests only run on with multi-backend keras",
|
|
79
|
+
)
|
|
115
80
|
for item in items:
|
|
116
81
|
if "large" in item.keywords:
|
|
117
82
|
item.add_marker(skip_large)
|
|
118
83
|
if "extra_large" in item.keywords:
|
|
119
84
|
item.add_marker(skip_extra_large)
|
|
120
|
-
if "tpu" in item.keywords:
|
|
121
|
-
item.add_marker(skip_tpu)
|
|
122
85
|
if "tf_only" in item.keywords:
|
|
123
|
-
item.add_marker(
|
|
86
|
+
item.add_marker(tf_only)
|
|
87
|
+
if "keras_3_only" in item.keywords:
|
|
88
|
+
item.add_marker(keras_3_only)
|
|
124
89
|
|
|
125
90
|
|
|
126
91
|
# Disable traceback filtering for quicker debugging of tests failures.
|
|
127
92
|
tf.debugging.disable_traceback_filtering()
|
|
128
|
-
if backend_config.
|
|
93
|
+
if backend_config.keras_3():
|
|
129
94
|
keras.config.disable_traceback_filtering()
|
|
130
95
|
|
|
131
|
-
# One off setup for dtensor tests.
|
|
132
|
-
if not backend_config.multi_backend():
|
|
133
|
-
keras.backend.experimental.enable_tf_random_generator()
|
|
134
|
-
keras.utils.set_random_seed(1337)
|
|
135
|
-
|
|
@@ -18,6 +18,7 @@ from keras_nlp.src.layers.modeling.cached_multi_head_attention import (
|
|
|
18
18
|
from keras_nlp.src.layers.modeling.f_net_encoder import FNetEncoder
|
|
19
19
|
from keras_nlp.src.layers.modeling.masked_lm_head import MaskedLMHead
|
|
20
20
|
from keras_nlp.src.layers.modeling.position_embedding import PositionEmbedding
|
|
21
|
+
from keras_nlp.src.layers.modeling.reversible_embedding import ReversibleEmbedding
|
|
21
22
|
from keras_nlp.src.layers.modeling.rotary_embedding import RotaryEmbedding
|
|
22
23
|
from keras_nlp.src.layers.modeling.sine_position_encoding import (
|
|
23
24
|
SinePositionEncoding,
|
|
@@ -36,9 +36,9 @@ class CachedMultiHeadAttentionTest(TestCase):
|
|
|
36
36
|
expected_output_shape=(2, 4, 6),
|
|
37
37
|
expected_num_trainable_weights=8,
|
|
38
38
|
expected_num_non_trainable_variables=1,
|
|
39
|
-
#
|
|
39
|
+
# Keras 2 does not handle mixed precision correctly when not set
|
|
40
40
|
# globally.
|
|
41
|
-
run_mixed_precision_check=config.
|
|
41
|
+
run_mixed_precision_check=config.keras_3(),
|
|
42
42
|
)
|
|
43
43
|
|
|
44
44
|
def test_cache_call_is_correct(self):
|
{keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/albert/albert_backbone_test.py
RENAMED
|
@@ -102,34 +102,3 @@ class AlbertBackboneTest(TestCase):
|
|
|
102
102
|
model_output["pooled_output"], restored_output["pooled_output"]
|
|
103
103
|
)
|
|
104
104
|
|
|
105
|
-
|
|
106
|
-
@pytest.mark.tpu
|
|
107
|
-
@pytest.mark.usefixtures("tpu_test_class")
|
|
108
|
-
class AlbertBackboneTPUTest(TestCase):
|
|
109
|
-
def setUp(self):
|
|
110
|
-
with self.tpu_strategy.scope():
|
|
111
|
-
self.backbone = AlbertBackbone(
|
|
112
|
-
vocabulary_size=10,
|
|
113
|
-
num_layers=2,
|
|
114
|
-
num_heads=2,
|
|
115
|
-
num_groups=1,
|
|
116
|
-
num_inner_repetitions=1,
|
|
117
|
-
embedding_dim=16,
|
|
118
|
-
hidden_dim=2,
|
|
119
|
-
intermediate_dim=2,
|
|
120
|
-
max_sequence_length=4,
|
|
121
|
-
)
|
|
122
|
-
|
|
123
|
-
self.input_batch = {
|
|
124
|
-
"token_ids": np.ones((8, 128), dtype="int32"),
|
|
125
|
-
"segment_ids": np.ones((8, 128), dtype="int32"),
|
|
126
|
-
"padding_mask": np.ones((8, 128), dtype="int32"),
|
|
127
|
-
}
|
|
128
|
-
self.input_dataset = tf.data.Dataset.from_tensor_slices(
|
|
129
|
-
self.input_batch
|
|
130
|
-
).batch(2)
|
|
131
|
-
|
|
132
|
-
def test_predict(self):
|
|
133
|
-
self.backbone.compile()
|
|
134
|
-
self.backbone.predict(self.input_dataset)
|
|
135
|
-
|
{keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bart/bart_backbone_test.py
RENAMED
|
@@ -92,31 +92,3 @@ class BartBackboneTest(TestCase):
|
|
|
92
92
|
restored_output["decoder_sequence_output"],
|
|
93
93
|
)
|
|
94
94
|
|
|
95
|
-
|
|
96
|
-
@pytest.mark.tpu
|
|
97
|
-
@pytest.mark.usefixtures("tpu_test_class")
|
|
98
|
-
class BartBackboneTPUTest(TestCase):
|
|
99
|
-
def setUp(self):
|
|
100
|
-
with self.tpu_strategy.scope():
|
|
101
|
-
self.backbone = BartBackbone(
|
|
102
|
-
vocabulary_size=1000,
|
|
103
|
-
num_layers=2,
|
|
104
|
-
num_heads=2,
|
|
105
|
-
hidden_dim=64,
|
|
106
|
-
intermediate_dim=128,
|
|
107
|
-
max_sequence_length=128,
|
|
108
|
-
)
|
|
109
|
-
self.input_batch = {
|
|
110
|
-
"encoder_token_ids": np.ones((8, 128), dtype="int32"),
|
|
111
|
-
"encoder_padding_mask": np.ones((8, 128), dtype="int32"),
|
|
112
|
-
"decoder_token_ids": np.ones((8, 128), dtype="int32"),
|
|
113
|
-
"decoder_padding_mask": np.ones((8, 128), dtype="int32"),
|
|
114
|
-
}
|
|
115
|
-
self.input_dataset = tf.data.Dataset.from_tensor_slices(
|
|
116
|
-
self.input_batch
|
|
117
|
-
).batch(2)
|
|
118
|
-
|
|
119
|
-
def test_predict(self):
|
|
120
|
-
self.backbone.compile()
|
|
121
|
-
self.backbone.predict(self.input_dataset)
|
|
122
|
-
|
{keras-nlp-0.6.3.dev0 → keras-nlp-0.6.4.dev0}/keras_nlp/src/models/bert/bert_backbone_test.py
RENAMED
|
@@ -86,30 +86,3 @@ class BertBackboneTest(TestCase):
|
|
|
86
86
|
restored_output = restored_model(self.input_batch)
|
|
87
87
|
self.assertAllClose(model_output, restored_output)
|
|
88
88
|
|
|
89
|
-
|
|
90
|
-
@pytest.mark.tpu
|
|
91
|
-
@pytest.mark.usefixtures("tpu_test_class")
|
|
92
|
-
class BertBackboneTPUTest(TestCase):
|
|
93
|
-
def setUp(self):
|
|
94
|
-
with self.tpu_strategy.scope():
|
|
95
|
-
self.backbone = BertBackbone(
|
|
96
|
-
vocabulary_size=1000,
|
|
97
|
-
num_layers=2,
|
|
98
|
-
num_heads=2,
|
|
99
|
-
hidden_dim=64,
|
|
100
|
-
intermediate_dim=128,
|
|
101
|
-
max_sequence_length=128,
|
|
102
|
-
)
|
|
103
|
-
self.input_batch = {
|
|
104
|
-
"token_ids": np.ones((8, 128), dtype="int32"),
|
|
105
|
-
"segment_ids": np.ones((8, 128), dtype="int32"),
|
|
106
|
-
"padding_mask": np.ones((8, 128), dtype="int32"),
|
|
107
|
-
}
|
|
108
|
-
self.input_dataset = tf.data.Dataset.from_tensor_slices(
|
|
109
|
-
self.input_batch
|
|
110
|
-
).batch(2)
|
|
111
|
-
|
|
112
|
-
def test_predict(self):
|
|
113
|
-
self.backbone.compile()
|
|
114
|
-
self.backbone.predict(self.input_dataset)
|
|
115
|
-
|
|
@@ -91,30 +91,3 @@ class DebertaV3BackboneTest(TestCase):
|
|
|
91
91
|
restored_output = restored_model(self.input_batch)
|
|
92
92
|
self.assertAllClose(model_output, restored_output)
|
|
93
93
|
|
|
94
|
-
|
|
95
|
-
@pytest.mark.tpu
|
|
96
|
-
@pytest.mark.usefixtures("tpu_test_class")
|
|
97
|
-
class DebertaV3BackboneTPUTest(TestCase):
|
|
98
|
-
def setUp(self):
|
|
99
|
-
with self.tpu_strategy.scope():
|
|
100
|
-
self.backbone = DebertaV3Backbone(
|
|
101
|
-
vocabulary_size=10,
|
|
102
|
-
num_layers=2,
|
|
103
|
-
num_heads=2,
|
|
104
|
-
hidden_dim=2,
|
|
105
|
-
intermediate_dim=4,
|
|
106
|
-
max_sequence_length=5,
|
|
107
|
-
bucket_size=2,
|
|
108
|
-
)
|
|
109
|
-
self.input_batch = {
|
|
110
|
-
"token_ids": np.ones((2, 5), dtype="int32"),
|
|
111
|
-
"padding_mask": np.ones((2, 5), dtype="int32"),
|
|
112
|
-
}
|
|
113
|
-
self.input_dataset = tf.data.Dataset.from_tensor_slices(
|
|
114
|
-
self.input_batch
|
|
115
|
-
).batch(2)
|
|
116
|
-
|
|
117
|
-
def test_predict(self):
|
|
118
|
-
self.backbone.compile()
|
|
119
|
-
self.backbone.predict(self.input_dataset)
|
|
120
|
-
|
|
@@ -232,12 +232,13 @@ class DisentangledSelfAttention(keras.layers.Layer):
|
|
|
232
232
|
x1=rel_pos,
|
|
233
233
|
x2=log_pos * sign,
|
|
234
234
|
)
|
|
235
|
-
bucket_pos = ops.cast(bucket_pos, dtype="
|
|
235
|
+
bucket_pos = ops.cast(bucket_pos, dtype="int")
|
|
236
236
|
|
|
237
237
|
return bucket_pos
|
|
238
238
|
|
|
239
239
|
def _get_rel_pos(self, num_positions):
|
|
240
|
-
ids = ops.arange(num_positions
|
|
240
|
+
ids = ops.arange(num_positions)
|
|
241
|
+
ids = ops.cast(ids, dtype="int")
|
|
241
242
|
query_ids = ops.expand_dims(ids, axis=-1)
|
|
242
243
|
key_ids = ops.expand_dims(ids, axis=0)
|
|
243
244
|
key_ids = ops.repeat(key_ids, repeats=num_positions, axis=0)
|
|
@@ -84,29 +84,3 @@ class DistilBertTest(TestCase):
|
|
|
84
84
|
restored_output = restored_model(self.input_batch)
|
|
85
85
|
self.assertAllClose(model_output, restored_output)
|
|
86
86
|
|
|
87
|
-
|
|
88
|
-
@pytest.mark.tpu
|
|
89
|
-
@pytest.mark.usefixtures("tpu_test_class")
|
|
90
|
-
class DistilBertTPUTest(TestCase):
|
|
91
|
-
def setUp(self):
|
|
92
|
-
with self.tpu_strategy.scope():
|
|
93
|
-
self.backbone = DistilBertBackbone(
|
|
94
|
-
vocabulary_size=1000,
|
|
95
|
-
num_layers=2,
|
|
96
|
-
num_heads=2,
|
|
97
|
-
hidden_dim=64,
|
|
98
|
-
intermediate_dim=128,
|
|
99
|
-
max_sequence_length=128,
|
|
100
|
-
)
|
|
101
|
-
self.input_batch = {
|
|
102
|
-
"token_ids": np.ones((8, 128), dtype="int32"),
|
|
103
|
-
"padding_mask": np.ones((8, 128), dtype="int32"),
|
|
104
|
-
}
|
|
105
|
-
self.input_dataset = tf.data.Dataset.from_tensor_slices(
|
|
106
|
-
self.input_batch
|
|
107
|
-
).batch(2)
|
|
108
|
-
|
|
109
|
-
def test_predict(self):
|
|
110
|
-
self.backbone.compile()
|
|
111
|
-
self.backbone.predict(self.input_dataset)
|
|
112
|
-
|