spark-nlp 4.2.6__py2.py3-none-any.whl → 6.2.1__py2.py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- com/johnsnowlabs/ml/__init__.py +0 -0
- com/johnsnowlabs/ml/ai/__init__.py +10 -0
- spark_nlp-6.2.1.dist-info/METADATA +362 -0
- spark_nlp-6.2.1.dist-info/RECORD +292 -0
- {spark_nlp-4.2.6.dist-info → spark_nlp-6.2.1.dist-info}/WHEEL +1 -1
- sparknlp/__init__.py +81 -28
- sparknlp/annotation.py +3 -2
- sparknlp/annotator/__init__.py +6 -0
- sparknlp/annotator/audio/__init__.py +2 -0
- sparknlp/annotator/audio/hubert_for_ctc.py +188 -0
- sparknlp/annotator/audio/wav2vec2_for_ctc.py +14 -14
- sparknlp/annotator/audio/whisper_for_ctc.py +251 -0
- sparknlp/{base → annotator}/chunk2_doc.py +4 -7
- sparknlp/annotator/chunker.py +1 -2
- sparknlp/annotator/classifier_dl/__init__.py +17 -0
- sparknlp/annotator/classifier_dl/albert_for_multiple_choice.py +161 -0
- sparknlp/annotator/classifier_dl/albert_for_question_answering.py +3 -15
- sparknlp/annotator/classifier_dl/albert_for_sequence_classification.py +4 -18
- sparknlp/annotator/classifier_dl/albert_for_token_classification.py +3 -17
- sparknlp/annotator/classifier_dl/albert_for_zero_shot_classification.py +211 -0
- sparknlp/annotator/classifier_dl/bart_for_zero_shot_classification.py +225 -0
- sparknlp/annotator/classifier_dl/bert_for_multiple_choice.py +161 -0
- sparknlp/annotator/classifier_dl/bert_for_question_answering.py +6 -20
- sparknlp/annotator/classifier_dl/bert_for_sequence_classification.py +3 -17
- sparknlp/annotator/classifier_dl/bert_for_token_classification.py +3 -17
- sparknlp/annotator/classifier_dl/bert_for_zero_shot_classification.py +212 -0
- sparknlp/annotator/classifier_dl/camembert_for_question_answering.py +168 -0
- sparknlp/annotator/classifier_dl/camembert_for_sequence_classification.py +5 -19
- sparknlp/annotator/classifier_dl/camembert_for_token_classification.py +5 -19
- sparknlp/annotator/classifier_dl/camembert_for_zero_shot_classification.py +202 -0
- sparknlp/annotator/classifier_dl/classifier_dl.py +4 -4
- sparknlp/annotator/classifier_dl/deberta_for_question_answering.py +3 -17
- sparknlp/annotator/classifier_dl/deberta_for_sequence_classification.py +4 -19
- sparknlp/annotator/classifier_dl/deberta_for_token_classification.py +5 -21
- sparknlp/annotator/classifier_dl/deberta_for_zero_shot_classification.py +193 -0
- sparknlp/annotator/classifier_dl/distil_bert_for_question_answering.py +3 -17
- sparknlp/annotator/classifier_dl/distil_bert_for_sequence_classification.py +4 -18
- sparknlp/annotator/classifier_dl/distil_bert_for_token_classification.py +3 -17
- sparknlp/annotator/classifier_dl/distil_bert_for_zero_shot_classification.py +211 -0
- sparknlp/annotator/classifier_dl/distilbert_for_multiple_choice.py +161 -0
- sparknlp/annotator/classifier_dl/longformer_for_question_answering.py +3 -17
- sparknlp/annotator/classifier_dl/longformer_for_sequence_classification.py +4 -18
- sparknlp/annotator/classifier_dl/longformer_for_token_classification.py +3 -17
- sparknlp/annotator/classifier_dl/mpnet_for_question_answering.py +148 -0
- sparknlp/annotator/classifier_dl/mpnet_for_sequence_classification.py +188 -0
- sparknlp/annotator/classifier_dl/mpnet_for_token_classification.py +173 -0
- sparknlp/annotator/classifier_dl/multi_classifier_dl.py +3 -3
- sparknlp/annotator/classifier_dl/roberta_for_multiple_choice.py +161 -0
- sparknlp/annotator/classifier_dl/roberta_for_question_answering.py +3 -17
- sparknlp/annotator/classifier_dl/roberta_for_sequence_classification.py +4 -18
- sparknlp/annotator/classifier_dl/roberta_for_token_classification.py +1 -1
- sparknlp/annotator/classifier_dl/roberta_for_zero_shot_classification.py +225 -0
- sparknlp/annotator/classifier_dl/sentiment_dl.py +4 -4
- sparknlp/annotator/classifier_dl/tapas_for_question_answering.py +2 -2
- sparknlp/annotator/classifier_dl/xlm_roberta_for_multiple_choice.py +149 -0
- sparknlp/annotator/classifier_dl/xlm_roberta_for_question_answering.py +3 -17
- sparknlp/annotator/classifier_dl/xlm_roberta_for_sequence_classification.py +4 -18
- sparknlp/annotator/classifier_dl/xlm_roberta_for_token_classification.py +6 -20
- sparknlp/annotator/classifier_dl/xlm_roberta_for_zero_shot_classification.py +225 -0
- sparknlp/annotator/classifier_dl/xlnet_for_sequence_classification.py +4 -18
- sparknlp/annotator/classifier_dl/xlnet_for_token_classification.py +3 -17
- sparknlp/annotator/cleaners/__init__.py +15 -0
- sparknlp/annotator/cleaners/cleaner.py +202 -0
- sparknlp/annotator/cleaners/extractor.py +191 -0
- sparknlp/annotator/coref/spanbert_coref.py +4 -18
- sparknlp/annotator/cv/__init__.py +15 -0
- sparknlp/annotator/cv/blip_for_question_answering.py +172 -0
- sparknlp/annotator/cv/clip_for_zero_shot_classification.py +193 -0
- sparknlp/annotator/cv/convnext_for_image_classification.py +269 -0
- sparknlp/annotator/cv/florence2_transformer.py +180 -0
- sparknlp/annotator/cv/gemma3_for_multimodal.py +346 -0
- sparknlp/annotator/cv/internvl_for_multimodal.py +280 -0
- sparknlp/annotator/cv/janus_for_multimodal.py +351 -0
- sparknlp/annotator/cv/llava_for_multimodal.py +328 -0
- sparknlp/annotator/cv/mllama_for_multimodal.py +340 -0
- sparknlp/annotator/cv/paligemma_for_multimodal.py +308 -0
- sparknlp/annotator/cv/phi3_vision_for_multimodal.py +328 -0
- sparknlp/annotator/cv/qwen2vl_transformer.py +332 -0
- sparknlp/annotator/cv/smolvlm_transformer.py +426 -0
- sparknlp/annotator/cv/swin_for_image_classification.py +242 -0
- sparknlp/annotator/cv/vision_encoder_decoder_for_image_captioning.py +240 -0
- sparknlp/annotator/cv/vit_for_image_classification.py +36 -4
- sparknlp/annotator/dataframe_optimizer.py +216 -0
- sparknlp/annotator/date2_chunk.py +88 -0
- sparknlp/annotator/dependency/dependency_parser.py +2 -3
- sparknlp/annotator/dependency/typed_dependency_parser.py +3 -4
- sparknlp/annotator/document_character_text_splitter.py +228 -0
- sparknlp/annotator/document_normalizer.py +37 -1
- sparknlp/annotator/document_token_splitter.py +175 -0
- sparknlp/annotator/document_token_splitter_test.py +85 -0
- sparknlp/annotator/embeddings/__init__.py +11 -0
- sparknlp/annotator/embeddings/albert_embeddings.py +4 -18
- sparknlp/annotator/embeddings/auto_gguf_embeddings.py +539 -0
- sparknlp/annotator/embeddings/bert_embeddings.py +9 -22
- sparknlp/annotator/embeddings/bert_sentence_embeddings.py +12 -24
- sparknlp/annotator/embeddings/bge_embeddings.py +199 -0
- sparknlp/annotator/embeddings/camembert_embeddings.py +4 -20
- sparknlp/annotator/embeddings/chunk_embeddings.py +1 -2
- sparknlp/annotator/embeddings/deberta_embeddings.py +2 -16
- sparknlp/annotator/embeddings/distil_bert_embeddings.py +5 -19
- sparknlp/annotator/embeddings/doc2vec.py +7 -1
- sparknlp/annotator/embeddings/e5_embeddings.py +195 -0
- sparknlp/annotator/embeddings/e5v_embeddings.py +138 -0
- sparknlp/annotator/embeddings/elmo_embeddings.py +2 -2
- sparknlp/annotator/embeddings/instructor_embeddings.py +204 -0
- sparknlp/annotator/embeddings/longformer_embeddings.py +3 -17
- sparknlp/annotator/embeddings/minilm_embeddings.py +189 -0
- sparknlp/annotator/embeddings/mpnet_embeddings.py +192 -0
- sparknlp/annotator/embeddings/mxbai_embeddings.py +184 -0
- sparknlp/annotator/embeddings/nomic_embeddings.py +181 -0
- sparknlp/annotator/embeddings/roberta_embeddings.py +9 -21
- sparknlp/annotator/embeddings/roberta_sentence_embeddings.py +7 -21
- sparknlp/annotator/embeddings/sentence_embeddings.py +2 -3
- sparknlp/annotator/embeddings/snowflake_embeddings.py +202 -0
- sparknlp/annotator/embeddings/uae_embeddings.py +211 -0
- sparknlp/annotator/embeddings/universal_sentence_encoder.py +3 -3
- sparknlp/annotator/embeddings/word2vec.py +7 -1
- sparknlp/annotator/embeddings/word_embeddings.py +4 -5
- sparknlp/annotator/embeddings/xlm_roberta_embeddings.py +9 -21
- sparknlp/annotator/embeddings/xlm_roberta_sentence_embeddings.py +7 -21
- sparknlp/annotator/embeddings/xlnet_embeddings.py +4 -18
- sparknlp/annotator/er/entity_ruler.py +37 -23
- sparknlp/annotator/keyword_extraction/yake_keyword_extraction.py +2 -3
- sparknlp/annotator/ld_dl/language_detector_dl.py +2 -2
- sparknlp/annotator/lemmatizer.py +3 -4
- sparknlp/annotator/matcher/date_matcher.py +35 -3
- sparknlp/annotator/matcher/multi_date_matcher.py +1 -2
- sparknlp/annotator/matcher/regex_matcher.py +3 -3
- sparknlp/annotator/matcher/text_matcher.py +2 -3
- sparknlp/annotator/n_gram_generator.py +1 -2
- sparknlp/annotator/ner/__init__.py +3 -1
- sparknlp/annotator/ner/ner_converter.py +18 -0
- sparknlp/annotator/ner/ner_crf.py +4 -5
- sparknlp/annotator/ner/ner_dl.py +10 -5
- sparknlp/annotator/ner/ner_dl_graph_checker.py +293 -0
- sparknlp/annotator/ner/ner_overwriter.py +2 -2
- sparknlp/annotator/ner/zero_shot_ner_model.py +173 -0
- sparknlp/annotator/normalizer.py +2 -2
- sparknlp/annotator/openai/__init__.py +16 -0
- sparknlp/annotator/openai/openai_completion.py +349 -0
- sparknlp/annotator/openai/openai_embeddings.py +106 -0
- sparknlp/annotator/pos/perceptron.py +6 -7
- sparknlp/annotator/sentence/sentence_detector.py +2 -2
- sparknlp/annotator/sentence/sentence_detector_dl.py +3 -3
- sparknlp/annotator/sentiment/sentiment_detector.py +4 -5
- sparknlp/annotator/sentiment/vivekn_sentiment.py +4 -5
- sparknlp/annotator/seq2seq/__init__.py +17 -0
- sparknlp/annotator/seq2seq/auto_gguf_model.py +304 -0
- sparknlp/annotator/seq2seq/auto_gguf_reranker.py +334 -0
- sparknlp/annotator/seq2seq/auto_gguf_vision_model.py +336 -0
- sparknlp/annotator/seq2seq/bart_transformer.py +420 -0
- sparknlp/annotator/seq2seq/cohere_transformer.py +357 -0
- sparknlp/annotator/seq2seq/cpm_transformer.py +321 -0
- sparknlp/annotator/seq2seq/gpt2_transformer.py +1 -1
- sparknlp/annotator/seq2seq/llama2_transformer.py +343 -0
- sparknlp/annotator/seq2seq/llama3_transformer.py +381 -0
- sparknlp/annotator/seq2seq/m2m100_transformer.py +392 -0
- sparknlp/annotator/seq2seq/marian_transformer.py +124 -3
- sparknlp/annotator/seq2seq/mistral_transformer.py +348 -0
- sparknlp/annotator/seq2seq/nllb_transformer.py +420 -0
- sparknlp/annotator/seq2seq/olmo_transformer.py +326 -0
- sparknlp/annotator/seq2seq/phi2_transformer.py +326 -0
- sparknlp/annotator/seq2seq/phi3_transformer.py +330 -0
- sparknlp/annotator/seq2seq/phi4_transformer.py +387 -0
- sparknlp/annotator/seq2seq/qwen_transformer.py +340 -0
- sparknlp/annotator/seq2seq/starcoder_transformer.py +335 -0
- sparknlp/annotator/seq2seq/t5_transformer.py +54 -4
- sparknlp/annotator/similarity/__init__.py +0 -0
- sparknlp/annotator/similarity/document_similarity_ranker.py +379 -0
- sparknlp/annotator/spell_check/context_spell_checker.py +116 -17
- sparknlp/annotator/spell_check/norvig_sweeting.py +3 -6
- sparknlp/annotator/spell_check/symmetric_delete.py +1 -1
- sparknlp/annotator/stemmer.py +2 -3
- sparknlp/annotator/stop_words_cleaner.py +3 -4
- sparknlp/annotator/tf_ner_dl_graph_builder.py +1 -1
- sparknlp/annotator/token/__init__.py +0 -1
- sparknlp/annotator/token/recursive_tokenizer.py +2 -3
- sparknlp/annotator/token/tokenizer.py +2 -3
- sparknlp/annotator/ws/word_segmenter.py +35 -10
- sparknlp/base/__init__.py +2 -3
- sparknlp/base/doc2_chunk.py +0 -3
- sparknlp/base/document_assembler.py +5 -5
- sparknlp/base/embeddings_finisher.py +14 -2
- sparknlp/base/finisher.py +15 -4
- sparknlp/base/gguf_ranking_finisher.py +234 -0
- sparknlp/base/image_assembler.py +69 -0
- sparknlp/base/light_pipeline.py +53 -21
- sparknlp/base/multi_document_assembler.py +9 -13
- sparknlp/base/prompt_assembler.py +207 -0
- sparknlp/base/token_assembler.py +1 -2
- sparknlp/common/__init__.py +2 -0
- sparknlp/common/annotator_type.py +1 -0
- sparknlp/common/completion_post_processing.py +37 -0
- sparknlp/common/match_strategy.py +33 -0
- sparknlp/common/properties.py +914 -9
- sparknlp/internal/__init__.py +841 -116
- sparknlp/internal/annotator_java_ml.py +1 -1
- sparknlp/internal/annotator_transformer.py +3 -0
- sparknlp/logging/comet.py +2 -2
- sparknlp/partition/__init__.py +16 -0
- sparknlp/partition/partition.py +244 -0
- sparknlp/partition/partition_properties.py +902 -0
- sparknlp/partition/partition_transformer.py +200 -0
- sparknlp/pretrained/pretrained_pipeline.py +1 -1
- sparknlp/pretrained/resource_downloader.py +126 -2
- sparknlp/reader/__init__.py +15 -0
- sparknlp/reader/enums.py +19 -0
- sparknlp/reader/pdf_to_text.py +190 -0
- sparknlp/reader/reader2doc.py +124 -0
- sparknlp/reader/reader2image.py +136 -0
- sparknlp/reader/reader2table.py +44 -0
- sparknlp/reader/reader_assembler.py +159 -0
- sparknlp/reader/sparknlp_reader.py +461 -0
- sparknlp/training/__init__.py +1 -0
- sparknlp/training/conll.py +8 -2
- sparknlp/training/spacy_to_annotation.py +57 -0
- sparknlp/util.py +26 -0
- spark_nlp-4.2.6.dist-info/METADATA +0 -1256
- spark_nlp-4.2.6.dist-info/RECORD +0 -196
- {spark_nlp-4.2.6.dist-info → spark_nlp-6.2.1.dist-info}/top_level.txt +0 -0
- /sparknlp/annotator/{token/token2_chunk.py → token2_chunk.py} +0 -0
sparknlp/internal/__init__.py
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# Copyright 2017-
|
|
1
|
+
# Copyright 2017-2023 John Snow Labs
|
|
2
2
|
#
|
|
3
3
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
4
|
# you may not use this file except in compliance with the License.
|
|
@@ -24,264 +24,632 @@ from sparknlp.internal.recursive import *
|
|
|
24
24
|
# Wrapper Definitions
|
|
25
25
|
class _AlbertLoader(ExtendedJavaWrapper):
|
|
26
26
|
def __init__(self, path, jspark):
|
|
27
|
-
super(_AlbertLoader, self).__init__(
|
|
28
|
-
|
|
27
|
+
super(_AlbertLoader, self).__init__(
|
|
28
|
+
"com.johnsnowlabs.nlp.embeddings.AlbertEmbeddings.loadSavedModel",
|
|
29
|
+
path,
|
|
30
|
+
jspark,
|
|
31
|
+
)
|
|
29
32
|
|
|
30
33
|
|
|
31
34
|
class _AlbertSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
32
35
|
def __init__(self, path, jspark):
|
|
33
36
|
super(_AlbertSequenceClassifierLoader, self).__init__(
|
|
34
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForSequenceClassification.loadSavedModel",
|
|
35
|
-
|
|
37
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForSequenceClassification.loadSavedModel",
|
|
38
|
+
path,
|
|
39
|
+
jspark,
|
|
40
|
+
)
|
|
36
41
|
|
|
37
42
|
|
|
38
43
|
class _AlbertTokenClassifierLoader(ExtendedJavaWrapper):
|
|
39
44
|
def __init__(self, path, jspark):
|
|
40
45
|
super(_AlbertTokenClassifierLoader, self).__init__(
|
|
41
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForTokenClassification.loadSavedModel",
|
|
46
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForTokenClassification.loadSavedModel",
|
|
47
|
+
path,
|
|
48
|
+
jspark,
|
|
49
|
+
)
|
|
42
50
|
|
|
43
51
|
|
|
44
52
|
class _AlbertQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
45
53
|
def __init__(self, path, jspark):
|
|
46
54
|
super(_AlbertQuestionAnsweringLoader, self).__init__(
|
|
47
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForQuestionAnswering.loadSavedModel",
|
|
48
|
-
|
|
55
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForQuestionAnswering.loadSavedModel",
|
|
56
|
+
path,
|
|
57
|
+
jspark,
|
|
58
|
+
)
|
|
49
59
|
|
|
50
60
|
|
|
51
|
-
class
|
|
61
|
+
class _AlbertForZeroShotClassificationLoader(ExtendedJavaWrapper):
|
|
52
62
|
def __init__(self, path, jspark):
|
|
53
|
-
super(
|
|
63
|
+
super(_AlbertForZeroShotClassificationLoader, self).__init__(
|
|
64
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForZeroShotClassification.loadSavedModel",
|
|
65
|
+
path,
|
|
66
|
+
jspark,
|
|
67
|
+
)
|
|
54
68
|
|
|
55
69
|
|
|
56
|
-
class
|
|
70
|
+
class _AlbertMultipleChoiceLoader(ExtendedJavaWrapper):
|
|
57
71
|
def __init__(self, path, jspark):
|
|
72
|
+
super(_AlbertMultipleChoiceLoader, self).__init__(
|
|
73
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForMultipleChoice.loadSavedModel",
|
|
74
|
+
path,
|
|
75
|
+
jspark,
|
|
76
|
+
)
|
|
77
|
+
|
|
78
|
+
|
|
79
|
+
class _BertLoader(ExtendedJavaWrapper):
|
|
80
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
81
|
+
super(_BertLoader, self).__init__(
|
|
82
|
+
"com.johnsnowlabs.nlp.embeddings.BertEmbeddings.loadSavedModel",
|
|
83
|
+
path,
|
|
84
|
+
jspark,
|
|
85
|
+
use_openvino,
|
|
86
|
+
)
|
|
87
|
+
|
|
88
|
+
|
|
89
|
+
class _BertSentenceLoader(ExtendedJavaWrapper):
|
|
90
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
58
91
|
super(_BertSentenceLoader, self).__init__(
|
|
59
|
-
"com.johnsnowlabs.nlp.embeddings.BertSentenceEmbeddings.loadSavedModel",
|
|
92
|
+
"com.johnsnowlabs.nlp.embeddings.BertSentenceEmbeddings.loadSavedModel",
|
|
93
|
+
path,
|
|
94
|
+
jspark,
|
|
95
|
+
use_openvino,
|
|
96
|
+
)
|
|
60
97
|
|
|
61
98
|
|
|
62
99
|
class _BertSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
63
100
|
def __init__(self, path, jspark):
|
|
64
101
|
super(_BertSequenceClassifierLoader, self).__init__(
|
|
65
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForSequenceClassification.loadSavedModel",
|
|
102
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForSequenceClassification.loadSavedModel",
|
|
103
|
+
path,
|
|
104
|
+
jspark,
|
|
105
|
+
)
|
|
66
106
|
|
|
67
107
|
|
|
68
108
|
class _BertTokenClassifierLoader(ExtendedJavaWrapper):
|
|
69
109
|
def __init__(self, path, jspark):
|
|
70
110
|
super(_BertTokenClassifierLoader, self).__init__(
|
|
71
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForTokenClassification.loadSavedModel",
|
|
111
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForTokenClassification.loadSavedModel",
|
|
112
|
+
path,
|
|
113
|
+
jspark,
|
|
114
|
+
)
|
|
72
115
|
|
|
73
116
|
|
|
74
117
|
class _BertQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
75
118
|
def __init__(self, path, jspark):
|
|
76
119
|
super(_BertQuestionAnsweringLoader, self).__init__(
|
|
77
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForQuestionAnswering.loadSavedModel",
|
|
120
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForQuestionAnswering.loadSavedModel",
|
|
121
|
+
path,
|
|
122
|
+
jspark,
|
|
123
|
+
)
|
|
124
|
+
|
|
125
|
+
class _BertMultipleChoiceLoader(ExtendedJavaWrapper):
|
|
126
|
+
def __init__(self, path, jspark):
|
|
127
|
+
super(_BertMultipleChoiceLoader, self).__init__(
|
|
128
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForMultipleChoice.loadSavedModel",
|
|
129
|
+
path,
|
|
130
|
+
jspark,
|
|
131
|
+
)
|
|
78
132
|
|
|
133
|
+
class _CoHereLoader(ExtendedJavaWrapper):
|
|
134
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
135
|
+
super(_CoHereLoader, self).__init__(
|
|
136
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.CoHereTransformer.loadSavedModel",
|
|
137
|
+
path,
|
|
138
|
+
jspark,
|
|
139
|
+
use_openvino,
|
|
140
|
+
)
|
|
79
141
|
|
|
80
142
|
class _DeBERTaLoader(ExtendedJavaWrapper):
|
|
81
143
|
def __init__(self, path, jspark):
|
|
82
144
|
super(_DeBERTaLoader, self).__init__(
|
|
83
|
-
"com.johnsnowlabs.nlp.embeddings.DeBertaEmbeddings.loadSavedModel",
|
|
84
|
-
|
|
145
|
+
"com.johnsnowlabs.nlp.embeddings.DeBertaEmbeddings.loadSavedModel",
|
|
146
|
+
path,
|
|
147
|
+
jspark,
|
|
148
|
+
)
|
|
85
149
|
|
|
86
150
|
|
|
87
151
|
class _DeBertaSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
88
152
|
def __init__(self, path, jspark):
|
|
89
153
|
super(_DeBertaSequenceClassifierLoader, self).__init__(
|
|
90
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForSequenceClassification.loadSavedModel",
|
|
91
|
-
|
|
154
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForSequenceClassification.loadSavedModel",
|
|
155
|
+
path,
|
|
156
|
+
jspark,
|
|
157
|
+
)
|
|
92
158
|
|
|
93
159
|
|
|
94
160
|
class _DeBertTokenClassifierLoader(ExtendedJavaWrapper):
|
|
95
161
|
def __init__(self, path, jspark):
|
|
96
162
|
super(_DeBertTokenClassifierLoader, self).__init__(
|
|
97
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForTokenClassification.loadSavedModel",
|
|
163
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForTokenClassification.loadSavedModel",
|
|
164
|
+
path,
|
|
165
|
+
jspark,
|
|
166
|
+
)
|
|
98
167
|
|
|
99
168
|
|
|
100
169
|
class _DeBertaQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
101
170
|
def __init__(self, path, jspark):
|
|
102
171
|
super(_DeBertaQuestionAnsweringLoader, self).__init__(
|
|
103
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForQuestionAnswering.loadSavedModel",
|
|
104
|
-
|
|
172
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForQuestionAnswering.loadSavedModel",
|
|
173
|
+
path,
|
|
174
|
+
jspark,
|
|
175
|
+
)
|
|
105
176
|
|
|
106
177
|
|
|
107
178
|
class _CamemBertLoader(ExtendedJavaWrapper):
|
|
108
179
|
def __init__(self, path, jspark):
|
|
109
|
-
super(_CamemBertLoader, self).__init__(
|
|
110
|
-
|
|
111
|
-
|
|
180
|
+
super(_CamemBertLoader, self).__init__(
|
|
181
|
+
"com.johnsnowlabs.nlp.embeddings.CamemBertEmbeddings.loadSavedModel",
|
|
182
|
+
path,
|
|
183
|
+
jspark,
|
|
184
|
+
)
|
|
185
|
+
|
|
186
|
+
class _CPMLoader(ExtendedJavaWrapper):
|
|
187
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
188
|
+
super(_CPMLoader, self).__init__(
|
|
189
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.CPMTransformer.loadSavedModel",
|
|
190
|
+
path,
|
|
191
|
+
jspark,
|
|
192
|
+
use_openvino
|
|
193
|
+
)
|
|
112
194
|
|
|
113
195
|
|
|
114
196
|
class _DistilBertLoader(ExtendedJavaWrapper):
|
|
115
197
|
def __init__(self, path, jspark):
|
|
116
|
-
super(_DistilBertLoader, self).__init__(
|
|
117
|
-
|
|
198
|
+
super(_DistilBertLoader, self).__init__(
|
|
199
|
+
"com.johnsnowlabs.nlp.embeddings.DistilBertEmbeddings.loadSavedModel",
|
|
200
|
+
path,
|
|
201
|
+
jspark,
|
|
202
|
+
)
|
|
118
203
|
|
|
119
204
|
|
|
120
205
|
class _DistilBertSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
121
206
|
def __init__(self, path, jspark):
|
|
122
207
|
super(_DistilBertSequenceClassifierLoader, self).__init__(
|
|
123
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForSequenceClassification.loadSavedModel",
|
|
124
|
-
|
|
208
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForSequenceClassification.loadSavedModel",
|
|
209
|
+
path,
|
|
210
|
+
jspark,
|
|
211
|
+
)
|
|
125
212
|
|
|
126
213
|
|
|
127
214
|
class _DistilBertTokenClassifierLoader(ExtendedJavaWrapper):
|
|
128
215
|
def __init__(self, path, jspark):
|
|
129
216
|
super(_DistilBertTokenClassifierLoader, self).__init__(
|
|
130
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForTokenClassification.loadSavedModel",
|
|
131
|
-
|
|
217
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForTokenClassification.loadSavedModel",
|
|
218
|
+
path,
|
|
219
|
+
jspark,
|
|
220
|
+
)
|
|
132
221
|
|
|
133
222
|
|
|
134
223
|
class _DistilBertQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
135
224
|
def __init__(self, path, jspark):
|
|
136
225
|
super(_DistilBertQuestionAnsweringLoader, self).__init__(
|
|
137
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForQuestionAnswering.loadSavedModel",
|
|
138
|
-
|
|
226
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForQuestionAnswering.loadSavedModel",
|
|
227
|
+
path,
|
|
228
|
+
jspark,
|
|
229
|
+
)
|
|
230
|
+
|
|
231
|
+
|
|
232
|
+
class _DistilBertMultipleChoiceLoader(ExtendedJavaWrapper):
|
|
233
|
+
def __init__(self, path, jspark):
|
|
234
|
+
super(_DistilBertMultipleChoiceLoader, self).__init__(
|
|
235
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForMultipleChoice.loadSavedModel",
|
|
236
|
+
path,
|
|
237
|
+
jspark,
|
|
238
|
+
)
|
|
139
239
|
|
|
140
240
|
|
|
141
241
|
class _ElmoLoader(ExtendedJavaWrapper):
|
|
142
242
|
def __init__(self, path, jspark):
|
|
143
|
-
super(_ElmoLoader, self).__init__(
|
|
243
|
+
super(_ElmoLoader, self).__init__(
|
|
244
|
+
"com.johnsnowlabs.nlp.embeddings.ElmoEmbeddings.loadSavedModel",
|
|
245
|
+
path,
|
|
246
|
+
jspark,
|
|
247
|
+
)
|
|
248
|
+
|
|
249
|
+
|
|
250
|
+
class _E5Loader(ExtendedJavaWrapper):
|
|
251
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
252
|
+
super(_E5Loader, self).__init__(
|
|
253
|
+
"com.johnsnowlabs.nlp.embeddings.E5Embeddings.loadSavedModel",
|
|
254
|
+
path,
|
|
255
|
+
jspark,
|
|
256
|
+
use_openvino,
|
|
257
|
+
)
|
|
258
|
+
|
|
259
|
+
|
|
260
|
+
class _MiniLMLoader(ExtendedJavaWrapper):
|
|
261
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
262
|
+
super(_MiniLMLoader, self).__init__(
|
|
263
|
+
"com.johnsnowlabs.nlp.embeddings.MiniLMEmbeddings.loadSavedModel",
|
|
264
|
+
path,
|
|
265
|
+
jspark,
|
|
266
|
+
use_openvino,
|
|
267
|
+
)
|
|
268
|
+
|
|
269
|
+
|
|
270
|
+
class _BGELoader(ExtendedJavaWrapper):
|
|
271
|
+
def __init__(self, path, jspark):
|
|
272
|
+
super(_BGELoader, self).__init__(
|
|
273
|
+
"com.johnsnowlabs.nlp.embeddings.BGEEmbeddings.loadSavedModel", path, jspark
|
|
274
|
+
)
|
|
144
275
|
|
|
145
276
|
|
|
146
277
|
class _GPT2Loader(ExtendedJavaWrapper):
|
|
147
278
|
def __init__(self, path, jspark):
|
|
148
279
|
super(_GPT2Loader, self).__init__(
|
|
149
|
-
"com.johnsnowlabs.nlp.annotators.seq2seq.GPT2Transformer.loadSavedModel",
|
|
280
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.GPT2Transformer.loadSavedModel",
|
|
281
|
+
path,
|
|
282
|
+
jspark,
|
|
283
|
+
)
|
|
284
|
+
|
|
285
|
+
class _Gemma3ForMultiModalLoader(ExtendedJavaWrapper):
|
|
286
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
287
|
+
super(_Gemma3ForMultiModalLoader, self).__init__(
|
|
288
|
+
"com.johnsnowlabs.nlp.annotators.cv.Gemma3ForMultiModal.loadSavedModel",
|
|
289
|
+
path,
|
|
290
|
+
jspark,
|
|
291
|
+
use_openvino
|
|
292
|
+
)
|
|
293
|
+
|
|
294
|
+
class _InternVLForMultiModalLoader(ExtendedJavaWrapper):
|
|
295
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
296
|
+
super(_InternVLForMultiModalLoader, self).__init__(
|
|
297
|
+
"com.johnsnowlabs.nlp.annotators.cv.InternVLForMultiModal.loadSavedModel",
|
|
298
|
+
path,
|
|
299
|
+
jspark,
|
|
300
|
+
use_openvino
|
|
301
|
+
)
|
|
150
302
|
|
|
151
303
|
|
|
304
|
+
class _JanusForMultiModalLoader(ExtendedJavaWrapper):
|
|
305
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
306
|
+
super(_JanusForMultiModalLoader, self).__init__(
|
|
307
|
+
"com.johnsnowlabs.nlp.annotators.cv.JanusForMultiModal.loadSavedModel",
|
|
308
|
+
path,
|
|
309
|
+
jspark,
|
|
310
|
+
use_openvino
|
|
311
|
+
)
|
|
312
|
+
|
|
313
|
+
class _LLAMA2Loader(ExtendedJavaWrapper):
|
|
314
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
315
|
+
super(_LLAMA2Loader, self).__init__(
|
|
316
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.LLAMA2Transformer.loadSavedModel",
|
|
317
|
+
path,
|
|
318
|
+
jspark,
|
|
319
|
+
use_openvino,
|
|
320
|
+
)
|
|
321
|
+
|
|
322
|
+
class _LLAMA3Loader(ExtendedJavaWrapper):
|
|
323
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
324
|
+
super(_LLAMA3Loader, self).__init__(
|
|
325
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.LLAMA3Transformer.loadSavedModel",
|
|
326
|
+
path,
|
|
327
|
+
jspark,
|
|
328
|
+
use_openvino,
|
|
329
|
+
)
|
|
330
|
+
|
|
152
331
|
class _LongformerLoader(ExtendedJavaWrapper):
|
|
153
332
|
def __init__(self, path, jspark):
|
|
154
|
-
super(_LongformerLoader, self).__init__(
|
|
155
|
-
|
|
156
|
-
|
|
333
|
+
super(_LongformerLoader, self).__init__(
|
|
334
|
+
"com.johnsnowlabs.nlp.embeddings.LongformerEmbeddings.loadSavedModel",
|
|
335
|
+
path,
|
|
336
|
+
jspark,
|
|
337
|
+
)
|
|
157
338
|
|
|
158
339
|
|
|
159
340
|
class _LongformerSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
160
341
|
def __init__(self, path, jspark):
|
|
161
342
|
super(_LongformerSequenceClassifierLoader, self).__init__(
|
|
162
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForSequenceClassification.loadSavedModel",
|
|
163
|
-
|
|
343
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForSequenceClassification.loadSavedModel",
|
|
344
|
+
path,
|
|
345
|
+
jspark,
|
|
346
|
+
)
|
|
164
347
|
|
|
165
348
|
|
|
166
349
|
class _LongformerTokenClassifierLoader(ExtendedJavaWrapper):
|
|
167
350
|
def __init__(self, path, jspark):
|
|
168
351
|
super(_LongformerTokenClassifierLoader, self).__init__(
|
|
169
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForTokenClassification.loadSavedModel",
|
|
170
|
-
|
|
352
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForTokenClassification.loadSavedModel",
|
|
353
|
+
path,
|
|
354
|
+
jspark,
|
|
355
|
+
)
|
|
171
356
|
|
|
172
357
|
|
|
173
358
|
class _LongformerQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
174
359
|
def __init__(self, path, jspark):
|
|
175
360
|
super(_LongformerQuestionAnsweringLoader, self).__init__(
|
|
176
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForQuestionAnswering.loadSavedModel",
|
|
177
|
-
|
|
361
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForQuestionAnswering.loadSavedModel",
|
|
362
|
+
path,
|
|
363
|
+
jspark,
|
|
364
|
+
)
|
|
365
|
+
|
|
366
|
+
class _LLAVAForMultiModalLoader(ExtendedJavaWrapper):
|
|
367
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
368
|
+
super(_LLAVAForMultiModalLoader, self).__init__(
|
|
369
|
+
"com.johnsnowlabs.nlp.annotators.cv.LLAVAForMultiModal.loadSavedModel",
|
|
370
|
+
path,
|
|
371
|
+
jspark,
|
|
372
|
+
use_openvino
|
|
373
|
+
)
|
|
374
|
+
|
|
375
|
+
class _M2M100Loader(ExtendedJavaWrapper):
|
|
376
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
377
|
+
super(_M2M100Loader, self).__init__(
|
|
378
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.M2M100Transformer.loadSavedModel",
|
|
379
|
+
path,
|
|
380
|
+
jspark,
|
|
381
|
+
)
|
|
178
382
|
|
|
179
383
|
|
|
384
|
+
class _MistralLoader(ExtendedJavaWrapper):
|
|
385
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
386
|
+
super(_MistralLoader, self).__init__(
|
|
387
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.MistralTransformer.loadSavedModel",
|
|
388
|
+
path,
|
|
389
|
+
jspark,
|
|
390
|
+
use_openvino,
|
|
391
|
+
)
|
|
392
|
+
|
|
393
|
+
class _MLLamaForMultimodalLoader(ExtendedJavaWrapper):
|
|
394
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
395
|
+
super(_MLLamaForMultimodalLoader, self).__init__(
|
|
396
|
+
"com.johnsnowlabs.nlp.annotators.cv.MLLamaForMultimodal.loadSavedModel",
|
|
397
|
+
path,
|
|
398
|
+
jspark,
|
|
399
|
+
use_openvino
|
|
400
|
+
)
|
|
401
|
+
|
|
402
|
+
class _NLLBLoader(ExtendedJavaWrapper):
|
|
403
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
404
|
+
super(_NLLBLoader, self).__init__(
|
|
405
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.NLLBTransformer.loadSavedModel",
|
|
406
|
+
path,
|
|
407
|
+
jspark,
|
|
408
|
+
use_openvino)
|
|
409
|
+
|
|
180
410
|
class _MarianLoader(ExtendedJavaWrapper):
|
|
181
411
|
def __init__(self, path, jspark):
|
|
182
412
|
super(_MarianLoader, self).__init__(
|
|
183
|
-
"com.johnsnowlabs.nlp.annotators.seq2seq.MarianTransformer.loadSavedModel",
|
|
413
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.MarianTransformer.loadSavedModel",
|
|
414
|
+
path,
|
|
415
|
+
jspark,
|
|
416
|
+
)
|
|
184
417
|
|
|
185
418
|
|
|
186
|
-
class
|
|
419
|
+
class _MPNetLoader(ExtendedJavaWrapper):
|
|
187
420
|
def __init__(self, path, jspark):
|
|
188
|
-
super(
|
|
189
|
-
|
|
421
|
+
super(_MPNetLoader, self).__init__(
|
|
422
|
+
"com.johnsnowlabs.nlp.embeddings.MPNetEmbeddings.loadSavedModel",
|
|
423
|
+
path,
|
|
424
|
+
jspark,
|
|
425
|
+
)
|
|
426
|
+
|
|
427
|
+
|
|
428
|
+
class _OLMoLoader(ExtendedJavaWrapper):
|
|
429
|
+
def __init__(self, path, jspark):
|
|
430
|
+
super(_OLMoLoader, self).__init__(
|
|
431
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.OLMoTransformer.loadSavedModel", path, jspark)
|
|
432
|
+
class _Phi2Loader(ExtendedJavaWrapper):
|
|
433
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
434
|
+
super(_Phi2Loader, self).__init__(
|
|
435
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.Phi2Transformer.loadSavedModel",
|
|
436
|
+
path,
|
|
437
|
+
jspark,
|
|
438
|
+
use_openvino,
|
|
439
|
+
)
|
|
440
|
+
|
|
441
|
+
class _Phi3Loader(ExtendedJavaWrapper):
|
|
442
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
443
|
+
super(_Phi3Loader, self).__init__(
|
|
444
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.Phi3Transformer.loadSavedModel",
|
|
445
|
+
path,
|
|
446
|
+
jspark,
|
|
447
|
+
use_openvino,
|
|
448
|
+
)
|
|
449
|
+
|
|
450
|
+
class _Phi3VisionLoader(ExtendedJavaWrapper):
|
|
451
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
452
|
+
super(_Phi3VisionLoader, self).__init__(
|
|
453
|
+
"com.johnsnowlabs.nlp.annotators.cv.Phi3Vision.loadSavedModel",
|
|
454
|
+
path,
|
|
455
|
+
jspark,
|
|
456
|
+
use_openvino
|
|
457
|
+
)
|
|
458
|
+
|
|
459
|
+
class _RoBertaLoader(ExtendedJavaWrapper):
|
|
460
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
461
|
+
super(_RoBertaLoader, self).__init__(
|
|
462
|
+
"com.johnsnowlabs.nlp.embeddings.RoBertaEmbeddings.loadSavedModel",
|
|
463
|
+
path,
|
|
464
|
+
jspark,
|
|
465
|
+
use_openvino,
|
|
466
|
+
)
|
|
190
467
|
|
|
191
468
|
|
|
192
469
|
class _RoBertaSentenceLoader(ExtendedJavaWrapper):
|
|
193
470
|
def __init__(self, path, jspark):
|
|
194
471
|
super(_RoBertaSentenceLoader, self).__init__(
|
|
195
|
-
"com.johnsnowlabs.nlp.embeddings.RoBertaSentenceEmbeddings.loadSavedModel",
|
|
472
|
+
"com.johnsnowlabs.nlp.embeddings.RoBertaSentenceEmbeddings.loadSavedModel",
|
|
473
|
+
path,
|
|
474
|
+
jspark,
|
|
475
|
+
)
|
|
196
476
|
|
|
197
477
|
|
|
198
478
|
class _RoBertaSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
199
479
|
def __init__(self, path, jspark):
|
|
200
480
|
super(_RoBertaSequenceClassifierLoader, self).__init__(
|
|
201
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForSequenceClassification.loadSavedModel",
|
|
202
|
-
|
|
481
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForSequenceClassification.loadSavedModel",
|
|
482
|
+
path,
|
|
483
|
+
jspark,
|
|
484
|
+
)
|
|
203
485
|
|
|
204
486
|
|
|
205
487
|
class _RoBertaTokenClassifierLoader(ExtendedJavaWrapper):
|
|
206
488
|
def __init__(self, path, jspark):
|
|
207
489
|
super(_RoBertaTokenClassifierLoader, self).__init__(
|
|
208
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForTokenClassification.loadSavedModel",
|
|
490
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForTokenClassification.loadSavedModel",
|
|
491
|
+
path,
|
|
492
|
+
jspark,
|
|
493
|
+
)
|
|
209
494
|
|
|
210
495
|
|
|
211
496
|
class _RoBertaQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
212
497
|
def __init__(self, path, jspark):
|
|
213
498
|
super(_RoBertaQuestionAnsweringLoader, self).__init__(
|
|
214
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForQuestionAnswering.loadSavedModel",
|
|
499
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForQuestionAnswering.loadSavedModel",
|
|
500
|
+
path,
|
|
501
|
+
jspark,
|
|
502
|
+
)
|
|
503
|
+
|
|
215
504
|
|
|
505
|
+
class _RoBertaMultipleChoiceLoader(ExtendedJavaWrapper):
|
|
506
|
+
def __init__(self, path, jspark):
|
|
507
|
+
super(_RoBertaMultipleChoiceLoader, self).__init__(
|
|
508
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForMultipleChoice.loadSavedModel",
|
|
509
|
+
path,
|
|
510
|
+
jspark,
|
|
511
|
+
)
|
|
512
|
+
|
|
513
|
+
|
|
514
|
+
class _StarCoderLoader(ExtendedJavaWrapper):
|
|
515
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
516
|
+
super(_StarCoderLoader, self).__init__(
|
|
517
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.StarCoderTransformer.loadSavedModel",
|
|
518
|
+
path,
|
|
519
|
+
jspark,
|
|
520
|
+
use_openvino,
|
|
521
|
+
)
|
|
216
522
|
|
|
217
523
|
class _T5Loader(ExtendedJavaWrapper):
|
|
218
524
|
def __init__(self, path, jspark):
|
|
219
525
|
super(_T5Loader, self).__init__(
|
|
220
|
-
"com.johnsnowlabs.nlp.annotators.seq2seq.T5Transformer.loadSavedModel",
|
|
526
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.T5Transformer.loadSavedModel",
|
|
527
|
+
path,
|
|
528
|
+
jspark,
|
|
529
|
+
)
|
|
530
|
+
|
|
531
|
+
|
|
532
|
+
class _BartLoader(ExtendedJavaWrapper):
|
|
533
|
+
def __init__(self, path, jspark, useCache):
|
|
534
|
+
super(_BartLoader, self).__init__(
|
|
535
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.BartTransformer.loadSavedModel",
|
|
536
|
+
path,
|
|
537
|
+
jspark,
|
|
538
|
+
useCache,
|
|
539
|
+
)
|
|
540
|
+
|
|
541
|
+
|
|
542
|
+
class _NomicLoader(ExtendedJavaWrapper):
|
|
543
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
544
|
+
super(_NomicLoader, self).__init__("com.johnsnowlabs.nlp.embeddings.NomicEmbeddings.loadSavedModel", path, jspark, use_openvino)
|
|
545
|
+
|
|
546
|
+
|
|
547
|
+
class _QwenLoader(ExtendedJavaWrapper):
|
|
548
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
549
|
+
super(_QwenLoader, self).__init__(
|
|
550
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.QwenTransformer.loadSavedModel", path, jspark, use_openvino)
|
|
221
551
|
|
|
222
552
|
|
|
223
553
|
class _USELoader(ExtendedJavaWrapper):
|
|
224
554
|
def __init__(self, path, jspark, loadsp):
|
|
225
|
-
super(_USELoader, self).__init__(
|
|
226
|
-
|
|
555
|
+
super(_USELoader, self).__init__(
|
|
556
|
+
"com.johnsnowlabs.nlp.embeddings.UniversalSentenceEncoder.loadSavedModel",
|
|
557
|
+
path,
|
|
558
|
+
jspark,
|
|
559
|
+
loadsp,
|
|
560
|
+
)
|
|
227
561
|
|
|
228
562
|
|
|
229
563
|
class _XlmRoBertaLoader(ExtendedJavaWrapper):
|
|
230
|
-
def __init__(self, path, jspark):
|
|
231
|
-
super(_XlmRoBertaLoader, self).__init__(
|
|
232
|
-
|
|
564
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
565
|
+
super(_XlmRoBertaLoader, self).__init__(
|
|
566
|
+
"com.johnsnowlabs.nlp.embeddings.XlmRoBertaEmbeddings.loadSavedModel",
|
|
567
|
+
path,
|
|
568
|
+
jspark,
|
|
569
|
+
use_openvino,
|
|
570
|
+
)
|
|
233
571
|
|
|
234
572
|
|
|
235
573
|
class _XlmRoBertaSentenceLoader(ExtendedJavaWrapper):
|
|
236
574
|
def __init__(self, path, jspark):
|
|
237
575
|
super(_XlmRoBertaSentenceLoader, self).__init__(
|
|
238
|
-
"com.johnsnowlabs.nlp.embeddings.XlmRoBertaSentenceEmbeddings.loadSavedModel",
|
|
576
|
+
"com.johnsnowlabs.nlp.embeddings.XlmRoBertaSentenceEmbeddings.loadSavedModel",
|
|
577
|
+
path,
|
|
578
|
+
jspark,
|
|
579
|
+
)
|
|
239
580
|
|
|
240
581
|
|
|
241
582
|
class _XlmRoBertaSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
242
583
|
def __init__(self, path, jspark):
|
|
243
584
|
super(_XlmRoBertaSequenceClassifierLoader, self).__init__(
|
|
244
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForSequenceClassification.loadSavedModel",
|
|
245
|
-
|
|
585
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForSequenceClassification.loadSavedModel",
|
|
586
|
+
path,
|
|
587
|
+
jspark,
|
|
588
|
+
)
|
|
246
589
|
|
|
247
590
|
|
|
248
591
|
class _XlmRoBertaTokenClassifierLoader(ExtendedJavaWrapper):
|
|
249
592
|
def __init__(self, path, jspark):
|
|
250
593
|
super(_XlmRoBertaTokenClassifierLoader, self).__init__(
|
|
251
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForTokenClassification.loadSavedModel",
|
|
252
|
-
|
|
594
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForTokenClassification.loadSavedModel",
|
|
595
|
+
path,
|
|
596
|
+
jspark,
|
|
597
|
+
)
|
|
253
598
|
|
|
254
599
|
|
|
255
600
|
class _XlmRoBertaQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
256
601
|
def __init__(self, path, jspark):
|
|
257
602
|
super(_XlmRoBertaQuestionAnsweringLoader, self).__init__(
|
|
258
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForQuestionAnswering.loadSavedModel",
|
|
259
|
-
|
|
603
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForQuestionAnswering.loadSavedModel",
|
|
604
|
+
path,
|
|
605
|
+
jspark,
|
|
606
|
+
)
|
|
607
|
+
|
|
608
|
+
|
|
609
|
+
class _XlmRoBertaMultipleChoiceLoader(ExtendedJavaWrapper):
|
|
610
|
+
def __init__(self, path, jspark):
|
|
611
|
+
super(_XlmRoBertaMultipleChoiceLoader, self).__init__(
|
|
612
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForMultipleChoice.loadSavedModel",
|
|
613
|
+
path,
|
|
614
|
+
jspark,
|
|
615
|
+
)
|
|
260
616
|
|
|
261
617
|
|
|
262
618
|
class _XlnetLoader(ExtendedJavaWrapper):
|
|
263
619
|
def __init__(self, path, jspark):
|
|
264
|
-
super(_XlnetLoader, self).__init__(
|
|
265
|
-
|
|
620
|
+
super(_XlnetLoader, self).__init__(
|
|
621
|
+
"com.johnsnowlabs.nlp.embeddings.XlnetEmbeddings.loadSavedModel",
|
|
622
|
+
path,
|
|
623
|
+
jspark,
|
|
624
|
+
)
|
|
266
625
|
|
|
267
626
|
|
|
268
627
|
class _XlnetSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
269
628
|
def __init__(self, path, jspark):
|
|
270
629
|
super(_XlnetSequenceClassifierLoader, self).__init__(
|
|
271
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlnetForSequenceClassification.loadSavedModel",
|
|
272
|
-
|
|
630
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlnetForSequenceClassification.loadSavedModel",
|
|
631
|
+
path,
|
|
632
|
+
jspark,
|
|
633
|
+
)
|
|
273
634
|
|
|
274
635
|
|
|
275
636
|
class _XlnetTokenClassifierLoader(ExtendedJavaWrapper):
|
|
276
637
|
def __init__(self, path, jspark):
|
|
277
638
|
super(_XlnetTokenClassifierLoader, self).__init__(
|
|
278
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlnetForTokenClassification.loadSavedModel",
|
|
639
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlnetForTokenClassification.loadSavedModel",
|
|
640
|
+
path,
|
|
641
|
+
jspark,
|
|
642
|
+
)
|
|
279
643
|
|
|
280
644
|
|
|
281
645
|
class _ClearCache(ExtendedJavaWrapper):
|
|
282
646
|
def __init__(self, name, language, remote_loc):
|
|
283
|
-
super(_ClearCache, self).__init__(
|
|
284
|
-
|
|
647
|
+
super(_ClearCache, self).__init__(
|
|
648
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.clearCache",
|
|
649
|
+
name,
|
|
650
|
+
language,
|
|
651
|
+
remote_loc,
|
|
652
|
+
)
|
|
285
653
|
|
|
286
654
|
|
|
287
655
|
class _CoNLLGeneratorExportFromTargetAndPipeline(ExtendedJavaWrapper):
|
|
@@ -293,50 +661,76 @@ class _CoNLLGeneratorExportFromTargetAndPipeline(ExtendedJavaWrapper):
|
|
|
293
661
|
if type(target) == DataFrame:
|
|
294
662
|
super(_CoNLLGeneratorExportFromTargetAndPipeline, self).__init__(
|
|
295
663
|
"com.johnsnowlabs.util.CoNLLGenerator.exportConllFiles",
|
|
296
|
-
target._jdf,
|
|
664
|
+
target._jdf,
|
|
665
|
+
pipeline,
|
|
666
|
+
output_path,
|
|
667
|
+
)
|
|
297
668
|
else:
|
|
298
669
|
super(_CoNLLGeneratorExportFromTargetAndPipeline, self).__init__(
|
|
299
670
|
"com.johnsnowlabs.util.CoNLLGenerator.exportConllFiles",
|
|
300
|
-
spark._jsparkSession,
|
|
671
|
+
spark._jsparkSession,
|
|
672
|
+
target,
|
|
673
|
+
pipeline,
|
|
674
|
+
output_path,
|
|
675
|
+
)
|
|
301
676
|
|
|
302
677
|
|
|
303
678
|
class _CoNLLGeneratorExportFromDataFrameAndField(ExtendedJavaWrapper):
|
|
304
679
|
|
|
305
680
|
def __init__(self, dataframe, output_path, metadata_sentence_key):
|
|
306
681
|
super(_CoNLLGeneratorExportFromDataFrameAndField, self).__init__(
|
|
307
|
-
"com.johnsnowlabs.util.CoNLLGenerator.exportConllFilesFromField",
|
|
308
|
-
|
|
682
|
+
"com.johnsnowlabs.util.CoNLLGenerator.exportConllFilesFromField",
|
|
683
|
+
dataframe,
|
|
684
|
+
output_path,
|
|
685
|
+
metadata_sentence_key,
|
|
686
|
+
)
|
|
309
687
|
|
|
310
688
|
|
|
311
689
|
class _CoNLLGeneratorExportFromDataFrame(ExtendedJavaWrapper):
|
|
312
690
|
def __init__(self, dataframe, output_path):
|
|
313
691
|
super(_CoNLLGeneratorExportFromDataFrame, self).__init__(
|
|
314
692
|
"com.johnsnowlabs.util.CoNLLGenerator.exportConllFiles",
|
|
315
|
-
dataframe,
|
|
693
|
+
dataframe,
|
|
694
|
+
output_path,
|
|
695
|
+
)
|
|
316
696
|
|
|
317
697
|
|
|
318
698
|
class _CoverageResult(ExtendedJavaWrapper):
|
|
319
699
|
def __init__(self, covered, total, percentage):
|
|
320
|
-
super(_CoverageResult, self).__init__(
|
|
321
|
-
|
|
700
|
+
super(_CoverageResult, self).__init__(
|
|
701
|
+
"com.johnsnowlabs.nlp.embeddings.CoverageResult", covered, total, percentage
|
|
702
|
+
)
|
|
322
703
|
|
|
323
704
|
|
|
324
705
|
class _DownloadModelDirectly(ExtendedJavaWrapper):
|
|
325
|
-
def __init__(self, name, remote_loc="public/models"):
|
|
706
|
+
def __init__(self, name, remote_loc="public/models", unzip=True):
|
|
326
707
|
super(_DownloadModelDirectly, self).__init__(
|
|
327
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.downloadModelDirectly",
|
|
708
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.downloadModelDirectly",
|
|
709
|
+
name,
|
|
710
|
+
remote_loc,
|
|
711
|
+
unzip,
|
|
712
|
+
)
|
|
328
713
|
|
|
329
714
|
|
|
330
715
|
class _DownloadModel(ExtendedJavaWrapper):
|
|
331
716
|
def __init__(self, reader, name, language, remote_loc, validator):
|
|
332
|
-
super(_DownloadModel, self).__init__(
|
|
333
|
-
|
|
717
|
+
super(_DownloadModel, self).__init__(
|
|
718
|
+
"com.johnsnowlabs.nlp.pretrained." + validator + ".downloadModel",
|
|
719
|
+
reader,
|
|
720
|
+
name,
|
|
721
|
+
language,
|
|
722
|
+
remote_loc,
|
|
723
|
+
)
|
|
334
724
|
|
|
335
725
|
|
|
336
726
|
class _DownloadPipeline(ExtendedJavaWrapper):
|
|
337
727
|
def __init__(self, name, language, remote_loc):
|
|
338
728
|
super(_DownloadPipeline, self).__init__(
|
|
339
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.downloadPipeline",
|
|
729
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.downloadPipeline",
|
|
730
|
+
name,
|
|
731
|
+
language,
|
|
732
|
+
remote_loc,
|
|
733
|
+
)
|
|
340
734
|
|
|
341
735
|
|
|
342
736
|
class _DownloadPredefinedPipeline(ExtendedJavaWrapper):
|
|
@@ -347,116 +741,215 @@ class _DownloadPredefinedPipeline(ExtendedJavaWrapper):
|
|
|
347
741
|
class _EmbeddingsCoverageColumn(ExtendedJavaWrapper):
|
|
348
742
|
def __init__(self, dataset, embeddings_col, output_col):
|
|
349
743
|
super(_EmbeddingsCoverageColumn, self).__init__(
|
|
350
|
-
"com.johnsnowlabs.nlp.embeddings.WordEmbeddingsModel.withCoverageColumn",
|
|
351
|
-
|
|
744
|
+
"com.johnsnowlabs.nlp.embeddings.WordEmbeddingsModel.withCoverageColumn",
|
|
745
|
+
dataset._jdf,
|
|
746
|
+
embeddings_col,
|
|
747
|
+
output_col,
|
|
748
|
+
)
|
|
352
749
|
|
|
353
750
|
|
|
354
751
|
class _EmbeddingsOverallCoverage(ExtendedJavaWrapper):
|
|
355
752
|
def __init__(self, dataset, embeddings_col):
|
|
356
753
|
super(_EmbeddingsOverallCoverage, self).__init__(
|
|
357
|
-
"com.johnsnowlabs.nlp.embeddings.WordEmbeddingsModel.overallCoverage",
|
|
754
|
+
"com.johnsnowlabs.nlp.embeddings.WordEmbeddingsModel.overallCoverage",
|
|
755
|
+
dataset._jdf,
|
|
756
|
+
embeddings_col,
|
|
757
|
+
)
|
|
358
758
|
|
|
359
759
|
|
|
360
760
|
class _ExternalResource(ExtendedJavaWrapper):
|
|
361
761
|
def __init__(self, path, read_as, options):
|
|
362
|
-
super(_ExternalResource, self).__init__(
|
|
363
|
-
|
|
762
|
+
super(_ExternalResource, self).__init__(
|
|
763
|
+
"com.johnsnowlabs.nlp.util.io.ExternalResource.fromJava",
|
|
764
|
+
path,
|
|
765
|
+
read_as,
|
|
766
|
+
options,
|
|
767
|
+
)
|
|
364
768
|
|
|
365
769
|
|
|
366
770
|
class _ConfigLoaderGetter(ExtendedJavaWrapper):
|
|
367
771
|
def __init__(self):
|
|
368
|
-
super(_ConfigLoaderGetter, self).__init__(
|
|
772
|
+
super(_ConfigLoaderGetter, self).__init__(
|
|
773
|
+
"com.johnsnowlabs.util.ConfigLoader.getConfigPath"
|
|
774
|
+
)
|
|
369
775
|
|
|
370
776
|
|
|
371
777
|
class _GetResourceSize(ExtendedJavaWrapper):
|
|
372
778
|
def __init__(self, name, language, remote_loc):
|
|
373
779
|
super(_GetResourceSize, self).__init__(
|
|
374
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.getDownloadSize",
|
|
780
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.getDownloadSize",
|
|
781
|
+
name,
|
|
782
|
+
language,
|
|
783
|
+
remote_loc,
|
|
784
|
+
)
|
|
375
785
|
|
|
376
786
|
|
|
377
787
|
class _LightPipeline(ExtendedJavaWrapper):
|
|
378
788
|
def __init__(self, pipelineModel, parse_embeddings):
|
|
379
|
-
super(_LightPipeline, self).__init__(
|
|
380
|
-
|
|
789
|
+
super(_LightPipeline, self).__init__(
|
|
790
|
+
"com.johnsnowlabs.nlp.LightPipeline",
|
|
791
|
+
pipelineModel._to_java(),
|
|
792
|
+
parse_embeddings,
|
|
793
|
+
)
|
|
381
794
|
|
|
382
795
|
|
|
383
796
|
class _RegexRule(ExtendedJavaWrapper):
|
|
384
797
|
def __init__(self, rule, identifier):
|
|
385
|
-
super(_RegexRule, self).__init__(
|
|
798
|
+
super(_RegexRule, self).__init__(
|
|
799
|
+
"com.johnsnowlabs.nlp.util.regex.RegexRule", rule, identifier
|
|
800
|
+
)
|
|
386
801
|
|
|
387
802
|
|
|
388
803
|
class _ShowAvailableAnnotators(ExtendedJavaWrapper):
|
|
389
804
|
def __init__(self):
|
|
390
805
|
super(_ShowAvailableAnnotators, self).__init__(
|
|
391
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showAvailableAnnotators"
|
|
806
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showAvailableAnnotators"
|
|
807
|
+
)
|
|
392
808
|
|
|
393
809
|
|
|
394
810
|
class _ShowPublicModels(ExtendedJavaWrapper):
|
|
395
811
|
def __init__(self, annotator, lang, version):
|
|
396
812
|
super(_ShowPublicModels, self).__init__(
|
|
397
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showPublicModels",
|
|
813
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showPublicModels",
|
|
814
|
+
annotator,
|
|
815
|
+
lang,
|
|
816
|
+
version,
|
|
817
|
+
)
|
|
398
818
|
|
|
399
819
|
|
|
400
820
|
class _ShowPublicPipelines(ExtendedJavaWrapper):
|
|
401
821
|
def __init__(self, lang, version):
|
|
402
822
|
super(_ShowPublicPipelines, self).__init__(
|
|
403
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showPublicPipelines",
|
|
823
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showPublicPipelines",
|
|
824
|
+
lang,
|
|
825
|
+
version,
|
|
826
|
+
)
|
|
404
827
|
|
|
405
828
|
|
|
406
829
|
class _ShowUnCategorizedResources(ExtendedJavaWrapper):
|
|
407
830
|
def __init__(self):
|
|
408
831
|
super(_ShowUnCategorizedResources, self).__init__(
|
|
409
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showUnCategorizedResources"
|
|
832
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showUnCategorizedResources"
|
|
833
|
+
)
|
|
410
834
|
|
|
411
835
|
|
|
412
836
|
class _StorageHelper(ExtendedJavaWrapper):
|
|
413
837
|
def __init__(self, path, spark, database, storage_ref, within_storage):
|
|
414
|
-
super(_StorageHelper, self).__init__(
|
|
415
|
-
|
|
838
|
+
super(_StorageHelper, self).__init__(
|
|
839
|
+
"com.johnsnowlabs.storage.StorageHelper.load",
|
|
840
|
+
path,
|
|
841
|
+
spark._jsparkSession,
|
|
842
|
+
database,
|
|
843
|
+
storage_ref,
|
|
844
|
+
within_storage,
|
|
845
|
+
)
|
|
416
846
|
|
|
417
847
|
|
|
418
848
|
class _SpanBertCorefLoader(ExtendedJavaWrapper):
|
|
419
849
|
def __init__(self, path, jspark):
|
|
420
850
|
super(_SpanBertCorefLoader, self).__init__(
|
|
421
|
-
"com.johnsnowlabs.nlp.annotators.coref.SpanBertCorefModel.loadSavedModel",
|
|
851
|
+
"com.johnsnowlabs.nlp.annotators.coref.SpanBertCorefModel.loadSavedModel",
|
|
852
|
+
path,
|
|
853
|
+
jspark,
|
|
854
|
+
)
|
|
422
855
|
|
|
423
856
|
|
|
424
857
|
class _NerDLGraphBuilder(ExtendedJavaWrapper):
|
|
425
858
|
def __init__(self, dataset, input_col, label_col):
|
|
426
859
|
super(_NerDLGraphBuilder, self).__init__(
|
|
427
860
|
"com.johnsnowlabs.nlp.annotators.ner.dl.NerDLApproach.getGraphParams",
|
|
428
|
-
dataset,
|
|
861
|
+
dataset,
|
|
862
|
+
input_col,
|
|
863
|
+
label_col,
|
|
864
|
+
)
|
|
429
865
|
|
|
430
866
|
|
|
431
867
|
class _ResourceHelper_moveFile(ExtendedJavaWrapper):
|
|
432
868
|
def __init__(self, local_file, hdfs_file):
|
|
433
869
|
super(_ResourceHelper_moveFile, self).__init__(
|
|
434
|
-
"com.johnsnowlabs.nlp.util.io.ResourceHelper.moveFile",
|
|
870
|
+
"com.johnsnowlabs.nlp.util.io.ResourceHelper.moveFile",
|
|
871
|
+
local_file,
|
|
872
|
+
hdfs_file,
|
|
873
|
+
)
|
|
435
874
|
|
|
436
875
|
|
|
437
876
|
class _ResourceHelper_validFile(ExtendedJavaWrapper):
|
|
438
877
|
def __init__(self, path):
|
|
439
878
|
super(_ResourceHelper_validFile, self).__init__(
|
|
440
|
-
"com.johnsnowlabs.nlp.util.io.ResourceHelper.validFile", path
|
|
879
|
+
"com.johnsnowlabs.nlp.util.io.ResourceHelper.validFile", path
|
|
880
|
+
)
|
|
441
881
|
|
|
442
882
|
|
|
443
883
|
class _ViTForImageClassification(ExtendedJavaWrapper):
|
|
444
884
|
def __init__(self, path, jspark):
|
|
445
885
|
super(_ViTForImageClassification, self).__init__(
|
|
446
|
-
"com.johnsnowlabs.nlp.annotators.cv.ViTForImageClassification.loadSavedModel",
|
|
886
|
+
"com.johnsnowlabs.nlp.annotators.cv.ViTForImageClassification.loadSavedModel",
|
|
887
|
+
path,
|
|
888
|
+
jspark,
|
|
889
|
+
)
|
|
890
|
+
|
|
891
|
+
|
|
892
|
+
class _VisionEncoderDecoderForImageCaptioning(ExtendedJavaWrapper):
|
|
893
|
+
def __init__(self, path, jspark):
|
|
894
|
+
super(_VisionEncoderDecoderForImageCaptioning, self).__init__(
|
|
895
|
+
"com.johnsnowlabs.nlp.annotators.cv.VisionEncoderDecoderForImageCaptioning.loadSavedModel",
|
|
896
|
+
path,
|
|
897
|
+
jspark,
|
|
898
|
+
)
|
|
899
|
+
|
|
900
|
+
|
|
901
|
+
class _SwinForImageClassification(ExtendedJavaWrapper):
|
|
902
|
+
def __init__(self, path, jspark):
|
|
903
|
+
super(_SwinForImageClassification, self).__init__(
|
|
904
|
+
"com.johnsnowlabs.nlp.annotators.cv.SwinForImageClassification.loadSavedModel",
|
|
905
|
+
path,
|
|
906
|
+
jspark,
|
|
907
|
+
)
|
|
908
|
+
|
|
909
|
+
|
|
910
|
+
class _ConvNextForImageClassification(ExtendedJavaWrapper):
|
|
911
|
+
def __init__(self, path, jspark):
|
|
912
|
+
super(_ConvNextForImageClassification, self).__init__(
|
|
913
|
+
"com.johnsnowlabs.nlp.annotators.cv.ConvNextForImageClassification.loadSavedModel",
|
|
914
|
+
path,
|
|
915
|
+
jspark,
|
|
916
|
+
)
|
|
447
917
|
|
|
448
918
|
|
|
449
919
|
class _Wav2Vec2ForCTC(ExtendedJavaWrapper):
|
|
450
920
|
def __init__(self, path, jspark):
|
|
451
921
|
super(_Wav2Vec2ForCTC, self).__init__(
|
|
452
|
-
"com.johnsnowlabs.nlp.annotators.audio.Wav2Vec2ForCTC.loadSavedModel",
|
|
922
|
+
"com.johnsnowlabs.nlp.annotators.audio.Wav2Vec2ForCTC.loadSavedModel",
|
|
923
|
+
path,
|
|
924
|
+
jspark,
|
|
925
|
+
)
|
|
926
|
+
|
|
927
|
+
|
|
928
|
+
class _HubertForCTC(ExtendedJavaWrapper):
|
|
929
|
+
def __init__(self, path, jspark):
|
|
930
|
+
super(_HubertForCTC, self).__init__(
|
|
931
|
+
"com.johnsnowlabs.nlp.annotators.audio.HubertForCTC.loadSavedModel",
|
|
932
|
+
path,
|
|
933
|
+
jspark,
|
|
934
|
+
)
|
|
453
935
|
|
|
454
936
|
|
|
455
|
-
class
|
|
937
|
+
class _WhisperForCTC(ExtendedJavaWrapper):
|
|
456
938
|
def __init__(self, path, jspark):
|
|
457
|
-
super(
|
|
458
|
-
"com.johnsnowlabs.nlp.annotators.
|
|
459
|
-
|
|
939
|
+
super(_WhisperForCTC, self).__init__(
|
|
940
|
+
"com.johnsnowlabs.nlp.annotators.audio.WhisperForCTC.loadSavedModel",
|
|
941
|
+
path,
|
|
942
|
+
jspark,
|
|
943
|
+
)
|
|
944
|
+
|
|
945
|
+
|
|
946
|
+
class _CamemBertForTokenClassificationLoader(ExtendedJavaWrapper):
|
|
947
|
+
def __init__(self, path, jspark):
|
|
948
|
+
super(_CamemBertForTokenClassificationLoader, self).__init__(
|
|
949
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.CamemBertForTokenClassification.loadSavedModel",
|
|
950
|
+
path,
|
|
951
|
+
jspark,
|
|
952
|
+
)
|
|
460
953
|
|
|
461
954
|
|
|
462
955
|
class _TapasForQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
@@ -464,11 +957,243 @@ class _TapasForQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
|
464
957
|
super(_TapasForQuestionAnsweringLoader, self).__init__(
|
|
465
958
|
"com.johnsnowlabs.nlp.annotators.classifier.dl.TapasForQuestionAnswering.loadSavedModel",
|
|
466
959
|
path,
|
|
467
|
-
jspark
|
|
960
|
+
jspark,
|
|
961
|
+
)
|
|
468
962
|
|
|
469
963
|
|
|
470
|
-
class
|
|
964
|
+
class _CamemBertForSequenceClassificationLoader(ExtendedJavaWrapper):
|
|
965
|
+
def __init__(self, path, jspark):
|
|
966
|
+
super(_CamemBertForSequenceClassificationLoader, self).__init__(
|
|
967
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.CamemBertForSequenceClassification.loadSavedModel",
|
|
968
|
+
path,
|
|
969
|
+
jspark,
|
|
970
|
+
)
|
|
971
|
+
|
|
972
|
+
|
|
973
|
+
class _CamemBertQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
974
|
+
def __init__(self, path, jspark):
|
|
975
|
+
super(_CamemBertQuestionAnsweringLoader, self).__init__(
|
|
976
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.CamemBertForQuestionAnswering.loadSavedModel",
|
|
977
|
+
path,
|
|
978
|
+
jspark,
|
|
979
|
+
)
|
|
980
|
+
|
|
981
|
+
class _CamemBertForZeroShotClassificationLoader(ExtendedJavaWrapper):
|
|
982
|
+
def __init__(self, path, jspark):
|
|
983
|
+
super(_CamemBertForZeroShotClassificationLoader, self).__init__(
|
|
984
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.CamemBertForZeroShotClassification.loadSavedModel",
|
|
985
|
+
path,
|
|
986
|
+
jspark,
|
|
987
|
+
)
|
|
988
|
+
|
|
989
|
+
class _RobertaQAToZeroShotNerLoader(ExtendedJavaWrapper):
|
|
990
|
+
def __init__(self, path):
|
|
991
|
+
super(_RobertaQAToZeroShotNerLoader, self).__init__(
|
|
992
|
+
"com.johnsnowlabs.nlp.annotators.ner.dl.ZeroShotNerModel.load", path
|
|
993
|
+
)
|
|
994
|
+
|
|
995
|
+
|
|
996
|
+
class _BertZeroShotClassifierLoader(ExtendedJavaWrapper):
|
|
997
|
+
def __init__(self, path, jspark):
|
|
998
|
+
super(_BertZeroShotClassifierLoader, self).__init__(
|
|
999
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForZeroShotClassification.loadSavedModel",
|
|
1000
|
+
path,
|
|
1001
|
+
jspark,
|
|
1002
|
+
)
|
|
1003
|
+
|
|
1004
|
+
|
|
1005
|
+
class _DistilBertForZeroShotClassification(ExtendedJavaWrapper):
|
|
1006
|
+
def __init__(self, path, jspark):
|
|
1007
|
+
super(_DistilBertForZeroShotClassification, self).__init__(
|
|
1008
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForZeroShotClassification.loadSavedModel",
|
|
1009
|
+
path,
|
|
1010
|
+
jspark,
|
|
1011
|
+
)
|
|
1012
|
+
|
|
1013
|
+
|
|
1014
|
+
class _RoBertaForZeroShotClassification(ExtendedJavaWrapper):
|
|
1015
|
+
def __init__(self, path, jspark):
|
|
1016
|
+
super(_RoBertaForZeroShotClassification, self).__init__(
|
|
1017
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForZeroShotClassification.loadSavedModel",
|
|
1018
|
+
path,
|
|
1019
|
+
jspark,
|
|
1020
|
+
)
|
|
1021
|
+
|
|
1022
|
+
|
|
1023
|
+
class _XlmRoBertaForZeroShotClassification(ExtendedJavaWrapper):
|
|
1024
|
+
def __init__(self, path, jspark):
|
|
1025
|
+
super(_XlmRoBertaForZeroShotClassification, self).__init__(
|
|
1026
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForZeroShotClassification.loadSavedModel",
|
|
1027
|
+
path,
|
|
1028
|
+
jspark,
|
|
1029
|
+
)
|
|
1030
|
+
|
|
1031
|
+
|
|
1032
|
+
class _InstructorLoader(ExtendedJavaWrapper):
|
|
1033
|
+
def __init__(self, path, jspark):
|
|
1034
|
+
super(_InstructorLoader, self).__init__(
|
|
1035
|
+
"com.johnsnowlabs.nlp.embeddings.InstructorEmbeddings.loadSavedModel",
|
|
1036
|
+
path,
|
|
1037
|
+
jspark,
|
|
1038
|
+
)
|
|
1039
|
+
|
|
1040
|
+
|
|
1041
|
+
class _BartForZeroShotClassification(ExtendedJavaWrapper):
|
|
1042
|
+
def __init__(self, path, jspark):
|
|
1043
|
+
super(_BartForZeroShotClassification, self).__init__(
|
|
1044
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.BartForZeroShotClassification.loadSavedModel",
|
|
1045
|
+
path,
|
|
1046
|
+
jspark,
|
|
1047
|
+
)
|
|
1048
|
+
|
|
1049
|
+
|
|
1050
|
+
class _CLIPForZeroShotClassification(ExtendedJavaWrapper):
|
|
1051
|
+
def __init__(self, path, jspark):
|
|
1052
|
+
super(_CLIPForZeroShotClassification, self).__init__(
|
|
1053
|
+
"com.johnsnowlabs.nlp.annotators.cv.CLIPForZeroShotClassification.loadSavedModel",
|
|
1054
|
+
path,
|
|
1055
|
+
jspark,
|
|
1056
|
+
)
|
|
1057
|
+
|
|
1058
|
+
|
|
1059
|
+
class _DeBertaForZeroShotClassification(ExtendedJavaWrapper):
|
|
1060
|
+
def __init__(self, path, jspark):
|
|
1061
|
+
super(_DeBertaForZeroShotClassification, self).__init__(
|
|
1062
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForZeroShotClassification.loadSavedModel",
|
|
1063
|
+
path,
|
|
1064
|
+
jspark,
|
|
1065
|
+
)
|
|
1066
|
+
|
|
1067
|
+
|
|
1068
|
+
class _MPNetForSequenceClassificationLoader(ExtendedJavaWrapper):
|
|
1069
|
+
def __init__(self, path, jspark):
|
|
1070
|
+
super(_MPNetForSequenceClassificationLoader, self).__init__(
|
|
1071
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.MPNetForSequenceClassification.loadSavedModel",
|
|
1072
|
+
path,
|
|
1073
|
+
jspark,
|
|
1074
|
+
)
|
|
1075
|
+
|
|
1076
|
+
|
|
1077
|
+
class _MPNetForQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
1078
|
+
def __init__(self, path, jspark):
|
|
1079
|
+
super(_MPNetForQuestionAnsweringLoader, self).__init__(
|
|
1080
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.MPNetForQuestionAnswering.loadSavedModel",
|
|
1081
|
+
path,
|
|
1082
|
+
jspark,
|
|
1083
|
+
)
|
|
1084
|
+
|
|
1085
|
+
|
|
1086
|
+
class _MPNetForTokenClassifierLoader(ExtendedJavaWrapper):
|
|
1087
|
+
def __init__(self, path, jspark):
|
|
1088
|
+
super(_MPNetForTokenClassifierLoader, self).__init__(
|
|
1089
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.MPNetForTokenClassification.loadSavedModel",
|
|
1090
|
+
path,
|
|
1091
|
+
jspark,
|
|
1092
|
+
)
|
|
1093
|
+
|
|
1094
|
+
|
|
1095
|
+
class _UAEEmbeddingsLoader(ExtendedJavaWrapper):
|
|
1096
|
+
def __init__(self, path, jspark):
|
|
1097
|
+
super(_UAEEmbeddingsLoader, self).__init__(
|
|
1098
|
+
"com.johnsnowlabs.nlp.embeddings.UAEEmbeddings.loadSavedModel", path, jspark
|
|
1099
|
+
)
|
|
1100
|
+
|
|
1101
|
+
|
|
1102
|
+
class _AutoGGUFLoader(ExtendedJavaWrapper):
|
|
1103
|
+
def __init__(self, path, jspark):
|
|
1104
|
+
super(_AutoGGUFLoader, self).__init__(
|
|
1105
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.AutoGGUFModel.loadSavedModel", path, jspark)
|
|
1106
|
+
|
|
1107
|
+
|
|
1108
|
+
class _MxbaiEmbeddingsLoader(ExtendedJavaWrapper):
|
|
1109
|
+
def __init__(self, path, jspark):
|
|
1110
|
+
super(_MxbaiEmbeddingsLoader, self).__init__(
|
|
1111
|
+
"com.johnsnowlabs.nlp.embeddings.MxbaiEmbeddings.loadSavedModel", path, jspark
|
|
1112
|
+
)
|
|
1113
|
+
|
|
1114
|
+
|
|
1115
|
+
class _SnowFlakeEmbeddingsLoader(ExtendedJavaWrapper):
|
|
1116
|
+
def __init__(self, path, jspark):
|
|
1117
|
+
super(_SnowFlakeEmbeddingsLoader, self).__init__(
|
|
1118
|
+
"com.johnsnowlabs.nlp.embeddings.SnowFlakeEmbeddings.loadSavedModel", path, jspark
|
|
1119
|
+
)
|
|
1120
|
+
|
|
1121
|
+
|
|
1122
|
+
class _AutoGGUFEmbeddingsLoader(ExtendedJavaWrapper):
|
|
1123
|
+
def __init__(self, path, jspark):
|
|
1124
|
+
super(_AutoGGUFEmbeddingsLoader, self).__init__(
|
|
1125
|
+
"com.johnsnowlabs.nlp.embeddings.AutoGGUFEmbeddings.loadSavedModel", path, jspark)
|
|
1126
|
+
|
|
1127
|
+
|
|
1128
|
+
class _BLIPForQuestionAnswering(ExtendedJavaWrapper):
|
|
1129
|
+
def __init__(self, path, jspark):
|
|
1130
|
+
super(_BLIPForQuestionAnswering, self).__init__(
|
|
1131
|
+
"com.johnsnowlabs.nlp.annotators.cv.BLIPForQuestionAnswering.loadSavedModel",
|
|
1132
|
+
path,
|
|
1133
|
+
jspark,
|
|
1134
|
+
)
|
|
1135
|
+
|
|
1136
|
+
|
|
1137
|
+
class _AutoGGUFVisionLoader(ExtendedJavaWrapper):
|
|
1138
|
+
def __init__(self, modelPath, mmprojPath, jspark):
|
|
1139
|
+
super(_AutoGGUFVisionLoader, self).__init__(
|
|
1140
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.AutoGGUFVisionModel.loadSavedModel", modelPath, mmprojPath, jspark)
|
|
1141
|
+
|
|
1142
|
+
|
|
1143
|
+
class _Qwen2VLTransformerLoader(ExtendedJavaWrapper):
|
|
1144
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
1145
|
+
super(_Qwen2VLTransformerLoader, self).__init__(
|
|
1146
|
+
"com.johnsnowlabs.nlp.annotators.cv.Qwen2VLTransformer.loadSavedModel",
|
|
1147
|
+
path,
|
|
1148
|
+
jspark,
|
|
1149
|
+
use_openvino,
|
|
1150
|
+
)
|
|
1151
|
+
|
|
1152
|
+
class _PaliGemmaForMultiModalLoader(ExtendedJavaWrapper):
|
|
1153
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
1154
|
+
super(_PaliGemmaForMultiModalLoader, self).__init__(
|
|
1155
|
+
"com.johnsnowlabs.nlp.annotators.cv.PaliGemmaForMultiModal.loadSavedModel",
|
|
1156
|
+
path,
|
|
1157
|
+
jspark,
|
|
1158
|
+
use_openvino,
|
|
1159
|
+
)
|
|
1160
|
+
|
|
1161
|
+
class _SmolVLMTransformerLoader(ExtendedJavaWrapper):
|
|
1162
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
1163
|
+
super(_SmolVLMTransformerLoader, self).__init__(
|
|
1164
|
+
"com.johnsnowlabs.nlp.annotators.cv.SmolVLMTransformer.loadSavedModel",
|
|
1165
|
+
path,
|
|
1166
|
+
jspark,
|
|
1167
|
+
use_openvino
|
|
1168
|
+
)
|
|
1169
|
+
|
|
1170
|
+
class _Florence2TransformerLoader(ExtendedJavaWrapper):
|
|
1171
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
1172
|
+
super(_Florence2TransformerLoader, self).__init__(
|
|
1173
|
+
"com.johnsnowlabs.nlp.annotators.cv.Florence2Transformer.loadSavedModel",
|
|
1174
|
+
path,
|
|
1175
|
+
jspark,
|
|
1176
|
+
use_openvino,
|
|
1177
|
+
)
|
|
1178
|
+
class _E5VEmbeddingsLoader(ExtendedJavaWrapper):
|
|
1179
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
1180
|
+
super(_E5VEmbeddingsLoader, self).__init__(
|
|
1181
|
+
"com.johnsnowlabs.nlp.embeddings.E5VEmbeddings.loadSavedModel",
|
|
1182
|
+
path,
|
|
1183
|
+
jspark,
|
|
1184
|
+
use_openvino
|
|
1185
|
+
)
|
|
1186
|
+
|
|
1187
|
+
class _Phi4Loader(ExtendedJavaWrapper):
|
|
1188
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
1189
|
+
super(_Phi4Loader, self).__init__(
|
|
1190
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.Phi4Transformer.loadSavedModel",
|
|
1191
|
+
path,
|
|
1192
|
+
jspark,
|
|
1193
|
+
use_openvino,
|
|
1194
|
+
)
|
|
1195
|
+
|
|
1196
|
+
class _AutoGGUFRerankerLoader(ExtendedJavaWrapper):
|
|
471
1197
|
def __init__(self, path, jspark):
|
|
472
|
-
super(
|
|
473
|
-
"com.johnsnowlabs.nlp.annotators.
|
|
474
|
-
jspark)
|
|
1198
|
+
super(_AutoGGUFRerankerLoader, self).__init__(
|
|
1199
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.AutoGGUFReranker.loadSavedModel", path, jspark)
|