spark-nlp 5.3.2__py2.py3-none-any.whl → 5.4.0__py2.py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of spark-nlp might be problematic. Click here for more details.
- com/johnsnowlabs/ml/__init__.py +0 -0
- com/johnsnowlabs/ml/ai/__init__.py +10 -0
- {spark_nlp-5.3.2.dist-info → spark_nlp-5.4.0.dist-info}/METADATA +50 -60
- {spark_nlp-5.3.2.dist-info → spark_nlp-5.4.0.dist-info}/RECORD +28 -22
- sparknlp/__init__.py +3 -2
- sparknlp/annotator/classifier_dl/__init__.py +1 -0
- sparknlp/annotator/classifier_dl/mpnet_for_token_classification.py +173 -0
- sparknlp/annotator/classifier_dl/xlm_roberta_for_token_classification.py +3 -3
- sparknlp/annotator/embeddings/__init__.py +1 -0
- sparknlp/annotator/embeddings/bert_embeddings.py +4 -2
- sparknlp/annotator/embeddings/bert_sentence_embeddings.py +4 -2
- sparknlp/annotator/embeddings/bge_embeddings.py +2 -0
- sparknlp/annotator/embeddings/e5_embeddings.py +6 -2
- sparknlp/annotator/embeddings/mpnet_embeddings.py +2 -0
- sparknlp/annotator/embeddings/roberta_embeddings.py +4 -2
- sparknlp/annotator/embeddings/uae_embeddings.py +211 -0
- sparknlp/annotator/embeddings/xlm_roberta_embeddings.py +4 -2
- sparknlp/annotator/openai/openai_embeddings.py +43 -69
- sparknlp/annotator/seq2seq/__init__.py +2 -0
- sparknlp/annotator/seq2seq/llama2_transformer.py +2 -2
- sparknlp/annotator/seq2seq/m2m100_transformer.py +2 -2
- sparknlp/annotator/seq2seq/mistral_transformer.py +349 -0
- sparknlp/annotator/seq2seq/phi2_transformer.py +326 -0
- sparknlp/internal/__init__.py +443 -148
- sparknlp/pretrained/resource_downloader.py +2 -3
- {spark_nlp-5.3.2.dist-info → spark_nlp-5.4.0.dist-info}/.uuid +0 -0
- {spark_nlp-5.3.2.dist-info → spark_nlp-5.4.0.dist-info}/WHEEL +0 -0
- {spark_nlp-5.3.2.dist-info → spark_nlp-5.4.0.dist-info}/top_level.txt +0 -0
sparknlp/internal/__init__.py
CHANGED
|
@@ -24,296 +24,452 @@ from sparknlp.internal.recursive import *
|
|
|
24
24
|
# Wrapper Definitions
|
|
25
25
|
class _AlbertLoader(ExtendedJavaWrapper):
|
|
26
26
|
def __init__(self, path, jspark):
|
|
27
|
-
super(_AlbertLoader, self).__init__(
|
|
28
|
-
|
|
27
|
+
super(_AlbertLoader, self).__init__(
|
|
28
|
+
"com.johnsnowlabs.nlp.embeddings.AlbertEmbeddings.loadSavedModel",
|
|
29
|
+
path,
|
|
30
|
+
jspark,
|
|
31
|
+
)
|
|
29
32
|
|
|
30
33
|
|
|
31
34
|
class _AlbertSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
32
35
|
def __init__(self, path, jspark):
|
|
33
36
|
super(_AlbertSequenceClassifierLoader, self).__init__(
|
|
34
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForSequenceClassification.loadSavedModel",
|
|
35
|
-
|
|
37
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForSequenceClassification.loadSavedModel",
|
|
38
|
+
path,
|
|
39
|
+
jspark,
|
|
40
|
+
)
|
|
36
41
|
|
|
37
42
|
|
|
38
43
|
class _AlbertTokenClassifierLoader(ExtendedJavaWrapper):
|
|
39
44
|
def __init__(self, path, jspark):
|
|
40
45
|
super(_AlbertTokenClassifierLoader, self).__init__(
|
|
41
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForTokenClassification.loadSavedModel",
|
|
46
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForTokenClassification.loadSavedModel",
|
|
47
|
+
path,
|
|
48
|
+
jspark,
|
|
49
|
+
)
|
|
42
50
|
|
|
43
51
|
|
|
44
52
|
class _AlbertQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
45
53
|
def __init__(self, path, jspark):
|
|
46
54
|
super(_AlbertQuestionAnsweringLoader, self).__init__(
|
|
47
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForQuestionAnswering.loadSavedModel",
|
|
48
|
-
|
|
55
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.AlbertForQuestionAnswering.loadSavedModel",
|
|
56
|
+
path,
|
|
57
|
+
jspark,
|
|
58
|
+
)
|
|
49
59
|
|
|
50
60
|
|
|
51
61
|
class _BertLoader(ExtendedJavaWrapper):
|
|
52
|
-
def __init__(self, path, jspark):
|
|
53
|
-
super(_BertLoader, self).__init__(
|
|
62
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
63
|
+
super(_BertLoader, self).__init__(
|
|
64
|
+
"com.johnsnowlabs.nlp.embeddings.BertEmbeddings.loadSavedModel",
|
|
65
|
+
path,
|
|
66
|
+
jspark,
|
|
67
|
+
use_openvino,
|
|
68
|
+
)
|
|
54
69
|
|
|
55
70
|
|
|
56
71
|
class _BertSentenceLoader(ExtendedJavaWrapper):
|
|
57
|
-
def __init__(self, path, jspark):
|
|
72
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
58
73
|
super(_BertSentenceLoader, self).__init__(
|
|
59
|
-
"com.johnsnowlabs.nlp.embeddings.BertSentenceEmbeddings.loadSavedModel",
|
|
74
|
+
"com.johnsnowlabs.nlp.embeddings.BertSentenceEmbeddings.loadSavedModel",
|
|
75
|
+
path,
|
|
76
|
+
jspark,
|
|
77
|
+
use_openvino,
|
|
78
|
+
)
|
|
60
79
|
|
|
61
80
|
|
|
62
81
|
class _BertSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
63
82
|
def __init__(self, path, jspark):
|
|
64
83
|
super(_BertSequenceClassifierLoader, self).__init__(
|
|
65
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForSequenceClassification.loadSavedModel",
|
|
84
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForSequenceClassification.loadSavedModel",
|
|
85
|
+
path,
|
|
86
|
+
jspark,
|
|
87
|
+
)
|
|
66
88
|
|
|
67
89
|
|
|
68
90
|
class _BertTokenClassifierLoader(ExtendedJavaWrapper):
|
|
69
91
|
def __init__(self, path, jspark):
|
|
70
92
|
super(_BertTokenClassifierLoader, self).__init__(
|
|
71
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForTokenClassification.loadSavedModel",
|
|
93
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForTokenClassification.loadSavedModel",
|
|
94
|
+
path,
|
|
95
|
+
jspark,
|
|
96
|
+
)
|
|
72
97
|
|
|
73
98
|
|
|
74
99
|
class _BertQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
75
100
|
def __init__(self, path, jspark):
|
|
76
101
|
super(_BertQuestionAnsweringLoader, self).__init__(
|
|
77
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForQuestionAnswering.loadSavedModel",
|
|
102
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForQuestionAnswering.loadSavedModel",
|
|
103
|
+
path,
|
|
104
|
+
jspark,
|
|
105
|
+
)
|
|
78
106
|
|
|
79
107
|
|
|
80
108
|
class _DeBERTaLoader(ExtendedJavaWrapper):
|
|
81
109
|
def __init__(self, path, jspark):
|
|
82
110
|
super(_DeBERTaLoader, self).__init__(
|
|
83
|
-
"com.johnsnowlabs.nlp.embeddings.DeBertaEmbeddings.loadSavedModel",
|
|
84
|
-
|
|
111
|
+
"com.johnsnowlabs.nlp.embeddings.DeBertaEmbeddings.loadSavedModel",
|
|
112
|
+
path,
|
|
113
|
+
jspark,
|
|
114
|
+
)
|
|
85
115
|
|
|
86
116
|
|
|
87
117
|
class _DeBertaSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
88
118
|
def __init__(self, path, jspark):
|
|
89
119
|
super(_DeBertaSequenceClassifierLoader, self).__init__(
|
|
90
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForSequenceClassification.loadSavedModel",
|
|
91
|
-
|
|
120
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForSequenceClassification.loadSavedModel",
|
|
121
|
+
path,
|
|
122
|
+
jspark,
|
|
123
|
+
)
|
|
92
124
|
|
|
93
125
|
|
|
94
126
|
class _DeBertTokenClassifierLoader(ExtendedJavaWrapper):
|
|
95
127
|
def __init__(self, path, jspark):
|
|
96
128
|
super(_DeBertTokenClassifierLoader, self).__init__(
|
|
97
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForTokenClassification.loadSavedModel",
|
|
129
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForTokenClassification.loadSavedModel",
|
|
130
|
+
path,
|
|
131
|
+
jspark,
|
|
132
|
+
)
|
|
98
133
|
|
|
99
134
|
|
|
100
135
|
class _DeBertaQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
101
136
|
def __init__(self, path, jspark):
|
|
102
137
|
super(_DeBertaQuestionAnsweringLoader, self).__init__(
|
|
103
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForQuestionAnswering.loadSavedModel",
|
|
104
|
-
|
|
138
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForQuestionAnswering.loadSavedModel",
|
|
139
|
+
path,
|
|
140
|
+
jspark,
|
|
141
|
+
)
|
|
105
142
|
|
|
106
143
|
|
|
107
144
|
class _CamemBertLoader(ExtendedJavaWrapper):
|
|
108
145
|
def __init__(self, path, jspark):
|
|
109
|
-
super(_CamemBertLoader, self).__init__(
|
|
110
|
-
|
|
111
|
-
|
|
146
|
+
super(_CamemBertLoader, self).__init__(
|
|
147
|
+
"com.johnsnowlabs.nlp.embeddings.CamemBertEmbeddings.loadSavedModel",
|
|
148
|
+
path,
|
|
149
|
+
jspark,
|
|
150
|
+
)
|
|
112
151
|
|
|
113
152
|
|
|
114
153
|
class _DistilBertLoader(ExtendedJavaWrapper):
|
|
115
154
|
def __init__(self, path, jspark):
|
|
116
|
-
super(_DistilBertLoader, self).__init__(
|
|
117
|
-
|
|
155
|
+
super(_DistilBertLoader, self).__init__(
|
|
156
|
+
"com.johnsnowlabs.nlp.embeddings.DistilBertEmbeddings.loadSavedModel",
|
|
157
|
+
path,
|
|
158
|
+
jspark,
|
|
159
|
+
)
|
|
118
160
|
|
|
119
161
|
|
|
120
162
|
class _DistilBertSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
121
163
|
def __init__(self, path, jspark):
|
|
122
164
|
super(_DistilBertSequenceClassifierLoader, self).__init__(
|
|
123
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForSequenceClassification.loadSavedModel",
|
|
124
|
-
|
|
165
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForSequenceClassification.loadSavedModel",
|
|
166
|
+
path,
|
|
167
|
+
jspark,
|
|
168
|
+
)
|
|
125
169
|
|
|
126
170
|
|
|
127
171
|
class _DistilBertTokenClassifierLoader(ExtendedJavaWrapper):
|
|
128
172
|
def __init__(self, path, jspark):
|
|
129
173
|
super(_DistilBertTokenClassifierLoader, self).__init__(
|
|
130
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForTokenClassification.loadSavedModel",
|
|
131
|
-
|
|
174
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForTokenClassification.loadSavedModel",
|
|
175
|
+
path,
|
|
176
|
+
jspark,
|
|
177
|
+
)
|
|
132
178
|
|
|
133
179
|
|
|
134
180
|
class _DistilBertQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
135
181
|
def __init__(self, path, jspark):
|
|
136
182
|
super(_DistilBertQuestionAnsweringLoader, self).__init__(
|
|
137
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForQuestionAnswering.loadSavedModel",
|
|
138
|
-
|
|
183
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForQuestionAnswering.loadSavedModel",
|
|
184
|
+
path,
|
|
185
|
+
jspark,
|
|
186
|
+
)
|
|
139
187
|
|
|
140
188
|
|
|
141
189
|
class _ElmoLoader(ExtendedJavaWrapper):
|
|
142
190
|
def __init__(self, path, jspark):
|
|
143
|
-
super(_ElmoLoader, self).__init__(
|
|
191
|
+
super(_ElmoLoader, self).__init__(
|
|
192
|
+
"com.johnsnowlabs.nlp.embeddings.ElmoEmbeddings.loadSavedModel",
|
|
193
|
+
path,
|
|
194
|
+
jspark,
|
|
195
|
+
)
|
|
144
196
|
|
|
145
197
|
|
|
146
198
|
class _E5Loader(ExtendedJavaWrapper):
|
|
147
|
-
def __init__(self, path, jspark):
|
|
148
|
-
super(_E5Loader, self).__init__(
|
|
199
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
200
|
+
super(_E5Loader, self).__init__(
|
|
201
|
+
"com.johnsnowlabs.nlp.embeddings.E5Embeddings.loadSavedModel",
|
|
202
|
+
path,
|
|
203
|
+
jspark,
|
|
204
|
+
use_openvino,
|
|
205
|
+
)
|
|
149
206
|
|
|
150
207
|
|
|
151
208
|
class _BGELoader(ExtendedJavaWrapper):
|
|
152
209
|
def __init__(self, path, jspark):
|
|
153
|
-
super(_BGELoader, self).__init__(
|
|
210
|
+
super(_BGELoader, self).__init__(
|
|
211
|
+
"com.johnsnowlabs.nlp.embeddings.BGEEmbeddings.loadSavedModel", path, jspark
|
|
212
|
+
)
|
|
154
213
|
|
|
155
214
|
|
|
156
215
|
class _GPT2Loader(ExtendedJavaWrapper):
|
|
157
216
|
def __init__(self, path, jspark):
|
|
158
217
|
super(_GPT2Loader, self).__init__(
|
|
159
|
-
"com.johnsnowlabs.nlp.annotators.seq2seq.GPT2Transformer.loadSavedModel",
|
|
218
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.GPT2Transformer.loadSavedModel",
|
|
219
|
+
path,
|
|
220
|
+
jspark,
|
|
221
|
+
)
|
|
222
|
+
|
|
160
223
|
|
|
161
224
|
class _LLAMA2Loader(ExtendedJavaWrapper):
|
|
162
|
-
def __init__(self, path, jspark):
|
|
225
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
163
226
|
super(_LLAMA2Loader, self).__init__(
|
|
164
|
-
"com.johnsnowlabs.nlp.annotators.seq2seq.LLAMA2Transformer.loadSavedModel",
|
|
227
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.LLAMA2Transformer.loadSavedModel",
|
|
228
|
+
path,
|
|
229
|
+
jspark,
|
|
230
|
+
use_openvino,
|
|
231
|
+
)
|
|
232
|
+
|
|
165
233
|
|
|
166
234
|
class _LongformerLoader(ExtendedJavaWrapper):
|
|
167
235
|
def __init__(self, path, jspark):
|
|
168
|
-
super(_LongformerLoader, self).__init__(
|
|
169
|
-
|
|
170
|
-
|
|
236
|
+
super(_LongformerLoader, self).__init__(
|
|
237
|
+
"com.johnsnowlabs.nlp.embeddings.LongformerEmbeddings.loadSavedModel",
|
|
238
|
+
path,
|
|
239
|
+
jspark,
|
|
240
|
+
)
|
|
171
241
|
|
|
172
242
|
|
|
173
243
|
class _LongformerSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
174
244
|
def __init__(self, path, jspark):
|
|
175
245
|
super(_LongformerSequenceClassifierLoader, self).__init__(
|
|
176
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForSequenceClassification.loadSavedModel",
|
|
177
|
-
|
|
246
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForSequenceClassification.loadSavedModel",
|
|
247
|
+
path,
|
|
248
|
+
jspark,
|
|
249
|
+
)
|
|
178
250
|
|
|
179
251
|
|
|
180
252
|
class _LongformerTokenClassifierLoader(ExtendedJavaWrapper):
|
|
181
253
|
def __init__(self, path, jspark):
|
|
182
254
|
super(_LongformerTokenClassifierLoader, self).__init__(
|
|
183
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForTokenClassification.loadSavedModel",
|
|
184
|
-
|
|
255
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForTokenClassification.loadSavedModel",
|
|
256
|
+
path,
|
|
257
|
+
jspark,
|
|
258
|
+
)
|
|
185
259
|
|
|
186
260
|
|
|
187
261
|
class _LongformerQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
188
262
|
def __init__(self, path, jspark):
|
|
189
263
|
super(_LongformerQuestionAnsweringLoader, self).__init__(
|
|
190
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForQuestionAnswering.loadSavedModel",
|
|
191
|
-
|
|
264
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.LongformerForQuestionAnswering.loadSavedModel",
|
|
265
|
+
path,
|
|
266
|
+
jspark,
|
|
267
|
+
)
|
|
192
268
|
|
|
193
269
|
|
|
194
270
|
class _M2M100Loader(ExtendedJavaWrapper):
|
|
195
|
-
def __init__(self, path, jspark):
|
|
271
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
196
272
|
super(_M2M100Loader, self).__init__(
|
|
197
|
-
"com.johnsnowlabs.nlp.annotators.seq2seq.M2M100Transformer.loadSavedModel",
|
|
273
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.M2M100Transformer.loadSavedModel",
|
|
274
|
+
path,
|
|
275
|
+
jspark,
|
|
276
|
+
)
|
|
277
|
+
|
|
278
|
+
|
|
279
|
+
class _MistralLoader(ExtendedJavaWrapper):
|
|
280
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
281
|
+
super(_MistralLoader, self).__init__(
|
|
282
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.MistralTransformer.loadSavedModel",
|
|
283
|
+
path,
|
|
284
|
+
jspark,
|
|
285
|
+
use_openvino,
|
|
286
|
+
)
|
|
198
287
|
|
|
199
288
|
|
|
200
289
|
class _MarianLoader(ExtendedJavaWrapper):
|
|
201
290
|
def __init__(self, path, jspark):
|
|
202
291
|
super(_MarianLoader, self).__init__(
|
|
203
|
-
"com.johnsnowlabs.nlp.annotators.seq2seq.MarianTransformer.loadSavedModel",
|
|
292
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.MarianTransformer.loadSavedModel",
|
|
293
|
+
path,
|
|
294
|
+
jspark,
|
|
295
|
+
)
|
|
204
296
|
|
|
205
297
|
|
|
206
298
|
class _MPNetLoader(ExtendedJavaWrapper):
|
|
207
299
|
def __init__(self, path, jspark):
|
|
208
300
|
super(_MPNetLoader, self).__init__(
|
|
209
|
-
"com.johnsnowlabs.nlp.embeddings.MPNetEmbeddings.loadSavedModel",
|
|
301
|
+
"com.johnsnowlabs.nlp.embeddings.MPNetEmbeddings.loadSavedModel",
|
|
302
|
+
path,
|
|
303
|
+
jspark,
|
|
304
|
+
)
|
|
305
|
+
|
|
306
|
+
|
|
307
|
+
class _Phi2Loader(ExtendedJavaWrapper):
|
|
308
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
309
|
+
super(_Phi2Loader, self).__init__(
|
|
310
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.Phi2Transformer.loadSavedModel",
|
|
311
|
+
path,
|
|
312
|
+
jspark,
|
|
313
|
+
use_openvino,
|
|
314
|
+
)
|
|
210
315
|
|
|
211
316
|
|
|
212
317
|
class _RoBertaLoader(ExtendedJavaWrapper):
|
|
213
|
-
def __init__(self, path, jspark):
|
|
214
|
-
super(_RoBertaLoader, self).__init__(
|
|
215
|
-
|
|
318
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
319
|
+
super(_RoBertaLoader, self).__init__(
|
|
320
|
+
"com.johnsnowlabs.nlp.embeddings.RoBertaEmbeddings.loadSavedModel",
|
|
321
|
+
path,
|
|
322
|
+
jspark,
|
|
323
|
+
use_openvino,
|
|
324
|
+
)
|
|
216
325
|
|
|
217
326
|
|
|
218
327
|
class _RoBertaSentenceLoader(ExtendedJavaWrapper):
|
|
219
328
|
def __init__(self, path, jspark):
|
|
220
329
|
super(_RoBertaSentenceLoader, self).__init__(
|
|
221
|
-
"com.johnsnowlabs.nlp.embeddings.RoBertaSentenceEmbeddings.loadSavedModel",
|
|
330
|
+
"com.johnsnowlabs.nlp.embeddings.RoBertaSentenceEmbeddings.loadSavedModel",
|
|
331
|
+
path,
|
|
332
|
+
jspark,
|
|
333
|
+
)
|
|
222
334
|
|
|
223
335
|
|
|
224
336
|
class _RoBertaSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
225
337
|
def __init__(self, path, jspark):
|
|
226
338
|
super(_RoBertaSequenceClassifierLoader, self).__init__(
|
|
227
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForSequenceClassification.loadSavedModel",
|
|
228
|
-
|
|
339
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForSequenceClassification.loadSavedModel",
|
|
340
|
+
path,
|
|
341
|
+
jspark,
|
|
342
|
+
)
|
|
229
343
|
|
|
230
344
|
|
|
231
345
|
class _RoBertaTokenClassifierLoader(ExtendedJavaWrapper):
|
|
232
346
|
def __init__(self, path, jspark):
|
|
233
347
|
super(_RoBertaTokenClassifierLoader, self).__init__(
|
|
234
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForTokenClassification.loadSavedModel",
|
|
348
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForTokenClassification.loadSavedModel",
|
|
349
|
+
path,
|
|
350
|
+
jspark,
|
|
351
|
+
)
|
|
235
352
|
|
|
236
353
|
|
|
237
354
|
class _RoBertaQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
238
355
|
def __init__(self, path, jspark):
|
|
239
356
|
super(_RoBertaQuestionAnsweringLoader, self).__init__(
|
|
240
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForQuestionAnswering.loadSavedModel",
|
|
357
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForQuestionAnswering.loadSavedModel",
|
|
358
|
+
path,
|
|
359
|
+
jspark,
|
|
360
|
+
)
|
|
241
361
|
|
|
242
362
|
|
|
243
363
|
class _T5Loader(ExtendedJavaWrapper):
|
|
244
364
|
def __init__(self, path, jspark):
|
|
245
365
|
super(_T5Loader, self).__init__(
|
|
246
|
-
"com.johnsnowlabs.nlp.annotators.seq2seq.T5Transformer.loadSavedModel",
|
|
366
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.T5Transformer.loadSavedModel",
|
|
367
|
+
path,
|
|
368
|
+
jspark,
|
|
369
|
+
)
|
|
247
370
|
|
|
248
371
|
|
|
249
372
|
class _BartLoader(ExtendedJavaWrapper):
|
|
250
373
|
def __init__(self, path, jspark, useCache):
|
|
251
374
|
super(_BartLoader, self).__init__(
|
|
252
|
-
"com.johnsnowlabs.nlp.annotators.seq2seq.BartTransformer.loadSavedModel",
|
|
375
|
+
"com.johnsnowlabs.nlp.annotators.seq2seq.BartTransformer.loadSavedModel",
|
|
376
|
+
path,
|
|
377
|
+
jspark,
|
|
378
|
+
useCache,
|
|
379
|
+
)
|
|
253
380
|
|
|
254
381
|
|
|
255
382
|
class _USELoader(ExtendedJavaWrapper):
|
|
256
383
|
def __init__(self, path, jspark, loadsp):
|
|
257
|
-
super(_USELoader, self).__init__(
|
|
258
|
-
|
|
384
|
+
super(_USELoader, self).__init__(
|
|
385
|
+
"com.johnsnowlabs.nlp.embeddings.UniversalSentenceEncoder.loadSavedModel",
|
|
386
|
+
path,
|
|
387
|
+
jspark,
|
|
388
|
+
loadsp,
|
|
389
|
+
)
|
|
259
390
|
|
|
260
391
|
|
|
261
392
|
class _XlmRoBertaLoader(ExtendedJavaWrapper):
|
|
262
|
-
def __init__(self, path, jspark):
|
|
263
|
-
super(_XlmRoBertaLoader, self).__init__(
|
|
264
|
-
|
|
393
|
+
def __init__(self, path, jspark, use_openvino=False):
|
|
394
|
+
super(_XlmRoBertaLoader, self).__init__(
|
|
395
|
+
"com.johnsnowlabs.nlp.embeddings.XlmRoBertaEmbeddings.loadSavedModel",
|
|
396
|
+
path,
|
|
397
|
+
jspark,
|
|
398
|
+
use_openvino,
|
|
399
|
+
)
|
|
265
400
|
|
|
266
401
|
|
|
267
402
|
class _XlmRoBertaSentenceLoader(ExtendedJavaWrapper):
|
|
268
403
|
def __init__(self, path, jspark):
|
|
269
404
|
super(_XlmRoBertaSentenceLoader, self).__init__(
|
|
270
|
-
"com.johnsnowlabs.nlp.embeddings.XlmRoBertaSentenceEmbeddings.loadSavedModel",
|
|
405
|
+
"com.johnsnowlabs.nlp.embeddings.XlmRoBertaSentenceEmbeddings.loadSavedModel",
|
|
406
|
+
path,
|
|
407
|
+
jspark,
|
|
408
|
+
)
|
|
271
409
|
|
|
272
410
|
|
|
273
411
|
class _XlmRoBertaSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
274
412
|
def __init__(self, path, jspark):
|
|
275
413
|
super(_XlmRoBertaSequenceClassifierLoader, self).__init__(
|
|
276
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForSequenceClassification.loadSavedModel",
|
|
277
|
-
|
|
414
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForSequenceClassification.loadSavedModel",
|
|
415
|
+
path,
|
|
416
|
+
jspark,
|
|
417
|
+
)
|
|
278
418
|
|
|
279
419
|
|
|
280
420
|
class _XlmRoBertaTokenClassifierLoader(ExtendedJavaWrapper):
|
|
281
421
|
def __init__(self, path, jspark):
|
|
282
422
|
super(_XlmRoBertaTokenClassifierLoader, self).__init__(
|
|
283
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForTokenClassification.loadSavedModel",
|
|
284
|
-
|
|
423
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForTokenClassification.loadSavedModel",
|
|
424
|
+
path,
|
|
425
|
+
jspark,
|
|
426
|
+
)
|
|
285
427
|
|
|
286
428
|
|
|
287
429
|
class _XlmRoBertaQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
288
430
|
def __init__(self, path, jspark):
|
|
289
431
|
super(_XlmRoBertaQuestionAnsweringLoader, self).__init__(
|
|
290
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForQuestionAnswering.loadSavedModel",
|
|
291
|
-
|
|
432
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForQuestionAnswering.loadSavedModel",
|
|
433
|
+
path,
|
|
434
|
+
jspark,
|
|
435
|
+
)
|
|
292
436
|
|
|
293
437
|
|
|
294
438
|
class _XlnetLoader(ExtendedJavaWrapper):
|
|
295
439
|
def __init__(self, path, jspark):
|
|
296
|
-
super(_XlnetLoader, self).__init__(
|
|
297
|
-
|
|
440
|
+
super(_XlnetLoader, self).__init__(
|
|
441
|
+
"com.johnsnowlabs.nlp.embeddings.XlnetEmbeddings.loadSavedModel",
|
|
442
|
+
path,
|
|
443
|
+
jspark,
|
|
444
|
+
)
|
|
298
445
|
|
|
299
446
|
|
|
300
447
|
class _XlnetSequenceClassifierLoader(ExtendedJavaWrapper):
|
|
301
448
|
def __init__(self, path, jspark):
|
|
302
449
|
super(_XlnetSequenceClassifierLoader, self).__init__(
|
|
303
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlnetForSequenceClassification.loadSavedModel",
|
|
304
|
-
|
|
450
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlnetForSequenceClassification.loadSavedModel",
|
|
451
|
+
path,
|
|
452
|
+
jspark,
|
|
453
|
+
)
|
|
305
454
|
|
|
306
455
|
|
|
307
456
|
class _XlnetTokenClassifierLoader(ExtendedJavaWrapper):
|
|
308
457
|
def __init__(self, path, jspark):
|
|
309
458
|
super(_XlnetTokenClassifierLoader, self).__init__(
|
|
310
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlnetForTokenClassification.loadSavedModel",
|
|
459
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlnetForTokenClassification.loadSavedModel",
|
|
460
|
+
path,
|
|
461
|
+
jspark,
|
|
462
|
+
)
|
|
311
463
|
|
|
312
464
|
|
|
313
465
|
class _ClearCache(ExtendedJavaWrapper):
|
|
314
466
|
def __init__(self, name, language, remote_loc):
|
|
315
|
-
super(_ClearCache, self).__init__(
|
|
316
|
-
|
|
467
|
+
super(_ClearCache, self).__init__(
|
|
468
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.clearCache",
|
|
469
|
+
name,
|
|
470
|
+
language,
|
|
471
|
+
remote_loc,
|
|
472
|
+
)
|
|
317
473
|
|
|
318
474
|
|
|
319
475
|
class _CoNLLGeneratorExportFromTargetAndPipeline(ExtendedJavaWrapper):
|
|
@@ -325,50 +481,76 @@ class _CoNLLGeneratorExportFromTargetAndPipeline(ExtendedJavaWrapper):
|
|
|
325
481
|
if type(target) == DataFrame:
|
|
326
482
|
super(_CoNLLGeneratorExportFromTargetAndPipeline, self).__init__(
|
|
327
483
|
"com.johnsnowlabs.util.CoNLLGenerator.exportConllFiles",
|
|
328
|
-
target._jdf,
|
|
484
|
+
target._jdf,
|
|
485
|
+
pipeline,
|
|
486
|
+
output_path,
|
|
487
|
+
)
|
|
329
488
|
else:
|
|
330
489
|
super(_CoNLLGeneratorExportFromTargetAndPipeline, self).__init__(
|
|
331
490
|
"com.johnsnowlabs.util.CoNLLGenerator.exportConllFiles",
|
|
332
|
-
spark._jsparkSession,
|
|
491
|
+
spark._jsparkSession,
|
|
492
|
+
target,
|
|
493
|
+
pipeline,
|
|
494
|
+
output_path,
|
|
495
|
+
)
|
|
333
496
|
|
|
334
497
|
|
|
335
498
|
class _CoNLLGeneratorExportFromDataFrameAndField(ExtendedJavaWrapper):
|
|
336
499
|
|
|
337
500
|
def __init__(self, dataframe, output_path, metadata_sentence_key):
|
|
338
501
|
super(_CoNLLGeneratorExportFromDataFrameAndField, self).__init__(
|
|
339
|
-
"com.johnsnowlabs.util.CoNLLGenerator.exportConllFilesFromField",
|
|
340
|
-
|
|
502
|
+
"com.johnsnowlabs.util.CoNLLGenerator.exportConllFilesFromField",
|
|
503
|
+
dataframe,
|
|
504
|
+
output_path,
|
|
505
|
+
metadata_sentence_key,
|
|
506
|
+
)
|
|
341
507
|
|
|
342
508
|
|
|
343
509
|
class _CoNLLGeneratorExportFromDataFrame(ExtendedJavaWrapper):
|
|
344
510
|
def __init__(self, dataframe, output_path):
|
|
345
511
|
super(_CoNLLGeneratorExportFromDataFrame, self).__init__(
|
|
346
512
|
"com.johnsnowlabs.util.CoNLLGenerator.exportConllFiles",
|
|
347
|
-
dataframe,
|
|
513
|
+
dataframe,
|
|
514
|
+
output_path,
|
|
515
|
+
)
|
|
348
516
|
|
|
349
517
|
|
|
350
518
|
class _CoverageResult(ExtendedJavaWrapper):
|
|
351
519
|
def __init__(self, covered, total, percentage):
|
|
352
|
-
super(_CoverageResult, self).__init__(
|
|
353
|
-
|
|
520
|
+
super(_CoverageResult, self).__init__(
|
|
521
|
+
"com.johnsnowlabs.nlp.embeddings.CoverageResult", covered, total, percentage
|
|
522
|
+
)
|
|
354
523
|
|
|
355
524
|
|
|
356
525
|
class _DownloadModelDirectly(ExtendedJavaWrapper):
|
|
357
526
|
def __init__(self, name, remote_loc="public/models", unzip=True):
|
|
358
527
|
super(_DownloadModelDirectly, self).__init__(
|
|
359
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.downloadModelDirectly",
|
|
528
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.downloadModelDirectly",
|
|
529
|
+
name,
|
|
530
|
+
remote_loc,
|
|
531
|
+
unzip,
|
|
532
|
+
)
|
|
360
533
|
|
|
361
534
|
|
|
362
535
|
class _DownloadModel(ExtendedJavaWrapper):
|
|
363
536
|
def __init__(self, reader, name, language, remote_loc, validator):
|
|
364
|
-
super(_DownloadModel, self).__init__(
|
|
365
|
-
|
|
537
|
+
super(_DownloadModel, self).__init__(
|
|
538
|
+
"com.johnsnowlabs.nlp.pretrained." + validator + ".downloadModel",
|
|
539
|
+
reader,
|
|
540
|
+
name,
|
|
541
|
+
language,
|
|
542
|
+
remote_loc,
|
|
543
|
+
)
|
|
366
544
|
|
|
367
545
|
|
|
368
546
|
class _DownloadPipeline(ExtendedJavaWrapper):
|
|
369
547
|
def __init__(self, name, language, remote_loc):
|
|
370
548
|
super(_DownloadPipeline, self).__init__(
|
|
371
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.downloadPipeline",
|
|
549
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.downloadPipeline",
|
|
550
|
+
name,
|
|
551
|
+
language,
|
|
552
|
+
remote_loc,
|
|
553
|
+
)
|
|
372
554
|
|
|
373
555
|
|
|
374
556
|
class _DownloadPredefinedPipeline(ExtendedJavaWrapper):
|
|
@@ -379,146 +561,215 @@ class _DownloadPredefinedPipeline(ExtendedJavaWrapper):
|
|
|
379
561
|
class _EmbeddingsCoverageColumn(ExtendedJavaWrapper):
|
|
380
562
|
def __init__(self, dataset, embeddings_col, output_col):
|
|
381
563
|
super(_EmbeddingsCoverageColumn, self).__init__(
|
|
382
|
-
"com.johnsnowlabs.nlp.embeddings.WordEmbeddingsModel.withCoverageColumn",
|
|
383
|
-
|
|
564
|
+
"com.johnsnowlabs.nlp.embeddings.WordEmbeddingsModel.withCoverageColumn",
|
|
565
|
+
dataset._jdf,
|
|
566
|
+
embeddings_col,
|
|
567
|
+
output_col,
|
|
568
|
+
)
|
|
384
569
|
|
|
385
570
|
|
|
386
571
|
class _EmbeddingsOverallCoverage(ExtendedJavaWrapper):
|
|
387
572
|
def __init__(self, dataset, embeddings_col):
|
|
388
573
|
super(_EmbeddingsOverallCoverage, self).__init__(
|
|
389
|
-
"com.johnsnowlabs.nlp.embeddings.WordEmbeddingsModel.overallCoverage",
|
|
574
|
+
"com.johnsnowlabs.nlp.embeddings.WordEmbeddingsModel.overallCoverage",
|
|
575
|
+
dataset._jdf,
|
|
576
|
+
embeddings_col,
|
|
577
|
+
)
|
|
390
578
|
|
|
391
579
|
|
|
392
580
|
class _ExternalResource(ExtendedJavaWrapper):
|
|
393
581
|
def __init__(self, path, read_as, options):
|
|
394
|
-
super(_ExternalResource, self).__init__(
|
|
395
|
-
|
|
582
|
+
super(_ExternalResource, self).__init__(
|
|
583
|
+
"com.johnsnowlabs.nlp.util.io.ExternalResource.fromJava",
|
|
584
|
+
path,
|
|
585
|
+
read_as,
|
|
586
|
+
options,
|
|
587
|
+
)
|
|
396
588
|
|
|
397
589
|
|
|
398
590
|
class _ConfigLoaderGetter(ExtendedJavaWrapper):
|
|
399
591
|
def __init__(self):
|
|
400
|
-
super(_ConfigLoaderGetter, self).__init__(
|
|
592
|
+
super(_ConfigLoaderGetter, self).__init__(
|
|
593
|
+
"com.johnsnowlabs.util.ConfigLoader.getConfigPath"
|
|
594
|
+
)
|
|
401
595
|
|
|
402
596
|
|
|
403
597
|
class _GetResourceSize(ExtendedJavaWrapper):
|
|
404
598
|
def __init__(self, name, language, remote_loc):
|
|
405
599
|
super(_GetResourceSize, self).__init__(
|
|
406
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.getDownloadSize",
|
|
600
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.getDownloadSize",
|
|
601
|
+
name,
|
|
602
|
+
language,
|
|
603
|
+
remote_loc,
|
|
604
|
+
)
|
|
407
605
|
|
|
408
606
|
|
|
409
607
|
class _LightPipeline(ExtendedJavaWrapper):
|
|
410
608
|
def __init__(self, pipelineModel, parse_embeddings):
|
|
411
|
-
super(_LightPipeline, self).__init__(
|
|
412
|
-
|
|
609
|
+
super(_LightPipeline, self).__init__(
|
|
610
|
+
"com.johnsnowlabs.nlp.LightPipeline",
|
|
611
|
+
pipelineModel._to_java(),
|
|
612
|
+
parse_embeddings,
|
|
613
|
+
)
|
|
413
614
|
|
|
414
615
|
|
|
415
616
|
class _RegexRule(ExtendedJavaWrapper):
|
|
416
617
|
def __init__(self, rule, identifier):
|
|
417
|
-
super(_RegexRule, self).__init__(
|
|
618
|
+
super(_RegexRule, self).__init__(
|
|
619
|
+
"com.johnsnowlabs.nlp.util.regex.RegexRule", rule, identifier
|
|
620
|
+
)
|
|
418
621
|
|
|
419
622
|
|
|
420
623
|
class _ShowAvailableAnnotators(ExtendedJavaWrapper):
|
|
421
624
|
def __init__(self):
|
|
422
625
|
super(_ShowAvailableAnnotators, self).__init__(
|
|
423
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showAvailableAnnotators"
|
|
626
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showAvailableAnnotators"
|
|
627
|
+
)
|
|
424
628
|
|
|
425
629
|
|
|
426
630
|
class _ShowPublicModels(ExtendedJavaWrapper):
|
|
427
631
|
def __init__(self, annotator, lang, version):
|
|
428
632
|
super(_ShowPublicModels, self).__init__(
|
|
429
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showPublicModels",
|
|
633
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showPublicModels",
|
|
634
|
+
annotator,
|
|
635
|
+
lang,
|
|
636
|
+
version,
|
|
637
|
+
)
|
|
430
638
|
|
|
431
639
|
|
|
432
640
|
class _ShowPublicPipelines(ExtendedJavaWrapper):
|
|
433
641
|
def __init__(self, lang, version):
|
|
434
642
|
super(_ShowPublicPipelines, self).__init__(
|
|
435
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showPublicPipelines",
|
|
643
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showPublicPipelines",
|
|
644
|
+
lang,
|
|
645
|
+
version,
|
|
646
|
+
)
|
|
436
647
|
|
|
437
648
|
|
|
438
649
|
class _ShowUnCategorizedResources(ExtendedJavaWrapper):
|
|
439
650
|
def __init__(self):
|
|
440
651
|
super(_ShowUnCategorizedResources, self).__init__(
|
|
441
|
-
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showUnCategorizedResources"
|
|
652
|
+
"com.johnsnowlabs.nlp.pretrained.PythonResourceDownloader.showUnCategorizedResources"
|
|
653
|
+
)
|
|
442
654
|
|
|
443
655
|
|
|
444
656
|
class _StorageHelper(ExtendedJavaWrapper):
|
|
445
657
|
def __init__(self, path, spark, database, storage_ref, within_storage):
|
|
446
|
-
super(_StorageHelper, self).__init__(
|
|
447
|
-
|
|
658
|
+
super(_StorageHelper, self).__init__(
|
|
659
|
+
"com.johnsnowlabs.storage.StorageHelper.load",
|
|
660
|
+
path,
|
|
661
|
+
spark._jsparkSession,
|
|
662
|
+
database,
|
|
663
|
+
storage_ref,
|
|
664
|
+
within_storage,
|
|
665
|
+
)
|
|
448
666
|
|
|
449
667
|
|
|
450
668
|
class _SpanBertCorefLoader(ExtendedJavaWrapper):
|
|
451
669
|
def __init__(self, path, jspark):
|
|
452
670
|
super(_SpanBertCorefLoader, self).__init__(
|
|
453
|
-
"com.johnsnowlabs.nlp.annotators.coref.SpanBertCorefModel.loadSavedModel",
|
|
671
|
+
"com.johnsnowlabs.nlp.annotators.coref.SpanBertCorefModel.loadSavedModel",
|
|
672
|
+
path,
|
|
673
|
+
jspark,
|
|
674
|
+
)
|
|
454
675
|
|
|
455
676
|
|
|
456
677
|
class _NerDLGraphBuilder(ExtendedJavaWrapper):
|
|
457
678
|
def __init__(self, dataset, input_col, label_col):
|
|
458
679
|
super(_NerDLGraphBuilder, self).__init__(
|
|
459
680
|
"com.johnsnowlabs.nlp.annotators.ner.dl.NerDLApproach.getGraphParams",
|
|
460
|
-
dataset,
|
|
681
|
+
dataset,
|
|
682
|
+
input_col,
|
|
683
|
+
label_col,
|
|
684
|
+
)
|
|
461
685
|
|
|
462
686
|
|
|
463
687
|
class _ResourceHelper_moveFile(ExtendedJavaWrapper):
|
|
464
688
|
def __init__(self, local_file, hdfs_file):
|
|
465
689
|
super(_ResourceHelper_moveFile, self).__init__(
|
|
466
|
-
"com.johnsnowlabs.nlp.util.io.ResourceHelper.moveFile",
|
|
690
|
+
"com.johnsnowlabs.nlp.util.io.ResourceHelper.moveFile",
|
|
691
|
+
local_file,
|
|
692
|
+
hdfs_file,
|
|
693
|
+
)
|
|
467
694
|
|
|
468
695
|
|
|
469
696
|
class _ResourceHelper_validFile(ExtendedJavaWrapper):
|
|
470
697
|
def __init__(self, path):
|
|
471
698
|
super(_ResourceHelper_validFile, self).__init__(
|
|
472
|
-
"com.johnsnowlabs.nlp.util.io.ResourceHelper.validFile", path
|
|
699
|
+
"com.johnsnowlabs.nlp.util.io.ResourceHelper.validFile", path
|
|
700
|
+
)
|
|
473
701
|
|
|
474
702
|
|
|
475
703
|
class _ViTForImageClassification(ExtendedJavaWrapper):
|
|
476
704
|
def __init__(self, path, jspark):
|
|
477
705
|
super(_ViTForImageClassification, self).__init__(
|
|
478
|
-
"com.johnsnowlabs.nlp.annotators.cv.ViTForImageClassification.loadSavedModel",
|
|
706
|
+
"com.johnsnowlabs.nlp.annotators.cv.ViTForImageClassification.loadSavedModel",
|
|
707
|
+
path,
|
|
708
|
+
jspark,
|
|
709
|
+
)
|
|
479
710
|
|
|
480
711
|
|
|
481
712
|
class _VisionEncoderDecoderForImageCaptioning(ExtendedJavaWrapper):
|
|
482
713
|
def __init__(self, path, jspark):
|
|
483
714
|
super(_VisionEncoderDecoderForImageCaptioning, self).__init__(
|
|
484
|
-
"com.johnsnowlabs.nlp.annotators.cv.VisionEncoderDecoderForImageCaptioning.loadSavedModel",
|
|
715
|
+
"com.johnsnowlabs.nlp.annotators.cv.VisionEncoderDecoderForImageCaptioning.loadSavedModel",
|
|
716
|
+
path,
|
|
717
|
+
jspark,
|
|
718
|
+
)
|
|
485
719
|
|
|
486
720
|
|
|
487
721
|
class _SwinForImageClassification(ExtendedJavaWrapper):
|
|
488
722
|
def __init__(self, path, jspark):
|
|
489
723
|
super(_SwinForImageClassification, self).__init__(
|
|
490
|
-
"com.johnsnowlabs.nlp.annotators.cv.SwinForImageClassification.loadSavedModel",
|
|
724
|
+
"com.johnsnowlabs.nlp.annotators.cv.SwinForImageClassification.loadSavedModel",
|
|
725
|
+
path,
|
|
726
|
+
jspark,
|
|
727
|
+
)
|
|
491
728
|
|
|
492
729
|
|
|
493
730
|
class _ConvNextForImageClassification(ExtendedJavaWrapper):
|
|
494
731
|
def __init__(self, path, jspark):
|
|
495
732
|
super(_ConvNextForImageClassification, self).__init__(
|
|
496
|
-
"com.johnsnowlabs.nlp.annotators.cv.ConvNextForImageClassification.loadSavedModel",
|
|
733
|
+
"com.johnsnowlabs.nlp.annotators.cv.ConvNextForImageClassification.loadSavedModel",
|
|
734
|
+
path,
|
|
735
|
+
jspark,
|
|
736
|
+
)
|
|
497
737
|
|
|
498
738
|
|
|
499
739
|
class _Wav2Vec2ForCTC(ExtendedJavaWrapper):
|
|
500
740
|
def __init__(self, path, jspark):
|
|
501
741
|
super(_Wav2Vec2ForCTC, self).__init__(
|
|
502
|
-
"com.johnsnowlabs.nlp.annotators.audio.Wav2Vec2ForCTC.loadSavedModel",
|
|
742
|
+
"com.johnsnowlabs.nlp.annotators.audio.Wav2Vec2ForCTC.loadSavedModel",
|
|
743
|
+
path,
|
|
744
|
+
jspark,
|
|
745
|
+
)
|
|
503
746
|
|
|
504
747
|
|
|
505
748
|
class _HubertForCTC(ExtendedJavaWrapper):
|
|
506
749
|
def __init__(self, path, jspark):
|
|
507
750
|
super(_HubertForCTC, self).__init__(
|
|
508
|
-
"com.johnsnowlabs.nlp.annotators.audio.HubertForCTC.loadSavedModel",
|
|
751
|
+
"com.johnsnowlabs.nlp.annotators.audio.HubertForCTC.loadSavedModel",
|
|
752
|
+
path,
|
|
753
|
+
jspark,
|
|
754
|
+
)
|
|
509
755
|
|
|
510
756
|
|
|
511
757
|
class _WhisperForCTC(ExtendedJavaWrapper):
|
|
512
758
|
def __init__(self, path, jspark):
|
|
513
759
|
super(_WhisperForCTC, self).__init__(
|
|
514
|
-
"com.johnsnowlabs.nlp.annotators.audio.WhisperForCTC.loadSavedModel",
|
|
760
|
+
"com.johnsnowlabs.nlp.annotators.audio.WhisperForCTC.loadSavedModel",
|
|
761
|
+
path,
|
|
762
|
+
jspark,
|
|
763
|
+
)
|
|
515
764
|
|
|
516
765
|
|
|
517
766
|
class _CamemBertForTokenClassificationLoader(ExtendedJavaWrapper):
|
|
518
767
|
def __init__(self, path, jspark):
|
|
519
768
|
super(_CamemBertForTokenClassificationLoader, self).__init__(
|
|
520
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.CamemBertForTokenClassification.loadSavedModel",
|
|
521
|
-
|
|
769
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.CamemBertForTokenClassification.loadSavedModel",
|
|
770
|
+
path,
|
|
771
|
+
jspark,
|
|
772
|
+
)
|
|
522
773
|
|
|
523
774
|
|
|
524
775
|
class _TapasForQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
@@ -526,92 +777,136 @@ class _TapasForQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
|
526
777
|
super(_TapasForQuestionAnsweringLoader, self).__init__(
|
|
527
778
|
"com.johnsnowlabs.nlp.annotators.classifier.dl.TapasForQuestionAnswering.loadSavedModel",
|
|
528
779
|
path,
|
|
529
|
-
jspark
|
|
780
|
+
jspark,
|
|
781
|
+
)
|
|
530
782
|
|
|
531
783
|
|
|
532
784
|
class _CamemBertForSequenceClassificationLoader(ExtendedJavaWrapper):
|
|
533
785
|
def __init__(self, path, jspark):
|
|
534
786
|
super(_CamemBertForSequenceClassificationLoader, self).__init__(
|
|
535
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.CamemBertForSequenceClassification.loadSavedModel",
|
|
536
|
-
|
|
787
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.CamemBertForSequenceClassification.loadSavedModel",
|
|
788
|
+
path,
|
|
789
|
+
jspark,
|
|
790
|
+
)
|
|
537
791
|
|
|
538
792
|
|
|
539
793
|
class _CamemBertQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
540
794
|
def __init__(self, path, jspark):
|
|
541
795
|
super(_CamemBertQuestionAnsweringLoader, self).__init__(
|
|
542
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.CamemBertForQuestionAnswering.loadSavedModel",
|
|
543
|
-
|
|
796
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.CamemBertForQuestionAnswering.loadSavedModel",
|
|
797
|
+
path,
|
|
798
|
+
jspark,
|
|
799
|
+
)
|
|
544
800
|
|
|
545
801
|
|
|
546
802
|
class _RobertaQAToZeroShotNerLoader(ExtendedJavaWrapper):
|
|
547
803
|
def __init__(self, path):
|
|
548
804
|
super(_RobertaQAToZeroShotNerLoader, self).__init__(
|
|
549
|
-
"com.johnsnowlabs.nlp.annotators.ner.dl.ZeroShotNerModel.load", path
|
|
805
|
+
"com.johnsnowlabs.nlp.annotators.ner.dl.ZeroShotNerModel.load", path
|
|
806
|
+
)
|
|
550
807
|
|
|
551
808
|
|
|
552
809
|
class _BertZeroShotClassifierLoader(ExtendedJavaWrapper):
|
|
553
810
|
def __init__(self, path, jspark):
|
|
554
811
|
super(_BertZeroShotClassifierLoader, self).__init__(
|
|
555
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForZeroShotClassification.loadSavedModel",
|
|
812
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.BertForZeroShotClassification.loadSavedModel",
|
|
813
|
+
path,
|
|
814
|
+
jspark,
|
|
815
|
+
)
|
|
556
816
|
|
|
557
817
|
|
|
558
818
|
class _DistilBertForZeroShotClassification(ExtendedJavaWrapper):
|
|
559
819
|
def __init__(self, path, jspark):
|
|
560
820
|
super(_DistilBertForZeroShotClassification, self).__init__(
|
|
561
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForZeroShotClassification.loadSavedModel",
|
|
562
|
-
|
|
821
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DistilBertForZeroShotClassification.loadSavedModel",
|
|
822
|
+
path,
|
|
823
|
+
jspark,
|
|
824
|
+
)
|
|
563
825
|
|
|
564
826
|
|
|
565
827
|
class _RoBertaForZeroShotClassification(ExtendedJavaWrapper):
|
|
566
828
|
def __init__(self, path, jspark):
|
|
567
829
|
super(_RoBertaForZeroShotClassification, self).__init__(
|
|
568
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForZeroShotClassification.loadSavedModel",
|
|
569
|
-
|
|
830
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.RoBertaForZeroShotClassification.loadSavedModel",
|
|
831
|
+
path,
|
|
832
|
+
jspark,
|
|
833
|
+
)
|
|
570
834
|
|
|
571
835
|
|
|
572
836
|
class _XlmRoBertaForZeroShotClassification(ExtendedJavaWrapper):
|
|
573
837
|
def __init__(self, path, jspark):
|
|
574
838
|
super(_XlmRoBertaForZeroShotClassification, self).__init__(
|
|
575
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForZeroShotClassification.loadSavedModel",
|
|
576
|
-
|
|
839
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.XlmRoBertaForZeroShotClassification.loadSavedModel",
|
|
840
|
+
path,
|
|
841
|
+
jspark,
|
|
842
|
+
)
|
|
577
843
|
|
|
578
844
|
|
|
579
845
|
class _InstructorLoader(ExtendedJavaWrapper):
|
|
580
846
|
def __init__(self, path, jspark):
|
|
581
|
-
super(_InstructorLoader, self).__init__(
|
|
582
|
-
|
|
847
|
+
super(_InstructorLoader, self).__init__(
|
|
848
|
+
"com.johnsnowlabs.nlp.embeddings.InstructorEmbeddings.loadSavedModel",
|
|
849
|
+
path,
|
|
850
|
+
jspark,
|
|
851
|
+
)
|
|
583
852
|
|
|
584
853
|
|
|
585
854
|
class _BartForZeroShotClassification(ExtendedJavaWrapper):
|
|
586
855
|
def __init__(self, path, jspark):
|
|
587
856
|
super(_BartForZeroShotClassification, self).__init__(
|
|
588
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.BartForZeroShotClassification.loadSavedModel",
|
|
589
|
-
|
|
857
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.BartForZeroShotClassification.loadSavedModel",
|
|
858
|
+
path,
|
|
859
|
+
jspark,
|
|
860
|
+
)
|
|
590
861
|
|
|
591
862
|
|
|
592
863
|
class _CLIPForZeroShotClassification(ExtendedJavaWrapper):
|
|
593
864
|
def __init__(self, path, jspark):
|
|
594
865
|
super(_CLIPForZeroShotClassification, self).__init__(
|
|
595
|
-
"com.johnsnowlabs.nlp.annotators.cv.CLIPForZeroShotClassification.loadSavedModel",
|
|
596
|
-
|
|
866
|
+
"com.johnsnowlabs.nlp.annotators.cv.CLIPForZeroShotClassification.loadSavedModel",
|
|
867
|
+
path,
|
|
868
|
+
jspark,
|
|
869
|
+
)
|
|
597
870
|
|
|
598
871
|
|
|
599
872
|
class _DeBertaForZeroShotClassification(ExtendedJavaWrapper):
|
|
600
873
|
def __init__(self, path, jspark):
|
|
601
874
|
super(_DeBertaForZeroShotClassification, self).__init__(
|
|
602
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForZeroShotClassification.loadSavedModel",
|
|
603
|
-
|
|
604
|
-
|
|
605
|
-
|
|
875
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.DeBertaForZeroShotClassification.loadSavedModel",
|
|
876
|
+
path,
|
|
877
|
+
jspark,
|
|
878
|
+
)
|
|
879
|
+
|
|
880
|
+
|
|
606
881
|
class _MPNetForSequenceClassificationLoader(ExtendedJavaWrapper):
|
|
607
882
|
def __init__(self, path, jspark):
|
|
608
883
|
super(_MPNetForSequenceClassificationLoader, self).__init__(
|
|
609
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.MPNetForSequenceClassification.loadSavedModel",
|
|
610
|
-
|
|
884
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.MPNetForSequenceClassification.loadSavedModel",
|
|
885
|
+
path,
|
|
886
|
+
jspark,
|
|
887
|
+
)
|
|
611
888
|
|
|
612
889
|
|
|
613
890
|
class _MPNetForQuestionAnsweringLoader(ExtendedJavaWrapper):
|
|
614
891
|
def __init__(self, path, jspark):
|
|
615
892
|
super(_MPNetForQuestionAnsweringLoader, self).__init__(
|
|
616
|
-
"com.johnsnowlabs.nlp.annotators.classifier.dl.MPNetForQuestionAnswering.loadSavedModel",
|
|
617
|
-
|
|
893
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.MPNetForQuestionAnswering.loadSavedModel",
|
|
894
|
+
path,
|
|
895
|
+
jspark,
|
|
896
|
+
)
|
|
897
|
+
|
|
898
|
+
|
|
899
|
+
class _MPNetForTokenClassifierLoader(ExtendedJavaWrapper):
|
|
900
|
+
def __init__(self, path, jspark):
|
|
901
|
+
super(_MPNetForTokenClassifierLoader, self).__init__(
|
|
902
|
+
"com.johnsnowlabs.nlp.annotators.classifier.dl.MPNetForTokenClassification.loadSavedModel",
|
|
903
|
+
path,
|
|
904
|
+
jspark,
|
|
905
|
+
)
|
|
906
|
+
|
|
907
|
+
|
|
908
|
+
class _UAEEmbeddingsLoader(ExtendedJavaWrapper):
|
|
909
|
+
def __init__(self, path, jspark):
|
|
910
|
+
super(_UAEEmbeddingsLoader, self).__init__(
|
|
911
|
+
"com.johnsnowlabs.nlp.embeddings.UAEEmbeddings.loadSavedModel", path, jspark
|
|
912
|
+
)
|