dstklib 2.0.0__py3-none-any.whl → 2.0.2__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- dstk/models/models.py +0 -1
- dstk/templates/templates.py +0 -6
- {dstklib-2.0.0.dist-info → dstklib-2.0.2.dist-info}/METADATA +7 -5
- {dstklib-2.0.0.dist-info → dstklib-2.0.2.dist-info}/RECORD +7 -7
- {dstklib-2.0.0.dist-info → dstklib-2.0.2.dist-info}/LICENSE +0 -0
- {dstklib-2.0.0.dist-info → dstklib-2.0.2.dist-info}/WHEEL +0 -0
- {dstklib-2.0.0.dist-info → dstklib-2.0.2.dist-info}/top_level.txt +0 -0
dstk/models/models.py
CHANGED
dstk/templates/templates.py
CHANGED
@@ -129,12 +129,6 @@ WeightMatrixTemplate: WorkflowTemplate = {
|
|
129
129
|
CountModelsTemplate: WorkflowTemplate = {
|
130
130
|
"steps": {
|
131
131
|
0: {
|
132
|
-
"include": ["scale_matrix"],
|
133
|
-
"repeat": False,
|
134
|
-
"chaining": False,
|
135
|
-
"step_name": "scale_matrix"
|
136
|
-
},
|
137
|
-
1: {
|
138
132
|
"include": "*",
|
139
133
|
"repeat": False,
|
140
134
|
"chaining": False,
|
@@ -1,7 +1,7 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: dstklib
|
3
|
-
Version: 2.0.
|
4
|
-
Requires-Python: <3.
|
3
|
+
Version: 2.0.2
|
4
|
+
Requires-Python: <3.13
|
5
5
|
Description-Content-Type: text/markdown
|
6
6
|
License-File: LICENSE
|
7
7
|
Requires-Dist: spacy
|
@@ -28,7 +28,7 @@ This library is based on the book *Distributional Semantics* by Alessandro Lenci
|
|
28
28
|
|
29
29
|
## Documentation
|
30
30
|
|
31
|
-
You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html).
|
31
|
+
You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html). You can also find a demonstration of how to use it on Google Colab (in spanish) [here](https://colab.research.google.com/drive/1xN6AzovxQICDpdyFatFeJDIuZcNdCxC3?usp=sharing)
|
32
32
|
|
33
33
|
## Installation
|
34
34
|
|
@@ -209,6 +209,7 @@ Some common tasks in distributional semantics require the use of more than one m
|
|
209
209
|
|
210
210
|
```python
|
211
211
|
from dstk.workflows.workflow_tools import WorkflowBuilder
|
212
|
+
from dstk.workflows.stage_workflows import TextProcessing
|
212
213
|
|
213
214
|
text = "The quick brown fox jumps over the lazy dog while the sun sets behind the hills."
|
214
215
|
model = "my_spacy_model"
|
@@ -219,7 +220,7 @@ TextProcessorWorkflow = TextProcessing(
|
|
219
220
|
"tokenizer": [
|
220
221
|
{"apply_model": {"model": model}},
|
221
222
|
{"get_tokens": {}},
|
222
|
-
{"remove_stop_words": {"custom_stop_words":
|
223
|
+
{"remove_stop_words": {"custom_stop_words": {}}},
|
223
224
|
],
|
224
225
|
"ngrams": [
|
225
226
|
{"extract_ngrams": {"window_size": 3}}
|
@@ -233,8 +234,9 @@ TextProcessorWorkflow = TextProcessing(
|
|
233
234
|
}
|
234
235
|
)
|
235
236
|
|
236
|
-
tokens =
|
237
|
+
tokens = TextProcessorWorkflow(input_data=text)
|
237
238
|
|
239
|
+
print(tokens)
|
238
240
|
|
239
241
|
# Output: ['the quick brown', 'quick brown fox', 'brown fox jumps', 'fox jumps over', 'jumps over the', 'over the lazy', 'the lazy dog', 'lazy dog while', 'dog while the', 'while the sun', 'the sun set', 'sun set behind', 'set behind the', 'behind the hills']
|
240
242
|
```
|
@@ -17,7 +17,7 @@ dstk/lib_types/sklearn_types.py,sha256=W59yIEkZM_E_tW061x1bY-LpRC2aCzLgtYmXANNSN
|
|
17
17
|
dstk/lib_types/spacy_types.py,sha256=hUiaw4AywSW8o42h5lp3t6a4yosG_GasdJX2RCKgW7o,125
|
18
18
|
dstk/models/__init__.py,sha256=27_6lGFl0BAZp3rgXnbazEX_uxK9jQ0lf3RkjomzICA,48
|
19
19
|
dstk/models/model_tools.py,sha256=IYTG4I1oNhnW3JX4bzXxgBa8phhvO7l0haTxeVMeYhM,3279
|
20
|
-
dstk/models/models.py,sha256=
|
20
|
+
dstk/models/models.py,sha256=1O8ZZ7LnjFB1JBD65FFKCRYa_QgQ1nCUeaKm5FLEqt4,8118
|
21
21
|
dstk/modules/__init__.py,sha256=NKI_C2D86x25lUmcM2r6e0M31rV1-8FZBFHRP2oXF2Q,267
|
22
22
|
dstk/modules/count_models.py,sha256=VY8YRao78pmh_3WBX8zWQ94B13J1cSL6Pg91c3qUUyg,4288
|
23
23
|
dstk/modules/geometric_distance.py,sha256=Zj9O0p6glJOqcNGkdjP_qucj_en-QeejbbQ8Hr5oUVM,4621
|
@@ -32,12 +32,12 @@ dstk/modules/data_visualization/clustering.py,sha256=tyUQtFayH7Jh4uisheaeWkIEn9X
|
|
32
32
|
dstk/modules/data_visualization/embeddings.py,sha256=8lPMUB-saog0c3PWiHvuz1sC5YYkqFjn5wCJilnyBfQ,4237
|
33
33
|
dstk/templates/__init__.py,sha256=t7R-RKxq-EZukHV7U9zj7dbIrbxGKTIJyRzh-Tm1PiM,45
|
34
34
|
dstk/templates/rules.py,sha256=Rg8uUBwWlG0b6P-ObnahImb-ZOphMkXB5COWLRQgZSg,1757
|
35
|
-
dstk/templates/templates.py,sha256=
|
35
|
+
dstk/templates/templates.py,sha256=8Hewqdu8a6ILKVnSex_X6ew3rz_Jt5a3IuoN9NNZJWk,6282
|
36
36
|
dstk/workflows/__init__.py,sha256=sP8X_nwRIquC4NHSyUZ5L8DbxZfUCtD8qBekykcBuW8,61
|
37
37
|
dstk/workflows/stage_workflows.py,sha256=LkNRgEHRLmpCNIXJJiUERu45trS3zGv2zC7hcIxUl_s,2639
|
38
38
|
dstk/workflows/workflow_tools.py,sha256=M1wcJ5UGeEKf6TSE0-Z2AA2CetmFUrgCGdV5Z4LvD4Y,16101
|
39
|
-
dstklib-2.0.
|
40
|
-
dstklib-2.0.
|
41
|
-
dstklib-2.0.
|
42
|
-
dstklib-2.0.
|
43
|
-
dstklib-2.0.
|
39
|
+
dstklib-2.0.2.dist-info/LICENSE,sha256=LpSgNPBfwn5F4CVhnTbhpiX2f0YgRMzGWQ7Sphuuwuc,35139
|
40
|
+
dstklib-2.0.2.dist-info/METADATA,sha256=rZU1I5jWni-bqijthZQeW5b08lEGu8jTViQj-RybyJk,13110
|
41
|
+
dstklib-2.0.2.dist-info/WHEEL,sha256=VyG4dJCdJcxE1baiVBm9NET3Nj7Wne1lZZq7UFNxRpg,97
|
42
|
+
dstklib-2.0.2.dist-info/top_level.txt,sha256=b_MNmKso0-ra2M7snsy5fZBW-l9MItjrwMYBd-tiOYo,5
|
43
|
+
dstklib-2.0.2.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|