dstklib 2.0.0__tar.gz → 2.0.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {dstklib-2.0.0 → dstklib-2.0.2}/PKG-INFO +7 -5
- {dstklib-2.0.0 → dstklib-2.0.2}/README.md +5 -3
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/models/models.py +0 -1
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/templates/templates.py +0 -6
- {dstklib-2.0.0 → dstklib-2.0.2}/dstklib.egg-info/PKG-INFO +7 -5
- {dstklib-2.0.0 → dstklib-2.0.2}/setup.py +2 -2
- {dstklib-2.0.0 → dstklib-2.0.2}/LICENSE +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/__init__.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/adaptors/__init__.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/adaptors/adaptors.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/adaptors/typeguards.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/hooks/__init__.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/hooks/hook_tools.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/hooks/type_conversion.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/__init__.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/dstk_types.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/fasttext_types.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/gensim_types.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/numpy_types.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/pandas_types.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/plotly_types.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/sklearn_types.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/spacy_types.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/method_index.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/models/__init__.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/models/model_tools.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/__init__.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/count_models.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/data_visualization/__init__.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/data_visualization/clustering.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/data_visualization/embeddings.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/geometric_distance.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/ngrams.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/predict_models.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/text_matrix_builder.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/text_processor.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/tokenizer.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/weight_matrix.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/templates/__init__.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/templates/rules.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/workflows/__init__.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/workflows/stage_workflows.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstk/workflows/workflow_tools.py +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstklib.egg-info/SOURCES.txt +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstklib.egg-info/dependency_links.txt +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstklib.egg-info/requires.txt +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/dstklib.egg-info/top_level.txt +0 -0
- {dstklib-2.0.0 → dstklib-2.0.2}/setup.cfg +0 -0
@@ -1,7 +1,7 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: dstklib
|
3
|
-
Version: 2.0.
|
4
|
-
Requires-Python: <3.
|
3
|
+
Version: 2.0.2
|
4
|
+
Requires-Python: <3.13
|
5
5
|
Description-Content-Type: text/markdown
|
6
6
|
License-File: LICENSE
|
7
7
|
Requires-Dist: spacy
|
@@ -28,7 +28,7 @@ This library is based on the book *Distributional Semantics* by Alessandro Lenci
|
|
28
28
|
|
29
29
|
## Documentation
|
30
30
|
|
31
|
-
You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html).
|
31
|
+
You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html). You can also find a demonstration of how to use it on Google Colab (in spanish) [here](https://colab.research.google.com/drive/1xN6AzovxQICDpdyFatFeJDIuZcNdCxC3?usp=sharing)
|
32
32
|
|
33
33
|
## Installation
|
34
34
|
|
@@ -209,6 +209,7 @@ Some common tasks in distributional semantics require the use of more than one m
|
|
209
209
|
|
210
210
|
```python
|
211
211
|
from dstk.workflows.workflow_tools import WorkflowBuilder
|
212
|
+
from dstk.workflows.stage_workflows import TextProcessing
|
212
213
|
|
213
214
|
text = "The quick brown fox jumps over the lazy dog while the sun sets behind the hills."
|
214
215
|
model = "my_spacy_model"
|
@@ -219,7 +220,7 @@ TextProcessorWorkflow = TextProcessing(
|
|
219
220
|
"tokenizer": [
|
220
221
|
{"apply_model": {"model": model}},
|
221
222
|
{"get_tokens": {}},
|
222
|
-
{"remove_stop_words": {"custom_stop_words":
|
223
|
+
{"remove_stop_words": {"custom_stop_words": {}}},
|
223
224
|
],
|
224
225
|
"ngrams": [
|
225
226
|
{"extract_ngrams": {"window_size": 3}}
|
@@ -233,8 +234,9 @@ TextProcessorWorkflow = TextProcessing(
|
|
233
234
|
}
|
234
235
|
)
|
235
236
|
|
236
|
-
tokens =
|
237
|
+
tokens = TextProcessorWorkflow(input_data=text)
|
237
238
|
|
239
|
+
print(tokens)
|
238
240
|
|
239
241
|
# Output: ['the quick brown', 'quick brown fox', 'brown fox jumps', 'fox jumps over', 'jumps over the', 'over the lazy', 'the lazy dog', 'lazy dog while', 'dog while the', 'while the sun', 'the sun set', 'sun set behind', 'set behind the', 'behind the hills']
|
240
242
|
```
|
@@ -12,7 +12,7 @@ This library is based on the book *Distributional Semantics* by Alessandro Lenci
|
|
12
12
|
|
13
13
|
## Documentation
|
14
14
|
|
15
|
-
You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html).
|
15
|
+
You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html). You can also find a demonstration of how to use it on Google Colab (in spanish) [here](https://colab.research.google.com/drive/1xN6AzovxQICDpdyFatFeJDIuZcNdCxC3?usp=sharing)
|
16
16
|
|
17
17
|
## Installation
|
18
18
|
|
@@ -193,6 +193,7 @@ Some common tasks in distributional semantics require the use of more than one m
|
|
193
193
|
|
194
194
|
```python
|
195
195
|
from dstk.workflows.workflow_tools import WorkflowBuilder
|
196
|
+
from dstk.workflows.stage_workflows import TextProcessing
|
196
197
|
|
197
198
|
text = "The quick brown fox jumps over the lazy dog while the sun sets behind the hills."
|
198
199
|
model = "my_spacy_model"
|
@@ -203,7 +204,7 @@ TextProcessorWorkflow = TextProcessing(
|
|
203
204
|
"tokenizer": [
|
204
205
|
{"apply_model": {"model": model}},
|
205
206
|
{"get_tokens": {}},
|
206
|
-
{"remove_stop_words": {"custom_stop_words":
|
207
|
+
{"remove_stop_words": {"custom_stop_words": {}}},
|
207
208
|
],
|
208
209
|
"ngrams": [
|
209
210
|
{"extract_ngrams": {"window_size": 3}}
|
@@ -217,8 +218,9 @@ TextProcessorWorkflow = TextProcessing(
|
|
217
218
|
}
|
218
219
|
)
|
219
220
|
|
220
|
-
tokens =
|
221
|
+
tokens = TextProcessorWorkflow(input_data=text)
|
221
222
|
|
223
|
+
print(tokens)
|
222
224
|
|
223
225
|
# Output: ['the quick brown', 'quick brown fox', 'brown fox jumps', 'fox jumps over', 'jumps over the', 'over the lazy', 'the lazy dog', 'lazy dog while', 'dog while the', 'while the sun', 'the sun set', 'sun set behind', 'set behind the', 'behind the hills']
|
224
226
|
```
|
@@ -129,12 +129,6 @@ WeightMatrixTemplate: WorkflowTemplate = {
|
|
129
129
|
CountModelsTemplate: WorkflowTemplate = {
|
130
130
|
"steps": {
|
131
131
|
0: {
|
132
|
-
"include": ["scale_matrix"],
|
133
|
-
"repeat": False,
|
134
|
-
"chaining": False,
|
135
|
-
"step_name": "scale_matrix"
|
136
|
-
},
|
137
|
-
1: {
|
138
132
|
"include": "*",
|
139
133
|
"repeat": False,
|
140
134
|
"chaining": False,
|
@@ -1,7 +1,7 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: dstklib
|
3
|
-
Version: 2.0.
|
4
|
-
Requires-Python: <3.
|
3
|
+
Version: 2.0.2
|
4
|
+
Requires-Python: <3.13
|
5
5
|
Description-Content-Type: text/markdown
|
6
6
|
License-File: LICENSE
|
7
7
|
Requires-Dist: spacy
|
@@ -28,7 +28,7 @@ This library is based on the book *Distributional Semantics* by Alessandro Lenci
|
|
28
28
|
|
29
29
|
## Documentation
|
30
30
|
|
31
|
-
You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html).
|
31
|
+
You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html). You can also find a demonstration of how to use it on Google Colab (in spanish) [here](https://colab.research.google.com/drive/1xN6AzovxQICDpdyFatFeJDIuZcNdCxC3?usp=sharing)
|
32
32
|
|
33
33
|
## Installation
|
34
34
|
|
@@ -209,6 +209,7 @@ Some common tasks in distributional semantics require the use of more than one m
|
|
209
209
|
|
210
210
|
```python
|
211
211
|
from dstk.workflows.workflow_tools import WorkflowBuilder
|
212
|
+
from dstk.workflows.stage_workflows import TextProcessing
|
212
213
|
|
213
214
|
text = "The quick brown fox jumps over the lazy dog while the sun sets behind the hills."
|
214
215
|
model = "my_spacy_model"
|
@@ -219,7 +220,7 @@ TextProcessorWorkflow = TextProcessing(
|
|
219
220
|
"tokenizer": [
|
220
221
|
{"apply_model": {"model": model}},
|
221
222
|
{"get_tokens": {}},
|
222
|
-
{"remove_stop_words": {"custom_stop_words":
|
223
|
+
{"remove_stop_words": {"custom_stop_words": {}}},
|
223
224
|
],
|
224
225
|
"ngrams": [
|
225
226
|
{"extract_ngrams": {"window_size": 3}}
|
@@ -233,8 +234,9 @@ TextProcessorWorkflow = TextProcessing(
|
|
233
234
|
}
|
234
235
|
)
|
235
236
|
|
236
|
-
tokens =
|
237
|
+
tokens = TextProcessorWorkflow(input_data=text)
|
237
238
|
|
239
|
+
print(tokens)
|
238
240
|
|
239
241
|
# Output: ['the quick brown', 'quick brown fox', 'brown fox jumps', 'fox jumps over', 'jumps over the', 'over the lazy', 'the lazy dog', 'lazy dog while', 'dog while the', 'while the sun', 'the sun set', 'sun set behind', 'set behind the', 'behind the hills']
|
240
242
|
```
|
@@ -5,7 +5,7 @@ with open("README.md", "r") as file:
|
|
5
5
|
|
6
6
|
setup(
|
7
7
|
name="dstklib",
|
8
|
-
version="2.0.
|
8
|
+
version="2.0.2",
|
9
9
|
packages=find_packages(),
|
10
10
|
install_requires=[
|
11
11
|
"spacy",
|
@@ -18,7 +18,7 @@ setup(
|
|
18
18
|
"kneed",
|
19
19
|
"umap-learn"
|
20
20
|
],
|
21
|
-
python_requires="<3.
|
21
|
+
python_requires="<3.13",
|
22
22
|
long_description=description,
|
23
23
|
long_description_content_type="text/markdown"
|
24
24
|
)
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|