dstklib 2.0.0__tar.gz → 2.0.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (48) hide show
  1. {dstklib-2.0.0 → dstklib-2.0.2}/PKG-INFO +7 -5
  2. {dstklib-2.0.0 → dstklib-2.0.2}/README.md +5 -3
  3. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/models/models.py +0 -1
  4. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/templates/templates.py +0 -6
  5. {dstklib-2.0.0 → dstklib-2.0.2}/dstklib.egg-info/PKG-INFO +7 -5
  6. {dstklib-2.0.0 → dstklib-2.0.2}/setup.py +2 -2
  7. {dstklib-2.0.0 → dstklib-2.0.2}/LICENSE +0 -0
  8. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/__init__.py +0 -0
  9. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/adaptors/__init__.py +0 -0
  10. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/adaptors/adaptors.py +0 -0
  11. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/adaptors/typeguards.py +0 -0
  12. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/hooks/__init__.py +0 -0
  13. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/hooks/hook_tools.py +0 -0
  14. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/hooks/type_conversion.py +0 -0
  15. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/__init__.py +0 -0
  16. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/dstk_types.py +0 -0
  17. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/fasttext_types.py +0 -0
  18. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/gensim_types.py +0 -0
  19. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/numpy_types.py +0 -0
  20. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/pandas_types.py +0 -0
  21. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/plotly_types.py +0 -0
  22. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/sklearn_types.py +0 -0
  23. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/lib_types/spacy_types.py +0 -0
  24. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/method_index.py +0 -0
  25. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/models/__init__.py +0 -0
  26. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/models/model_tools.py +0 -0
  27. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/__init__.py +0 -0
  28. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/count_models.py +0 -0
  29. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/data_visualization/__init__.py +0 -0
  30. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/data_visualization/clustering.py +0 -0
  31. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/data_visualization/embeddings.py +0 -0
  32. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/geometric_distance.py +0 -0
  33. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/ngrams.py +0 -0
  34. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/predict_models.py +0 -0
  35. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/text_matrix_builder.py +0 -0
  36. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/text_processor.py +0 -0
  37. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/tokenizer.py +0 -0
  38. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/modules/weight_matrix.py +0 -0
  39. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/templates/__init__.py +0 -0
  40. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/templates/rules.py +0 -0
  41. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/workflows/__init__.py +0 -0
  42. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/workflows/stage_workflows.py +0 -0
  43. {dstklib-2.0.0 → dstklib-2.0.2}/dstk/workflows/workflow_tools.py +0 -0
  44. {dstklib-2.0.0 → dstklib-2.0.2}/dstklib.egg-info/SOURCES.txt +0 -0
  45. {dstklib-2.0.0 → dstklib-2.0.2}/dstklib.egg-info/dependency_links.txt +0 -0
  46. {dstklib-2.0.0 → dstklib-2.0.2}/dstklib.egg-info/requires.txt +0 -0
  47. {dstklib-2.0.0 → dstklib-2.0.2}/dstklib.egg-info/top_level.txt +0 -0
  48. {dstklib-2.0.0 → dstklib-2.0.2}/setup.cfg +0 -0
@@ -1,7 +1,7 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: dstklib
3
- Version: 2.0.0
4
- Requires-Python: <3.12
3
+ Version: 2.0.2
4
+ Requires-Python: <3.13
5
5
  Description-Content-Type: text/markdown
6
6
  License-File: LICENSE
7
7
  Requires-Dist: spacy
@@ -28,7 +28,7 @@ This library is based on the book *Distributional Semantics* by Alessandro Lenci
28
28
 
29
29
  ## Documentation
30
30
 
31
- You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html).
31
+ You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html). You can also find a demonstration of how to use it on Google Colab (in spanish) [here](https://colab.research.google.com/drive/1xN6AzovxQICDpdyFatFeJDIuZcNdCxC3?usp=sharing)
32
32
 
33
33
  ## Installation
34
34
 
@@ -209,6 +209,7 @@ Some common tasks in distributional semantics require the use of more than one m
209
209
 
210
210
  ```python
211
211
  from dstk.workflows.workflow_tools import WorkflowBuilder
212
+ from dstk.workflows.stage_workflows import TextProcessing
212
213
 
213
214
  text = "The quick brown fox jumps over the lazy dog while the sun sets behind the hills."
214
215
  model = "my_spacy_model"
@@ -219,7 +220,7 @@ TextProcessorWorkflow = TextProcessing(
219
220
  "tokenizer": [
220
221
  {"apply_model": {"model": model}},
221
222
  {"get_tokens": {}},
222
- {"remove_stop_words": {"custom_stop_words": stops}},
223
+ {"remove_stop_words": {"custom_stop_words": {}}},
223
224
  ],
224
225
  "ngrams": [
225
226
  {"extract_ngrams": {"window_size": 3}}
@@ -233,8 +234,9 @@ TextProcessorWorkflow = TextProcessing(
233
234
  }
234
235
  )
235
236
 
236
- tokens = TokenizerWorkflow(input_data=text)
237
+ tokens = TextProcessorWorkflow(input_data=text)
237
238
 
239
+ print(tokens)
238
240
 
239
241
  # Output: ['the quick brown', 'quick brown fox', 'brown fox jumps', 'fox jumps over', 'jumps over the', 'over the lazy', 'the lazy dog', 'lazy dog while', 'dog while the', 'while the sun', 'the sun set', 'sun set behind', 'set behind the', 'behind the hills']
240
242
  ```
@@ -12,7 +12,7 @@ This library is based on the book *Distributional Semantics* by Alessandro Lenci
12
12
 
13
13
  ## Documentation
14
14
 
15
- You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html).
15
+ You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html). You can also find a demonstration of how to use it on Google Colab (in spanish) [here](https://colab.research.google.com/drive/1xN6AzovxQICDpdyFatFeJDIuZcNdCxC3?usp=sharing)
16
16
 
17
17
  ## Installation
18
18
 
@@ -193,6 +193,7 @@ Some common tasks in distributional semantics require the use of more than one m
193
193
 
194
194
  ```python
195
195
  from dstk.workflows.workflow_tools import WorkflowBuilder
196
+ from dstk.workflows.stage_workflows import TextProcessing
196
197
 
197
198
  text = "The quick brown fox jumps over the lazy dog while the sun sets behind the hills."
198
199
  model = "my_spacy_model"
@@ -203,7 +204,7 @@ TextProcessorWorkflow = TextProcessing(
203
204
  "tokenizer": [
204
205
  {"apply_model": {"model": model}},
205
206
  {"get_tokens": {}},
206
- {"remove_stop_words": {"custom_stop_words": stops}},
207
+ {"remove_stop_words": {"custom_stop_words": {}}},
207
208
  ],
208
209
  "ngrams": [
209
210
  {"extract_ngrams": {"window_size": 3}}
@@ -217,8 +218,9 @@ TextProcessorWorkflow = TextProcessing(
217
218
  }
218
219
  )
219
220
 
220
- tokens = TokenizerWorkflow(input_data=text)
221
+ tokens = TextProcessorWorkflow(input_data=text)
221
222
 
223
+ print(tokens)
222
224
 
223
225
  # Output: ['the quick brown', 'quick brown fox', 'brown fox jumps', 'fox jumps over', 'jumps over the', 'over the lazy', 'the lazy dog', 'lazy dog while', 'dog while the', 'while the sun', 'the sun set', 'sun set behind', 'set behind the', 'behind the hills']
224
226
  ```
@@ -83,7 +83,6 @@ def StandardModel(text: str, model: str | Language, custom_stop_words: list[str]
83
83
  module_name="count_models",
84
84
  template=CountModelsTemplate,
85
85
  workflow=[
86
- {"scale_matrix": {}},
87
86
  {"svd_embeddings": {"n_components": n_components}}
88
87
  ]
89
88
  )
@@ -129,12 +129,6 @@ WeightMatrixTemplate: WorkflowTemplate = {
129
129
  CountModelsTemplate: WorkflowTemplate = {
130
130
  "steps": {
131
131
  0: {
132
- "include": ["scale_matrix"],
133
- "repeat": False,
134
- "chaining": False,
135
- "step_name": "scale_matrix"
136
- },
137
- 1: {
138
132
  "include": "*",
139
133
  "repeat": False,
140
134
  "chaining": False,
@@ -1,7 +1,7 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: dstklib
3
- Version: 2.0.0
4
- Requires-Python: <3.12
3
+ Version: 2.0.2
4
+ Requires-Python: <3.13
5
5
  Description-Content-Type: text/markdown
6
6
  License-File: LICENSE
7
7
  Requires-Dist: spacy
@@ -28,7 +28,7 @@ This library is based on the book *Distributional Semantics* by Alessandro Lenci
28
28
 
29
29
  ## Documentation
30
30
 
31
- You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html).
31
+ You can find the (temporal) basic documentation [here](https://distributional-semantics-toolkit-30269b.gitlab.io/index.html). You can also find a demonstration of how to use it on Google Colab (in spanish) [here](https://colab.research.google.com/drive/1xN6AzovxQICDpdyFatFeJDIuZcNdCxC3?usp=sharing)
32
32
 
33
33
  ## Installation
34
34
 
@@ -209,6 +209,7 @@ Some common tasks in distributional semantics require the use of more than one m
209
209
 
210
210
  ```python
211
211
  from dstk.workflows.workflow_tools import WorkflowBuilder
212
+ from dstk.workflows.stage_workflows import TextProcessing
212
213
 
213
214
  text = "The quick brown fox jumps over the lazy dog while the sun sets behind the hills."
214
215
  model = "my_spacy_model"
@@ -219,7 +220,7 @@ TextProcessorWorkflow = TextProcessing(
219
220
  "tokenizer": [
220
221
  {"apply_model": {"model": model}},
221
222
  {"get_tokens": {}},
222
- {"remove_stop_words": {"custom_stop_words": stops}},
223
+ {"remove_stop_words": {"custom_stop_words": {}}},
223
224
  ],
224
225
  "ngrams": [
225
226
  {"extract_ngrams": {"window_size": 3}}
@@ -233,8 +234,9 @@ TextProcessorWorkflow = TextProcessing(
233
234
  }
234
235
  )
235
236
 
236
- tokens = TokenizerWorkflow(input_data=text)
237
+ tokens = TextProcessorWorkflow(input_data=text)
237
238
 
239
+ print(tokens)
238
240
 
239
241
  # Output: ['the quick brown', 'quick brown fox', 'brown fox jumps', 'fox jumps over', 'jumps over the', 'over the lazy', 'the lazy dog', 'lazy dog while', 'dog while the', 'while the sun', 'the sun set', 'sun set behind', 'set behind the', 'behind the hills']
240
242
  ```
@@ -5,7 +5,7 @@ with open("README.md", "r") as file:
5
5
 
6
6
  setup(
7
7
  name="dstklib",
8
- version="2.0.0",
8
+ version="2.0.2",
9
9
  packages=find_packages(),
10
10
  install_requires=[
11
11
  "spacy",
@@ -18,7 +18,7 @@ setup(
18
18
  "kneed",
19
19
  "umap-learn"
20
20
  ],
21
- python_requires="<3.12",
21
+ python_requires="<3.13",
22
22
  long_description=description,
23
23
  long_description_content_type="text/markdown"
24
24
  )
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes