teradataml 20.0.0.4__py3-none-any.whl → 20.0.0.5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of teradataml might be problematic. Click here for more details.
- teradataml/LICENSE-3RD-PARTY.pdf +0 -0
- teradataml/README.md +86 -13
- teradataml/__init__.py +2 -1
- teradataml/_version.py +2 -2
- teradataml/analytics/analytic_function_executor.py +7 -12
- teradataml/analytics/json_parser/analytic_functions_argument.py +4 -0
- teradataml/analytics/sqle/__init__.py +16 -1
- teradataml/analytics/utils.py +15 -1
- teradataml/automl/__init__.py +290 -106
- teradataml/automl/autodataprep/__init__.py +471 -0
- teradataml/automl/data_preparation.py +29 -10
- teradataml/automl/data_transformation.py +11 -0
- teradataml/automl/feature_engineering.py +64 -4
- teradataml/automl/feature_exploration.py +639 -25
- teradataml/automl/model_training.py +1 -1
- teradataml/clients/auth_client.py +2 -2
- teradataml/common/constants.py +61 -26
- teradataml/common/messagecodes.py +2 -1
- teradataml/common/messages.py +5 -4
- teradataml/common/utils.py +255 -37
- teradataml/context/context.py +225 -87
- teradataml/data/apriori_example.json +22 -0
- teradataml/data/docs/sqle/docs_17_20/Apriori.py +138 -0
- teradataml/data/docs/sqle/docs_17_20/NERExtractor.py +121 -0
- teradataml/data/docs/sqle/docs_17_20/NGramSplitter.py +3 -3
- teradataml/data/docs/sqle/docs_17_20/SMOTE.py +212 -0
- teradataml/data/docs/sqle/docs_17_20/TextMorph.py +119 -0
- teradataml/data/docs/sqle/docs_17_20/TextParser.py +54 -3
- teradataml/data/docs/uaf/docs_17_20/ACF.py +1 -1
- teradataml/data/docs/uaf/docs_17_20/ArimaEstimate.py +2 -2
- teradataml/data/docs/uaf/docs_17_20/ArimaXEstimate.py +2 -2
- teradataml/data/docs/uaf/docs_17_20/DFFT.py +1 -1
- teradataml/data/docs/uaf/docs_17_20/DFFT2.py +1 -1
- teradataml/data/docs/uaf/docs_17_20/DFFT2Conv.py +1 -1
- teradataml/data/docs/uaf/docs_17_20/DFFTConv.py +1 -1
- teradataml/data/docs/uaf/docs_17_20/FilterFactory1d.py +4 -4
- teradataml/data/docs/uaf/docs_17_20/GenseriesSinusoids.py +2 -2
- teradataml/data/docs/uaf/docs_17_20/GoldfeldQuandt.py +2 -2
- teradataml/data/docs/uaf/docs_17_20/HoltWintersForecaster.py +6 -6
- teradataml/data/docs/uaf/docs_17_20/LineSpec.py +1 -1
- teradataml/data/docs/uaf/docs_17_20/LinearRegr.py +1 -1
- teradataml/data/docs/uaf/docs_17_20/Matrix2Image.py +4 -4
- teradataml/data/docs/uaf/docs_17_20/MultivarRegr.py +1 -1
- teradataml/data/docs/uaf/docs_17_20/PACF.py +1 -1
- teradataml/data/docs/uaf/docs_17_20/PowerSpec.py +2 -2
- teradataml/data/docs/uaf/docs_17_20/PowerTransform.py +3 -3
- teradataml/data/docs/uaf/docs_17_20/Resample.py +5 -5
- teradataml/data/docs/uaf/docs_17_20/SAX.py +3 -3
- teradataml/data/docs/uaf/docs_17_20/SignifPeriodicities.py +1 -1
- teradataml/data/docs/uaf/docs_17_20/SimpleExp.py +1 -1
- teradataml/data/docs/uaf/docs_17_20/Smoothma.py +3 -3
- teradataml/data/docs/uaf/docs_17_20/UNDIFF.py +1 -1
- teradataml/data/jsons/sqle/17.20/NGramSplitter.json +6 -6
- teradataml/data/jsons/sqle/17.20/TD_Apriori.json +181 -0
- teradataml/data/jsons/sqle/17.20/TD_NERExtractor.json +145 -0
- teradataml/data/jsons/sqle/17.20/TD_SMOTE.json +267 -0
- teradataml/data/jsons/sqle/17.20/TD_TextMorph.json +134 -0
- teradataml/data/jsons/sqle/17.20/TD_TextParser.json +114 -9
- teradataml/data/jsons/sqle/20.00/AI_AnalyzeSentiment.json +328 -0
- teradataml/data/jsons/sqle/20.00/AI_AskLLM.json +420 -0
- teradataml/data/jsons/sqle/20.00/AI_DetectLanguage.json +343 -0
- teradataml/data/jsons/sqle/20.00/AI_ExtractKeyPhrases.json +328 -0
- teradataml/data/jsons/sqle/20.00/AI_MaskPII.json +328 -0
- teradataml/data/jsons/sqle/20.00/AI_RecognizeEntities.json +328 -0
- teradataml/data/jsons/sqle/20.00/AI_RecognizePIIEntities.json +328 -0
- teradataml/data/jsons/sqle/20.00/AI_TextClassifier.json +359 -0
- teradataml/data/jsons/sqle/20.00/AI_TextEmbeddings.json +360 -0
- teradataml/data/jsons/sqle/20.00/AI_TextSummarize.json +343 -0
- teradataml/data/jsons/sqle/20.00/AI_TextTranslate.json +343 -0
- teradataml/data/jsons/sqle/20.00/TD_SMOTE.json +2 -2
- teradataml/data/jsons/sqle/20.00/TD_VectorDistance.json +1 -1
- teradataml/data/ner_dict.csv +8 -0
- teradataml/data/ner_input_eng.csv +7 -0
- teradataml/data/ner_rule.csv +5 -0
- teradataml/data/pos_input.csv +40 -0
- teradataml/data/tdnerextractor_example.json +14 -0
- teradataml/data/teradataml_example.json +13 -0
- teradataml/data/textmorph_example.json +5 -0
- teradataml/data/to_num_data.csv +4 -0
- teradataml/data/tochar_data.csv +5 -0
- teradataml/data/trans_dense.csv +16 -0
- teradataml/data/trans_sparse.csv +55 -0
- teradataml/dataframe/copy_to.py +37 -26
- teradataml/dataframe/data_transfer.py +61 -45
- teradataml/dataframe/dataframe.py +130 -50
- teradataml/dataframe/dataframe_utils.py +15 -2
- teradataml/dataframe/functions.py +109 -9
- teradataml/dataframe/sql.py +328 -76
- teradataml/dbutils/dbutils.py +33 -13
- teradataml/dbutils/filemgr.py +14 -10
- teradataml/lib/aed_0_1.dll +0 -0
- teradataml/opensource/_base.py +6 -157
- teradataml/options/configure.py +4 -5
- teradataml/scriptmgmt/UserEnv.py +305 -38
- teradataml/scriptmgmt/lls_utils.py +376 -130
- teradataml/store/__init__.py +1 -1
- teradataml/table_operators/Apply.py +16 -1
- teradataml/table_operators/Script.py +20 -1
- teradataml/table_operators/table_operator_util.py +58 -9
- teradataml/utils/dtypes.py +2 -1
- teradataml/utils/internal_buffer.py +22 -2
- teradataml/utils/validators.py +313 -57
- {teradataml-20.0.0.4.dist-info → teradataml-20.0.0.5.dist-info}/METADATA +89 -14
- {teradataml-20.0.0.4.dist-info → teradataml-20.0.0.5.dist-info}/RECORD +107 -77
- {teradataml-20.0.0.4.dist-info → teradataml-20.0.0.5.dist-info}/WHEEL +0 -0
- {teradataml-20.0.0.4.dist-info → teradataml-20.0.0.5.dist-info}/top_level.txt +0 -0
- {teradataml-20.0.0.4.dist-info → teradataml-20.0.0.5.dist-info}/zip-safe +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: teradataml
|
|
3
|
-
Version: 20.0.0.
|
|
3
|
+
Version: 20.0.0.5
|
|
4
4
|
Summary: Teradata Vantage Python package for Advanced Analytics
|
|
5
5
|
Home-page: http://www.teradata.com/
|
|
6
6
|
Author: Teradata Corporation
|
|
@@ -17,14 +17,16 @@ Classifier: Topic :: Database :: Front-Ends
|
|
|
17
17
|
Classifier: License :: Other/Proprietary License
|
|
18
18
|
Requires-Python: >=3.8
|
|
19
19
|
Description-Content-Type: text/markdown
|
|
20
|
-
Requires-Dist: teradatasql (>=20.0.0.
|
|
21
|
-
Requires-Dist: teradatasqlalchemy (>=20.0.0.
|
|
20
|
+
Requires-Dist: teradatasql (>=20.0.0.26)
|
|
21
|
+
Requires-Dist: teradatasqlalchemy (>=20.0.0.5)
|
|
22
22
|
Requires-Dist: pandas (>=0.22)
|
|
23
23
|
Requires-Dist: psutil
|
|
24
24
|
Requires-Dist: requests (>=2.25.1)
|
|
25
25
|
Requires-Dist: scikit-learn (>=0.24.2)
|
|
26
26
|
Requires-Dist: IPython (>=8.10.0)
|
|
27
27
|
Requires-Dist: imbalanced-learn (>=0.8.0)
|
|
28
|
+
Requires-Dist: matplotlib (>=3.7.5)
|
|
29
|
+
Requires-Dist: seaborn (>=0.13.0)
|
|
28
30
|
Requires-Dist: pyjwt (>=2.8.0)
|
|
29
31
|
Requires-Dist: cryptography (>=42.0.5)
|
|
30
32
|
Requires-Dist: sqlalchemy (>=2.0)
|
|
@@ -40,7 +42,7 @@ For community support, please visit the [Teradata Community](https://support.ter
|
|
|
40
42
|
|
|
41
43
|
For Teradata customer support, please visit [Teradata Support](https://support.teradata.com/csm).
|
|
42
44
|
|
|
43
|
-
Copyright
|
|
45
|
+
Copyright 2025, Teradata. All Rights Reserved.
|
|
44
46
|
|
|
45
47
|
### Table of Contents
|
|
46
48
|
* [Release Notes](#release-notes)
|
|
@@ -51,10 +53,83 @@ Copyright 2024, Teradata. All Rights Reserved.
|
|
|
51
53
|
|
|
52
54
|
## Release Notes:
|
|
53
55
|
|
|
56
|
+
#### teradataml 20.00.00.05
|
|
57
|
+
* ##### New Features/Functionality
|
|
58
|
+
* ##### teradataml: AutoML
|
|
59
|
+
* New methods added for `AutoML()`, `AutoRegressor()` and `AutoClassifier()`:
|
|
60
|
+
* `get_persisted_tables()` - List the persisted tables created during AutoML execution.
|
|
61
|
+
* `visualize()` - Generates visualizations to analyze and understand the underlying patterns in the data.
|
|
62
|
+
|
|
63
|
+
* ##### AutoDataPrep - Automated Data Preparation
|
|
64
|
+
AutoDataPrep simplifies the data preparation process by automating the different aspects of
|
|
65
|
+
data cleaning and transformation, enabling seamless exploration, transformation, and optimization of datasets.
|
|
66
|
+
* `AutoDataPrep`
|
|
67
|
+
* Methods of AutoDataPrep
|
|
68
|
+
* `__init__()` - Instantiate an object of AutoDataPrep with given parameters.
|
|
69
|
+
* `fit()` - Perform fit on specified data and target column.
|
|
70
|
+
* `get_data()` - Retrieve the data after AutoDataPrep.
|
|
71
|
+
* `load()` - Load the saved datasets from Teradata Vantage.
|
|
72
|
+
* `deploy()` - Persist the datasets generated by AutoDataPrep in Teradata Vantage.
|
|
73
|
+
* `delete_data()` - Deletes the deployed dataset from the Teradata Vantage.
|
|
74
|
+
* `visualize()` - Generates visualizations to analyze and understand the underlying patterns in the data.
|
|
75
|
+
|
|
76
|
+
* ##### teradataml: SQLE Engine Analytic Functions
|
|
77
|
+
* New Analytics Database Analytic Functions:
|
|
78
|
+
* `Apriori()`
|
|
79
|
+
* `NERExtractor()`
|
|
80
|
+
* `TextMorph()`
|
|
81
|
+
|
|
82
|
+
* ##### teradataml: Functions
|
|
83
|
+
* `td_range()` - Creates a DataFrame with a specified range of numbers.
|
|
84
|
+
|
|
85
|
+
* ##### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
86
|
+
* `DataFrameColumn.to_number()` - Function converts a string-like representation of a number to NUMBER type.
|
|
87
|
+
|
|
88
|
+
* ##### Updates
|
|
89
|
+
* ###### teradataml: DataFrame function
|
|
90
|
+
* `DataFrame.agg()`: User can request for different percentiles while running agg function.
|
|
91
|
+
* New argument `debug` is added to `DataFrame.map_row()`, `DataFrame.map_partition()`, `DataFrame.apply()` and `udf()`. During the execution of these functions, teradataml internally generates scripts, which are garbage collected implicitly. To debug the failures, this argument allows user to control the garbage collection of the script. When set to False (default), script generated is garbage collected, otherwise script is not garbage collected and displays the path to the script, and user is responsible to remove the script if required.
|
|
92
|
+
* `map_row()`, `map_partition()` and `apply()`
|
|
93
|
+
* Raises a TeradataMlException, if the Python interpreter major version is different between the Vantage Python environment and the local user environment.
|
|
94
|
+
* Displays a warning, if `dill` package version is different between the Vantage Python environment and the local user environment.
|
|
95
|
+
* `DataFrame.describe()`: Argument `include` is no longer supported.
|
|
96
|
+
* `assign()` - Optimized SQL query to enhance the performance for consecutive assign calls.
|
|
97
|
+
|
|
98
|
+
* ###### teradataml: Context Creation
|
|
99
|
+
* `create_context()`
|
|
100
|
+
* Enables user to set the authentication token while creating the connection. This authentication token is required to access services running on Teradata Vantage.
|
|
101
|
+
* New argument `sql_timeout` is added to specify timeout for SQL statement execution triggered from the current session.
|
|
102
|
+
|
|
103
|
+
* ###### teradataml: UAF Functions
|
|
104
|
+
* Integer type value is now accepted as a valid value for function arguments accepting float type.
|
|
105
|
+
|
|
106
|
+
* ###### General functions
|
|
107
|
+
* `set_auth_token()`
|
|
108
|
+
* Added argument `kid` to accept the name of the key used while generating `pem_file`.
|
|
109
|
+
* New keyword argument `auth_mech` accepts the authentication mechanism to be used for generating authentication token.
|
|
110
|
+
* Basic authentication is now supported as well. New keyword argument `password` accepts password for database user in such case.
|
|
111
|
+
* `copy_to_sql()` and `read_csv()` support the VECTOR data type.
|
|
112
|
+
|
|
113
|
+
* ###### Open Analytics Framework (OpenAF) APIs:
|
|
114
|
+
* `create_env()`:
|
|
115
|
+
* Supports creation of conda R environment.
|
|
116
|
+
|
|
117
|
+
* ###### teradataml DataFrameColumn a.k.a. ColumnExpression
|
|
118
|
+
* _String Functions_
|
|
119
|
+
* `DataFrameColumn.substr()` - Arguments `start_pos` and `length` now accept DataFrameColumn as input.
|
|
120
|
+
* `DataFrameColumn.to_char()` - Argument `formatter` now accepts DataFrameColumn as input.
|
|
121
|
+
|
|
122
|
+
* ###### teradataml: SQLE Engine Analytic Functions
|
|
123
|
+
* Updated Analytics Database Analytic Functions:
|
|
124
|
+
* `SMOTE()` is now supported on 17.20.00.00 as well.
|
|
125
|
+
* `TextParser()`
|
|
126
|
+
* New arguments added: `enforce_token_limit`, `delimiter_regex`, `doc_id_column`,
|
|
127
|
+
`list_positions`, `token_frequency`, `output_by_word`
|
|
128
|
+
|
|
54
129
|
#### teradataml 20.00.00.04
|
|
55
130
|
* ##### New Features/Functionality
|
|
56
131
|
* ###### teradataml OTF Support:
|
|
57
|
-
* This release has enabled the support for accessing OTF data from teradataml.
|
|
132
|
+
* This release has enabled the support for accessing OTF data from teradataml.
|
|
58
133
|
* User can now create a teradataml DataFrame on OTF table, allowing user to use teradataml functions.
|
|
59
134
|
* Example usage below:
|
|
60
135
|
* Creation of view on OTF/datalake table is not supported. Hence, user has to set `configure.temp_object_type` to `VT` using below-mentioned statement.
|
|
@@ -82,7 +157,7 @@ Copyright 2024, Teradata. All Rights Reserved.
|
|
|
82
157
|
```
|
|
83
158
|
* ###### teradataml: DataFrame
|
|
84
159
|
* Introduced a new feature 'Exploratory Data Analysis UI' (EDA-UI), which enhances
|
|
85
|
-
the user experience of teradataml with Jupyter notebook. EDA-UI is displayed by default
|
|
160
|
+
the user experience of teradataml with Jupyter notebook. EDA-UI is displayed by default
|
|
86
161
|
when a teradataml DataFrame is printed in the Jupyter notebook.
|
|
87
162
|
* User can control the EDA-UI using a new configuration option `display.enable_ui`.
|
|
88
163
|
It can be disabled by setting `display.enable_ui` to False.
|
|
@@ -99,7 +174,7 @@ Copyright 2024, Teradata. All Rights Reserved.
|
|
|
99
174
|
* `td_lightgbm.load()` - Load the deployed model in the current session.
|
|
100
175
|
|
|
101
176
|
* ###### FeatureStore
|
|
102
|
-
* New function `FeatureStore.delete()` is added to drop the Feature Store and corresponding repo from Vantage.
|
|
177
|
+
* New function `FeatureStore.delete()` is added to drop the Feature Store and corresponding repo from Vantage.
|
|
103
178
|
|
|
104
179
|
* ###### Database Utility
|
|
105
180
|
* `db_python_version_diff()` - Identifies the Python interpreter major version difference between the interpreter installed on Vantage vs interpreter on the local user environment.
|
|
@@ -112,13 +187,13 @@ Copyright 2024, Teradata. All Rights Reserved.
|
|
|
112
187
|
* Configuration Options
|
|
113
188
|
* `configure.temp_object_type` - Allows user to choose between creating volatile tables or views for teradataml internal use. By default, teradataml internally creates the views for some of the operations. Now, with new configuration option, user can opt to create Volatile tables instead of views. This provides greater flexibility for users who lack the necessary permissions to create view or need to create views on tables without WITH GRANT permissions.
|
|
114
189
|
* Display Options
|
|
115
|
-
* `display.enable_ui` - Specifies whether to display exploratory data analysis UI when DataFrame is printed. By default, this option is enabled (True), allowing exploratory data analysis UI to be displayed. When set to False, exploratory data analysis UI is hidden.
|
|
190
|
+
* `display.enable_ui` - Specifies whether to display exploratory data analysis UI when DataFrame is printed. By default, this option is enabled (True), allowing exploratory data analysis UI to be displayed. When set to False, exploratory data analysis UI is hidden.
|
|
116
191
|
|
|
117
192
|
* ##### Updates
|
|
118
193
|
* ###### teradataml: DataFrame function
|
|
119
194
|
* `describe()`
|
|
120
195
|
* New argument added: `pivot`.
|
|
121
|
-
* When argument `pivot` is set to False, Non-numeric columns are no longer supported for generating statistics.
|
|
196
|
+
* When argument `pivot` is set to False, Non-numeric columns are no longer supported for generating statistics.
|
|
122
197
|
Use `CategoricalSummary` and `ColumnSummary`.
|
|
123
198
|
* `fillna()` - Accepts new argument `partition_column` to partition the data and impute null values accordingly.
|
|
124
199
|
* Optimised performance for `DataFrame.plot()`.
|
|
@@ -128,8 +203,8 @@ Copyright 2024, Teradata. All Rights Reserved.
|
|
|
128
203
|
* ###### teradataml: DataFrame Utilities
|
|
129
204
|
* `in_schema()`: New argument `datalake_name` added to accept datalake name.
|
|
130
205
|
|
|
131
|
-
* ###### Table Operator
|
|
132
|
-
* `Apply()` no longer looks at authentication token by default. Authentication token is now required only if user
|
|
206
|
+
* ###### Table Operator
|
|
207
|
+
* `Apply()` no longer looks at authentication token by default. Authentication token is now required only if user wants to consume Open Analytics Framework REST APIs.
|
|
133
208
|
|
|
134
209
|
* ###### Hyper Parameter Tuner
|
|
135
210
|
* `GridSearch()` and `RandomSearch()` now displays a message to refer to `get_error_log()` api when model training fails in HPT.
|
|
@@ -147,7 +222,7 @@ Copyright 2024, Teradata. All Rights Reserved.
|
|
|
147
222
|
|
|
148
223
|
* ###### OpensourceML
|
|
149
224
|
* Raises a TeradataMlException, if the Python interpreter major version is different between the Vantage Python environment and the local user environment.
|
|
150
|
-
* Displays a warning, if specific Python package versions are different between the Vantage Python environment and the local user environment.
|
|
225
|
+
* Displays a warning, if specific Python package versions are different between the Vantage Python environment and the local user environment.
|
|
151
226
|
|
|
152
227
|
* ###### Database Utility
|
|
153
228
|
* `db_list_tables()`: New argument `datalake_name` added to accept datalake name to list tables from.
|
|
@@ -165,10 +240,10 @@ Copyright 2024, Teradata. All Rights Reserved.
|
|
|
165
240
|
* `DataFrame.set_index()` no longer modifies the original DataFrame's index when argument `append` is used.
|
|
166
241
|
* `concat()` function now supports the DataFrame with column name starts with digit or contains special characters or contains reserved keywords.
|
|
167
242
|
* `create_env()` proceeds to install other files even if current file installation fails.
|
|
168
|
-
* Corrected the error message being raised in `create_env()` when authentication is not set.
|
|
243
|
+
* Corrected the error message being raised in `create_env()` when authentication token is not set.
|
|
169
244
|
* Added missing argument `charset` for Vantage Analytic Library functions.
|
|
170
245
|
* New argument `seed` is added to `AutoML`, `AutoRegressor` and `AutoClassifier` to ensure consistency on result.
|
|
171
|
-
* Analytic functions now work even if name of columns for underlying tables
|
|
246
|
+
* Analytic functions now work even if name of columns for underlying tables has non-ascii characters.
|
|
172
247
|
|
|
173
248
|
#### teradataml 20.00.00.03
|
|
174
249
|
|