PyPI - teradataml - Versions diffs - 20.0.0.0__py3-none-any.whl → 20.0.0.2__py3-none-any.whl - Mend

teradataml 20.0.0.0py3-none-any.whl → 20.0.0.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of teradataml might be problematic. Click here for more details.

Files changed (263) hide show

teradataml/LICENSE-3RD-PARTY.pdf +0 -0
teradataml/LICENSE.pdf +0 -0
teradataml/README.md +183 -0
teradataml/__init__.py +6 -3
teradataml/_version.py +2 -2
teradataml/analytics/__init__.py +3 -2
teradataml/analytics/analytic_function_executor.py +275 -40
teradataml/analytics/analytic_query_generator.py +92 -0
teradataml/analytics/byom/__init__.py +3 -2
teradataml/analytics/json_parser/metadata.py +1 -0
teradataml/analytics/json_parser/utils.py +17 -21
teradataml/analytics/meta_class.py +40 -1
teradataml/analytics/sqle/DecisionTreePredict.py +1 -1
teradataml/analytics/sqle/__init__.py +10 -2
teradataml/analytics/table_operator/__init__.py +3 -2
teradataml/analytics/uaf/__init__.py +21 -2
teradataml/analytics/utils.py +62 -1
teradataml/analytics/valib.py +1 -1
teradataml/automl/__init__.py +1553 -319
teradataml/automl/custom_json_utils.py +139 -61
teradataml/automl/data_preparation.py +276 -319
teradataml/automl/data_transformation.py +163 -81
teradataml/automl/feature_engineering.py +402 -239
teradataml/automl/feature_exploration.py +9 -2
teradataml/automl/model_evaluation.py +48 -51
teradataml/automl/model_training.py +291 -189
teradataml/catalog/byom.py +8 -8
teradataml/catalog/model_cataloging_utils.py +1 -1
teradataml/clients/auth_client.py +133 -0
teradataml/clients/pkce_client.py +1 -1
teradataml/common/aed_utils.py +3 -2
teradataml/common/constants.py +48 -6
teradataml/common/deprecations.py +13 -7
teradataml/common/garbagecollector.py +156 -120
teradataml/common/messagecodes.py +6 -1
teradataml/common/messages.py +3 -1
teradataml/common/sqlbundle.py +1 -1
teradataml/common/utils.py +103 -11
teradataml/common/wrapper_utils.py +1 -1
teradataml/context/context.py +121 -31
teradataml/data/advertising.csv +201 -0
teradataml/data/bank_marketing.csv +11163 -0
teradataml/data/bike_sharing.csv +732 -0
teradataml/data/boston2cols.csv +721 -0
teradataml/data/breast_cancer.csv +570 -0
teradataml/data/complaints_test_tokenized.csv +353 -0
teradataml/data/complaints_tokens_model.csv +348 -0
teradataml/data/covid_confirm_sd.csv +83 -0
teradataml/data/customer_segmentation_test.csv +2628 -0
teradataml/data/customer_segmentation_train.csv +8069 -0
teradataml/data/dataframe_example.json +10 -0
teradataml/data/docs/sqle/docs_17_10/OneHotEncodingFit.py +3 -1
teradataml/data/docs/sqle/docs_17_10/OneHotEncodingTransform.py +6 -0
teradataml/data/docs/sqle/docs_17_10/OutlierFilterTransform.py +5 -1
teradataml/data/docs/sqle/docs_17_20/ANOVA.py +61 -1
teradataml/data/docs/sqle/docs_17_20/CFilter.py +132 -0
teradataml/data/docs/sqle/docs_17_20/ColumnTransformer.py +2 -0
teradataml/data/docs/sqle/docs_17_20/FTest.py +105 -26
teradataml/data/docs/sqle/docs_17_20/GLM.py +162 -1
teradataml/data/docs/sqle/docs_17_20/GetFutileColumns.py +5 -3
teradataml/data/docs/sqle/docs_17_20/KMeans.py +48 -1
teradataml/data/docs/sqle/docs_17_20/NaiveBayes.py +162 -0
teradataml/data/docs/sqle/docs_17_20/NonLinearCombineFit.py +3 -2
teradataml/data/docs/sqle/docs_17_20/OneHotEncodingFit.py +5 -0
teradataml/data/docs/sqle/docs_17_20/OneHotEncodingTransform.py +6 -0
teradataml/data/docs/sqle/docs_17_20/OutlierFilterFit.py +2 -0
teradataml/data/docs/sqle/docs_17_20/Pivoting.py +279 -0
teradataml/data/docs/sqle/docs_17_20/ROC.py +3 -2
teradataml/data/docs/sqle/docs_17_20/SVMPredict.py +13 -2
teradataml/data/docs/sqle/docs_17_20/ScaleFit.py +119 -1
teradataml/data/docs/sqle/docs_17_20/ScaleTransform.py +93 -1
teradataml/data/docs/sqle/docs_17_20/Shap.py +197 -0
teradataml/data/docs/sqle/docs_17_20/TDGLMPredict.py +163 -1
teradataml/data/docs/sqle/docs_17_20/TDNaiveBayesPredict.py +189 -0
teradataml/data/docs/sqle/docs_17_20/TFIDF.py +142 -0
teradataml/data/docs/sqle/docs_17_20/Unpivoting.py +216 -0
teradataml/data/docs/sqle/docs_17_20/XGBoost.py +12 -4
teradataml/data/docs/sqle/docs_17_20/XGBoostPredict.py +7 -1
teradataml/data/docs/sqle/docs_17_20/ZTest.py +72 -7
teradataml/data/docs/uaf/docs_17_20/ACF.py +1 -10
teradataml/data/docs/uaf/docs_17_20/ArimaEstimate.py +1 -1
teradataml/data/docs/uaf/docs_17_20/ArimaForecast.py +35 -5
teradataml/data/docs/uaf/docs_17_20/ArimaValidate.py +3 -1
teradataml/data/docs/uaf/docs_17_20/ArimaXEstimate.py +293 -0
teradataml/data/docs/uaf/docs_17_20/AutoArima.py +354 -0
teradataml/data/docs/uaf/docs_17_20/BreuschGodfrey.py +3 -2
teradataml/data/docs/uaf/docs_17_20/BreuschPaganGodfrey.py +1 -1
teradataml/data/docs/uaf/docs_17_20/Convolve.py +13 -10
teradataml/data/docs/uaf/docs_17_20/Convolve2.py +4 -1
teradataml/data/docs/uaf/docs_17_20/CumulPeriodogram.py +5 -4
teradataml/data/docs/uaf/docs_17_20/DFFT2Conv.py +4 -4
teradataml/data/docs/uaf/docs_17_20/DWT.py +235 -0
teradataml/data/docs/uaf/docs_17_20/DWT2D.py +214 -0
teradataml/data/docs/uaf/docs_17_20/DurbinWatson.py +1 -1
teradataml/data/docs/uaf/docs_17_20/ExtractResults.py +1 -1
teradataml/data/docs/uaf/docs_17_20/FilterFactory1d.py +160 -0
teradataml/data/docs/uaf/docs_17_20/GenseriesSinusoids.py +1 -1
teradataml/data/docs/uaf/docs_17_20/GoldfeldQuandt.py +9 -31
teradataml/data/docs/uaf/docs_17_20/HoltWintersForecaster.py +4 -2
teradataml/data/docs/uaf/docs_17_20/IDFFT2.py +1 -8
teradataml/data/docs/uaf/docs_17_20/IDWT.py +236 -0
teradataml/data/docs/uaf/docs_17_20/IDWT2D.py +226 -0
teradataml/data/docs/uaf/docs_17_20/IQR.py +134 -0
teradataml/data/docs/uaf/docs_17_20/LineSpec.py +1 -1
teradataml/data/docs/uaf/docs_17_20/LinearRegr.py +2 -2
teradataml/data/docs/uaf/docs_17_20/MAMean.py +3 -3
teradataml/data/docs/uaf/docs_17_20/Matrix2Image.py +297 -0
teradataml/data/docs/uaf/docs_17_20/MatrixMultiply.py +15 -6
teradataml/data/docs/uaf/docs_17_20/PACF.py +0 -1
teradataml/data/docs/uaf/docs_17_20/Portman.py +2 -2
teradataml/data/docs/uaf/docs_17_20/PowerSpec.py +2 -2
teradataml/data/docs/uaf/docs_17_20/Resample.py +9 -1
teradataml/data/docs/uaf/docs_17_20/SAX.py +246 -0
teradataml/data/docs/uaf/docs_17_20/SeasonalNormalize.py +17 -10
teradataml/data/docs/uaf/docs_17_20/SignifPeriodicities.py +1 -1
teradataml/data/docs/uaf/docs_17_20/WhitesGeneral.py +3 -1
teradataml/data/docs/uaf/docs_17_20/WindowDFFT.py +368 -0
teradataml/data/dwt2d_dataTable.csv +65 -0
teradataml/data/dwt_dataTable.csv +8 -0
teradataml/data/dwt_filterTable.csv +3 -0
teradataml/data/finance_data4.csv +13 -0
teradataml/data/glm_example.json +28 -1
teradataml/data/grocery_transaction.csv +19 -0
teradataml/data/housing_train_segment.csv +201 -0
teradataml/data/idwt2d_dataTable.csv +5 -0
teradataml/data/idwt_dataTable.csv +8 -0
teradataml/data/idwt_filterTable.csv +3 -0
teradataml/data/insect2Cols.csv +61 -0
teradataml/data/interval_data.csv +5 -0
teradataml/data/jsons/paired_functions.json +14 -0
teradataml/data/jsons/sqle/17.20/TD_ANOVA.json +99 -27
teradataml/data/jsons/sqle/17.20/TD_CFilter.json +118 -0
teradataml/data/jsons/sqle/17.20/TD_FTest.json +166 -83
teradataml/data/jsons/sqle/17.20/TD_GLM.json +90 -14
teradataml/data/jsons/sqle/17.20/TD_GLMPREDICT.json +48 -5
teradataml/data/jsons/sqle/17.20/TD_GetFutileColumns.json +5 -3
teradataml/data/jsons/sqle/17.20/TD_KMeans.json +31 -11
teradataml/data/jsons/sqle/17.20/TD_NaiveBayes.json +193 -0
teradataml/data/jsons/sqle/17.20/TD_NaiveBayesPredict.json +212 -0
teradataml/data/jsons/sqle/17.20/TD_NonLinearCombineFit.json +3 -2
teradataml/data/jsons/sqle/17.20/TD_OneClassSVM.json +9 -9
teradataml/data/jsons/sqle/17.20/TD_Pivoting.json +280 -0
teradataml/data/jsons/sqle/17.20/TD_ROC.json +2 -1
teradataml/data/jsons/sqle/17.20/TD_SVM.json +16 -16
teradataml/data/jsons/sqle/17.20/TD_SVMPredict.json +19 -1
teradataml/data/jsons/sqle/17.20/TD_ScaleFit.json +168 -15
teradataml/data/jsons/sqle/17.20/TD_ScaleTransform.json +50 -1
teradataml/data/jsons/sqle/17.20/TD_Shap.json +222 -0
teradataml/data/jsons/sqle/17.20/TD_TFIDF.json +162 -0
teradataml/data/jsons/sqle/17.20/TD_Unpivoting.json +235 -0
teradataml/data/jsons/sqle/17.20/TD_XGBoost.json +25 -7
teradataml/data/jsons/sqle/17.20/TD_XGBoostPredict.json +17 -4
teradataml/data/jsons/sqle/17.20/TD_ZTest.json +157 -80
teradataml/data/jsons/storedprocedure/17.20/TD_FILTERFACTORY1D.json +150 -0
teradataml/data/jsons/uaf/17.20/TD_ACF.json +1 -18
teradataml/data/jsons/uaf/17.20/TD_ARIMAESTIMATE.json +3 -16
teradataml/data/jsons/uaf/17.20/TD_ARIMAFORECAST.json +0 -3
teradataml/data/jsons/uaf/17.20/TD_ARIMAVALIDATE.json +5 -3
teradataml/data/jsons/uaf/17.20/TD_ARIMAXESTIMATE.json +362 -0
teradataml/data/jsons/uaf/17.20/TD_AUTOARIMA.json +469 -0
teradataml/data/jsons/uaf/17.20/TD_BINARYMATRIXOP.json +0 -3
teradataml/data/jsons/uaf/17.20/TD_BINARYSERIESOP.json +0 -2
teradataml/data/jsons/uaf/17.20/TD_BREUSCH_GODFREY.json +2 -1
teradataml/data/jsons/uaf/17.20/TD_BREUSCH_PAGAN_GODFREY.json +2 -5
teradataml/data/jsons/uaf/17.20/TD_CONVOLVE.json +3 -6
teradataml/data/jsons/uaf/17.20/TD_CONVOLVE2.json +1 -3
teradataml/data/jsons/uaf/17.20/TD_CUMUL_PERIODOGRAM.json +0 -5
teradataml/data/jsons/uaf/17.20/TD_DFFT.json +1 -4
teradataml/data/jsons/uaf/17.20/TD_DFFT2.json +2 -7
teradataml/data/jsons/uaf/17.20/TD_DFFT2CONV.json +1 -2
teradataml/data/jsons/uaf/17.20/TD_DFFTCONV.json +0 -2
teradataml/data/jsons/uaf/17.20/TD_DTW.json +3 -6
teradataml/data/jsons/uaf/17.20/TD_DWT.json +173 -0
teradataml/data/jsons/uaf/17.20/TD_DWT2D.json +160 -0
teradataml/data/jsons/uaf/17.20/TD_FITMETRICS.json +1 -1
teradataml/data/jsons/uaf/17.20/TD_GOLDFELD_QUANDT.json +16 -30
teradataml/data/jsons/uaf/17.20/{TD_HOLT_WINTERS_FORECAST.json → TD_HOLT_WINTERS_FORECASTER.json} +1 -2
teradataml/data/jsons/uaf/17.20/TD_IDFFT2.json +1 -15
teradataml/data/jsons/uaf/17.20/TD_IDWT.json +162 -0
teradataml/data/jsons/uaf/17.20/TD_IDWT2D.json +149 -0
teradataml/data/jsons/uaf/17.20/TD_IQR.json +117 -0
teradataml/data/jsons/uaf/17.20/TD_LINEAR_REGR.json +1 -1
teradataml/data/jsons/uaf/17.20/TD_LINESPEC.json +1 -1
teradataml/data/jsons/uaf/17.20/TD_MAMEAN.json +1 -3
teradataml/data/jsons/uaf/17.20/TD_MATRIX2IMAGE.json +209 -0
teradataml/data/jsons/uaf/17.20/TD_PACF.json +2 -2
teradataml/data/jsons/uaf/17.20/TD_POWERSPEC.json +5 -5
teradataml/data/jsons/uaf/17.20/TD_RESAMPLE.json +48 -28
teradataml/data/jsons/uaf/17.20/TD_SAX.json +208 -0
teradataml/data/jsons/uaf/17.20/TD_SEASONALNORMALIZE.json +12 -6
teradataml/data/jsons/uaf/17.20/TD_SIMPLEEXP.json +0 -1
teradataml/data/jsons/uaf/17.20/TD_TRACKINGOP.json +8 -8
teradataml/data/jsons/uaf/17.20/TD_UNDIFF.json +1 -1
teradataml/data/jsons/uaf/17.20/TD_UNNORMALIZE.json +1 -1
teradataml/data/jsons/uaf/17.20/TD_WINDOWDFFT.json +400 -0
teradataml/data/kmeans_example.json +5 -0
teradataml/data/kmeans_table.csv +10 -0
teradataml/data/load_example_data.py +8 -2
teradataml/data/naivebayestextclassifier_example.json +1 -1
teradataml/data/naivebayestextclassifierpredict_example.json +11 -0
teradataml/data/onehot_encoder_train.csv +4 -0
teradataml/data/openml_example.json +29 -0
teradataml/data/peppers.png +0 -0
teradataml/data/real_values.csv +14 -0
teradataml/data/sax_example.json +8 -0
teradataml/data/scale_attributes.csv +3 -0
teradataml/data/scale_example.json +52 -1
teradataml/data/scale_input_part_sparse.csv +31 -0
teradataml/data/scale_input_partitioned.csv +16 -0
teradataml/data/scale_input_sparse.csv +11 -0
teradataml/data/scale_parameters.csv +3 -0
teradataml/data/scripts/deploy_script.py +21 -2
teradataml/data/scripts/sklearn/sklearn_fit.py +40 -37
teradataml/data/scripts/sklearn/sklearn_fit_predict.py +22 -30
teradataml/data/scripts/sklearn/sklearn_function.template +42 -24
teradataml/data/scripts/sklearn/sklearn_model_selection_split.py +23 -33
teradataml/data/scripts/sklearn/sklearn_neighbors.py +19 -28
teradataml/data/scripts/sklearn/sklearn_score.py +32 -32
teradataml/data/scripts/sklearn/sklearn_transform.py +85 -42
teradataml/data/star_pivot.csv +8 -0
teradataml/data/templates/open_source_ml.json +2 -1
teradataml/data/teradataml_example.json +97 -1
teradataml/data/timestamp_data.csv +4 -0
teradataml/data/titanic_dataset_unpivoted.csv +19 -0
teradataml/data/uaf_example.json +55 -1
teradataml/data/unpivot_example.json +15 -0
teradataml/data/url_data.csv +9 -0
teradataml/data/windowdfft.csv +16 -0
teradataml/data/ztest_example.json +16 -0
teradataml/dataframe/copy_to.py +9 -4
teradataml/dataframe/data_transfer.py +125 -64
teradataml/dataframe/dataframe.py +575 -57
teradataml/dataframe/dataframe_utils.py +47 -9
teradataml/dataframe/fastload.py +273 -90
teradataml/dataframe/functions.py +339 -0
teradataml/dataframe/row.py +160 -0
teradataml/dataframe/setop.py +2 -2
teradataml/dataframe/sql.py +740 -18
teradataml/dataframe/window.py +1 -1
teradataml/dbutils/dbutils.py +324 -18
teradataml/geospatial/geodataframe.py +1 -1
teradataml/geospatial/geodataframecolumn.py +1 -1
teradataml/hyperparameter_tuner/optimizer.py +13 -13
teradataml/lib/aed_0_1.dll +0 -0
teradataml/opensource/sklearn/_sklearn_wrapper.py +254 -122
teradataml/options/__init__.py +16 -5
teradataml/options/configure.py +39 -6
teradataml/options/display.py +2 -2
teradataml/plot/axis.py +4 -4
teradataml/scriptmgmt/UserEnv.py +26 -19
teradataml/scriptmgmt/lls_utils.py +120 -16
teradataml/table_operators/Script.py +4 -5
teradataml/table_operators/TableOperator.py +160 -26
teradataml/table_operators/table_operator_util.py +88 -41
teradataml/table_operators/templates/dataframe_udf.template +63 -0
teradataml/telemetry_utils/__init__.py +0 -0
teradataml/telemetry_utils/queryband.py +52 -0
teradataml/utils/validators.py +41 -3
{teradataml-20.0.0.0.dist-info → teradataml-20.0.0.2.dist-info}/METADATA +191 -6
{teradataml-20.0.0.0.dist-info → teradataml-20.0.0.2.dist-info}/RECORD +263 -185
{teradataml-20.0.0.0.dist-info → teradataml-20.0.0.2.dist-info}/WHEEL +0 -0
{teradataml-20.0.0.0.dist-info → teradataml-20.0.0.2.dist-info}/top_level.txt +0 -0
{teradataml-20.0.0.0.dist-info → teradataml-20.0.0.2.dist-info}/zip-safe +0 -0

teradataml/data/docs/sqle/docs_17_20/TDNaiveBayesPredict.py ADDED Viewed

@@ -0,0 +1,189 @@
+def  TDNaiveBayesPredict(data = None, object = None, id_column = None,
+                         numeric_inputs = None, categorical_inputs = None,
+                         attribute_name_column = None, attribute_value_column = None,
+                         responses = None, output_prob = False, accumulate = None,
+                         **generic_arguments):
+    """
+    DESCRIPTION:
+        Function predicts classification label using model generated by NaiveBayes function
+        for a test set of data.
+    PARAMETERS:
+        data:
+            Required Argument.
+            Specifies the input teradataml DataFrame.
+            Types: teradataml DataFrame
+        object:
+            Required Argument.
+            Specifies the  teradataml DataFrame containing the model data
+            or instance of NaiveBayes.
+            Types: teradataml DataFrame or NaiveBayes
+        id_column:
+            Required Argument.
+            Specifies the name of the column that uniquely identifies an
+            observation in the "data".
+            Types: str
+        numeric_inputs:
+            Optional Argument.
+            Specifies the name of the columns in "data" containing numeric attributes values.
+            Types: str OR list of Strings (str)
+        categorical_inputs:
+            Optional Argument.
+            Specifies the name of the columns in "data" containing categorical attributes values.
+            Types: str OR list of Strings (str)
+        attribute_name_column:
+            Optional Argument.
+            Specifies the name of the columns in "data" containing attributes names.
+            Types: str
+        attribute_value_column:
+            Optional Argument.
+            Specifies the name of the columns in "data" containing attributes values.
+            Types: str
+        responses:
+            Optional Argument.
+            Specifies a list of responses to output.
+            Types: str OR list of strs
+        output_prob:
+            Optional Argument.
+            Specifies whether to output the probability for each response.
+            Default Value: False
+            Types: bool
+        accumulate:
+            Optional Argument.
+            Specify the names of the columns in "data" that need to be copied
+            from the input to output teradataml DataFrame.
+            Types: str OR list of Strings (str)
+        **generic_arguments:
+            Specifies the generic keyword arguments SQLE functions accept. Below
+            are the generic keyword arguments:
+                persist:
+                    Optional Argument.
+                    Specifies whether to persist the results of the
+                    function in a table or not. When set to True,
+                    results are persisted in a table; otherwise,
+                    results are garbage collected at the end of the
+                    session.
+                    Default Value: False
+                    Types: bool
+                volatile:
+                    Optional Argument.
+                    Specifies whether to put the results of the
+                    function in a volatile table or not. When set to
+                    True, results are stored in a volatile table,
+                    otherwise not.
+                    Default Value: False
+                    Types: bool
+            Function allows the user to partition, hash, order or local
+            order the input data. These generic arguments are available
+            for each argument that accepts teradataml DataFrame as
+            input and can be accessed as:
+                * "<input_data_arg_name>_partition_column" accepts str or
+                    list of str (Strings)
+                * "<input_data_arg_name>_hash_column" accepts str or list
+                    of str (Strings)
+                * "<input_data_arg_name>_order_column" accepts str or list
+                    of str (Strings)
+                * "local_order_<input_data_arg_name>" accepts boolean
+            Note:
+                These generic arguments are supported by teradataml if
+                the underlying SQL Engine function supports, else an
+                exception is raised.
+    RETURNS:
+        Instance of  NaiveBayesPredict.
+        Output teradataml DataFrames can be accessed using attribute
+        references, such as  NaiveBayesPredictObj.<attribute_name>.
+        Output teradataml DataFrame attribute name is:
+            result
+    RAISES:
+        TeradataMlException, TypeError, ValueError
+    EXAMPLES:
+        # Notes:
+        #     1. Get the connection to Vantage, before importing the
+        #        function in user space.
+        #     2. User can import the function, if it is available on
+        #        Vantage user is connected to.
+        #     3. To check the list of analytic functions available on
+        #        Vantage user connected to, use
+        #        "display_analytic_functions()".
+        # Load the example data.
+        load_example_data("decisionforestpredict", ["housing_train", "housing_test"])
+        # Create teradataml DataFrame objects.
+        housing_train = DataFrame.from_table("housing_train")
+        housing_test = DataFrame.from_table("housing_test")
+        # Check the list of available analytic functions.
+        display_analytic_functions()
+        # Import function  NaiveBayesPredict.
+        from teradataml import  NaiveBayesPredict
+        # Example 1: NaiveBayesPredict function to predict the classification label using Dense input.
+        NaiveBayes_out = NaiveBayes(data=housing_train, response_column='homestyle',
+                                    numeric_inputs=['price','lotsize','bedrooms','bathrms','stories','garagepl'],
+                                    categorical_inputs=['driveway','recroom','fullbase','gashw','airco','prefarea'])
+        NaiveBayesPredict_out = TDNaiveBayesPredict(data=housing_test, object=NaiveBayes_out.result, id_column='sn',
+                                                    numeric_inputs=['price','lotsize','bedrooms','bathrms','stories','garagepl'],
+                                                    categorical_inputs=['driveway','recroom','fullbase','gashw','airco','prefarea'],
+                                                    responses=['Classic', 'Eclectic', 'bungalow'],
+                                                    accumulate='homestyle',
+                                                    output_prob=True
+                                                    )
+        # Print the result DataFrame.
+        print( NaiveBayesPredict_out.result)
+        # Example 2: NaiveBayesPredict function to predict the classification label using Sparse input.
+        # Unpivoting the data for sparse input to naive bayes.
+        upvt_train = Unpivoting(data = housing_train, id_column = 'sn',
+                                target_columns = ['price','lotsize','bedrooms','bathrms','stories','garagepl',
+                                                  'driveway','recroom','fullbase','gashw','airco','prefarea'],
+                                attribute_column = "AttributeName",
+                                value_column = "AttributeValue",
+                                accumulate = 'homestyle')
+        upvt_test = Unpivoting(data = housing_test, id_column = 'sn',
+                               target_columns = ['price','lotsize','bedrooms','bathrms','stories','garagepl','driveway',
+                                                 'recroom','fullbase','gashw','airco','prefarea'],
+                               attribute_column = "AttributeName", value_column = "AttributeValue",
+                               accumulate = 'homestyle')
+        NaiveBayes_out1 = NaiveBayes(data=upvt_train.result,
+                                     response_column='homestyle',
+                                     attribute_name_column='AttributeName',
+                                     attribute_value_column='AttributeValue',
+                                     numeric_attributes=['price','lotsize','bedrooms','bathrms','stories','garagepl'],
+                                     categorical_attributes=['driveway','recroom','fullbase','gashw','airco','prefarea'])
+        NaiveBayesPredict_out1 = TDNaiveBayesPredict(data=upvt_test.result, object=NaiveBayes_out1, id_column='sn',
+                                                     attribute_name_column='AttributeName',
+                                                     attribute_value_column='AttributeValue',
+                                                     responses=['Classic', 'Eclectic', 'bungalow'],
+                                                     accumulate='homestyle',
+                                                     output_prob=True
+                                                     )
+        # Print the result DataFrame.
+        print( NaiveBayesPredict_out1.result)
+    """

teradataml/data/docs/sqle/docs_17_20/TFIDF.py ADDED Viewed

@@ -0,0 +1,142 @@
+def TFIDF(data = None, doc_id_column = None, token_column = None,
+          tf_normalization = "NORMAL", idf_normalization = "LOG",
+          regularization = "NONE", accumulate = None,
+          **generic_arguments):
+    """
+    DESCRIPTION:
+        Function takes any document set and computes the Term Frequency (TF),
+        Inverse Document Frequency (IDF), and Term Frequency Inverse Document
+        Frequency (TF-IDF) scores for each term.
+    PARAMETERS:
+        data:
+            Required Argument.
+            Specifies the input teradataml DataFrame that contains
+            the document id and the term.
+            Types: teradataml DataFrame
+        doc_id_column:
+            Required Argument.
+            Specifies the name of the column in "data" that contains the
+            document identifier.
+            Types: str
+        token_column:
+            Required Argument.
+            Specifies the name of the column in "data" that contains the tokens.
+            Types: str
+        tf_normalization:
+            Optional Argument.
+            Specifies the normalization method for calculating the term frequency (TF).
+            Default Value: "NORMAL"
+            Permitted Values: BOOL, COUNT, NORMAL, LOG, AUGMENT
+            Types: str
+        idf_normalization:
+            Optional Argument.
+            Specifies the normalization method for calculating the inverse
+            document frequency (IDF).
+            Default Value: "LOG"
+            Permitted Values: UNARY, LOG, LOGNORM, SMOOTH
+            Types: str
+        regularization:
+            Optional Argument.
+            Specifies the regularization method for calculating the TF-IDF score.
+            Default Value: "NONE"
+            Permitted Values: L2, L1, NONE
+            Types: str
+        accumulate:
+            Optional Argument.
+            Specifies the name(s) of input teradataml DataFrame column(s) to copy to the
+            output.
+            Types: str OR list of Strings (str)
+        **generic_arguments:
+            Specifies the generic keyword arguments SQLE functions accept. Below
+            are the generic keyword arguments:
+                persist:
+                    Optional Argument.
+                    Specifies whether to persist the results of the
+                    function in a table or not. When set to True,
+                    results are persisted in a table; otherwise,
+                    results are garbage collected at the end of the
+                    session.
+                    Default Value: False
+                    Types: bool
+                volatile:
+                    Optional Argument.
+                    Specifies whether to put the results of the
+                    function in a volatile table or not. When set to
+                    True, results are stored in a volatile table,
+                    otherwise not.
+                    Default Value: False
+                    Types: bool
+            Function allows the user to partition, hash, order or local
+            order the input data. These generic arguments are available
+            for each argument that accepts teradataml DataFrame as
+            input and can be accessed as:
+                * "<input_data_arg_name>_partition_column" accepts str or
+                    list of str (Strings)
+                * "<input_data_arg_name>_hash_column" accepts str or list
+                    of str (Strings)
+                * "<input_data_arg_name>_order_column" accepts str or list
+                    of str (Strings)
+                * "local_order_<input_data_arg_name>" accepts boolean
+            Note:
+                These generic arguments are supported by teradataml if
+                the underlying SQL Engine function supports, else an
+                exception is raised.
+    RETURNS:
+        Instance of TFIDF.
+        Output teradataml DataFrames can be accessed using attribute
+        references, such as  TFIDFObj.<attribute_name>.
+        Output teradataml DataFrame attribute name is:
+            result
+    RAISES:
+        TeradataMlException, TypeError, ValueError
+    EXAMPLES:
+        # Notes:
+        #     1. Get the connection to Vantage, before importing the
+        #        function in user space.
+        #     2. User can import the function, if it is available on
+        #        Vantage user is connected to.
+        #     3. To check the list of analytic functions available on
+        #        Vantage user connected to, use
+        #        "display_analytic_functions()".
+        # Load the example data.
+        load_example_data('naivebayestextclassifier',"token_table")
+        # Create teradataml DataFrame objects.
+        inp = DataFrame.from_table('token_table')
+        # Check the list of available analytic functions.
+        display_analytic_functions()
+        # Import function  TFIDF.
+        from teradataml import  TFIDF
+        # Example 1 : Compute the TF, IDF and TF-IDF scores
+        #             for each term in the input data.
+        TFIDF_out = TFIDF(data=inp,
+                          doc_id_column='doc_id',
+                          token_column='token',
+                          tf_normalization = "LOG",
+                          idf_normalization = "SMOOTH",
+                          regularization = "L2",
+                          accumulate=['category'])
+        # Print the result DataFrame.
+        print(TFIDF_out.result)
+    """

teradataml/data/docs/sqle/docs_17_20/Unpivoting.py ADDED Viewed

@@ -0,0 +1,216 @@
+def Unpivoting(data = None, id_column = None, target_columns = None,
+                alias_names = None, attribute_column = "AttributeName", value_column = "AttributeValue",
+                accumulate = None, include_nulls = False, input_types = False, output_varchar = False,
+                indexed_attribute = False, include_datatypes = False,
+                **generic_arguments):
+    """
+    DESCRIPTION:
+        Function unpivots the data, that is, changes the data from
+        dense format to sparse format.
+    PARAMETERS:
+        data:
+            Required Argument.
+            Specifies the input teradataml DataFrame.
+            Types: teradataml DataFrame
+        id_column:
+            Required Argument.
+            Specifies the name of the column in "data" which contains the input data identifier.
+            Types: str
+        target_columns:
+            Required Argument.
+            Specifies the name(s) of input teradataml DataFrame column(s) which contains the data for
+            unpivoting.
+            Types: str OR list of Strings (str)
+            Optional Argument.
+            Specifies alternate names for the values in the 'attribute_column'.
+            Types: str OR list of strs
+        alias_names:
+            Optional Argument.
+            Specifies alternate names for the values in the 'attribute_column'.
+            column.
+            Types: str OR list of strs
+        attribute_column:
+            Optional Argument.
+            Specifies the name of the column in the output DataFrame, which holds the names of pivoted columns.
+            Default Value: "AttributeName"
+            Types: str
+        value_column:
+            Optional Argument.
+            Specifies the name of the column in the output DataFrame, which holds the values of pivoted columns.
+            Default Value: "AttributeValue"
+            Types: str
+        accumulate:
+            Optional Argument.
+            Specifies the name(s) of input teradataml DataFrame column(s) to copy to the output.
+            By default, the function copies no input teradataml DataFrame columns to the output.
+            Types: str OR list of Strings (str)
+        include_nulls:
+            Optional Argument.
+            Specifies whether or not to include nulls in the transformation.
+            Default Value: False
+            Types: bool
+        input_types:
+            Optional Argument.
+            Specifies whether attribute values should be organized into multiple columns based on data type groups.
+            Note:
+                * 'input_types' argument cannot be used when output_varchar is set to True.
+            Default Value: False
+            Types: bool
+        output_varchar:
+            Optional Argument.
+            Specifies whether to output the 'value_column' in varchar format regardless of its data type.
+            Note:
+                * 'output_varchar' argument cannot be used when input_types is set to True.
+            Default Value: False
+            Types: bool
+        indexed_attribute:
+            Optional Argument.
+            Specifies whether to output the column indexes instead of column names in AttributeName column.
+            When set to True, outputs the column indexes instead of column names.
+            Default Value: False
+            Types: bool
+        include_datatypes:
+            Optional Argument.
+            Specifies whether to output the original datatype name. When set to True,
+            outputs the original datatype name.
+            Default Value: False
+            Types: bool
+        **generic_arguments:
+            Specifies the generic keyword arguments SQLE functions accept. Below
+            are the generic keyword arguments:
+                persist:
+                    Optional Argument.
+                    Specifies whether to persist the results of the
+                    function in a table or not. When set to True,
+                    results are persisted in a table; otherwise,
+                    results are garbage collected at the end of the
+                    session.
+                    Default Value: False
+                    Types: bool
+                volatile:
+                    Optional Argument.
+                    Specifies whether to put the results of the
+                    function in a volatile table or not. When set to
+                    True, results are stored in a volatile table,
+                    otherwise not.
+                    Default Value: False
+                    Types: bool
+            Function allows the user to partition, hash, order or local
+            order the input data. These generic arguments are available
+            for each argument that accepts teradataml DataFrame as
+            input and can be accessed as:
+                * "<input_data_arg_name>_partition_column" accepts str or
+                    list of str (Strings)
+                * "<input_data_arg_name>_hash_column" accepts str or list
+                    of str (Strings)
+                * "<input_data_arg_name>_order_column" accepts str or list
+                    of str (Strings)
+                * "local_order_<input_data_arg_name>" accepts boolean
+            Note:
+                These generic arguments are supported by teradataml if
+                the underlying SQL Engine function supports, else an
+                exception is raised.
+    RETURNS:
+        Instance of Unpivoting.
+        Output teradataml DataFrames can be accessed using attribute
+        references, such as UnpivotingObj.<attribute_name>.
+        Output teradataml DataFrame attribute name is:
+            result
+    RAISES:
+        TeradataMlException, TypeError, ValueError
+    EXAMPLES:
+        # Notes:
+        #     1. Get the connection to Vantage, before importing the
+        #        function in user space.
+        #     2. User can import the function, if it is available on
+        #        Vantage user is connected to.
+        #     3. To check the list of analytic functions available on
+        #        Vantage user connected to, use
+        #        "display_analytic_functions()".
+        # Load the example data.
+        load_example_data('unpivot', 'unpivot_input')
+        # Create teradataml DataFrame objects.
+        upvt_inp = DataFrame('unpivot_input')
+        # Check the list of available analytic functions.
+        display_analytic_functions()
+        # Import function  Unpivoting.
+        from teradataml import  Unpivoting
+        # Example 1 : Unpivot the data.
+        upvt1 = Unpivoting(data = upvt_inp,
+                           id_column = 'sn',
+                           target_columns = 'city',
+                           accumulate = 'week',
+                           include_nulls = True)
+        # Print the result DataFrame.
+        print( upvt1.result)
+        # Example 2 : Unpivot the data with alternate names for the values in
+        #             the AttributeName output column.
+        upvt2= Unpivoting(data = upvt_inp,
+                          id_column = 'sn',
+                          target_columns = 'city',
+                          alias_names = 'city_us',
+                          attribute_column = "Attribute",
+                          value_column = "value",
+                          accumulate = 'week',
+                          include_nulls = True)
+        # Print the result DataFrame.
+        print( upvt2.result)
+        # Example 3 : Unpivot the data with multiple target columns and output
+        #             data types.
+        upvt3 = Unpivoting(data = upvt_inp,
+                           id_column = 'sn',
+                           target_columns = ['city','pressure'],
+                           attribute_column = "Attribute",
+                           value_column = "value",
+                           accumulate = 'week',
+                           include_nulls = True,
+                           indexed_attribute = True,
+                           include_datatypes = True)
+        # Print the result DataFrame.
+        print( upvt3.result)
+        # Example 4 : Unpivot the data with multiple target columns and output
+        #             the input types.
+        upvt4 = Unpivoting(data = upvt_inp,
+                           id_column = 'sn',
+                           target_columns = ['city','temp'],
+                           accumulate = 'week',
+                           include_nulls = True,
+                           input_types = True)
+        # Print the result DataFrame.
+        print( upvt4.result)
+    """

teradataml/data/docs/sqle/docs_17_20/XGBoost.py CHANGED Viewed

@@ -1,7 +1,7 @@
 def XGBoost(formula=None, data=None, input_columns=None, response_column=None, max_depth=5,
             num_boosted_trees=-1, min_node_size=1, seed=1, model_type='REGRESSION',
-            coverage_factor=1.0, min_impurity=0.0, lambda1=100000,
-            shrinkage_factor=0.1, column_sampling=1.0, iter_num=10, tree_size=-1,
+            coverage_factor=1.0, min_impurity=0.0, lambda1=1, shrinkage_factor=0.5,
+            column_sampling=1.0, iter_num=10, tree_size=-1, base_score=0.0,
             **generic_arguments):
     """
     DESCRIPTION:
@@ -174,7 +174,7 @@ def XGBoost(formula=None, data=None, input_columns=None, response_column=None, m
             Notes:
                 * The "lambda1" must be in the range [0, 100000].
                 * The value 0 specifies no regularization.
-            Default Value: 100000
+            Default Value: 1
             Types: float OR int
         shrinkage_factor:
@@ -185,7 +185,7 @@ def XGBoost(formula=None, data=None, input_columns=None, response_column=None, m
             Notes:
                 * The "shrinkage_factor" is a DOUBLE PRECISION value in the range (0, 1].
                 * The value 1 specifies no shrinkage.
-            Default Value: 0.1
+            Default Value: 0.5
             Types: float
         column_sampling:
@@ -217,6 +217,14 @@ def XGBoost(formula=None, data=None, input_columns=None, response_column=None, m
             Default Value: -1
             Types: int
+        base_score:
+            Optional Argument.
+            Specifies the initial prediction value for all data points.
+            Note:
+                * The "base_score" must be in the range [-1e50, 1e50].
+            Default Value: 0.0
+            Types: float
         **generic_arguments:
             Specifies the generic keyword arguments SQLE functions accept. Below
             are the generic keyword arguments:

teradataml/data/docs/sqle/docs_17_20/XGBoostPredict.py CHANGED Viewed

@@ -1,6 +1,6 @@
 def XGBoostPredict(newdata=None, object=None, id_column=None, num_boosted_tree=1000,
                    iter_num=3, accumulate=None, output_prob=False, model_type="REGRESSION",
-                   output_responses=None,  **generic_arguments):
+                   output_responses=None, detailed=False, **generic_arguments):
     """
     DESCRIPTION:
         The XGBoostPredict() function runs the predictive algorithm based on the model generated
@@ -123,6 +123,12 @@ def XGBoostPredict(newdata=None, object=None, id_column=None, num_boosted_tree=1
                   'Classification'.
             Types: str OR list of str(s)
+        detailed:
+            Optional Argument.
+            Specifies whether to output detailed information of each prediction.
+            Default Value: False
+            Types: bool
         **generic_arguments:
             Specifies the generic keyword arguments SQLE functions accept. Below
             are the generic keyword arguments:

teradataml 20.0.0.0__py3-none-any.whl → 20.0.0.2__py3-none-any.whl

Potentially problematic release.

teradataml 20.0.0.0py3-none-any.whl → 20.0.0.2py3-none-any.whl