PyPI - teradataml - Versions diffs - 17.20.0.6__py3-none-any.whl → 20.0.0.0__py3-none-any.whl - Mend

teradataml 17.20.0.6py3-none-any.whl → 20.0.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of teradataml might be problematic. Click here for more details.

Files changed (432) hide show

teradataml/LICENSE-3RD-PARTY.pdf +0 -0
teradataml/LICENSE.pdf +0 -0
teradataml/README.md +238 -1
teradataml/__init__.py +13 -3
teradataml/_version.py +1 -1
teradataml/analytics/Transformations.py +4 -4
teradataml/analytics/__init__.py +0 -2
teradataml/analytics/analytic_function_executor.py +3 -0
teradataml/analytics/json_parser/utils.py +13 -12
teradataml/analytics/sqle/DecisionTreePredict.py +15 -30
teradataml/analytics/sqle/NaiveBayesPredict.py +11 -20
teradataml/analytics/sqle/__init__.py +0 -13
teradataml/analytics/utils.py +1 -0
teradataml/analytics/valib.py +3 -0
teradataml/automl/__init__.py +1628 -0
teradataml/automl/custom_json_utils.py +1270 -0
teradataml/automl/data_preparation.py +993 -0
teradataml/automl/data_transformation.py +727 -0
teradataml/automl/feature_engineering.py +1648 -0
teradataml/automl/feature_exploration.py +547 -0
teradataml/automl/model_evaluation.py +163 -0
teradataml/automl/model_training.py +887 -0
teradataml/catalog/__init__.py +0 -2
teradataml/catalog/byom.py +49 -6
teradataml/catalog/function_argument_mapper.py +0 -2
teradataml/catalog/model_cataloging_utils.py +2 -1021
teradataml/common/aed_utils.py +6 -2
teradataml/common/constants.py +50 -58
teradataml/common/deprecations.py +160 -0
teradataml/common/garbagecollector.py +61 -104
teradataml/common/messagecodes.py +27 -36
teradataml/common/messages.py +11 -15
teradataml/common/utils.py +205 -287
teradataml/common/wrapper_utils.py +1 -110
teradataml/context/context.py +150 -78
teradataml/data/bank_churn.csv +10001 -0
teradataml/data/bmi.csv +501 -0
teradataml/data/docs/sqle/docs_17_10/BincodeFit.py +3 -3
teradataml/data/docs/sqle/docs_17_10/BincodeTransform.py +6 -5
teradataml/data/docs/sqle/docs_17_10/Fit.py +1 -1
teradataml/data/docs/sqle/docs_17_10/OneHotEncodingTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_10/OutlierFilterTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_10/PolynomialFeaturesTransform.py +2 -2
teradataml/data/docs/sqle/docs_17_10/RowNormalizeTransform.py +2 -1
teradataml/data/docs/sqle/docs_17_10/ScaleTransform.py +1 -0
teradataml/data/docs/sqle/docs_17_10/SimpleImputeTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_10/Transform.py +2 -1
teradataml/data/docs/sqle/docs_17_20/BincodeFit.py +3 -3
teradataml/data/docs/sqle/docs_17_20/BincodeTransform.py +6 -5
teradataml/data/docs/sqle/docs_17_20/Fit.py +1 -1
teradataml/data/docs/sqle/docs_17_20/GLM.py +1 -1
teradataml/data/docs/sqle/docs_17_20/GLMPredictPerSegment.py +9 -10
teradataml/data/docs/sqle/docs_17_20/KMeansPredict.py +3 -2
teradataml/data/docs/sqle/docs_17_20/NaiveBayesTextClassifierPredict.py +16 -15
teradataml/data/docs/sqle/docs_17_20/NaiveBayesTextClassifierTrainer.py +2 -2
teradataml/data/docs/sqle/docs_17_20/NonLinearCombineFit.py +2 -2
teradataml/data/docs/sqle/docs_17_20/NonLinearCombineTransform.py +8 -8
teradataml/data/docs/sqle/docs_17_20/OneClassSVMPredict.py +21 -20
teradataml/data/docs/sqle/docs_17_20/OneHotEncodingTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_20/OutlierFilterTransform.py +8 -3
teradataml/data/docs/sqle/docs_17_20/PolynomialFeaturesTransform.py +6 -5
teradataml/data/docs/sqle/docs_17_20/RandomProjectionTransform.py +6 -6
teradataml/data/docs/sqle/docs_17_20/RowNormalizeTransform.py +2 -1
teradataml/data/docs/sqle/docs_17_20/SVM.py +1 -1
teradataml/data/docs/sqle/docs_17_20/SVMPredict.py +16 -16
teradataml/data/docs/sqle/docs_17_20/ScaleTransform.py +1 -0
teradataml/data/docs/sqle/docs_17_20/SimpleImputeTransform.py +3 -2
teradataml/data/docs/sqle/docs_17_20/TDDecisionForestPredict.py +4 -4
teradataml/data/docs/sqle/docs_17_20/TDGLMPredict.py +19 -19
teradataml/data/docs/sqle/docs_17_20/TargetEncodingTransform.py +5 -4
teradataml/data/docs/sqle/docs_17_20/Transform.py +2 -2
teradataml/data/docs/sqle/docs_17_20/XGBoostPredict.py +9 -9
teradataml/data/fish.csv +160 -0
teradataml/data/glass_types.csv +215 -0
teradataml/data/insurance.csv +1 -1
teradataml/data/iris_data.csv +151 -0
teradataml/data/jsons/sqle/17.10/TD_FunctionTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_OneHotEncodingTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_OutlierFilterTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_PolynomialFeaturesTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_RowNormalizeTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_ScaleTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_SimpleImputeTransform.json +1 -0
teradataml/data/load_example_data.py +3 -0
teradataml/data/multi_model_classification.csv +401 -0
teradataml/data/multi_model_regression.csv +401 -0
teradataml/data/openml_example.json +63 -0
teradataml/data/scripts/deploy_script.py +65 -0
teradataml/data/scripts/mapper.R +20 -0
teradataml/data/scripts/sklearn/__init__.py +0 -0
teradataml/data/scripts/sklearn/sklearn_fit.py +175 -0
teradataml/data/scripts/sklearn/sklearn_fit_predict.py +135 -0
teradataml/data/scripts/sklearn/sklearn_function.template +113 -0
teradataml/data/scripts/sklearn/sklearn_model_selection_split.py +158 -0
teradataml/data/scripts/sklearn/sklearn_neighbors.py +152 -0
teradataml/data/scripts/sklearn/sklearn_score.py +128 -0
teradataml/data/scripts/sklearn/sklearn_transform.py +179 -0
teradataml/data/templates/open_source_ml.json +9 -0
teradataml/data/teradataml_example.json +73 -1
teradataml/data/test_classification.csv +101 -0
teradataml/data/test_prediction.csv +101 -0
teradataml/data/test_regression.csv +101 -0
teradataml/data/train_multiclass.csv +101 -0
teradataml/data/train_regression.csv +101 -0
teradataml/data/train_regression_multiple_labels.csv +101 -0
teradataml/data/wine_data.csv +1600 -0
teradataml/dataframe/copy_to.py +79 -13
teradataml/dataframe/data_transfer.py +8 -0
teradataml/dataframe/dataframe.py +910 -311
teradataml/dataframe/dataframe_utils.py +102 -5
teradataml/dataframe/fastload.py +11 -3
teradataml/dataframe/setop.py +15 -2
teradataml/dataframe/sql.py +3735 -77
teradataml/dataframe/sql_function_parameters.py +56 -5
teradataml/dataframe/vantage_function_types.py +45 -1
teradataml/dataframe/window.py +30 -29
teradataml/dbutils/dbutils.py +18 -1
teradataml/geospatial/geodataframe.py +18 -7
teradataml/geospatial/geodataframecolumn.py +5 -0
teradataml/hyperparameter_tuner/optimizer.py +910 -120
teradataml/hyperparameter_tuner/utils.py +131 -37
teradataml/lib/aed_0_1.dll +0 -0
teradataml/lib/libaed_0_1.dylib +0 -0
teradataml/lib/libaed_0_1.so +0 -0
teradataml/libaed_0_1.dylib +0 -0
teradataml/libaed_0_1.so +0 -0
teradataml/opensource/__init__.py +1 -0
teradataml/opensource/sklearn/__init__.py +1 -0
teradataml/opensource/sklearn/_class.py +255 -0
teradataml/opensource/sklearn/_sklearn_wrapper.py +1668 -0
teradataml/opensource/sklearn/_wrapper_utils.py +268 -0
teradataml/opensource/sklearn/constants.py +54 -0
teradataml/options/__init__.py +3 -6
teradataml/options/configure.py +21 -20
teradataml/scriptmgmt/UserEnv.py +61 -5
teradataml/scriptmgmt/lls_utils.py +135 -53
teradataml/table_operators/Apply.py +38 -6
teradataml/table_operators/Script.py +45 -308
teradataml/table_operators/TableOperator.py +182 -591
teradataml/table_operators/__init__.py +0 -1
teradataml/table_operators/table_operator_util.py +32 -40
teradataml/utils/validators.py +127 -3
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/METADATA +243 -3
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/RECORD +147 -391
teradataml/analytics/mle/AdaBoost.py +0 -651
teradataml/analytics/mle/AdaBoostPredict.py +0 -564
teradataml/analytics/mle/Antiselect.py +0 -342
teradataml/analytics/mle/Arima.py +0 -641
teradataml/analytics/mle/ArimaPredict.py +0 -477
teradataml/analytics/mle/Attribution.py +0 -1070
teradataml/analytics/mle/Betweenness.py +0 -658
teradataml/analytics/mle/Burst.py +0 -711
teradataml/analytics/mle/CCM.py +0 -600
teradataml/analytics/mle/CCMPrepare.py +0 -324
teradataml/analytics/mle/CFilter.py +0 -460
teradataml/analytics/mle/ChangePointDetection.py +0 -572
teradataml/analytics/mle/ChangePointDetectionRT.py +0 -477
teradataml/analytics/mle/Closeness.py +0 -737
teradataml/analytics/mle/ConfusionMatrix.py +0 -420
teradataml/analytics/mle/Correlation.py +0 -477
teradataml/analytics/mle/Correlation2.py +0 -573
teradataml/analytics/mle/CoxHazardRatio.py +0 -679
teradataml/analytics/mle/CoxPH.py +0 -556
teradataml/analytics/mle/CoxSurvival.py +0 -478
teradataml/analytics/mle/CumulativeMovAvg.py +0 -363
teradataml/analytics/mle/DTW.py +0 -623
teradataml/analytics/mle/DWT.py +0 -564
teradataml/analytics/mle/DWT2D.py +0 -599
teradataml/analytics/mle/DecisionForest.py +0 -716
teradataml/analytics/mle/DecisionForestEvaluator.py +0 -363
teradataml/analytics/mle/DecisionForestPredict.py +0 -561
teradataml/analytics/mle/DecisionTree.py +0 -830
teradataml/analytics/mle/DecisionTreePredict.py +0 -528
teradataml/analytics/mle/ExponentialMovAvg.py +0 -418
teradataml/analytics/mle/FMeasure.py +0 -402
teradataml/analytics/mle/FPGrowth.py +0 -734
teradataml/analytics/mle/FrequentPaths.py +0 -695
teradataml/analytics/mle/GLM.py +0 -558
teradataml/analytics/mle/GLML1L2.py +0 -547
teradataml/analytics/mle/GLML1L2Predict.py +0 -519
teradataml/analytics/mle/GLMPredict.py +0 -529
teradataml/analytics/mle/HMMDecoder.py +0 -945
teradataml/analytics/mle/HMMEvaluator.py +0 -901
teradataml/analytics/mle/HMMSupervised.py +0 -521
teradataml/analytics/mle/HMMUnsupervised.py +0 -572
teradataml/analytics/mle/Histogram.py +0 -561
teradataml/analytics/mle/IDWT.py +0 -476
teradataml/analytics/mle/IDWT2D.py +0 -493
teradataml/analytics/mle/IdentityMatch.py +0 -763
teradataml/analytics/mle/Interpolator.py +0 -918
teradataml/analytics/mle/KMeans.py +0 -485
teradataml/analytics/mle/KNN.py +0 -627
teradataml/analytics/mle/KNNRecommender.py +0 -488
teradataml/analytics/mle/KNNRecommenderPredict.py +0 -581
teradataml/analytics/mle/LAR.py +0 -439
teradataml/analytics/mle/LARPredict.py +0 -478
teradataml/analytics/mle/LDA.py +0 -548
teradataml/analytics/mle/LDAInference.py +0 -492
teradataml/analytics/mle/LDATopicSummary.py +0 -464
teradataml/analytics/mle/LevenshteinDistance.py +0 -450
teradataml/analytics/mle/LinReg.py +0 -433
teradataml/analytics/mle/LinRegPredict.py +0 -438
teradataml/analytics/mle/MinHash.py +0 -544
teradataml/analytics/mle/Modularity.py +0 -587
teradataml/analytics/mle/NEREvaluator.py +0 -410
teradataml/analytics/mle/NERExtractor.py +0 -595
teradataml/analytics/mle/NERTrainer.py +0 -458
teradataml/analytics/mle/NGrams.py +0 -570
teradataml/analytics/mle/NPath.py +0 -634
teradataml/analytics/mle/NTree.py +0 -549
teradataml/analytics/mle/NaiveBayes.py +0 -462
teradataml/analytics/mle/NaiveBayesPredict.py +0 -513
teradataml/analytics/mle/NaiveBayesTextClassifier.py +0 -607
teradataml/analytics/mle/NaiveBayesTextClassifier2.py +0 -531
teradataml/analytics/mle/NaiveBayesTextClassifierPredict.py +0 -799
teradataml/analytics/mle/NamedEntityFinder.py +0 -529
teradataml/analytics/mle/NamedEntityFinderEvaluator.py +0 -414
teradataml/analytics/mle/NamedEntityFinderTrainer.py +0 -396
teradataml/analytics/mle/POSTagger.py +0 -417
teradataml/analytics/mle/Pack.py +0 -411
teradataml/analytics/mle/PageRank.py +0 -535
teradataml/analytics/mle/PathAnalyzer.py +0 -426
teradataml/analytics/mle/PathGenerator.py +0 -367
teradataml/analytics/mle/PathStart.py +0 -464
teradataml/analytics/mle/PathSummarizer.py +0 -470
teradataml/analytics/mle/Pivot.py +0 -471
teradataml/analytics/mle/ROC.py +0 -425
teradataml/analytics/mle/RandomSample.py +0 -637
teradataml/analytics/mle/RandomWalkSample.py +0 -490
teradataml/analytics/mle/SAX.py +0 -779
teradataml/analytics/mle/SVMDense.py +0 -677
teradataml/analytics/mle/SVMDensePredict.py +0 -536
teradataml/analytics/mle/SVMDenseSummary.py +0 -437
teradataml/analytics/mle/SVMSparse.py +0 -557
teradataml/analytics/mle/SVMSparsePredict.py +0 -553
teradataml/analytics/mle/SVMSparseSummary.py +0 -435
teradataml/analytics/mle/Sampling.py +0 -549
teradataml/analytics/mle/Scale.py +0 -565
teradataml/analytics/mle/ScaleByPartition.py +0 -496
teradataml/analytics/mle/ScaleMap.py +0 -378
teradataml/analytics/mle/ScaleSummary.py +0 -320
teradataml/analytics/mle/SentenceExtractor.py +0 -363
teradataml/analytics/mle/SentimentEvaluator.py +0 -432
teradataml/analytics/mle/SentimentExtractor.py +0 -578
teradataml/analytics/mle/SentimentTrainer.py +0 -405
teradataml/analytics/mle/SeriesSplitter.py +0 -641
teradataml/analytics/mle/Sessionize.py +0 -475
teradataml/analytics/mle/SimpleMovAvg.py +0 -397
teradataml/analytics/mle/StringSimilarity.py +0 -425
teradataml/analytics/mle/TF.py +0 -389
teradataml/analytics/mle/TFIDF.py +0 -504
teradataml/analytics/mle/TextChunker.py +0 -414
teradataml/analytics/mle/TextClassifier.py +0 -399
teradataml/analytics/mle/TextClassifierEvaluator.py +0 -413
teradataml/analytics/mle/TextClassifierTrainer.py +0 -565
teradataml/analytics/mle/TextMorph.py +0 -494
teradataml/analytics/mle/TextParser.py +0 -623
teradataml/analytics/mle/TextTagger.py +0 -530
teradataml/analytics/mle/TextTokenizer.py +0 -502
teradataml/analytics/mle/UnivariateStatistics.py +0 -488
teradataml/analytics/mle/Unpack.py +0 -526
teradataml/analytics/mle/Unpivot.py +0 -438
teradataml/analytics/mle/VarMax.py +0 -776
teradataml/analytics/mle/VectorDistance.py +0 -762
teradataml/analytics/mle/WeightedMovAvg.py +0 -400
teradataml/analytics/mle/XGBoost.py +0 -842
teradataml/analytics/mle/XGBoostPredict.py +0 -627
teradataml/analytics/mle/__init__.py +0 -123
teradataml/analytics/mle/json/adaboost_mle.json +0 -135
teradataml/analytics/mle/json/adaboostpredict_mle.json +0 -85
teradataml/analytics/mle/json/antiselect_mle.json +0 -34
teradataml/analytics/mle/json/antiselect_mle_mle.json +0 -34
teradataml/analytics/mle/json/arima_mle.json +0 -172
teradataml/analytics/mle/json/arimapredict_mle.json +0 -52
teradataml/analytics/mle/json/attribution_mle_mle.json +0 -143
teradataml/analytics/mle/json/betweenness_mle.json +0 -97
teradataml/analytics/mle/json/burst_mle.json +0 -140
teradataml/analytics/mle/json/ccm_mle.json +0 -124
teradataml/analytics/mle/json/ccmprepare_mle.json +0 -14
teradataml/analytics/mle/json/cfilter_mle.json +0 -93
teradataml/analytics/mle/json/changepointdetection_mle.json +0 -92
teradataml/analytics/mle/json/changepointdetectionrt_mle.json +0 -78
teradataml/analytics/mle/json/closeness_mle.json +0 -104
teradataml/analytics/mle/json/confusionmatrix_mle.json +0 -79
teradataml/analytics/mle/json/correlation_mle.json +0 -86
teradataml/analytics/mle/json/correlationreduce_mle.json +0 -49
teradataml/analytics/mle/json/coxhazardratio_mle.json +0 -89
teradataml/analytics/mle/json/coxph_mle.json +0 -98
teradataml/analytics/mle/json/coxsurvival_mle.json +0 -79
teradataml/analytics/mle/json/cumulativemovavg_mle.json +0 -34
teradataml/analytics/mle/json/decisionforest_mle.json +0 -167
teradataml/analytics/mle/json/decisionforestevaluator_mle.json +0 -33
teradataml/analytics/mle/json/decisionforestpredict_mle_mle.json +0 -74
teradataml/analytics/mle/json/decisiontree_mle.json +0 -194
teradataml/analytics/mle/json/decisiontreepredict_mle_mle.json +0 -86
teradataml/analytics/mle/json/dtw_mle.json +0 -97
teradataml/analytics/mle/json/dwt2d_mle.json +0 -116
teradataml/analytics/mle/json/dwt_mle.json +0 -101
teradataml/analytics/mle/json/exponentialmovavg_mle.json +0 -55
teradataml/analytics/mle/json/fmeasure_mle.json +0 -58
teradataml/analytics/mle/json/fpgrowth_mle.json +0 -159
teradataml/analytics/mle/json/frequentpaths_mle.json +0 -129
teradataml/analytics/mle/json/glm_mle.json +0 -111
teradataml/analytics/mle/json/glml1l2_mle.json +0 -106
teradataml/analytics/mle/json/glml1l2predict_mle.json +0 -57
teradataml/analytics/mle/json/glmpredict_mle_mle.json +0 -74
teradataml/analytics/mle/json/histogram_mle.json +0 -100
teradataml/analytics/mle/json/hmmdecoder_mle.json +0 -192
teradataml/analytics/mle/json/hmmevaluator_mle.json +0 -206
teradataml/analytics/mle/json/hmmsupervised_mle.json +0 -91
teradataml/analytics/mle/json/hmmunsupervised_mle.json +0 -114
teradataml/analytics/mle/json/identitymatch_mle.json +0 -88
teradataml/analytics/mle/json/idwt2d_mle.json +0 -73
teradataml/analytics/mle/json/idwt_mle.json +0 -66
teradataml/analytics/mle/json/interpolator_mle.json +0 -151
teradataml/analytics/mle/json/kmeans_mle.json +0 -97
teradataml/analytics/mle/json/knn_mle.json +0 -141
teradataml/analytics/mle/json/knnrecommender_mle.json +0 -111
teradataml/analytics/mle/json/knnrecommenderpredict_mle.json +0 -75
teradataml/analytics/mle/json/lar_mle.json +0 -78
teradataml/analytics/mle/json/larpredict_mle.json +0 -69
teradataml/analytics/mle/json/lda_mle.json +0 -130
teradataml/analytics/mle/json/ldainference_mle.json +0 -78
teradataml/analytics/mle/json/ldatopicsummary_mle.json +0 -64
teradataml/analytics/mle/json/levenshteindistance_mle.json +0 -92
teradataml/analytics/mle/json/linreg_mle.json +0 -42
teradataml/analytics/mle/json/linregpredict_mle.json +0 -56
teradataml/analytics/mle/json/minhash_mle.json +0 -113
teradataml/analytics/mle/json/modularity_mle.json +0 -91
teradataml/analytics/mle/json/naivebayespredict_mle_mle.json +0 -85
teradataml/analytics/mle/json/naivebayesreduce_mle.json +0 -52
teradataml/analytics/mle/json/naivebayestextclassifierpredict_mle_mle.json +0 -147
teradataml/analytics/mle/json/naivebayestextclassifiertrainer2_mle.json +0 -108
teradataml/analytics/mle/json/naivebayestextclassifiertrainer_mle.json +0 -102
teradataml/analytics/mle/json/namedentityfinder_mle.json +0 -84
teradataml/analytics/mle/json/namedentityfinderevaluatorreduce_mle.json +0 -43
teradataml/analytics/mle/json/namedentityfindertrainer_mle.json +0 -64
teradataml/analytics/mle/json/nerevaluator_mle.json +0 -54
teradataml/analytics/mle/json/nerextractor_mle.json +0 -87
teradataml/analytics/mle/json/nertrainer_mle.json +0 -89
teradataml/analytics/mle/json/ngrams_mle.json +0 -137
teradataml/analytics/mle/json/ngramsplitter_mle_mle.json +0 -137
teradataml/analytics/mle/json/npath@coprocessor_mle.json +0 -73
teradataml/analytics/mle/json/ntree@coprocessor_mle.json +0 -123
teradataml/analytics/mle/json/pack_mle.json +0 -58
teradataml/analytics/mle/json/pack_mle_mle.json +0 -58
teradataml/analytics/mle/json/pagerank_mle.json +0 -81
teradataml/analytics/mle/json/pathanalyzer_mle.json +0 -63
teradataml/analytics/mle/json/pathgenerator_mle.json +0 -40
teradataml/analytics/mle/json/pathstart_mle.json +0 -62
teradataml/analytics/mle/json/pathsummarizer_mle.json +0 -72
teradataml/analytics/mle/json/pivoting_mle.json +0 -71
teradataml/analytics/mle/json/postagger_mle.json +0 -51
teradataml/analytics/mle/json/randomsample_mle.json +0 -131
teradataml/analytics/mle/json/randomwalksample_mle.json +0 -85
teradataml/analytics/mle/json/roc_mle.json +0 -73
teradataml/analytics/mle/json/sampling_mle.json +0 -75
teradataml/analytics/mle/json/sax_mle.json +0 -154
teradataml/analytics/mle/json/scale_mle.json +0 -93
teradataml/analytics/mle/json/scalebypartition_mle.json +0 -89
teradataml/analytics/mle/json/scalemap_mle.json +0 -44
teradataml/analytics/mle/json/scalesummary_mle.json +0 -14
teradataml/analytics/mle/json/sentenceextractor_mle.json +0 -41
teradataml/analytics/mle/json/sentimentevaluator_mle.json +0 -43
teradataml/analytics/mle/json/sentimentextractor_mle.json +0 -100
teradataml/analytics/mle/json/sentimenttrainer_mle.json +0 -68
teradataml/analytics/mle/json/seriessplitter_mle.json +0 -133
teradataml/analytics/mle/json/sessionize_mle_mle.json +0 -62
teradataml/analytics/mle/json/simplemovavg_mle.json +0 -48
teradataml/analytics/mle/json/stringsimilarity_mle.json +0 -50
teradataml/analytics/mle/json/stringsimilarity_mle_mle.json +0 -50
teradataml/analytics/mle/json/svmdense_mle.json +0 -165
teradataml/analytics/mle/json/svmdensepredict_mle.json +0 -95
teradataml/analytics/mle/json/svmdensesummary_mle.json +0 -58
teradataml/analytics/mle/json/svmsparse_mle.json +0 -148
teradataml/analytics/mle/json/svmsparsepredict_mle_mle.json +0 -103
teradataml/analytics/mle/json/svmsparsesummary_mle.json +0 -57
teradataml/analytics/mle/json/textchunker_mle.json +0 -40
teradataml/analytics/mle/json/textclassifier_mle.json +0 -51
teradataml/analytics/mle/json/textclassifierevaluator_mle.json +0 -43
teradataml/analytics/mle/json/textclassifiertrainer_mle.json +0 -103
teradataml/analytics/mle/json/textmorph_mle.json +0 -63
teradataml/analytics/mle/json/textparser_mle.json +0 -166
teradataml/analytics/mle/json/texttagger_mle.json +0 -81
teradataml/analytics/mle/json/texttokenizer_mle.json +0 -91
teradataml/analytics/mle/json/tf_mle.json +0 -33
teradataml/analytics/mle/json/tfidf_mle.json +0 -34
teradataml/analytics/mle/json/univariatestatistics_mle.json +0 -81
teradataml/analytics/mle/json/unpack_mle.json +0 -91
teradataml/analytics/mle/json/unpack_mle_mle.json +0 -91
teradataml/analytics/mle/json/unpivoting_mle.json +0 -63
teradataml/analytics/mle/json/varmax_mle.json +0 -176
teradataml/analytics/mle/json/vectordistance_mle.json +0 -179
teradataml/analytics/mle/json/weightedmovavg_mle.json +0 -48
teradataml/analytics/mle/json/xgboost_mle.json +0 -178
teradataml/analytics/mle/json/xgboostpredict_mle.json +0 -104
teradataml/analytics/sqle/Antiselect.py +0 -321
teradataml/analytics/sqle/Attribution.py +0 -603
teradataml/analytics/sqle/DecisionForestPredict.py +0 -408
teradataml/analytics/sqle/GLMPredict.py +0 -430
teradataml/analytics/sqle/MovingAverage.py +0 -543
teradataml/analytics/sqle/NGramSplitter.py +0 -548
teradataml/analytics/sqle/NPath.py +0 -632
teradataml/analytics/sqle/NaiveBayesTextClassifierPredict.py +0 -515
teradataml/analytics/sqle/Pack.py +0 -388
teradataml/analytics/sqle/SVMSparsePredict.py +0 -464
teradataml/analytics/sqle/Sessionize.py +0 -390
teradataml/analytics/sqle/StringSimilarity.py +0 -400
teradataml/analytics/sqle/Unpack.py +0 -503
teradataml/analytics/sqle/json/antiselect_sqle.json +0 -21
teradataml/analytics/sqle/json/attribution_sqle.json +0 -92
teradataml/analytics/sqle/json/decisionforestpredict_sqle.json +0 -48
teradataml/analytics/sqle/json/glmpredict_sqle.json +0 -48
teradataml/analytics/sqle/json/h2opredict_sqle.json +0 -63
teradataml/analytics/sqle/json/movingaverage_sqle.json +0 -58
teradataml/analytics/sqle/json/naivebayestextclassifierpredict_sqle.json +0 -76
teradataml/analytics/sqle/json/ngramsplitter_sqle.json +0 -126
teradataml/analytics/sqle/json/npath_sqle.json +0 -67
teradataml/analytics/sqle/json/pack_sqle.json +0 -47
teradataml/analytics/sqle/json/pmmlpredict_sqle.json +0 -55
teradataml/analytics/sqle/json/sessionize_sqle.json +0 -43
teradataml/analytics/sqle/json/stringsimilarity_sqle.json +0 -39
teradataml/analytics/sqle/json/svmsparsepredict_sqle.json +0 -74
teradataml/analytics/sqle/json/unpack_sqle.json +0 -80
teradataml/catalog/model_cataloging.py +0 -980
teradataml/config/mlengine_alias_definitions_v1.0 +0 -118
teradataml/config/mlengine_alias_definitions_v1.1 +0 -127
teradataml/config/mlengine_alias_definitions_v1.3 +0 -129
teradataml/table_operators/sandbox_container_util.py +0 -643
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/WHEEL +0 -0
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/top_level.txt +0 -0
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/zip-safe +0 -0

teradataml/LICENSE-3RD-PARTY.pdf CHANGED Viewed

Binary file

teradataml/LICENSE.pdf CHANGED Viewed

Binary file

teradataml/README.md CHANGED Viewed

@@ -6,7 +6,7 @@ For community support, please visit the [Teradata Community](https://support.ter
 For Teradata customer support, please visit [Teradata Support](https://support.teradata.com/csm).
-Copyright 2023, Teradata. All Rights Reserved.
+Copyright 2024, Teradata. All Rights Reserved.
 ### Table of Contents
 * [Release Notes](#release-notes)
@@ -16,6 +16,243 @@ Copyright 2023, Teradata. All Rights Reserved.
 * [License](#license)
 ## Release Notes:
+#### teradataml 20.00.00.00
+* ##### New Features/Functionality
+    * ###### teradataml OpenML: Run Opensource packages through Teradata Vantage
+      `OpenML` dynamically exposes opensource packages through Teradata Vantage. `OpenML` provides an
+      interface object through which exposed classes and functions of opensource packages can be accessed
+      with the same syntax and arguments.
+      The following functionality is added in the current release:
+      * `td_sklearn` - Interface object to run scikit-learn functions and classes through Teradata Vantage.
+      Example usage below:
+        ```
+        from teradataml import td_sklearn, DataFrame
+        df_train = DataFrame("multi_model_classification")
+        feature_columns = ["col1", "col2", "col3", "col4"]
+        label_columns = ["label"]
+        part_columns = ["partition_column_1", "partition_column_2"]
+        linear_svc = td_sklearn.LinearSVC()
+        ```
+      * `OpenML` is supported in both Teradata Vantage Enterprise and Teradata Vantage Lake.
+      * Argument Support:
+        * `Use of X and y arguments` - Scikit-learn users are familiar with using `X` and `y` as argument names
+        which take data as pandas DataFrames, numpy arrays or lists etc. However, in OpenML, we pass
+        teradataml DataFrames for arguments `X` and `y`.
+          ```
+          df_x = df_train.select(feature_columns)
+          df_y = df_train.select(label_columns)
+          linear_svc = linear_svc.fit(X=df_x, y=df_y)
+          ```
+        * `Additional support for data, feature_columns, label_columns and group_columns arguments` -
+        Apart from traditional arguments, OpenML supports additional arguments - `data`,
+        `feature_columns`, `label_columns` and `group_columns`. These are used as alternatives to `X`, `y`
+        and `groups`.
+          ```
+          linear_svc = linear_svc.fit(data=df_train, feature_columns=feature_columns, label_colums=label_columns)
+          ```
+      * `Support for classification and regression metrics` - Metrics functions for classification and
+      regression in `sklearn.metrics` module are supported. Other metrics functions' support will be added
+      in future releases.
+      * `Distributed Modeling and partition_columns argument support` - Existing scikit-learn supports
+      only single model generation. However, OpenML supports both single model use case and distributed
+      (multi) model use case. For this, user has to additionally pass `partition_columns` argument to
+      existing `fit()`, `predict()` or any other function to be run. This will generate multiple models
+      for multiple partitions, using the data in corresponding partition.
+        ```
+        df_x_1 = df_train.select(feature_columns + part_columns)
+        linear_svc = linear_svc.fit(X=df_x_1, y=df_y, partition_columns=part_columns)
+        ```
+      * `Support for load and deploy models` - OpenML provides additional support for saving (deploying) the
+      trained models. These models can be loaded later to perform operations like prediction, score etc. The
+      following functions are provided by OpenML:
+        * `<obj>.deploy()` - Used to deploy/save the model created and/or trained by OpenML.
+        * `td_sklearn.deploy()` - Used to deploy/save the model created and/or trained outside teradataml.
+        * `td_sklearn.load()` - Used to load the saved models.
+      <br>Refer Teradata Python Package User Guide for more details of this feature, arguments, usage, examples and supportability in both VantageCloud Enterprise and VantageCloud Lake.
+    * ###### teradataml: AutoML - Automated end to end Machine Learning flow.
+      AutoML is an approach to automate the process of building, training, and validating machine learning models.
+      It involves automation of various aspects of the machine learning workflow, such as feature exploration,
+      feature engineering, data preparation, model training and evaluation for given dataset.
+      teradataml AutoML feature offers best model identification, model leaderboard generation, parallel execution,
+      early stopping feature, model evaluation, model prediction, live logging, customization on default process.
+      * `AutoML`
+        AutoML is a generic algorithm that supports all three tasks, i.e. 'Regression',
+        'Binary Classification' and 'Multiclass Classification'.
+        * Methods of AutoML
+          * `__init__()` - Instantiate an object of AutoML with given parameters.
+          * `fit()` - Perform fit on specified data and target column.
+          * `leaderboard()` - Get the leaderboard for the AutoML. Presents diverse models, feature
+          selection method, and performance metrics.
+          * `leader()` - Show best performing model and its details such as feature
+          selection method, and performance metrics.
+          * `predict()` - Perform prediction on the data using the best model or the model of users
+          choice from the leaderboard.
+          * `generate_custom_config()` - Generate custom config JSON file required for customized
+          run of AutoML.
+      * `AutoRegressor`
+        AutoRegressor is a special purpose AutoML feature to run regression specific tasks.
+        * Methods of AutoRegressor
+          * `__init__()` - Instantiate an object of AutoRegressor with given parameters.
+          * `fit()` - Perform fit on specified data and target column.
+          * `leaderboard()` - Get the leaderboard for the AutoRegressor. Presents diverse models, feature
+          selection method, and performance metrics.
+          * `leader()` - Show best performing model and its details such as feature
+          selection method, and performance metrics.
+          * `predict()` - Perform prediction on the data using the best model or the model of users
+          choice from the leaderboard.
+          * `generate_custom_config()` - Generate custom config JSON file required for customized
+          run of AutoRegressor.
+      * `AutoClassifier`
+        AutoClassifier is a special purpose AutoML feature to run classification specific tasks.
+        * Methods of AutoClassifier
+          * `__init__()` - Instantiate an object of AutoClassifier with given parameters.
+          * `fit()` - Perform fit on specified data and target column.
+          * `leaderboard()` - Get the leaderboard for the AutoClassifier. Presents diverse models, feature
+          selection method, and performance metrics.
+          * `leader()` - Show best performing model and its details such as feature
+          selection method, and performance metrics.
+          * `predict()` - Perform prediction on the data using the best model or the model of users
+          choice from the leaderboard.
+          * `generate_custom_config()` - Generate custom config JSON file required for customized
+          run of AutoClassifier.
+    * ###### teradataml: DataFrame
+      * `fillna` - Replace the null values in a column with the value specified.
+      * Data Manipulation
+          * `cube()`- Analyzes data by grouping it into multiple dimensions.
+          * `rollup()` - Analyzes a set of data across a single dimension with more than one level of detail.
+          * `replace()` - Replaces the values for columns.
+    * ###### teradataml: Script and Apply
+      * `deploy()` - Function deploys the model, generated after `execute_script()`, in database or user
+            environment in lake. The function is available in both Script and Apply.
+    * ###### teradataml: DataFrameColumn
+      * `fillna` - Replaces every occurrence of null value in column with the value specified.
+* ###### teradataml DataFrameColumn a.k.a. ColumnExpression
+    * _Date Time Functions_
+      * `DataFrameColumn.week_start()` - Returns the first date or timestamp of the week that begins immediately before the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.week_begin()` - It is an alias for `DataFrameColumn.week_start()` function.
+      * `DataFrameColumn.week_end()` - Returns the last date or timestamp of the week that ends immediately after the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.month_start()` - Returns the first date or timestamp of the month that begins immediately before the specified date or timestamp value in a column or as a literal.
+      * `DataFrameColumn.month_begin()` - It is an alias for `DataFrameColumn.month_start()` function.
+      * `DataFrameColumn.month_end()` - Returns the last date or timestamp of the month that ends immediately after the specified date or timestamp value in a column or as a literal.
+      * `DataFrameColumn.year_start()` - Returns the first date or timestamp of the year that begins immediately before the specified date or timestamp value in a column or as a literal.
+      * `DataFrameColumn.year_begin()` - It is an alias for `DataFrameColumn.year_start()` function.
+      * `DataFrameColumn.year_end()` - Returns the last date or timestamp of the year that ends immediately after the specified date or timestamp value in a column or as a literal.
+      * `DataFrameColumn.quarter_start()` - Returns the first date or timestamp of the quarter that begins immediately before the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.quarter_begin()` - It is an alias for `DataFrameColumn.quarter_start()` function.
+      * `DataFrameColumn.quarter_end()` - Returns the last date or timestamp of the quarter that ends immediately after the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.last_sunday()` - Returns the date or timestamp of Sunday that falls immediately before the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.last_monday()` - Returns the date or timestamp of Monday that falls immediately before the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.last_tuesday()` - Returns the date or timestamp of Tuesday that falls immediately before the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.last_wednesday()` - Returns the date or timestamp of Wednesday that falls immediately before specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.last_thursday()`- Returns the date or timestamp of Thursday that falls immediately before specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.last_friday()` - Returns the date or timestamp of Friday that falls immediately before specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.last_saturday()` - Returns the date or timestamp of Saturday that falls immediately before specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.day_of_week()` - Returns the number of days from the beginning of the week to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.day_of_month()` - Returns the number of days from the beginning of the month to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.day_of_year()` - Returns the number of days from the beginning of the year to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.day_of_calendar()` - Returns the number of days from the beginning of the business calendar to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.week_of_month()` - Returns the number of weeks from the beginning of the month to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.week_of_quarter()` - Returns the number of weeks from the beginning of the quarter to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.week_of_year()` - Returns the number of weeks from the beginning of the year to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.week_of_calendar()` - Returns the number of weeks from the beginning of the calendar to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.month_of_year()` - Returns the number of months from the beginning of the year to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.month_of_calendar()` - Returns the number of months from the beginning of the calendar to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.month_of_quarter()` - Returns the number of months from the beginning of the quarter to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.quarter_of_year()` - Returns the number of quarters from the beginning of the year to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.quarter_of_calendar()` - Returns the number of quarters from the beginning of the calendar to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.year_of_calendar()` - Returns the year of the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.day_occurrence_of_month()` - Returns the nth occurrence of the weekday in the month for the date to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.year()` - Returns the integer value for year in the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.month()` - Returns the integer value for month in the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.hour()` - Returns the integer value for hour in the specified timestamp value in a column as a literal.
+      * `DataFrameColumn.minute()` - Returns the integer value for minute in the specified timestamp value in a column as a literal.
+      * `DataFrameColumn.second()` - Returns the integer value for seconds in the specified timestamp value in a column as a literal.
+      * `DataFrameColumn.week()` - Returns the number of weeks from the beginning of the year to the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.next_day()` - Returns the date of the first weekday specified as 'day_value' that is later than the specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.months_between()` - Returns the number of months between value in specified date or timestamp value in a column as a literal and date or timestamp value in argument.
+      * `DataFrameColumn.add_months()` - Adds an integer number of months to specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.oadd_months()` - Adds an integer number of months, date or timestamp value in specified date or timestamp value in a column as a literal.
+      * `DataFrameColumn.to_date()` - Function converts a string-like representation of a DATE or PERIOD type to Date type.
+    * _String Functions_
+      * `DataFrameColumn.concat()` - Function to concatenate the columns with a separator.
+      * `DataFrameColumn.like()` - Function to match the string pattern. String match is case sensitive.
+      * `DataFrameColumn.ilike()` - Function to match the string pattern. String match is not case sensitive.
+      * `DataFrameColumn.substr()` - Returns the substring from a string column.
+      * `DataFrameColumn.startswith()` - Function to check if the column value starts with the specified value or not.
+      * `DataFrameColumn.endswith()` - Function to check if the column value ends with the specified value or not.
+      * `DataFrameColumn.format()` - Function to format the values in column based on formatter.
+      * `DataFrameColumn.to_char()` - Function converts numeric type or datetype to character type.
+      * `DataFrameColumn.trim()` - Function trims the string values in the column.
+    * _Regular Arithmetic Functions_
+      * `DataFrameColumn.cbrt()` - Computes the cube root of values in the column.
+      * `DataFrameColumn.hex()` - Computes the Hexadecimal from decimal for the values in the column.
+      * `DataframeColumn.hypot()` - Computes the decimal from Hexadecimal for the values in the column.
+      * `DataFrameColumn.unhex()` - computes the hypotenuse for the values between two columns.
+    * _Bit Byte Manipulation Functions_
+      * `DataFrameColumn.from_byte()` - Encodes a sequence of bits into a sequence of characters.
+    * _Comparison Functions_
+      * `DataFrameColumn.greatest()` - Returns the greatest values from columns.
+      * `DataFrameColumn.least()` - Returns the least values from columns.
+    * Behaviour of `DataFrameColumn.replace()` is changed.
+    * Behaviour of `DataFrameColumn.to_byte()` is changed. It now decodes a sequence of characters in a given encoding into a sequence of bits.
+    * Behaviour of `DataFrameColumn.trunc()` is changed. It now accepts Date type columns.
+* ##### Bug Fixes
+  * Argument `url_encode` is no longer used in `create_context()` and is deprecated.
+    * **Important notes**
+      * Users do not need to encode password even if password contain special characters.
+      * Pass the password to the `create_context()` function argument `password` as it is without changing special characters.
+  * `fillna()` in VAL transformation allows to replace NULL values with empty string.
+* ##### Updates
+  * Support for following deprecated functionality is removed:
+    * ML Engine functions
+    * STO and APPLY sandbox feature support for testing the script.
+      * sandbox_container_utils is removed. Following methods can no longer be used:
+        * `setup_sandbox_env()`
+        * `copy_files_from_container()`
+        * `cleanup_sandbox_env()`
+    * Model Cataloging APIs can no longer be used:
+        * `describe_model()`
+        * `delete_model()`
+        * `list_models()`
+        * `publish_model()`
+        * `retrieve_model()`
+        * `save_model()`
+  * `DataFrame.join()`
+    * Arguments `lsuffix` and `rsuffix` now add suffixes to new column names for join operation.
+  * `DataFrame.describe()`
+    * New argument `columns` is added to generate statistics on only those columns instead of all applicable columns.
+  * `DataFrame.groupby()`
+    * Supports `CUBE` and `ROLLUP` with additional optional argument `option`.
+  * `DataFrame.column.window()`
+    * Supports ColumnExpressions for `partition_columns` and `order_columns` arguments.
+  * `DataFrame.column.contains()` allows ColumnExpressions for `pattern` argument.
+  * `DataFrame.window()`
+    * Supports ColumnExpressions for `partition_columns` and `order_columns` arguments.
+#### teradataml 17.20.00.07
+* ##### New Features/Functionality
+  * ###### Open Analytics Framework (OpenAF) APIs:
+      * Manage all user environments.
+        * `create_env()`:
+          * new argument `conda_env` is added to create a conda environment.
+        * `list_user_envs()`:
+          * User can list conda environment(s) by using filter with new argument `conda_env`.
+      *  Conda environment(s) can be managed using APIs for installing , updating, removing files/libraries.
+* ##### Bug Fixes
+  * `columns` argument for `FillNa` function is made optional.
 #### teradataml 17.20.00.06
 * ##### New Features/Functionality
 * ###### teradataml DataFrameColumn a.k.a. ColumnExpression

teradataml/__init__.py CHANGED Viewed

@@ -7,7 +7,6 @@ from teradataml.dbutils.filemgr import *
 from teradataml.dataframe.copy_to import *
 from teradataml.dataframe.fastload import fastload
 from teradataml.data.load_example_data import *
-from teradataml.catalog.model_cataloging import *
 from teradataml.catalog.byom import *
 from teradataml.dataframe.data_transfer import fastexport, read_csv
@@ -16,7 +15,6 @@ from teradataml.dataframe.sql_functions import *
 # import Analytical Function to User's workspace.
 from teradataml.analytics.byom import *
-from teradataml.analytics.mle import *
 from teradataml.analytics.sqle import *
 from teradataml.analytics.table_operator import *
 from teradataml.analytics.uaf import *
@@ -45,7 +43,6 @@ __version__ = v.version
 # Import Table Operator to User's workspace.
 from teradataml.table_operators.Script import *
 from teradataml.table_operators.Apply import *
-from teradataml.table_operators.sandbox_container_util import *
 # Import Geospatial APIs, modules
 from teradataml.geospatial import *
@@ -58,3 +55,16 @@ from teradataml.scriptmgmt import *
 # Import utility functions.
 from teradataml.utils.utils import execute_sql, async_run_status
+import os
+_TDML_DIRECTORY = os.path.dirname(v.__file__)
+from teradataml.opensource import *
+# Import AutoML
+from teradataml.automl import AutoML, AutoRegressor, AutoClassifier
+# Configure app name and app version for querybands
+from teradatasqlalchemy.telemetry.queryband import session_queryband
+session_queryband.configure_queryband_parameters(app_name="TDML", app_version=__version__)

teradataml/_version.py CHANGED Viewed

@@ -8,4 +8,4 @@
 #
 # ##################################################################
-version = "17.20.00.06"
+version = "20.00.00.00"

teradataml/analytics/Transformations.py CHANGED Viewed

@@ -209,7 +209,7 @@ class FillNa(_Transformations):
                 Types: teradataml DataFrame, bool, int, str, float, datetime.date
             columns:
-                Required Argument.
+                Optional Argument.
                 Specifies the names of the columns.
                 Types: str or list of str
@@ -484,7 +484,7 @@ class FillNa(_Transformations):
             >>>
         """
         # Call super()
-        super().__init__(columns=columns, out_columns=out_columns, datatype=datatype, columns_optional=False)
+        super().__init__(columns=columns, out_columns=out_columns, datatype=datatype, columns_optional=True)
         # Initialize style and value as data members.
         self.style = style
         self.value = value
@@ -557,8 +557,8 @@ class FillNa(_Transformations):
         nullstyle_args = self.style.lower()
         if self.style.upper() in ["LITERAL", "IMPUTED"]:
-            nullstyle_args = "{}, {}".format(self.style.lower(), self.value)
+            nullstyle_args = "{}, {}".format(self.style.lower(), '\'\'\'\'' if isinstance(self.value, str) and len(
+                self.value) == 0 else self.value)
         return nullstyle_fmt.format(nullstyle_args)
     def _val_sql_syntax(self):

teradataml/analytics/__init__.py CHANGED Viewed

@@ -14,7 +14,6 @@ based on the json data and attach it to teradataml.
 and function _get_executor_class_name, Internal function to get executor class name for function_type provided.
 """
 from .byom import *
-from .mle import *
 from .sqle import *
 from .table_operator import *
 from .uaf import *
@@ -24,7 +23,6 @@ from .Transformations import Binning, Derive, OneHotEncoder, FillNa, LabelEncode
 from teradataml.analytics.json_parser.utils import _get_json_data_from_tdml_repo, _process_paired_functions
 from teradataml.analytics.analytic_function_executor import _SQLEFunctionExecutor, _TableOperatorExecutor,\
     _UAFFunctionExecutor, _BYOMFunctionExecutor
-import sys
 from teradataml.common.constants import TeradataAnalyticFunctionTypes

teradataml/analytics/analytic_function_executor.py CHANGED Viewed

@@ -29,6 +29,7 @@ from teradataml.common.wrapper_utils import AnalyticsWrapperUtils
 from teradataml.common.utils import UtilFuncs
 from teradataml.context.context import _get_context_temp_databasename
 from teradataml.table_operators.table_operator_query_generator import TableOperatorQueryGenerator
+from teradatasqlalchemy.telemetry.queryband import collect_queryband
 from teradataml.utils.dtypes import _ListOf
 from teradataml.utils.validators import _Validators
@@ -150,6 +151,7 @@ class _AnlyticFunctionExecutor:
         # Validate the function arguments.
         _Validators._validate_function_arguments([argument_info])
+    @collect_queryband(attr="func_name")
     def _execute_query(self, persist=False, volatile=False):
         """
         DESCRIPTION:
@@ -1906,6 +1908,7 @@ class _UAFFunctionExecutor(_SQLEFunctionExecutor):
                 self.__process_individual_argument(output_fmt_argument,
                                                   **kwargs))
+    @collect_queryband(attr="func_name")
     def _execute_query(self, persist=False, volatile=None):
         """
         DESCRIPTION:

teradataml/analytics/json_parser/utils.py CHANGED Viewed

@@ -551,26 +551,27 @@ class _KNNPredict:
             res = KNN_out.evaluate(test_data=computers_train1_encoded.result.iloc[10:])
         """
-        # response_column is required when the model_type is classification or regression.
-        # accumulate is optional in case user specifies accumulate then consider the value specified by the user,
-        # else consider the value specified for response_column.
         params = {"test_data": kwargs.get("test_data"),
                   "id_column": self.id_column,
-                  "voting_weight": self.voting_weight,
-                  "k": self.k,
-                  "tolerance": self.tolerance,
-                  "output_prob": self.output_prob,
-                  "output_responses": self.output_responses,
-                  "emit_neighbors": self.emit_neighbors,
-                  "emit_distances": self.emit_distances,
                   "train_data": self.train_data,
                   "input_columns": self.input_columns,
-                  "model_type": self.model_type,
                   "response_column": kwargs.get("response_column", self.response_column),
                   "accumulate": kwargs.get("accumulate", kwargs.get("response_column", self.response_column)
                                 if getattr(self.obj, "accumulate") is None else self.accumulate)}
+        # KNN works in a different way. predict calls the same function with test data along with
+        # the arguments passed to the actual function. The above parameters are required
+        # arguments so we expect them to be available in output of KNN. However, the below
+        # ones are optional arguments. They can be available or not based on user input. So, before
+        # passing those to KNN again, check whether that argument is passed or not.
+        optional_args = ["model_type", "k", "voting_weight",
+                         "tolerance", "output_prob", "output_responses",
+                         "emit_neighbors", "emit_distances"]
+        for optional_arg in optional_args:
+            if hasattr(self, optional_arg):
+                params[optional_arg] = getattr(self, optional_arg)
         return getattr(module, "KNN")(**params)

teradataml/analytics/sqle/DecisionTreePredict.py CHANGED Viewed

@@ -26,7 +26,6 @@ from teradataml.common.messagecodes import MessageCodes
 from teradataml.common.constants import TeradataConstants
 from teradataml.dataframe.dataframe_utils import DataFrameUtils as df_utils
 from teradataml.options.display import display
-from teradataml.analytics.mle.DecisionTree import DecisionTree
 class DecisionTreePredict:
@@ -52,7 +51,7 @@ class DecisionTreePredict:
             object:
                 Required Argument.
                 Specifies the name of the teradataml DataFrame containing the output
-                model from DecisionTree or instance of DecisionTree.
+                model from DecisionTree.
             object_order_column:
                 Optional Argument.
@@ -132,40 +131,28 @@ class DecisionTreePredict:
         EXAMPLES:
             # Load the data to run the example.
-            load_example_data("DecisionTreePredict", ["iris_attribute_train",
-                                                      "iris_response_train",
-                                                      "iris_attribute_test"])
+            load_example_data("DecisionTreePredict", ["iris_response_train",
+                                                      "iris_attribute_test",
+                                                      "iris_attribute_output"])
             # Create teradataml DataFrame.
             iris_attribute_test = DataFrame.from_table("iris_attribute_test")
-            iris_attribute_train = DataFrame.from_table("iris_attribute_train")
             iris_response_train = DataFrame.from_table("iris_response_train")
+            iris_attribute_output = DataFrame.from_table("iris_attribute_output")
             # Example 1 -
-            # First train the data, i.e., create a decision tree Model
-            td_decision_tree_out  = DecisionTree(attribute_name_columns = 'attribute',
-                                                 attribute_value_column = 'attrvalue',
-                                                 id_columns = 'pid',
-                                                 attribute_table = iris_attribute_train,
-                                                 response_table = iris_response_train,
-                                                 response_column = 'response',
-                                                 approx_splits = True,
-                                                 nodesize = 100,
-                                                 max_depth = 5,
-                                                 weighted = False,
-                                                 split_measure = "gini",
-                                                 output_response_probdist = False)
-            # Run predict on the output of decision tree
+            # Run predict on the output of decision tree in iris_attribute_output
             decision_tree_predict_out = DecisionTreePredict(newdata=iris_attribute_test,
                                                             newdata_partition_column='pid',
-                                                            object=td_decision_tree_out,
+                                                            object=iris_attribute_output,
                                                             attr_table_groupby_columns='attribute',
                                                             attr_table_pid_columns='pid',
                                                             attr_table_val_column='attrvalue',
-                                                            accumulate='pid',
-                                                            output_response_probdist=False,
-                                                            output_responses=['pid','attribute'])
+                                                            accumulate='attribute',
+                                                            output_response_probdist=True,
+                                                            output_responses=['1', '2', '3'])
             # Print output dataframes
             print(decision_tree_predict_out.result)
@@ -227,9 +214,7 @@ class DecisionTreePredict:
         arguments, input argument and table types. Also processes the
         argument values.
         """
-        if isinstance(self.object, DecisionTree):
-            self.object = self.object._mlresults[0]
         # Make sure that a non-NULL value has been supplied for all mandatory arguments
         self.__awu._validate_missing_required_arguments(self.__arg_info_matrix)
@@ -238,7 +223,7 @@ class DecisionTreePredict:
         # Check to make sure input table types are strings or data frame objects or of valid type.
         self.__awu._validate_input_table_datatype(self.newdata, "newdata", None)
-        self.__awu._validate_input_table_datatype(self.object, "object", DecisionTree)
+        self.__awu._validate_input_table_datatype(self.object, "object", DataFrame)
         # Check whether the input columns passed to the argument are not empty.
         # Also check whether the input columns passed to the argument valid or not.

teradataml/analytics/sqle/NaiveBayesPredict.py CHANGED Viewed

@@ -27,7 +27,6 @@ from teradataml.common.constants import TeradataConstants
 from teradataml.dataframe.dataframe_utils import DataFrameUtils as df_utils
 from teradataml.options.display import display
 from teradataml.common.formula import Formula
-from teradataml.analytics.mle.NaiveBayes import NaiveBayes
 class NaiveBayesPredict:
@@ -104,21 +103,20 @@ class NaiveBayesPredict:
         EXAMPLES:
             # Load the data to run the example
-            load_example_data("NaiveBayesPredict",["nb_iris_input_test","nb_iris_input_train"])
+            load_example_data("NaiveBayesPredict",["nb_iris_input_test"])
+            load_example_data("teradataml","nbp_iris_model")
             # Create teradataml DataFrame objects.
-            nb_iris_input_train = DataFrame.from_table("nb_iris_input_train")
             nb_iris_input_test = DataFrame.from_table("nb_iris_input_test")
+            nbp_iris_model = DataFrame.from_table("nbp_iris_model")
             # Example 1 -
-            # Run the train function
-            naivebayes_train = NaiveBayes(formula="species ~ petal_length + sepal_width + petal_width + sepal_length",
-                                          data=nb_iris_input_train)
-            # Generate prediction using output of train function
+            # Generate prediction using output of train stored in nbp_iris_model.
             naivebayes_predict_result = NaiveBayesPredict(newdata=nb_iris_input_test,
-                                                          modeldata = naivebayes_train,
+                                                          modeldata = nbp_iris_model,
                                                           id_col = "id",
+                                                          formula="species ~ .",
                                                           responses = ["virginica","setosa","versicolor"]
                                                           )
@@ -174,14 +172,7 @@ class NaiveBayesPredict:
         arguments, input argument and table types. Also processes the
         argument values.
         """
-        if isinstance(self.modeldata, NaiveBayes):
-            self.formula = self.modeldata.formula
-            self.modeldata = self.modeldata._mlresults[0]
-        else:
-            if self.formula is None:
-                raise TeradataMlException(Messages.get_message(MessageCodes.MISSING_ARGS, "formula"),
-                                          MessageCodes.MISSING_ARGS)
         # Make sure that a non-NULL value has been supplied for all mandatory arguments
         self.__awu._validate_missing_required_arguments(self.__arg_info_matrix)
@@ -190,7 +181,7 @@ class NaiveBayesPredict:
         # Check to make sure input table types are strings or data frame objects or of valid type.
         self.__awu._validate_input_table_datatype(self.newdata, "newdata", None)
-        self.__awu._validate_input_table_datatype(self.modeldata, "modeldata", NaiveBayes)
+        self.__awu._validate_input_table_datatype(self.modeldata, "modeldata", None)
         # Check whether the input columns passed to the argument are not empty.
         # Also check whether the input columns passed to the argument valid or not.

teradataml/analytics/sqle/__init__.py CHANGED Viewed

@@ -1,18 +1,5 @@
-from teradataml.analytics.sqle.Antiselect import Antiselect
-from teradataml.analytics.sqle.Attribution import Attribution
-from teradataml.analytics.sqle.DecisionForestPredict import DecisionForestPredict
 from teradataml.analytics.sqle.DecisionTreePredict import DecisionTreePredict
-from teradataml.analytics.sqle.GLMPredict import GLMPredict
-from teradataml.analytics.sqle.MovingAverage import MovingAverage
-from teradataml.analytics.sqle.NGramSplitter import NGramSplitter
-from teradataml.analytics.sqle.NPath import NPath
 from teradataml.analytics.sqle.NaiveBayesPredict import NaiveBayesPredict
-from teradataml.analytics.sqle.NaiveBayesTextClassifierPredict import NaiveBayesTextClassifierPredict
-from teradataml.analytics.sqle.Pack import Pack
-from teradataml.analytics.sqle.Sessionize import Sessionize
-from teradataml.analytics.sqle.StringSimilarity import StringSimilarity
-from teradataml.analytics.sqle.SVMSparsePredict import SVMSparsePredict
-from teradataml.analytics.sqle.Unpack import Unpack
 from teradataml.analytics.meta_class import _AnalyticFunction
 from teradataml.analytics.meta_class import _common_init

teradataml/analytics/utils.py CHANGED Viewed

@@ -264,6 +264,7 @@ def _display_functions(func_type_category_name_dict, func_types=None, search_key
     # Check for type of 'type'. If str, convert it to list.
     func_types = UtilFuncs._as_list(func_types)
+    func_types = list(map(lambda x: x.upper(), func_types))
     # Map to store function types and corresponding type to be printed.
     func_type_display_type_map = {"SQLE": "Analytics Database",

teradataml/analytics/valib.py CHANGED Viewed

@@ -12,6 +12,8 @@ Library (VALIB) Function.
 import time
 import uuid
 from math import floor
+from teradatasqlalchemy.telemetry.queryband import collect_queryband
 from teradataml.common import messages
 from teradataml.common.constants import TeradataConstants, ValibConstants as VC
 from teradataml.common.exceptions import TeradataMlException
@@ -230,6 +232,7 @@ class _VALIB():
         self.__dyn_cls_data_members[out_var]._index_query_required = False
         self.__dyn_cls_data_members[VC.OUTPUT_DATAFRAME_RESULTS.value].append(out_var)
+    @collect_queryband(attr="_VALIB__sql_func_name")
     def __generate_execute_sp_query(self):
         """
         DESCRIPTION:

teradataml 17.20.0.6__py3-none-any.whl → 20.0.0.0__py3-none-any.whl

Potentially problematic release.

teradataml 17.20.0.6py3-none-any.whl → 20.0.0.0py3-none-any.whl