PyPI - teradataml - Versions diffs - 17.20.0.6__py3-none-any.whl → 20.0.0.0__py3-none-any.whl - Mend

teradataml 17.20.0.6py3-none-any.whl → 20.0.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of teradataml might be problematic. Click here for more details.

Files changed (432) hide show

teradataml/LICENSE-3RD-PARTY.pdf +0 -0
teradataml/LICENSE.pdf +0 -0
teradataml/README.md +238 -1
teradataml/__init__.py +13 -3
teradataml/_version.py +1 -1
teradataml/analytics/Transformations.py +4 -4
teradataml/analytics/__init__.py +0 -2
teradataml/analytics/analytic_function_executor.py +3 -0
teradataml/analytics/json_parser/utils.py +13 -12
teradataml/analytics/sqle/DecisionTreePredict.py +15 -30
teradataml/analytics/sqle/NaiveBayesPredict.py +11 -20
teradataml/analytics/sqle/__init__.py +0 -13
teradataml/analytics/utils.py +1 -0
teradataml/analytics/valib.py +3 -0
teradataml/automl/__init__.py +1628 -0
teradataml/automl/custom_json_utils.py +1270 -0
teradataml/automl/data_preparation.py +993 -0
teradataml/automl/data_transformation.py +727 -0
teradataml/automl/feature_engineering.py +1648 -0
teradataml/automl/feature_exploration.py +547 -0
teradataml/automl/model_evaluation.py +163 -0
teradataml/automl/model_training.py +887 -0
teradataml/catalog/__init__.py +0 -2
teradataml/catalog/byom.py +49 -6
teradataml/catalog/function_argument_mapper.py +0 -2
teradataml/catalog/model_cataloging_utils.py +2 -1021
teradataml/common/aed_utils.py +6 -2
teradataml/common/constants.py +50 -58
teradataml/common/deprecations.py +160 -0
teradataml/common/garbagecollector.py +61 -104
teradataml/common/messagecodes.py +27 -36
teradataml/common/messages.py +11 -15
teradataml/common/utils.py +205 -287
teradataml/common/wrapper_utils.py +1 -110
teradataml/context/context.py +150 -78
teradataml/data/bank_churn.csv +10001 -0
teradataml/data/bmi.csv +501 -0
teradataml/data/docs/sqle/docs_17_10/BincodeFit.py +3 -3
teradataml/data/docs/sqle/docs_17_10/BincodeTransform.py +6 -5
teradataml/data/docs/sqle/docs_17_10/Fit.py +1 -1
teradataml/data/docs/sqle/docs_17_10/OneHotEncodingTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_10/OutlierFilterTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_10/PolynomialFeaturesTransform.py +2 -2
teradataml/data/docs/sqle/docs_17_10/RowNormalizeTransform.py +2 -1
teradataml/data/docs/sqle/docs_17_10/ScaleTransform.py +1 -0
teradataml/data/docs/sqle/docs_17_10/SimpleImputeTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_10/Transform.py +2 -1
teradataml/data/docs/sqle/docs_17_20/BincodeFit.py +3 -3
teradataml/data/docs/sqle/docs_17_20/BincodeTransform.py +6 -5
teradataml/data/docs/sqle/docs_17_20/Fit.py +1 -1
teradataml/data/docs/sqle/docs_17_20/GLM.py +1 -1
teradataml/data/docs/sqle/docs_17_20/GLMPredictPerSegment.py +9 -10
teradataml/data/docs/sqle/docs_17_20/KMeansPredict.py +3 -2
teradataml/data/docs/sqle/docs_17_20/NaiveBayesTextClassifierPredict.py +16 -15
teradataml/data/docs/sqle/docs_17_20/NaiveBayesTextClassifierTrainer.py +2 -2
teradataml/data/docs/sqle/docs_17_20/NonLinearCombineFit.py +2 -2
teradataml/data/docs/sqle/docs_17_20/NonLinearCombineTransform.py +8 -8
teradataml/data/docs/sqle/docs_17_20/OneClassSVMPredict.py +21 -20
teradataml/data/docs/sqle/docs_17_20/OneHotEncodingTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_20/OutlierFilterTransform.py +8 -3
teradataml/data/docs/sqle/docs_17_20/PolynomialFeaturesTransform.py +6 -5
teradataml/data/docs/sqle/docs_17_20/RandomProjectionTransform.py +6 -6
teradataml/data/docs/sqle/docs_17_20/RowNormalizeTransform.py +2 -1
teradataml/data/docs/sqle/docs_17_20/SVM.py +1 -1
teradataml/data/docs/sqle/docs_17_20/SVMPredict.py +16 -16
teradataml/data/docs/sqle/docs_17_20/ScaleTransform.py +1 -0
teradataml/data/docs/sqle/docs_17_20/SimpleImputeTransform.py +3 -2
teradataml/data/docs/sqle/docs_17_20/TDDecisionForestPredict.py +4 -4
teradataml/data/docs/sqle/docs_17_20/TDGLMPredict.py +19 -19
teradataml/data/docs/sqle/docs_17_20/TargetEncodingTransform.py +5 -4
teradataml/data/docs/sqle/docs_17_20/Transform.py +2 -2
teradataml/data/docs/sqle/docs_17_20/XGBoostPredict.py +9 -9
teradataml/data/fish.csv +160 -0
teradataml/data/glass_types.csv +215 -0
teradataml/data/insurance.csv +1 -1
teradataml/data/iris_data.csv +151 -0
teradataml/data/jsons/sqle/17.10/TD_FunctionTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_OneHotEncodingTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_OutlierFilterTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_PolynomialFeaturesTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_RowNormalizeTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_ScaleTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_SimpleImputeTransform.json +1 -0
teradataml/data/load_example_data.py +3 -0
teradataml/data/multi_model_classification.csv +401 -0
teradataml/data/multi_model_regression.csv +401 -0
teradataml/data/openml_example.json +63 -0
teradataml/data/scripts/deploy_script.py +65 -0
teradataml/data/scripts/mapper.R +20 -0
teradataml/data/scripts/sklearn/__init__.py +0 -0
teradataml/data/scripts/sklearn/sklearn_fit.py +175 -0
teradataml/data/scripts/sklearn/sklearn_fit_predict.py +135 -0
teradataml/data/scripts/sklearn/sklearn_function.template +113 -0
teradataml/data/scripts/sklearn/sklearn_model_selection_split.py +158 -0
teradataml/data/scripts/sklearn/sklearn_neighbors.py +152 -0
teradataml/data/scripts/sklearn/sklearn_score.py +128 -0
teradataml/data/scripts/sklearn/sklearn_transform.py +179 -0
teradataml/data/templates/open_source_ml.json +9 -0
teradataml/data/teradataml_example.json +73 -1
teradataml/data/test_classification.csv +101 -0
teradataml/data/test_prediction.csv +101 -0
teradataml/data/test_regression.csv +101 -0
teradataml/data/train_multiclass.csv +101 -0
teradataml/data/train_regression.csv +101 -0
teradataml/data/train_regression_multiple_labels.csv +101 -0
teradataml/data/wine_data.csv +1600 -0
teradataml/dataframe/copy_to.py +79 -13
teradataml/dataframe/data_transfer.py +8 -0
teradataml/dataframe/dataframe.py +910 -311
teradataml/dataframe/dataframe_utils.py +102 -5
teradataml/dataframe/fastload.py +11 -3
teradataml/dataframe/setop.py +15 -2
teradataml/dataframe/sql.py +3735 -77
teradataml/dataframe/sql_function_parameters.py +56 -5
teradataml/dataframe/vantage_function_types.py +45 -1
teradataml/dataframe/window.py +30 -29
teradataml/dbutils/dbutils.py +18 -1
teradataml/geospatial/geodataframe.py +18 -7
teradataml/geospatial/geodataframecolumn.py +5 -0
teradataml/hyperparameter_tuner/optimizer.py +910 -120
teradataml/hyperparameter_tuner/utils.py +131 -37
teradataml/lib/aed_0_1.dll +0 -0
teradataml/lib/libaed_0_1.dylib +0 -0
teradataml/lib/libaed_0_1.so +0 -0
teradataml/libaed_0_1.dylib +0 -0
teradataml/libaed_0_1.so +0 -0
teradataml/opensource/__init__.py +1 -0
teradataml/opensource/sklearn/__init__.py +1 -0
teradataml/opensource/sklearn/_class.py +255 -0
teradataml/opensource/sklearn/_sklearn_wrapper.py +1668 -0
teradataml/opensource/sklearn/_wrapper_utils.py +268 -0
teradataml/opensource/sklearn/constants.py +54 -0
teradataml/options/__init__.py +3 -6
teradataml/options/configure.py +21 -20
teradataml/scriptmgmt/UserEnv.py +61 -5
teradataml/scriptmgmt/lls_utils.py +135 -53
teradataml/table_operators/Apply.py +38 -6
teradataml/table_operators/Script.py +45 -308
teradataml/table_operators/TableOperator.py +182 -591
teradataml/table_operators/__init__.py +0 -1
teradataml/table_operators/table_operator_util.py +32 -40
teradataml/utils/validators.py +127 -3
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/METADATA +243 -3
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/RECORD +147 -391
teradataml/analytics/mle/AdaBoost.py +0 -651
teradataml/analytics/mle/AdaBoostPredict.py +0 -564
teradataml/analytics/mle/Antiselect.py +0 -342
teradataml/analytics/mle/Arima.py +0 -641
teradataml/analytics/mle/ArimaPredict.py +0 -477
teradataml/analytics/mle/Attribution.py +0 -1070
teradataml/analytics/mle/Betweenness.py +0 -658
teradataml/analytics/mle/Burst.py +0 -711
teradataml/analytics/mle/CCM.py +0 -600
teradataml/analytics/mle/CCMPrepare.py +0 -324
teradataml/analytics/mle/CFilter.py +0 -460
teradataml/analytics/mle/ChangePointDetection.py +0 -572
teradataml/analytics/mle/ChangePointDetectionRT.py +0 -477
teradataml/analytics/mle/Closeness.py +0 -737
teradataml/analytics/mle/ConfusionMatrix.py +0 -420
teradataml/analytics/mle/Correlation.py +0 -477
teradataml/analytics/mle/Correlation2.py +0 -573
teradataml/analytics/mle/CoxHazardRatio.py +0 -679
teradataml/analytics/mle/CoxPH.py +0 -556
teradataml/analytics/mle/CoxSurvival.py +0 -478
teradataml/analytics/mle/CumulativeMovAvg.py +0 -363
teradataml/analytics/mle/DTW.py +0 -623
teradataml/analytics/mle/DWT.py +0 -564
teradataml/analytics/mle/DWT2D.py +0 -599
teradataml/analytics/mle/DecisionForest.py +0 -716
teradataml/analytics/mle/DecisionForestEvaluator.py +0 -363
teradataml/analytics/mle/DecisionForestPredict.py +0 -561
teradataml/analytics/mle/DecisionTree.py +0 -830
teradataml/analytics/mle/DecisionTreePredict.py +0 -528
teradataml/analytics/mle/ExponentialMovAvg.py +0 -418
teradataml/analytics/mle/FMeasure.py +0 -402
teradataml/analytics/mle/FPGrowth.py +0 -734
teradataml/analytics/mle/FrequentPaths.py +0 -695
teradataml/analytics/mle/GLM.py +0 -558
teradataml/analytics/mle/GLML1L2.py +0 -547
teradataml/analytics/mle/GLML1L2Predict.py +0 -519
teradataml/analytics/mle/GLMPredict.py +0 -529
teradataml/analytics/mle/HMMDecoder.py +0 -945
teradataml/analytics/mle/HMMEvaluator.py +0 -901
teradataml/analytics/mle/HMMSupervised.py +0 -521
teradataml/analytics/mle/HMMUnsupervised.py +0 -572
teradataml/analytics/mle/Histogram.py +0 -561
teradataml/analytics/mle/IDWT.py +0 -476
teradataml/analytics/mle/IDWT2D.py +0 -493
teradataml/analytics/mle/IdentityMatch.py +0 -763
teradataml/analytics/mle/Interpolator.py +0 -918
teradataml/analytics/mle/KMeans.py +0 -485
teradataml/analytics/mle/KNN.py +0 -627
teradataml/analytics/mle/KNNRecommender.py +0 -488
teradataml/analytics/mle/KNNRecommenderPredict.py +0 -581
teradataml/analytics/mle/LAR.py +0 -439
teradataml/analytics/mle/LARPredict.py +0 -478
teradataml/analytics/mle/LDA.py +0 -548
teradataml/analytics/mle/LDAInference.py +0 -492
teradataml/analytics/mle/LDATopicSummary.py +0 -464
teradataml/analytics/mle/LevenshteinDistance.py +0 -450
teradataml/analytics/mle/LinReg.py +0 -433
teradataml/analytics/mle/LinRegPredict.py +0 -438
teradataml/analytics/mle/MinHash.py +0 -544
teradataml/analytics/mle/Modularity.py +0 -587
teradataml/analytics/mle/NEREvaluator.py +0 -410
teradataml/analytics/mle/NERExtractor.py +0 -595
teradataml/analytics/mle/NERTrainer.py +0 -458
teradataml/analytics/mle/NGrams.py +0 -570
teradataml/analytics/mle/NPath.py +0 -634
teradataml/analytics/mle/NTree.py +0 -549
teradataml/analytics/mle/NaiveBayes.py +0 -462
teradataml/analytics/mle/NaiveBayesPredict.py +0 -513
teradataml/analytics/mle/NaiveBayesTextClassifier.py +0 -607
teradataml/analytics/mle/NaiveBayesTextClassifier2.py +0 -531
teradataml/analytics/mle/NaiveBayesTextClassifierPredict.py +0 -799
teradataml/analytics/mle/NamedEntityFinder.py +0 -529
teradataml/analytics/mle/NamedEntityFinderEvaluator.py +0 -414
teradataml/analytics/mle/NamedEntityFinderTrainer.py +0 -396
teradataml/analytics/mle/POSTagger.py +0 -417
teradataml/analytics/mle/Pack.py +0 -411
teradataml/analytics/mle/PageRank.py +0 -535
teradataml/analytics/mle/PathAnalyzer.py +0 -426
teradataml/analytics/mle/PathGenerator.py +0 -367
teradataml/analytics/mle/PathStart.py +0 -464
teradataml/analytics/mle/PathSummarizer.py +0 -470
teradataml/analytics/mle/Pivot.py +0 -471
teradataml/analytics/mle/ROC.py +0 -425
teradataml/analytics/mle/RandomSample.py +0 -637
teradataml/analytics/mle/RandomWalkSample.py +0 -490
teradataml/analytics/mle/SAX.py +0 -779
teradataml/analytics/mle/SVMDense.py +0 -677
teradataml/analytics/mle/SVMDensePredict.py +0 -536
teradataml/analytics/mle/SVMDenseSummary.py +0 -437
teradataml/analytics/mle/SVMSparse.py +0 -557
teradataml/analytics/mle/SVMSparsePredict.py +0 -553
teradataml/analytics/mle/SVMSparseSummary.py +0 -435
teradataml/analytics/mle/Sampling.py +0 -549
teradataml/analytics/mle/Scale.py +0 -565
teradataml/analytics/mle/ScaleByPartition.py +0 -496
teradataml/analytics/mle/ScaleMap.py +0 -378
teradataml/analytics/mle/ScaleSummary.py +0 -320
teradataml/analytics/mle/SentenceExtractor.py +0 -363
teradataml/analytics/mle/SentimentEvaluator.py +0 -432
teradataml/analytics/mle/SentimentExtractor.py +0 -578
teradataml/analytics/mle/SentimentTrainer.py +0 -405
teradataml/analytics/mle/SeriesSplitter.py +0 -641
teradataml/analytics/mle/Sessionize.py +0 -475
teradataml/analytics/mle/SimpleMovAvg.py +0 -397
teradataml/analytics/mle/StringSimilarity.py +0 -425
teradataml/analytics/mle/TF.py +0 -389
teradataml/analytics/mle/TFIDF.py +0 -504
teradataml/analytics/mle/TextChunker.py +0 -414
teradataml/analytics/mle/TextClassifier.py +0 -399
teradataml/analytics/mle/TextClassifierEvaluator.py +0 -413
teradataml/analytics/mle/TextClassifierTrainer.py +0 -565
teradataml/analytics/mle/TextMorph.py +0 -494
teradataml/analytics/mle/TextParser.py +0 -623
teradataml/analytics/mle/TextTagger.py +0 -530
teradataml/analytics/mle/TextTokenizer.py +0 -502
teradataml/analytics/mle/UnivariateStatistics.py +0 -488
teradataml/analytics/mle/Unpack.py +0 -526
teradataml/analytics/mle/Unpivot.py +0 -438
teradataml/analytics/mle/VarMax.py +0 -776
teradataml/analytics/mle/VectorDistance.py +0 -762
teradataml/analytics/mle/WeightedMovAvg.py +0 -400
teradataml/analytics/mle/XGBoost.py +0 -842
teradataml/analytics/mle/XGBoostPredict.py +0 -627
teradataml/analytics/mle/__init__.py +0 -123
teradataml/analytics/mle/json/adaboost_mle.json +0 -135
teradataml/analytics/mle/json/adaboostpredict_mle.json +0 -85
teradataml/analytics/mle/json/antiselect_mle.json +0 -34
teradataml/analytics/mle/json/antiselect_mle_mle.json +0 -34
teradataml/analytics/mle/json/arima_mle.json +0 -172
teradataml/analytics/mle/json/arimapredict_mle.json +0 -52
teradataml/analytics/mle/json/attribution_mle_mle.json +0 -143
teradataml/analytics/mle/json/betweenness_mle.json +0 -97
teradataml/analytics/mle/json/burst_mle.json +0 -140
teradataml/analytics/mle/json/ccm_mle.json +0 -124
teradataml/analytics/mle/json/ccmprepare_mle.json +0 -14
teradataml/analytics/mle/json/cfilter_mle.json +0 -93
teradataml/analytics/mle/json/changepointdetection_mle.json +0 -92
teradataml/analytics/mle/json/changepointdetectionrt_mle.json +0 -78
teradataml/analytics/mle/json/closeness_mle.json +0 -104
teradataml/analytics/mle/json/confusionmatrix_mle.json +0 -79
teradataml/analytics/mle/json/correlation_mle.json +0 -86
teradataml/analytics/mle/json/correlationreduce_mle.json +0 -49
teradataml/analytics/mle/json/coxhazardratio_mle.json +0 -89
teradataml/analytics/mle/json/coxph_mle.json +0 -98
teradataml/analytics/mle/json/coxsurvival_mle.json +0 -79
teradataml/analytics/mle/json/cumulativemovavg_mle.json +0 -34
teradataml/analytics/mle/json/decisionforest_mle.json +0 -167
teradataml/analytics/mle/json/decisionforestevaluator_mle.json +0 -33
teradataml/analytics/mle/json/decisionforestpredict_mle_mle.json +0 -74
teradataml/analytics/mle/json/decisiontree_mle.json +0 -194
teradataml/analytics/mle/json/decisiontreepredict_mle_mle.json +0 -86
teradataml/analytics/mle/json/dtw_mle.json +0 -97
teradataml/analytics/mle/json/dwt2d_mle.json +0 -116
teradataml/analytics/mle/json/dwt_mle.json +0 -101
teradataml/analytics/mle/json/exponentialmovavg_mle.json +0 -55
teradataml/analytics/mle/json/fmeasure_mle.json +0 -58
teradataml/analytics/mle/json/fpgrowth_mle.json +0 -159
teradataml/analytics/mle/json/frequentpaths_mle.json +0 -129
teradataml/analytics/mle/json/glm_mle.json +0 -111
teradataml/analytics/mle/json/glml1l2_mle.json +0 -106
teradataml/analytics/mle/json/glml1l2predict_mle.json +0 -57
teradataml/analytics/mle/json/glmpredict_mle_mle.json +0 -74
teradataml/analytics/mle/json/histogram_mle.json +0 -100
teradataml/analytics/mle/json/hmmdecoder_mle.json +0 -192
teradataml/analytics/mle/json/hmmevaluator_mle.json +0 -206
teradataml/analytics/mle/json/hmmsupervised_mle.json +0 -91
teradataml/analytics/mle/json/hmmunsupervised_mle.json +0 -114
teradataml/analytics/mle/json/identitymatch_mle.json +0 -88
teradataml/analytics/mle/json/idwt2d_mle.json +0 -73
teradataml/analytics/mle/json/idwt_mle.json +0 -66
teradataml/analytics/mle/json/interpolator_mle.json +0 -151
teradataml/analytics/mle/json/kmeans_mle.json +0 -97
teradataml/analytics/mle/json/knn_mle.json +0 -141
teradataml/analytics/mle/json/knnrecommender_mle.json +0 -111
teradataml/analytics/mle/json/knnrecommenderpredict_mle.json +0 -75
teradataml/analytics/mle/json/lar_mle.json +0 -78
teradataml/analytics/mle/json/larpredict_mle.json +0 -69
teradataml/analytics/mle/json/lda_mle.json +0 -130
teradataml/analytics/mle/json/ldainference_mle.json +0 -78
teradataml/analytics/mle/json/ldatopicsummary_mle.json +0 -64
teradataml/analytics/mle/json/levenshteindistance_mle.json +0 -92
teradataml/analytics/mle/json/linreg_mle.json +0 -42
teradataml/analytics/mle/json/linregpredict_mle.json +0 -56
teradataml/analytics/mle/json/minhash_mle.json +0 -113
teradataml/analytics/mle/json/modularity_mle.json +0 -91
teradataml/analytics/mle/json/naivebayespredict_mle_mle.json +0 -85
teradataml/analytics/mle/json/naivebayesreduce_mle.json +0 -52
teradataml/analytics/mle/json/naivebayestextclassifierpredict_mle_mle.json +0 -147
teradataml/analytics/mle/json/naivebayestextclassifiertrainer2_mle.json +0 -108
teradataml/analytics/mle/json/naivebayestextclassifiertrainer_mle.json +0 -102
teradataml/analytics/mle/json/namedentityfinder_mle.json +0 -84
teradataml/analytics/mle/json/namedentityfinderevaluatorreduce_mle.json +0 -43
teradataml/analytics/mle/json/namedentityfindertrainer_mle.json +0 -64
teradataml/analytics/mle/json/nerevaluator_mle.json +0 -54
teradataml/analytics/mle/json/nerextractor_mle.json +0 -87
teradataml/analytics/mle/json/nertrainer_mle.json +0 -89
teradataml/analytics/mle/json/ngrams_mle.json +0 -137
teradataml/analytics/mle/json/ngramsplitter_mle_mle.json +0 -137
teradataml/analytics/mle/json/npath@coprocessor_mle.json +0 -73
teradataml/analytics/mle/json/ntree@coprocessor_mle.json +0 -123
teradataml/analytics/mle/json/pack_mle.json +0 -58
teradataml/analytics/mle/json/pack_mle_mle.json +0 -58
teradataml/analytics/mle/json/pagerank_mle.json +0 -81
teradataml/analytics/mle/json/pathanalyzer_mle.json +0 -63
teradataml/analytics/mle/json/pathgenerator_mle.json +0 -40
teradataml/analytics/mle/json/pathstart_mle.json +0 -62
teradataml/analytics/mle/json/pathsummarizer_mle.json +0 -72
teradataml/analytics/mle/json/pivoting_mle.json +0 -71
teradataml/analytics/mle/json/postagger_mle.json +0 -51
teradataml/analytics/mle/json/randomsample_mle.json +0 -131
teradataml/analytics/mle/json/randomwalksample_mle.json +0 -85
teradataml/analytics/mle/json/roc_mle.json +0 -73
teradataml/analytics/mle/json/sampling_mle.json +0 -75
teradataml/analytics/mle/json/sax_mle.json +0 -154
teradataml/analytics/mle/json/scale_mle.json +0 -93
teradataml/analytics/mle/json/scalebypartition_mle.json +0 -89
teradataml/analytics/mle/json/scalemap_mle.json +0 -44
teradataml/analytics/mle/json/scalesummary_mle.json +0 -14
teradataml/analytics/mle/json/sentenceextractor_mle.json +0 -41
teradataml/analytics/mle/json/sentimentevaluator_mle.json +0 -43
teradataml/analytics/mle/json/sentimentextractor_mle.json +0 -100
teradataml/analytics/mle/json/sentimenttrainer_mle.json +0 -68
teradataml/analytics/mle/json/seriessplitter_mle.json +0 -133
teradataml/analytics/mle/json/sessionize_mle_mle.json +0 -62
teradataml/analytics/mle/json/simplemovavg_mle.json +0 -48
teradataml/analytics/mle/json/stringsimilarity_mle.json +0 -50
teradataml/analytics/mle/json/stringsimilarity_mle_mle.json +0 -50
teradataml/analytics/mle/json/svmdense_mle.json +0 -165
teradataml/analytics/mle/json/svmdensepredict_mle.json +0 -95
teradataml/analytics/mle/json/svmdensesummary_mle.json +0 -58
teradataml/analytics/mle/json/svmsparse_mle.json +0 -148
teradataml/analytics/mle/json/svmsparsepredict_mle_mle.json +0 -103
teradataml/analytics/mle/json/svmsparsesummary_mle.json +0 -57
teradataml/analytics/mle/json/textchunker_mle.json +0 -40
teradataml/analytics/mle/json/textclassifier_mle.json +0 -51
teradataml/analytics/mle/json/textclassifierevaluator_mle.json +0 -43
teradataml/analytics/mle/json/textclassifiertrainer_mle.json +0 -103
teradataml/analytics/mle/json/textmorph_mle.json +0 -63
teradataml/analytics/mle/json/textparser_mle.json +0 -166
teradataml/analytics/mle/json/texttagger_mle.json +0 -81
teradataml/analytics/mle/json/texttokenizer_mle.json +0 -91
teradataml/analytics/mle/json/tf_mle.json +0 -33
teradataml/analytics/mle/json/tfidf_mle.json +0 -34
teradataml/analytics/mle/json/univariatestatistics_mle.json +0 -81
teradataml/analytics/mle/json/unpack_mle.json +0 -91
teradataml/analytics/mle/json/unpack_mle_mle.json +0 -91
teradataml/analytics/mle/json/unpivoting_mle.json +0 -63
teradataml/analytics/mle/json/varmax_mle.json +0 -176
teradataml/analytics/mle/json/vectordistance_mle.json +0 -179
teradataml/analytics/mle/json/weightedmovavg_mle.json +0 -48
teradataml/analytics/mle/json/xgboost_mle.json +0 -178
teradataml/analytics/mle/json/xgboostpredict_mle.json +0 -104
teradataml/analytics/sqle/Antiselect.py +0 -321
teradataml/analytics/sqle/Attribution.py +0 -603
teradataml/analytics/sqle/DecisionForestPredict.py +0 -408
teradataml/analytics/sqle/GLMPredict.py +0 -430
teradataml/analytics/sqle/MovingAverage.py +0 -543
teradataml/analytics/sqle/NGramSplitter.py +0 -548
teradataml/analytics/sqle/NPath.py +0 -632
teradataml/analytics/sqle/NaiveBayesTextClassifierPredict.py +0 -515
teradataml/analytics/sqle/Pack.py +0 -388
teradataml/analytics/sqle/SVMSparsePredict.py +0 -464
teradataml/analytics/sqle/Sessionize.py +0 -390
teradataml/analytics/sqle/StringSimilarity.py +0 -400
teradataml/analytics/sqle/Unpack.py +0 -503
teradataml/analytics/sqle/json/antiselect_sqle.json +0 -21
teradataml/analytics/sqle/json/attribution_sqle.json +0 -92
teradataml/analytics/sqle/json/decisionforestpredict_sqle.json +0 -48
teradataml/analytics/sqle/json/glmpredict_sqle.json +0 -48
teradataml/analytics/sqle/json/h2opredict_sqle.json +0 -63
teradataml/analytics/sqle/json/movingaverage_sqle.json +0 -58
teradataml/analytics/sqle/json/naivebayestextclassifierpredict_sqle.json +0 -76
teradataml/analytics/sqle/json/ngramsplitter_sqle.json +0 -126
teradataml/analytics/sqle/json/npath_sqle.json +0 -67
teradataml/analytics/sqle/json/pack_sqle.json +0 -47
teradataml/analytics/sqle/json/pmmlpredict_sqle.json +0 -55
teradataml/analytics/sqle/json/sessionize_sqle.json +0 -43
teradataml/analytics/sqle/json/stringsimilarity_sqle.json +0 -39
teradataml/analytics/sqle/json/svmsparsepredict_sqle.json +0 -74
teradataml/analytics/sqle/json/unpack_sqle.json +0 -80
teradataml/catalog/model_cataloging.py +0 -980
teradataml/config/mlengine_alias_definitions_v1.0 +0 -118
teradataml/config/mlengine_alias_definitions_v1.1 +0 -127
teradataml/config/mlengine_alias_definitions_v1.3 +0 -129
teradataml/table_operators/sandbox_container_util.py +0 -643
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/WHEEL +0 -0
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/top_level.txt +0 -0
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/zip-safe +0 -0

teradataml/catalog/model_cataloging_utils.py CHANGED Viewed

@@ -308,91 +308,6 @@ def __check_if_client_specific_use(key, function_arg_map, is_sql_name=False):
     else:
         return False, None
-def __get_model_parameters(model, function_arg_map):
-    """
-    DESCRIPTION:
-        Internal function to get parameter information of the model to be saved.
-    PARAMETERS:
-        model:
-            Required argument.
-            The model (analytic function object instance) to be saved.
-            Types: teradataml Analytic Function object.
-        function_arg_map:
-            Required argument.
-            The teradataml-sql map for the function obtained using function_argument_mapper.
-            Types: dict
-    RETURNS:
-        A dict containing the information about parameters passed to model.
-    EXAMPLES:
-        >>> model_parameters = __get_model_parameters(model, function_arg_map)
-    """
-    parameter_json = {}
-    # Get the attributes that are specific to the SQL syntax of the model algorithm
-    sql_specific_attributes = model._get_sql_specific_attributes()
-    # First, let's identify the parameters
-    nonsql_argument_counter = 1
-    for key in model.__dict__:
-        if not key.startswith('_'):
-            member = getattr(model, key)
-            # Check if this is an attribute, not a DataFrame
-            if not isinstance(member, DataFrame) and key != "sqlmr_query":
-                # Check if it is a special or client specific argument
-                special_use, used_in = __check_if_client_specific_use(key, function_arg_map)
-                value = member
-                # Add quotes to Boolean values as they tend to be handled in unintended way with JSON.
-                if type(member) == bool or key == famc.TDML_FORMULA_NAME.value:
-                    value = str(member)
-                else:
-                    if isinstance(member, list):
-                        # We try to save the list as a string representation that could readily be used,
-                        # in SQL, and has no language specific representation.
-                        # Here, we remove the '[' and ']' from the string representation.
-                        # We also avoid adding quotes around single-item list.
-                        if len(member) == 1:
-                            value = str(member[0]) if type(member[0]) == bool else member[0]
-                        elif len(member) > 1:
-                            if type(member[0]) == bool:
-                                member = ['{}'.format(val) for val in member]
-                            value = str(member).lstrip('[').rstrip(']')
-                        else:
-                            # Empty list has no meaning, but no chance of running into this with the validation
-                            # in the function wrappers.
-                            value = None
-                if value is not None:
-                    if special_use:
-                        sql_name = '__nonsql_argument_{}__'.format(nonsql_argument_counter)
-                        nonsql_argument_counter = nonsql_argument_counter + 1
-                    else:
-                        sql_name = __get_arg_sql_name_from_tdml(function_arg_map,arg_type=famc.ARGUMENTS.value,name=key)
-                    parameter_json[sql_name] = {}
-                    parameter_json[sql_name]["value"] = value
-                    parameter_json[sql_name]["client_specific_name"] = key
-    sql_name = '__nonsql_argument_{}__'.format(nonsql_argument_counter)
-    parameter_json[sql_name] = {}
-    parameter_json[sql_name]["value"] = model.__class__.__name__
-    parameter_json[sql_name]["client_specific_name"] = "__class_name__"
-    # Add the SQL specific arguments
-    for sql_name in sql_specific_attributes:
-        parameter_json[sql_name] = {}
-        parameter_json[sql_name]["value"] = sql_specific_attributes[sql_name]
-        # Also save the formula related property names for corresponding SQL arguments
-        if hasattr(model, '_sql_formula_attribute_mapper'):
-            if sql_name in model._sql_formula_attribute_mapper:
-                parameter_json[sql_name]["client_specific_name"] = model._sql_formula_attribute_mapper[sql_name]
-    return parameter_json
 def __check_if_model_exists(name, created=False, accessible=False,
                             raise_error_if_exists=False, raise_error_if_model_not_found=False):
     """
@@ -477,89 +392,6 @@ def __check_if_model_exists(name, created=False, accessible=False,
                                                                name, ' or not created by user'),
                                           MessageCodes.MODEL_NOT_FOUND)
-def __check_if_model_cataloging_tables_exists(raise_error_if_does_not_exists=True):
-    """
-    DESCRIPTION:
-        Check whether Model Cataloging tables (one of the views - ModelCataloging.ModelsV) exists or not.
-    PARAMETERS:
-        raise_error_if_does_not_exists:
-            Optional Argument.
-            Specifies the flag to decide whether to raise error when Model Cataloging tables does not exist.
-            Default Value: True (Raise exception)
-            Types: bool
-    RAISES:
-        None.
-    RETURNS:
-        True, if the view exists, else False.
-    EXAMPLES:
-        >>>  __check_if_model_cataloging_tables_exists()
-    """
-    # Get current connection().
-    conn = get_connection()
-    # Check whether tables exists on the system or not.
-    model_table_exists = conn.dialect.has_view(conn, view_name=mac.MODELS.value,
-                                                schema=mac.MODEL_CATALOG_DB.value)
-    # If both tables exist, return True.
-    if model_table_exists:
-        return True
-    # We are here means the Model Cataloging view does not exist.
-    # Let's raise error if 'raise_error_if_does_not_exists' set to True.
-    if raise_error_if_does_not_exists:
-        # Raise error, as one or both Model Cataloging tables does not exist.
-        # MODEL_CATALOGING_TABLE_DOES_EXIST
-        raise TeradataMlException(
-            Messages.get_message(MessageCodes.MODEL_CATALOGING_TABLE_DOES_EXIST),
-            MessageCodes.MODEL_CATALOGING_TABLE_DOES_EXIST)
-def __get_tables_for_model(name, current_user):
-    """
-    DESCRIPTION:
-        Function to get model tables for a given model name.
-    PARAMETERS:
-        name:
-            Required Argument.
-            Specifies the name of the model to get the model tables for.
-            Types: str
-        current_user:
-            Required Argument.
-            Specifies the name of the current Vantage user.
-            Types: str
-    RETURNS:
-        A list of model tables associated with the model.
-    EXAMPLES:
-        >>> table_list = __get_tables_for_model(name, current_user)
-    """
-    # Get list of tables
-    model_object_info = DataFrame(in_schema(mac.MODEL_CATALOG_DB.value, mac.MODELS_OBJECTS.value))
-    model_info = DataFrame(in_schema(mac.MODEL_CATALOG_DB.value, mac.MODELSX.value))
-    model_info = model_info[model_info[mac.CREATED_BY.value].str.lower() == current_user.lower()]
-    model_info = model_info[model_info[mac.MODEL_NAME.value] == name]
-    model_objects_to_publish = model_info.join(model_object_info,
-                                               on=[model_info.Name == model_object_info.ModelName],
-                                               how='inner').select([mac.MODEL_OBJ_TABLE_NAME.value])
-    model_objects_to_publish = model_objects_to_publish.to_pandas().squeeze()
-    if isinstance(model_objects_to_publish, str):
-        # If there is only one output table
-        return [model_objects_to_publish]
-    else:
-        # For multiple or no output tables
-        return model_objects_to_publish.tolist()
 def __get_current_user(conn=None):
     """
     DESCRIPTION:
@@ -619,36 +451,6 @@ def __get_like_filter_expression_on_col(metaexpr, column_name, like):
     return metaexpr._filter(0, 'like', [column_name], like = like, match_arg='i')
-def __get_model_engine(model):
-    """
-    DESCRIPTION:
-        Internal function to return the engine name on which the model was generated.
-    PARAMETERS:
-        model:
-            Required Argument.
-            Model object, for which engine is to be found.
-            Types: str
-    RETURNS:
-        Engine name ('ML Engine' or 'Advanced SQL Engine')
-    RAISES:
-        TeradataMlException
-    EXAMPLES:
-        >>> __get_model_engine(model)
-    """
-    if ".mle." in str(type(model)):
-        return mac.MODEL_ENGINE_ML.value
-    elif ".sqle." in str(type(model)):
-        return mac.MODEL_ENGINE_ADVSQL.value
-    else:
-        raise TeradataMlException(Messages.get_message(MessageCodes.UNKNOWN_MODEL_ENGINE,
-                                                       str(type(model))),
-                                  MessageCodes.UNKNOWN_MODEL_ENGINE)
 def __get_wrapper_class(model_engine, model_class):
     """
     DESCRIPTION:
@@ -674,11 +476,9 @@ def __get_wrapper_class(model_engine, model_class):
         AttributeError - When model_class wrapper function, does is not from model_engine.
     EXAMPLES:
-        >>> __get_wrapper_class("ML Engine", "GLM")
+        >>> __get_wrapper_class("SQL Engine", "GLM")
     """
-    if model_engine == mac.MODEL_ENGINE_ML.value:
-        module_name = "teradataml.analytics.mle"
-    elif model_engine == mac.MODEL_ENGINE_ADVSQL.value:
+    if model_engine == mac.MODEL_ENGINE_ADVSQL.value:
         module_name = "teradataml.analytics.sqle"
     else:
         raise ValueError("Invalid Engine found in Model Cataloging table.")
@@ -688,823 +488,4 @@ def __get_wrapper_class(model_engine, model_class):
     return getattr(wrapper_module, model_class)
-def __is_view(tablename):
-    """
-    DESCRIPTION:
-        Internal function to check whether the object is view or not.
-    PARAMETERS:
-        tablename:
-            Required Argument.
-            Table name or view name to be checked.
-            Types: str
-    RAISES:
-        None.
-    RETURNS:
-        True when the tablename is view, else false.
-    EXAMPLES:
-        >>> __is_view('"dbaname"."tablename"')
-    """
-    db_name = UtilFuncs._teradata_unquote_arg(UtilFuncs._extract_db_name(tablename), "\"")
-    table_view_name = UtilFuncs._teradata_unquote_arg(UtilFuncs._extract_table_name(tablename), "\"")
-    query = SQLBundle._build_select_table_kind(db_name, "{0}".format(table_view_name), "'V'")
-    pdf = pd.read_sql(query, get_context())
-    if pdf.shape[0] > 0:
-        return True
-    else:
-        return False
-def __delete_model_tableview(tableviewname):
-    """
-    DESCRIPTION:
-        Internal function to remove table name or view.
-    PARAMETERS:
-        tableviewname:
-            Required Argument.
-            Table name or view name to be deleted.
-            Types: str
-    RAISES:
-        None.
-    RETURNS:
-        bool
-    EXAMPLES:
-        >>> __delete_model_tableview('"dbname"."tableviewname"')
-    """
-    if not __is_view(tableviewname):
-        try:
-            UtilFuncs._drop_table(tableviewname)
-        except:
-            return False
-    else:
-        try:
-            UtilFuncs._drop_view(tableviewname)
-        except:
-            return False
-    return True
-def __get_all_formula_related_args(function_arg_map):
-    """
-    DESCRIPTION:
-        Internal function to find a list of all formula related arguments for a function.
-    PARAMETERS:
-        function_arg_map:
-            Required Argument.
-            The teradataml-sql map for the function obtained using function_argument_mapper.
-            Types: dict
-    RETURNS:
-         A dictionary mapping all SQL Arguments for the function related to formula to its role in formula.
-    EXAMPLE:
-        >>> __get_all_formula_related_args(function_arg_map)
-    """
-    formula_args = {}
-    for arg_name in function_arg_map[famc.ARGUMENTS.value][famc.SQL_TO_TDML.value]:
-        arg = function_arg_map[famc.ARGUMENTS.value][famc.SQL_TO_TDML.value][arg_name]
-        # Ignore alternate names
-        if famc.ALTERNATE_TO.value in arg:
-            alternate_name = arg[famc.ALTERNATE_TO.value]
-            arg = function_arg_map[famc.ARGUMENTS.value][famc.SQL_TO_TDML.value][alternate_name]
-        if famc.USED_IN_FORMULA.value in arg:
-            formula_args[arg_name] = {}
-            formula_args[arg_name][famc.USED_IN_FORMULA.value] = arg[famc.USED_IN_FORMULA.value]
-            formula_args[arg_name]['arg_value'] = None
-    return formula_args
-def __fix_imbalanced_quotes(arg):
-    """
-    DESCRIPTION:
-        Internal function to fix imbalanced quotes around a string.
-    PARAMETERS:
-        arg:
-            Required Argument.
-            The string to fix the imbalanced quotes for, if any.
-            Types: str
-    RETURNS:
-         The input string with any imbalanced quotes stripped.
-    EXAMPLE:
-        >>> __fix_imbalanced_quotes('hello"')
-        hello
-    """
-    for quote in ["'", '"']:
-        if (arg.startswith(quote) and not arg.endswith(quote)) or (not arg.startswith(quote) and arg.endswith(quote)):
-            return arg.strip(quote)
-    return arg
-def __get_tdml_parameter_value_for_sequence(function_arg_map, attr_value):
-    """
-    DESCRIPTION:
-        Internal function to form sequence_column teradataml argument from SQL arguments.
-    PARAMETERS:
-        function_arg_map:
-            Required Argument.
-            The teradataml-sql map for the function obtained using function_argument_mapper.
-            Types: dict
-        attr_value:
-            Required Argument.
-            The value of the SQL sequence argument.
-    RETURNS:
-         A dictionary mapping the teradataml sequence argument to its values.
-    EXAMPLES:
-        >>> tdml_sequence_args = __get_tdml_parameter_value_for_sequence(function_arg_map, sql_sequence_arg)
-    """
-    sequence_dict = {}
-    tdml_name = None
-    for column in attr_value.split(','):
-        if len(column) == 0:
-            continue
-        if ':' in column:
-            input_name, col_val = column.split(':')
-            input_name = __fix_imbalanced_quotes(input_name)
-            col_val = __fix_imbalanced_quotes(col_val)
-            tdml_name = '{}_{}'.format(__get_arg_tdml_name_from_sql(function_arg_map, famc.INPUTS.value,
-                                                                    input_name.lower()),
-                                       'sequence_column')
-            tdml_name = __fix_imbalanced_quotes(tdml_name)
-            sequence_dict[tdml_name] = [col_val]
-        else:
-            if tdml_name not in sequence_dict:
-                # This means there is only one input and the input name was not specified in the
-                # SequenceInputBy clause. So we get the only input name.
-                tdml_name = list(function_arg_map[famc.INPUTS.value][famc.TDML_TO_SQL.value].keys())[0]
-                tdml_name = '{}_{}'.format(tdml_name, 'sequence_column')
-                sequence_dict[tdml_name] = []
-            column = __fix_imbalanced_quotes(column)
-            sequence_dict[tdml_name].append(column)
-    return sequence_dict
-def __get_target_column(name):
-    """
-    DESCRIPTION:
-        Internal function to get the target column of a saved model.
-    PARAMETERS:
-        name:
-            Required Argument.
-            Specifies the name used to save the model.
-            Types: str
-    RETURNS:
-         A String representing the name of the target column.
-    EXAMPLES:
-        >>> target_column = __get_target_column('GLMModel')
-    """
-    model_details = DataFrame(in_schema(mac.MODEL_CATALOG_DB.value, mac.MODELS_DETAILSX.value))
-    model_details = model_details[model_details[mac.MODEL_DERIVED_NAME.value] == name]
-    target_column = model_details.select([mac.MODEL_DERIVED_TARGET_COLUMN.value]).squeeze()
-    return target_column
-def __get_tdml_parameter_value_for_formula(formula_args, target_column):
-    """
-    DESCRIPTION:
-        Internal function to build the formula argument based on the SQL equivalent inputs.
-    PARAMETERS:
-        formula_args:
-            Required Argument.
-            A dictionary mapping all SQL Arguments for the function related to formula to its role in formula.
-            Types: dict
-        target_column:
-            Required Argument.
-            The target column for the model, if any.
-            Types: str
-    RETURNS:
-         A String representing the formula argument to be used with teradataml.
-    EXAMPLES:
-        >>> formula = __get_tdml_parameter_value_for_formula(formula_args, target_column)
-    """
-    dependent_var = target_column
-    all_vars = []
-    for arg in formula_args:
-        if formula_args[arg]['arg_value'] is not None:
-            if formula_args[arg][famc.USED_IN_FORMULA.value] == famc.DEPENDENT_ATTR.value:
-                dependent_var = formula_args[arg]['arg_value'].strip("'")
-            else:
-                all_vars.extend(formula_args[arg]['arg_value'].split(','))
-    # Remove duplicates
-    all_vars = list(set(all_vars))
-    all_vars = [var.strip("'") for var in all_vars]
-    # Remove dependent variable if it occurs in all_vars
-    if dependent_var in all_vars:
-        all_vars.pop(all_vars.index(dependent_var))
-    formula = '{} ~ {}'.format(dependent_var, ' + '. join(all_vars))
-    return formula
-def __cast_arg_values_to_tdml_types(value, type_):
-    """
-    DESCRIPTION:
-        Internal function used by retrieve_model() to cast the retrieved model parameters to the expected python types.
-    PARAMETERS:
-        value:
-            Required Argument.
-            Specifies the value retrieved that needs a type cast.
-            Types: str
-        type_:
-            Required Argument.
-            Specifies the Python type the value needs to be cast to.
-            Type: Python type or tuple of Python types
-    RETURNS:
-        The value cast to the required Python type.
-    RAISES:
-        None
-    EXAMPLE:
-        >>> cast_value = __cast_arg_values_to_tdml_types('0.1', float)
-    """
-    return_value = None
-    required_type = type_
-    accepted_bool_values = ['1', 't', 'true', 'y', 'yes']
-    # If the required_type is a tuple, we need to consider the possibility of the value being a list
-    if isinstance(required_type, tuple):
-        # The function_argument_mapper adds the type of the object in the list as the first value in the tuple
-        required_type = required_type[0]
-        # Use regex to split the string value into a list.
-        # This is required only when we expect the values to be a list as well, in which case,
-        # the 'value' will be a comma-separated list of strings.
-        # The pattern matches anything but whitespace and comma and not in quotes, or anything in quotes,
-        # basically avoiding splitting on a comma when surrounded by quotes.
-        pattern = r"[^',\s]+|'[^']*'"
-        values = re.findall(pattern, value)
-        if len(values) > 1:
-            if required_type == bool:
-                # Remove the quotes surrounding items in a list,
-                # and check for their presence in the acceptable TRUE values.
-                return_value = [val.strip().strip("'").lower() in accepted_bool_values for val in values]
-            else:
-                # Remove the quotes surrounding items in a list cast them to the required type.
-                return_value = [required_type(val.strip().strip("'")) for val in values]
-        else:
-            value = values[0]
-    if return_value is None:
-        if required_type == bool:
-            # Remove the quotes surrounding the value,
-            # and check for their presence in the acceptable TRUE values.
-            return_value = value.strip().strip("'").lower() in accepted_bool_values
-        else:
-            # Remove the quotes surrounding the value and cast it to the required type.
-            return_value = required_type(value.strip().strip("'"))
-    return return_value
-def __get_model_access(name):
-    """
-    DESCRIPTION:
-        Internal function to get the current access level of a saved model.
-    PARAMETERS:
-        name:
-            Required Argument.
-            Specifies the name of the saved model to get the access level for.
-            Types: str
-    RAISES:
-        None.
-    RETURNS:
-        A String representing the access level of the saved model.
-    EXAMPLES:
-        >>> __get_model_access('saved_glm_model')
-    """
-    df = DataFrame(in_schema(mac.MODEL_CATALOG_DB.value, mac.MODELS_DETAILS.value))
-    return df[df[mac.MODEL_DERIVED_NAME.value] == name].select([mac.MODEL_ACCESS.value]).squeeze()
-def __get_tdml_type_for_tdml_arg(name, function_arg_map):
-    """
-    DESCRIPTION:
-        Internal function to get the Python type for the given teradataml model class attribute.
-    PARAMETERS:
-        name:
-            Required Argument.
-            Specifies the teradataml name for the attribute to get the expected python type for.
-            Types: str
-        function_arg_map:
-            Required Argument.
-            Specifies the teradataml-sql map for the function obtained using function_argument_mapper.
-            Types: dict
-    RETURNS:
-        Python type for the given teradataml model class attribute name.
-        None when argument name not found.
-    RAISES:
-        None
-    EXAMPLES:
-        >>> from teradataml.catalog.function_argument_mapper import _argument_mapper
-        >>> function_arg_map = _argument_mapper._get_function_map('ML Engine', 'glm')
-        >>> tdml_type = __get_tdml_type_for_tdml_arg('linkfunction', function_arg_map)
-    """
-    # Let's check if the function argument mapper has the information about the argument we are looking for.
-    # If not, let's return None.
-    if name not in function_arg_map[famc.ARGUMENTS.value][famc.TDML_TO_SQL.value]:
-        return None
-    tdml_type = str
-    sql_name = function_arg_map[famc.ARGUMENTS.value][famc.TDML_TO_SQL.value][name]
-    # We can ignore formula letting it default to str
-    special_use, used_in = __check_if_client_specific_use(name, function_arg_map)
-    if not special_use or used_in == famc.USED_IN_SEQUENCE_INPUT_BY.value:
-        tdml_type = function_arg_map[famc.ARGUMENTS.value][famc.SQL_TO_TDML.value][sql_name][famc.TDML_TYPE.value]
-    return tdml_type
-def __retrieve_model_class(name, model_client, function_arg_map):
-    """
-    DESCRIPTION:
-        Internal function to get the teradataml class used for generating model given it's name.
-    PARAMETERS:
-        name:
-            Optional Argument. Required when model was saved by teradataml.
-            Specifies the name of the model to retrieve the model attributes and output information for.
-            Types: str
-        model_client:
-            Required Argument.
-            Specified the name of the client used to generate the model.
-            Types: str
-        function_arg_map:
-            Optional Argument. Required when model was not saved by teradataml.
-            Specifies the teradataml-sql map for the function obtained using function_argument_mapper.
-            Types: dict
-    RETURNS:
-        A String representing the teradataml class name corresponding to the model.
-    EXAMPLES:
-        >>> model_class = __retrieve_model_class(name, model_client, function_arg_map)
-    """
-    if model_client == mac.MODEL_TDML.value:
-        # Create DF on top of ModelAttributesV view
-        model_arguments = DataFrame(in_schema(mac.MODEL_CATALOG_DB.value, mac.MODELS_ATTRS.value))
-        model_arguments = model_arguments[model_arguments[mac.MODEL_DERIVED_NAME.value] == name]
-        model_class = model_arguments[model_arguments.ClientSpecificAttributeName.str.
-                                          contains(mac.MODEL_CLIENT_CLASS_KEY.value) == 1].\
-            select([mac.MODEL_ATTR_VALUE.value]).squeeze()
-    else:
-        model_class = function_arg_map[famc.FUNCTION_TDML_NAME.value]
-    return model_class
-def __retrieve_model_client_engine_algorithm(name, return_details=False):
-    """
-    DESCRIPTION:
-        Internal function to get the the model generating engine, client, algorithm, and optionally the model details
-        given the model name.
-    PARAMETERS:
-        name:
-            Required Argument.
-            Specifies the name of the model to retrieve the model attributes and output information for.
-            Types: str
-        return_details:
-            Optional Argument.
-            Specifies whether to also return the row from the ModelDetailsV corresponding to the model.
-            Types: bool
-            Default Value: False
-    RETURNS:
-        A tuple containing:
-        * the name of the client that was used to generate the model,
-        * the name of the engine that generated the model, and
-        * the name of the algorithm used to generate the model.
-        * If return_details=True, then additionally, the ModelDetailsV row related to the model.
-    EXAMPLES:
-        >>> model_client, model_engine, algorithm = __retrieve_model_client_engine_algorithm(name)
-    """
-    model_details = DataFrame(in_schema(mac.MODEL_CATALOG_DB.value, mac.MODELS_DETAILS.value))
-    model_details = model_details[model_details[mac.MODEL_DERIVED_NAME.value] == name]
-    model_algorithm = model_details.select([mac.MODEL_DERIVED_ALGORITHM.value]).squeeze().lower()
-    model_client_and_eng = model_details.select([mac.MODEL_DERIVED_GENCLIENT.value,
-                                                 mac.MODEL_DERIVED_GENENG.value]).squeeze()
-    model_client = model_client_and_eng.select([mac.MODEL_DERIVED_GENCLIENT.value]).squeeze()
-    model_engine = model_client_and_eng.select([mac.MODEL_DERIVED_GENENG.value]).squeeze()
-    if return_details:
-        return model_client, model_engine, model_algorithm, model_details
-    else:
-        return model_client, model_engine, model_algorithm
-def __retrieve_model_attributes(name, model_client, function_arg_map):
-    """
-    DESCRIPTION:
-        Internal function to get the the attributes used for generating model given it's name.
-    PARAMETERS:
-        name:
-            Required Argument.
-            Specifies the name of the model to retrieve the model attributes and output information for.
-            Types: str
-        model_client:
-            Required Argument.
-            Specified the name of the engine that generated the model.
-            Types: str
-        function_arg_map:
-            Required Argument.
-            Specifies the teradataml-sql map for the function obtained using function_argument_mapper.
-            Types: dict
-    RETURNS:
-        A tuple of dictionaries:
-        * the first one containing the attribute names and their values, and
-        * the second one containing the formula related properties and their values, if the model saving client was
-          teradataml.
-    EXAMPLES:
-        >>> model_parameters, formula_related_params = __retrieve_model_attributes(name, model_client, function_arg_map)
-    """
-    # Create DF on top of ModelAttributesV view and
-    # 1. get only rows related to the model named 'name'.
-    model_arguments = DataFrame(in_schema(mac.MODEL_CATALOG_DB.value, mac.MODELS_ATTRS.value))
-    model_arguments = model_arguments[model_arguments[mac.MODEL_DERIVED_NAME.value] == name]
-    if model_client == mac.MODEL_TDML.value:
-        attr_name_to_use = mac.MODEL_ATTR_CLIENT_NAME.value
-    else:
-        attr_name_to_use = mac.MODEL_ATTR_NAME.value
-    if model_client != mac.MODEL_TDML.value:
-        # 2. Filter out the the row where "AttributeName" is not like __nonsql_argument_
-        model_arguments = model_arguments.assign(notSqlonly=model_arguments.AttributeName.str.contains('__nonsql_argument_'))
-        model_arguments = model_arguments[model_arguments.notSqlonly == 0]
-    else:
-        # 2. Filter out the the row where "ClientSpecificAttributeName" is not NULL
-        model_arguments = model_arguments[model_arguments[attr_name_to_use] != None]
-    # Make sure the non-lazy view exists before SQLAlchemy construct can be used
-    if model_arguments._table_name is None:
-        model_arguments._table_name = df_utils._execute_node_return_db_object_name(model_arguments._nodeid,
-                                                                                   model_arguments._metaexpr)
-    # Since lengthier arguments can be a clob column, casting the smaller to clob
-    # to select one of the two as applicable without values being truncated.
-    select_expression = [model_arguments[attr_name_to_use].expression.label("AttrName"),
-                         case_when([(model_arguments[mac.MODEL_ATTR_VALUE.value].expression == None,
-                                     model_arguments[mac.MODEL_ATTR_VALUEC.value].expression)],
-                                   else_=func.cast(model_arguments[mac.MODEL_ATTR_VALUE.value].expression,
-                                                   type_=CLOB)).expression.label("AttrValue")]
-    # Get the final list of AttNames (Client/SQL) and their values  (CLOB type)
-    final_list = DataFrame.from_query(str(select(select_expression).compile(compile_kwargs={"literal_binds": True})))
-    # Model Parameters
-    final_list = final_list[final_list["AttrName"] != mac.MODEL_CLIENT_CLASS_KEY.value]
-    params = final_list.to_pandas().to_dict()
-    model_parameters = {}
-    formula_related_params = {}
-    index_len = len(params["AttrName"])
-    if model_client == mac.MODEL_TDML.value:
-        for i in range(index_len):
-            # Check if the arguments are related to formula
-            if params["AttrName"][i] == '__all_columns':
-                formula_related_params['__all_columns'] = __cast_arg_values_to_tdml_types(params["AttrValue"][i],
-                                                                                          (str, list))
-            elif params["AttrName"][i] == '__numeric_columns':
-                formula_related_params['__numeric_columns'] = __cast_arg_values_to_tdml_types(params["AttrValue"][i],
-                                                                                              (str, list))
-            elif params["AttrName"][i] == '__categorical_columns':
-                formula_related_params['__categorical_columns'] = __cast_arg_values_to_tdml_types(params["AttrValue"]
-                                                                                                  [i], (str, list))
-            elif params["AttrName"][i] == '__response_column':
-                formula_related_params['__response_column'] = __cast_arg_values_to_tdml_types(params["AttrValue"][i],
-                                                                                              str)
-            else:
-                tdml_type = __get_tdml_type_for_tdml_arg(params["AttrName"][i], function_arg_map)
-                # tdml_type can be None when we do not have information about the argument in
-                # the function argument mapper. Let's ignore it in the retrieval.
-                if tdml_type is not None:
-                    model_parameters[params["AttrName"][i]] = __cast_arg_values_to_tdml_types(params["AttrValue"][i],
-                                                                                              tdml_type)
-    else:
-        formula_args = None
-        for i in range(index_len):
-            model_param_name = __get_arg_tdml_name_from_sql(function_arg_map,
-                                                            arg_type=famc.ARGUMENTS.value,
-                                                            name=params["AttrName"][i].lower())
-            attr_value = params["AttrValue"][i]
-            special_use, used_in = __check_if_client_specific_use(params["AttrName"][i].lower(),
-                                                                  function_arg_map, is_sql_name=True)
-            if special_use:
-                if used_in == famc.USED_IN_FORMULA.value:
-                    # Get formula
-                    if formula_args is None:
-                        formula_args = __get_all_formula_related_args(function_arg_map)
-                    formula_args[params["AttrName"][i].lower()]['arg_value'] = attr_value
-                else:
-                    # Get dictionary of sequence_column arguments
-                    sequence_by = __get_tdml_parameter_value_for_sequence(function_arg_map, attr_value)
-                    if sequence_by:
-                        for seq_key in sequence_by:
-                            model_parameters[seq_key] = sequence_by[seq_key]
-            else:
-                # tdml_name can be None when we do not have information about the SQL argument in
-                # the function argument mapper. Let's ignore it in the retrieval.
-                if model_param_name is None:
-                    warnings.warn(Messages.get_message(MessageCodes.CANNOT_TRANSLATE_TO_TDML_NAME,
-                                                       params["AttrName"][i]))
-                    continue
-                model_param_type = model_param_name[famc.TDML_TYPE.value]
-                model_param_name = model_param_name[famc.TDML_NAME.value]
-                model_parameters[model_param_name] = __cast_arg_values_to_tdml_types(attr_value,
-                                                                                     model_param_type)
-        if formula_args is not None:
-            formula = __get_tdml_parameter_value_for_formula(formula_args, __get_target_column(name))
-            model_parameters[famc.TDML_FORMULA_NAME.value] = formula
-    return model_parameters, formula_related_params
-def __retrieve_model_outputs(name, model_client, function_arg_map):
-    """
-    DESCRIPTION:
-        Internal function to get the output DataFrames corresponding to a saved model given it's name.
-    PARAMETERS:
-        name:
-            Required Argument.
-            Specifies the name of the model to retrieve the model output information for.
-            Types: str
-        model_client:
-            Required Argument.
-            Specifies the name of the client that generated the model.
-            Types: str
-        function_arg_map:
-            Required Argument.
-            Specifies the teradataml-sql map for the function obtained using function_argument_mapper.
-            Types: dict
-    RAISES:
-        TeradataMlException
-    RETURNS:
-        A Pandas DataFrame with the teradataml specific name for the output, and the underlying
-        table names corresponding to them.
-    EXAMPLES:
-        >>> output_df = __retrieve_model_outputs(name, model_client, function_arg_map)
-    """
-    # Let's also get the output table map
-    model_outputs = DataFrame(in_schema(mac.MODEL_CATALOG_DB.value, mac.MODELS_OBJECTS.value))
-    model_outputs = model_outputs[model_outputs[mac.MODEL_DERIVED_NAME.value] == name]
-    if model_client == mac.MODEL_TDML.value:
-        model_outputs = model_outputs.assign(drop_columns=True,
-                                             OutputName=model_outputs[mac.MODEL_OBJ_CLIENT_NAME.value],
-                                             OutputTableName=model_outputs[mac.MODEL_OBJ_TABLE_NAME.value]).to_pandas()
-    else:
-        model_outputs = model_outputs.assign(drop_columns=True,
-                                             OutputName=model_outputs[mac.MODEL_OBJ_NAME.value],
-                                             OutputTableName=model_outputs[mac.MODEL_OBJ_TABLE_NAME.value]).to_pandas()
-        output_names = []
-        output_table_names = []
-        index_len = len(model_outputs["OutputName"])
-        for i in range(index_len):
-            output_name = __get_arg_tdml_name_from_sql(function_arg_map, famc.OUTPUTS.value,
-                                                       model_outputs["OutputName"][i].lower())
-            # We raise an exception when we are not able to get the teradataml name
-            # for the SQL name of the output table.
-            if output_name is None:
-                raise TeradataMlException(Messages.get_message(MessageCodes.CANNOT_TRANSLATE_TO_TDML_NAME),
-                                          MessageCodes.CANNOT_TRANSLATE_TO_TDML_NAME)
-            output_names.append(output_name)
-            output_table_names.append(model_outputs["OutputTableName"][i])
-        model_outputs = pd.DataFrame({'OutputName': output_names, 'OutputTableName': output_table_names})
-    return model_outputs
-def __retrieve_model_inputs(name, model_client, function_arg_map):
-    """
-    DESCRIPTION:
-        Internal function to get the input DataFrames corresponding to a saved model given it's name.
-    PARAMETERS:
-        name:
-            Required Argument.
-            Specifies the name of the model to retrieve the model input information for.
-            Types: str
-        model_client:
-            Required Argument.
-            Specifies the name of the client that generated the model.
-            Types: str
-        function_arg_map:
-            Required Argument.
-            Specifies the teradataml-sql map for the function obtained using function_argument_mapper.
-            Types: dict
-    RETURNS:
-        A dict mapping the teradataml specific name for the input to actual input DataFrame.
-        The dictionary is of the following form:
-            {
-                <tdml_input_name> :
-                    {
-                        'TableName' : <actual_table_name>,
-                        'NRows': <number of rows>,
-                        'NCols': <number of columns>
-                    }
-            }
-    EXAMPLES:
-        >>> input_info = __retrieve_model_inputs(name, model_client, function_arg_map)
-    """
-    model_inputs = {}
-    # First get the model_id
-    model_id = DataFrame(in_schema(mac.MODEL_CATALOG_DB.value, mac.MODELS.value))
-    model_id = model_id[model_id[mac.MODEL_NAME.value] == name].select([mac.MODEL_ID.value]).squeeze().item()
-    # Now find the inputs related to the model
-    model_training_data = DataFrame(in_schema(mac.MODEL_CATALOG_DB.value, mac.MODELS_INPUTSX.value))
-    model_training_data = model_training_data[model_training_data[mac.MODEL_ID.value] == model_id]
-    model_training_data = model_training_data.to_pandas().to_dict()
-    index_len = len(model_training_data[mac.MODEL_ID.value])
-    for i in range(index_len):
-        if model_client == mac.MODEL_TDML.value:
-            input_name = model_training_data[mac.MODEL_INPUT_CLIENT_NAME.value][i]
-            table_name = model_training_data[mac.MODEL_INPUT_TABLE_NAME.value][i]
-        else:
-            input_name = __get_arg_tdml_name_from_sql(function_arg_map, famc.INPUTS.value,
-                                                      model_training_data[mac.MODEL_INPUT_NAME.value][i].lower())
-            # if input_name is None then we have been unable to get the tdml name from the SQL name
-            # for the input. In this case, we ignore the input initialization and continue.
-            if input_name is None:
-                warnings.warn(Messages.get_message(MessageCodes.CANNOT_TRANSLATE_TO_TDML_NAME,
-                                                   model_training_data[mac.MODEL_INPUT_NAME.value][i]))
-                continue
-            table_name = model_training_data[mac.MODEL_INPUT_TABLE_NAME.value][i]
-        # No need for further processing if the TableName associated with an input is None.
-        if table_name is None:
-            continue
-        nrows = model_training_data[mac.MODEL_INPUT_NROWS.value][i]
-        ncols = model_training_data[mac.MODEL_INPUT_NCOLS.value][i]
-        model_inputs[input_name] = {}
-        model_inputs[input_name][mac.MODEL_OBJ_TABLE_NAME.value] = table_name
-        model_inputs[input_name][mac.MODEL_INPUT_NROWS.value] = nrows
-        model_inputs[input_name][mac.MODEL_INPUT_NCOLS.value] = ncols
-    return model_inputs
-def __retrieve_argument_and_output_map(name):
-    """
-    DESCRIPTION:
-        Internal function to get the teradataml function class corresponding to the model to retrieve,
-        along with the attributes and output objects to initialize the model with.
-    PARAMETERS:
-        name:
-            Required Argument.
-            Specifies the name of the model to retrieve the model attributes and output information for.
-            Types: str
-    RETURNS:
-        A tuple with the following elements:
-        * the function class to initialize for the model,
-        * the model generating engine to help with the initialization, and
-        * the dictionary containing the attributes and their values including output table objects.
-    EXAMPLES:
-        >>> model_class, model_engine, attribute_dictionary = __retrieve_argument_and_output_map(name)
-    """
-    # First, let's get the model engine, client, algorithm, and other details.
-    model_client, model_engine, model_algorithm, model_details = __retrieve_model_client_engine_algorithm(name, True)
-    # Get the build_time, algorithm_name/model_class, target_column, prediction_type to be returned later as parameters.
-    # model_algorithm is also use to figure out the Python class to be instantiated.
-    build_time = model_details.select([mac.MODEL_DERIVED_BUILD_TIME.value]).squeeze()
-    prediction_type = model_details.select([mac.MODEL_DERIVED_PREDICTION_TYPE.value]).squeeze()
-    target_column = model_details.select([mac.MODEL_DERIVED_TARGET_COLUMN.value]).squeeze()
-    # Get the teradataml model class corresponding to the model
-    function_arg_map = _argument_mapper._get_function_map(engine=model_engine,
-                                                          function_name=model_algorithm.lower())
-    model_class = __retrieve_model_class(name, model_client, function_arg_map)
-    # Get the model attributes and formula related arguments
-    model_parameters, formula_related_args = __retrieve_model_attributes(name, model_client, function_arg_map)
-    # Also append the algorithm_name, build_time, target_column, and prediction_type for the function
-    model_parameters['__algorithm_name'] = model_algorithm
-    if build_time is not None:
-        model_parameters['__build_time'] = build_time.item()
-    if target_column is not None:
-        model_parameters['__target_column'] = target_column
-    if prediction_type is not None:
-        model_parameters['__prediction_type'] = prediction_type
-    # Merge the formula related arguments
-    model_parameters = {**model_parameters, **formula_related_args}
-    # Try plugging in the input DataFrames as well
-    model_inputs = __retrieve_model_inputs(name, model_client, function_arg_map)
-    for input_name in model_inputs:
-        table_name = model_inputs[input_name][mac.MODEL_OBJ_TABLE_NAME.value]
-        sname = UtilFuncs._extract_db_name(table_name)
-        tname = UtilFuncs._extract_table_name(table_name)
-        # Add quoted around the DB and Table names if necessary.
-        tdp = preparer(td_dialect)
-        if sname is not None:
-            sname = tdp.quote(UtilFuncs._teradata_unquote_arg(sname, quote='"'))
-        if tname is not None:
-            tname = tdp.quote(UtilFuncs._teradata_unquote_arg(tname, quote='"'))
-        # Try creating the input DataFrames
-        try:
-            if sname is None:
-                input = DataFrame(tname)
-            else:
-                input = DataFrame(in_schema(sname, tname))
-            model_inputs[input_name] = input
-        except Exception as err:
-            # We are most likely not able to create a DataFrame on the input as the input may no longer be existent.
-            # In this case, we just initialize it to None.
-            warnings.warn("Unable to fetch input details for the '{}' argument "
-                          "from underlying object named '{}'".format(input_name, table_name))
-            model_inputs[input_name] = None
-    # Let's also get the output table map
-    model_outputs = __retrieve_model_outputs(name, model_client, function_arg_map)
-    tables = model_outputs.to_dict()
-    model_tables = {}
-    index_len = len(tables["OutputName"])
-    for i in range(index_len):
-        output_name = tables["OutputName"][i]
-        model_tables[output_name] = tables["OutputTableName"][i]
-    return model_class, model_engine, {**model_inputs, **model_parameters, **model_tables}
 from teradataml.dataframe.dataframe import DataFrame, in_schema

teradataml 17.20.0.6__py3-none-any.whl → 20.0.0.0__py3-none-any.whl

Potentially problematic release.

teradataml 17.20.0.6py3-none-any.whl → 20.0.0.0py3-none-any.whl