PyPI - teradataml - Versions diffs - 17.20.0.6__py3-none-any.whl → 20.0.0.0__py3-none-any.whl - Mend

teradataml 17.20.0.6py3-none-any.whl → 20.0.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of teradataml might be problematic. Click here for more details.

Files changed (432) hide show

teradataml/LICENSE-3RD-PARTY.pdf +0 -0
teradataml/LICENSE.pdf +0 -0
teradataml/README.md +238 -1
teradataml/__init__.py +13 -3
teradataml/_version.py +1 -1
teradataml/analytics/Transformations.py +4 -4
teradataml/analytics/__init__.py +0 -2
teradataml/analytics/analytic_function_executor.py +3 -0
teradataml/analytics/json_parser/utils.py +13 -12
teradataml/analytics/sqle/DecisionTreePredict.py +15 -30
teradataml/analytics/sqle/NaiveBayesPredict.py +11 -20
teradataml/analytics/sqle/__init__.py +0 -13
teradataml/analytics/utils.py +1 -0
teradataml/analytics/valib.py +3 -0
teradataml/automl/__init__.py +1628 -0
teradataml/automl/custom_json_utils.py +1270 -0
teradataml/automl/data_preparation.py +993 -0
teradataml/automl/data_transformation.py +727 -0
teradataml/automl/feature_engineering.py +1648 -0
teradataml/automl/feature_exploration.py +547 -0
teradataml/automl/model_evaluation.py +163 -0
teradataml/automl/model_training.py +887 -0
teradataml/catalog/__init__.py +0 -2
teradataml/catalog/byom.py +49 -6
teradataml/catalog/function_argument_mapper.py +0 -2
teradataml/catalog/model_cataloging_utils.py +2 -1021
teradataml/common/aed_utils.py +6 -2
teradataml/common/constants.py +50 -58
teradataml/common/deprecations.py +160 -0
teradataml/common/garbagecollector.py +61 -104
teradataml/common/messagecodes.py +27 -36
teradataml/common/messages.py +11 -15
teradataml/common/utils.py +205 -287
teradataml/common/wrapper_utils.py +1 -110
teradataml/context/context.py +150 -78
teradataml/data/bank_churn.csv +10001 -0
teradataml/data/bmi.csv +501 -0
teradataml/data/docs/sqle/docs_17_10/BincodeFit.py +3 -3
teradataml/data/docs/sqle/docs_17_10/BincodeTransform.py +6 -5
teradataml/data/docs/sqle/docs_17_10/Fit.py +1 -1
teradataml/data/docs/sqle/docs_17_10/OneHotEncodingTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_10/OutlierFilterTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_10/PolynomialFeaturesTransform.py +2 -2
teradataml/data/docs/sqle/docs_17_10/RowNormalizeTransform.py +2 -1
teradataml/data/docs/sqle/docs_17_10/ScaleTransform.py +1 -0
teradataml/data/docs/sqle/docs_17_10/SimpleImputeTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_10/Transform.py +2 -1
teradataml/data/docs/sqle/docs_17_20/BincodeFit.py +3 -3
teradataml/data/docs/sqle/docs_17_20/BincodeTransform.py +6 -5
teradataml/data/docs/sqle/docs_17_20/Fit.py +1 -1
teradataml/data/docs/sqle/docs_17_20/GLM.py +1 -1
teradataml/data/docs/sqle/docs_17_20/GLMPredictPerSegment.py +9 -10
teradataml/data/docs/sqle/docs_17_20/KMeansPredict.py +3 -2
teradataml/data/docs/sqle/docs_17_20/NaiveBayesTextClassifierPredict.py +16 -15
teradataml/data/docs/sqle/docs_17_20/NaiveBayesTextClassifierTrainer.py +2 -2
teradataml/data/docs/sqle/docs_17_20/NonLinearCombineFit.py +2 -2
teradataml/data/docs/sqle/docs_17_20/NonLinearCombineTransform.py +8 -8
teradataml/data/docs/sqle/docs_17_20/OneClassSVMPredict.py +21 -20
teradataml/data/docs/sqle/docs_17_20/OneHotEncodingTransform.py +1 -1
teradataml/data/docs/sqle/docs_17_20/OutlierFilterTransform.py +8 -3
teradataml/data/docs/sqle/docs_17_20/PolynomialFeaturesTransform.py +6 -5
teradataml/data/docs/sqle/docs_17_20/RandomProjectionTransform.py +6 -6
teradataml/data/docs/sqle/docs_17_20/RowNormalizeTransform.py +2 -1
teradataml/data/docs/sqle/docs_17_20/SVM.py +1 -1
teradataml/data/docs/sqle/docs_17_20/SVMPredict.py +16 -16
teradataml/data/docs/sqle/docs_17_20/ScaleTransform.py +1 -0
teradataml/data/docs/sqle/docs_17_20/SimpleImputeTransform.py +3 -2
teradataml/data/docs/sqle/docs_17_20/TDDecisionForestPredict.py +4 -4
teradataml/data/docs/sqle/docs_17_20/TDGLMPredict.py +19 -19
teradataml/data/docs/sqle/docs_17_20/TargetEncodingTransform.py +5 -4
teradataml/data/docs/sqle/docs_17_20/Transform.py +2 -2
teradataml/data/docs/sqle/docs_17_20/XGBoostPredict.py +9 -9
teradataml/data/fish.csv +160 -0
teradataml/data/glass_types.csv +215 -0
teradataml/data/insurance.csv +1 -1
teradataml/data/iris_data.csv +151 -0
teradataml/data/jsons/sqle/17.10/TD_FunctionTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_OneHotEncodingTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_OutlierFilterTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_PolynomialFeaturesTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_RowNormalizeTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_ScaleTransform.json +1 -0
teradataml/data/jsons/sqle/17.10/TD_SimpleImputeTransform.json +1 -0
teradataml/data/load_example_data.py +3 -0
teradataml/data/multi_model_classification.csv +401 -0
teradataml/data/multi_model_regression.csv +401 -0
teradataml/data/openml_example.json +63 -0
teradataml/data/scripts/deploy_script.py +65 -0
teradataml/data/scripts/mapper.R +20 -0
teradataml/data/scripts/sklearn/__init__.py +0 -0
teradataml/data/scripts/sklearn/sklearn_fit.py +175 -0
teradataml/data/scripts/sklearn/sklearn_fit_predict.py +135 -0
teradataml/data/scripts/sklearn/sklearn_function.template +113 -0
teradataml/data/scripts/sklearn/sklearn_model_selection_split.py +158 -0
teradataml/data/scripts/sklearn/sklearn_neighbors.py +152 -0
teradataml/data/scripts/sklearn/sklearn_score.py +128 -0
teradataml/data/scripts/sklearn/sklearn_transform.py +179 -0
teradataml/data/templates/open_source_ml.json +9 -0
teradataml/data/teradataml_example.json +73 -1
teradataml/data/test_classification.csv +101 -0
teradataml/data/test_prediction.csv +101 -0
teradataml/data/test_regression.csv +101 -0
teradataml/data/train_multiclass.csv +101 -0
teradataml/data/train_regression.csv +101 -0
teradataml/data/train_regression_multiple_labels.csv +101 -0
teradataml/data/wine_data.csv +1600 -0
teradataml/dataframe/copy_to.py +79 -13
teradataml/dataframe/data_transfer.py +8 -0
teradataml/dataframe/dataframe.py +910 -311
teradataml/dataframe/dataframe_utils.py +102 -5
teradataml/dataframe/fastload.py +11 -3
teradataml/dataframe/setop.py +15 -2
teradataml/dataframe/sql.py +3735 -77
teradataml/dataframe/sql_function_parameters.py +56 -5
teradataml/dataframe/vantage_function_types.py +45 -1
teradataml/dataframe/window.py +30 -29
teradataml/dbutils/dbutils.py +18 -1
teradataml/geospatial/geodataframe.py +18 -7
teradataml/geospatial/geodataframecolumn.py +5 -0
teradataml/hyperparameter_tuner/optimizer.py +910 -120
teradataml/hyperparameter_tuner/utils.py +131 -37
teradataml/lib/aed_0_1.dll +0 -0
teradataml/lib/libaed_0_1.dylib +0 -0
teradataml/lib/libaed_0_1.so +0 -0
teradataml/libaed_0_1.dylib +0 -0
teradataml/libaed_0_1.so +0 -0
teradataml/opensource/__init__.py +1 -0
teradataml/opensource/sklearn/__init__.py +1 -0
teradataml/opensource/sklearn/_class.py +255 -0
teradataml/opensource/sklearn/_sklearn_wrapper.py +1668 -0
teradataml/opensource/sklearn/_wrapper_utils.py +268 -0
teradataml/opensource/sklearn/constants.py +54 -0
teradataml/options/__init__.py +3 -6
teradataml/options/configure.py +21 -20
teradataml/scriptmgmt/UserEnv.py +61 -5
teradataml/scriptmgmt/lls_utils.py +135 -53
teradataml/table_operators/Apply.py +38 -6
teradataml/table_operators/Script.py +45 -308
teradataml/table_operators/TableOperator.py +182 -591
teradataml/table_operators/__init__.py +0 -1
teradataml/table_operators/table_operator_util.py +32 -40
teradataml/utils/validators.py +127 -3
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/METADATA +243 -3
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/RECORD +147 -391
teradataml/analytics/mle/AdaBoost.py +0 -651
teradataml/analytics/mle/AdaBoostPredict.py +0 -564
teradataml/analytics/mle/Antiselect.py +0 -342
teradataml/analytics/mle/Arima.py +0 -641
teradataml/analytics/mle/ArimaPredict.py +0 -477
teradataml/analytics/mle/Attribution.py +0 -1070
teradataml/analytics/mle/Betweenness.py +0 -658
teradataml/analytics/mle/Burst.py +0 -711
teradataml/analytics/mle/CCM.py +0 -600
teradataml/analytics/mle/CCMPrepare.py +0 -324
teradataml/analytics/mle/CFilter.py +0 -460
teradataml/analytics/mle/ChangePointDetection.py +0 -572
teradataml/analytics/mle/ChangePointDetectionRT.py +0 -477
teradataml/analytics/mle/Closeness.py +0 -737
teradataml/analytics/mle/ConfusionMatrix.py +0 -420
teradataml/analytics/mle/Correlation.py +0 -477
teradataml/analytics/mle/Correlation2.py +0 -573
teradataml/analytics/mle/CoxHazardRatio.py +0 -679
teradataml/analytics/mle/CoxPH.py +0 -556
teradataml/analytics/mle/CoxSurvival.py +0 -478
teradataml/analytics/mle/CumulativeMovAvg.py +0 -363
teradataml/analytics/mle/DTW.py +0 -623
teradataml/analytics/mle/DWT.py +0 -564
teradataml/analytics/mle/DWT2D.py +0 -599
teradataml/analytics/mle/DecisionForest.py +0 -716
teradataml/analytics/mle/DecisionForestEvaluator.py +0 -363
teradataml/analytics/mle/DecisionForestPredict.py +0 -561
teradataml/analytics/mle/DecisionTree.py +0 -830
teradataml/analytics/mle/DecisionTreePredict.py +0 -528
teradataml/analytics/mle/ExponentialMovAvg.py +0 -418
teradataml/analytics/mle/FMeasure.py +0 -402
teradataml/analytics/mle/FPGrowth.py +0 -734
teradataml/analytics/mle/FrequentPaths.py +0 -695
teradataml/analytics/mle/GLM.py +0 -558
teradataml/analytics/mle/GLML1L2.py +0 -547
teradataml/analytics/mle/GLML1L2Predict.py +0 -519
teradataml/analytics/mle/GLMPredict.py +0 -529
teradataml/analytics/mle/HMMDecoder.py +0 -945
teradataml/analytics/mle/HMMEvaluator.py +0 -901
teradataml/analytics/mle/HMMSupervised.py +0 -521
teradataml/analytics/mle/HMMUnsupervised.py +0 -572
teradataml/analytics/mle/Histogram.py +0 -561
teradataml/analytics/mle/IDWT.py +0 -476
teradataml/analytics/mle/IDWT2D.py +0 -493
teradataml/analytics/mle/IdentityMatch.py +0 -763
teradataml/analytics/mle/Interpolator.py +0 -918
teradataml/analytics/mle/KMeans.py +0 -485
teradataml/analytics/mle/KNN.py +0 -627
teradataml/analytics/mle/KNNRecommender.py +0 -488
teradataml/analytics/mle/KNNRecommenderPredict.py +0 -581
teradataml/analytics/mle/LAR.py +0 -439
teradataml/analytics/mle/LARPredict.py +0 -478
teradataml/analytics/mle/LDA.py +0 -548
teradataml/analytics/mle/LDAInference.py +0 -492
teradataml/analytics/mle/LDATopicSummary.py +0 -464
teradataml/analytics/mle/LevenshteinDistance.py +0 -450
teradataml/analytics/mle/LinReg.py +0 -433
teradataml/analytics/mle/LinRegPredict.py +0 -438
teradataml/analytics/mle/MinHash.py +0 -544
teradataml/analytics/mle/Modularity.py +0 -587
teradataml/analytics/mle/NEREvaluator.py +0 -410
teradataml/analytics/mle/NERExtractor.py +0 -595
teradataml/analytics/mle/NERTrainer.py +0 -458
teradataml/analytics/mle/NGrams.py +0 -570
teradataml/analytics/mle/NPath.py +0 -634
teradataml/analytics/mle/NTree.py +0 -549
teradataml/analytics/mle/NaiveBayes.py +0 -462
teradataml/analytics/mle/NaiveBayesPredict.py +0 -513
teradataml/analytics/mle/NaiveBayesTextClassifier.py +0 -607
teradataml/analytics/mle/NaiveBayesTextClassifier2.py +0 -531
teradataml/analytics/mle/NaiveBayesTextClassifierPredict.py +0 -799
teradataml/analytics/mle/NamedEntityFinder.py +0 -529
teradataml/analytics/mle/NamedEntityFinderEvaluator.py +0 -414
teradataml/analytics/mle/NamedEntityFinderTrainer.py +0 -396
teradataml/analytics/mle/POSTagger.py +0 -417
teradataml/analytics/mle/Pack.py +0 -411
teradataml/analytics/mle/PageRank.py +0 -535
teradataml/analytics/mle/PathAnalyzer.py +0 -426
teradataml/analytics/mle/PathGenerator.py +0 -367
teradataml/analytics/mle/PathStart.py +0 -464
teradataml/analytics/mle/PathSummarizer.py +0 -470
teradataml/analytics/mle/Pivot.py +0 -471
teradataml/analytics/mle/ROC.py +0 -425
teradataml/analytics/mle/RandomSample.py +0 -637
teradataml/analytics/mle/RandomWalkSample.py +0 -490
teradataml/analytics/mle/SAX.py +0 -779
teradataml/analytics/mle/SVMDense.py +0 -677
teradataml/analytics/mle/SVMDensePredict.py +0 -536
teradataml/analytics/mle/SVMDenseSummary.py +0 -437
teradataml/analytics/mle/SVMSparse.py +0 -557
teradataml/analytics/mle/SVMSparsePredict.py +0 -553
teradataml/analytics/mle/SVMSparseSummary.py +0 -435
teradataml/analytics/mle/Sampling.py +0 -549
teradataml/analytics/mle/Scale.py +0 -565
teradataml/analytics/mle/ScaleByPartition.py +0 -496
teradataml/analytics/mle/ScaleMap.py +0 -378
teradataml/analytics/mle/ScaleSummary.py +0 -320
teradataml/analytics/mle/SentenceExtractor.py +0 -363
teradataml/analytics/mle/SentimentEvaluator.py +0 -432
teradataml/analytics/mle/SentimentExtractor.py +0 -578
teradataml/analytics/mle/SentimentTrainer.py +0 -405
teradataml/analytics/mle/SeriesSplitter.py +0 -641
teradataml/analytics/mle/Sessionize.py +0 -475
teradataml/analytics/mle/SimpleMovAvg.py +0 -397
teradataml/analytics/mle/StringSimilarity.py +0 -425
teradataml/analytics/mle/TF.py +0 -389
teradataml/analytics/mle/TFIDF.py +0 -504
teradataml/analytics/mle/TextChunker.py +0 -414
teradataml/analytics/mle/TextClassifier.py +0 -399
teradataml/analytics/mle/TextClassifierEvaluator.py +0 -413
teradataml/analytics/mle/TextClassifierTrainer.py +0 -565
teradataml/analytics/mle/TextMorph.py +0 -494
teradataml/analytics/mle/TextParser.py +0 -623
teradataml/analytics/mle/TextTagger.py +0 -530
teradataml/analytics/mle/TextTokenizer.py +0 -502
teradataml/analytics/mle/UnivariateStatistics.py +0 -488
teradataml/analytics/mle/Unpack.py +0 -526
teradataml/analytics/mle/Unpivot.py +0 -438
teradataml/analytics/mle/VarMax.py +0 -776
teradataml/analytics/mle/VectorDistance.py +0 -762
teradataml/analytics/mle/WeightedMovAvg.py +0 -400
teradataml/analytics/mle/XGBoost.py +0 -842
teradataml/analytics/mle/XGBoostPredict.py +0 -627
teradataml/analytics/mle/__init__.py +0 -123
teradataml/analytics/mle/json/adaboost_mle.json +0 -135
teradataml/analytics/mle/json/adaboostpredict_mle.json +0 -85
teradataml/analytics/mle/json/antiselect_mle.json +0 -34
teradataml/analytics/mle/json/antiselect_mle_mle.json +0 -34
teradataml/analytics/mle/json/arima_mle.json +0 -172
teradataml/analytics/mle/json/arimapredict_mle.json +0 -52
teradataml/analytics/mle/json/attribution_mle_mle.json +0 -143
teradataml/analytics/mle/json/betweenness_mle.json +0 -97
teradataml/analytics/mle/json/burst_mle.json +0 -140
teradataml/analytics/mle/json/ccm_mle.json +0 -124
teradataml/analytics/mle/json/ccmprepare_mle.json +0 -14
teradataml/analytics/mle/json/cfilter_mle.json +0 -93
teradataml/analytics/mle/json/changepointdetection_mle.json +0 -92
teradataml/analytics/mle/json/changepointdetectionrt_mle.json +0 -78
teradataml/analytics/mle/json/closeness_mle.json +0 -104
teradataml/analytics/mle/json/confusionmatrix_mle.json +0 -79
teradataml/analytics/mle/json/correlation_mle.json +0 -86
teradataml/analytics/mle/json/correlationreduce_mle.json +0 -49
teradataml/analytics/mle/json/coxhazardratio_mle.json +0 -89
teradataml/analytics/mle/json/coxph_mle.json +0 -98
teradataml/analytics/mle/json/coxsurvival_mle.json +0 -79
teradataml/analytics/mle/json/cumulativemovavg_mle.json +0 -34
teradataml/analytics/mle/json/decisionforest_mle.json +0 -167
teradataml/analytics/mle/json/decisionforestevaluator_mle.json +0 -33
teradataml/analytics/mle/json/decisionforestpredict_mle_mle.json +0 -74
teradataml/analytics/mle/json/decisiontree_mle.json +0 -194
teradataml/analytics/mle/json/decisiontreepredict_mle_mle.json +0 -86
teradataml/analytics/mle/json/dtw_mle.json +0 -97
teradataml/analytics/mle/json/dwt2d_mle.json +0 -116
teradataml/analytics/mle/json/dwt_mle.json +0 -101
teradataml/analytics/mle/json/exponentialmovavg_mle.json +0 -55
teradataml/analytics/mle/json/fmeasure_mle.json +0 -58
teradataml/analytics/mle/json/fpgrowth_mle.json +0 -159
teradataml/analytics/mle/json/frequentpaths_mle.json +0 -129
teradataml/analytics/mle/json/glm_mle.json +0 -111
teradataml/analytics/mle/json/glml1l2_mle.json +0 -106
teradataml/analytics/mle/json/glml1l2predict_mle.json +0 -57
teradataml/analytics/mle/json/glmpredict_mle_mle.json +0 -74
teradataml/analytics/mle/json/histogram_mle.json +0 -100
teradataml/analytics/mle/json/hmmdecoder_mle.json +0 -192
teradataml/analytics/mle/json/hmmevaluator_mle.json +0 -206
teradataml/analytics/mle/json/hmmsupervised_mle.json +0 -91
teradataml/analytics/mle/json/hmmunsupervised_mle.json +0 -114
teradataml/analytics/mle/json/identitymatch_mle.json +0 -88
teradataml/analytics/mle/json/idwt2d_mle.json +0 -73
teradataml/analytics/mle/json/idwt_mle.json +0 -66
teradataml/analytics/mle/json/interpolator_mle.json +0 -151
teradataml/analytics/mle/json/kmeans_mle.json +0 -97
teradataml/analytics/mle/json/knn_mle.json +0 -141
teradataml/analytics/mle/json/knnrecommender_mle.json +0 -111
teradataml/analytics/mle/json/knnrecommenderpredict_mle.json +0 -75
teradataml/analytics/mle/json/lar_mle.json +0 -78
teradataml/analytics/mle/json/larpredict_mle.json +0 -69
teradataml/analytics/mle/json/lda_mle.json +0 -130
teradataml/analytics/mle/json/ldainference_mle.json +0 -78
teradataml/analytics/mle/json/ldatopicsummary_mle.json +0 -64
teradataml/analytics/mle/json/levenshteindistance_mle.json +0 -92
teradataml/analytics/mle/json/linreg_mle.json +0 -42
teradataml/analytics/mle/json/linregpredict_mle.json +0 -56
teradataml/analytics/mle/json/minhash_mle.json +0 -113
teradataml/analytics/mle/json/modularity_mle.json +0 -91
teradataml/analytics/mle/json/naivebayespredict_mle_mle.json +0 -85
teradataml/analytics/mle/json/naivebayesreduce_mle.json +0 -52
teradataml/analytics/mle/json/naivebayestextclassifierpredict_mle_mle.json +0 -147
teradataml/analytics/mle/json/naivebayestextclassifiertrainer2_mle.json +0 -108
teradataml/analytics/mle/json/naivebayestextclassifiertrainer_mle.json +0 -102
teradataml/analytics/mle/json/namedentityfinder_mle.json +0 -84
teradataml/analytics/mle/json/namedentityfinderevaluatorreduce_mle.json +0 -43
teradataml/analytics/mle/json/namedentityfindertrainer_mle.json +0 -64
teradataml/analytics/mle/json/nerevaluator_mle.json +0 -54
teradataml/analytics/mle/json/nerextractor_mle.json +0 -87
teradataml/analytics/mle/json/nertrainer_mle.json +0 -89
teradataml/analytics/mle/json/ngrams_mle.json +0 -137
teradataml/analytics/mle/json/ngramsplitter_mle_mle.json +0 -137
teradataml/analytics/mle/json/npath@coprocessor_mle.json +0 -73
teradataml/analytics/mle/json/ntree@coprocessor_mle.json +0 -123
teradataml/analytics/mle/json/pack_mle.json +0 -58
teradataml/analytics/mle/json/pack_mle_mle.json +0 -58
teradataml/analytics/mle/json/pagerank_mle.json +0 -81
teradataml/analytics/mle/json/pathanalyzer_mle.json +0 -63
teradataml/analytics/mle/json/pathgenerator_mle.json +0 -40
teradataml/analytics/mle/json/pathstart_mle.json +0 -62
teradataml/analytics/mle/json/pathsummarizer_mle.json +0 -72
teradataml/analytics/mle/json/pivoting_mle.json +0 -71
teradataml/analytics/mle/json/postagger_mle.json +0 -51
teradataml/analytics/mle/json/randomsample_mle.json +0 -131
teradataml/analytics/mle/json/randomwalksample_mle.json +0 -85
teradataml/analytics/mle/json/roc_mle.json +0 -73
teradataml/analytics/mle/json/sampling_mle.json +0 -75
teradataml/analytics/mle/json/sax_mle.json +0 -154
teradataml/analytics/mle/json/scale_mle.json +0 -93
teradataml/analytics/mle/json/scalebypartition_mle.json +0 -89
teradataml/analytics/mle/json/scalemap_mle.json +0 -44
teradataml/analytics/mle/json/scalesummary_mle.json +0 -14
teradataml/analytics/mle/json/sentenceextractor_mle.json +0 -41
teradataml/analytics/mle/json/sentimentevaluator_mle.json +0 -43
teradataml/analytics/mle/json/sentimentextractor_mle.json +0 -100
teradataml/analytics/mle/json/sentimenttrainer_mle.json +0 -68
teradataml/analytics/mle/json/seriessplitter_mle.json +0 -133
teradataml/analytics/mle/json/sessionize_mle_mle.json +0 -62
teradataml/analytics/mle/json/simplemovavg_mle.json +0 -48
teradataml/analytics/mle/json/stringsimilarity_mle.json +0 -50
teradataml/analytics/mle/json/stringsimilarity_mle_mle.json +0 -50
teradataml/analytics/mle/json/svmdense_mle.json +0 -165
teradataml/analytics/mle/json/svmdensepredict_mle.json +0 -95
teradataml/analytics/mle/json/svmdensesummary_mle.json +0 -58
teradataml/analytics/mle/json/svmsparse_mle.json +0 -148
teradataml/analytics/mle/json/svmsparsepredict_mle_mle.json +0 -103
teradataml/analytics/mle/json/svmsparsesummary_mle.json +0 -57
teradataml/analytics/mle/json/textchunker_mle.json +0 -40
teradataml/analytics/mle/json/textclassifier_mle.json +0 -51
teradataml/analytics/mle/json/textclassifierevaluator_mle.json +0 -43
teradataml/analytics/mle/json/textclassifiertrainer_mle.json +0 -103
teradataml/analytics/mle/json/textmorph_mle.json +0 -63
teradataml/analytics/mle/json/textparser_mle.json +0 -166
teradataml/analytics/mle/json/texttagger_mle.json +0 -81
teradataml/analytics/mle/json/texttokenizer_mle.json +0 -91
teradataml/analytics/mle/json/tf_mle.json +0 -33
teradataml/analytics/mle/json/tfidf_mle.json +0 -34
teradataml/analytics/mle/json/univariatestatistics_mle.json +0 -81
teradataml/analytics/mle/json/unpack_mle.json +0 -91
teradataml/analytics/mle/json/unpack_mle_mle.json +0 -91
teradataml/analytics/mle/json/unpivoting_mle.json +0 -63
teradataml/analytics/mle/json/varmax_mle.json +0 -176
teradataml/analytics/mle/json/vectordistance_mle.json +0 -179
teradataml/analytics/mle/json/weightedmovavg_mle.json +0 -48
teradataml/analytics/mle/json/xgboost_mle.json +0 -178
teradataml/analytics/mle/json/xgboostpredict_mle.json +0 -104
teradataml/analytics/sqle/Antiselect.py +0 -321
teradataml/analytics/sqle/Attribution.py +0 -603
teradataml/analytics/sqle/DecisionForestPredict.py +0 -408
teradataml/analytics/sqle/GLMPredict.py +0 -430
teradataml/analytics/sqle/MovingAverage.py +0 -543
teradataml/analytics/sqle/NGramSplitter.py +0 -548
teradataml/analytics/sqle/NPath.py +0 -632
teradataml/analytics/sqle/NaiveBayesTextClassifierPredict.py +0 -515
teradataml/analytics/sqle/Pack.py +0 -388
teradataml/analytics/sqle/SVMSparsePredict.py +0 -464
teradataml/analytics/sqle/Sessionize.py +0 -390
teradataml/analytics/sqle/StringSimilarity.py +0 -400
teradataml/analytics/sqle/Unpack.py +0 -503
teradataml/analytics/sqle/json/antiselect_sqle.json +0 -21
teradataml/analytics/sqle/json/attribution_sqle.json +0 -92
teradataml/analytics/sqle/json/decisionforestpredict_sqle.json +0 -48
teradataml/analytics/sqle/json/glmpredict_sqle.json +0 -48
teradataml/analytics/sqle/json/h2opredict_sqle.json +0 -63
teradataml/analytics/sqle/json/movingaverage_sqle.json +0 -58
teradataml/analytics/sqle/json/naivebayestextclassifierpredict_sqle.json +0 -76
teradataml/analytics/sqle/json/ngramsplitter_sqle.json +0 -126
teradataml/analytics/sqle/json/npath_sqle.json +0 -67
teradataml/analytics/sqle/json/pack_sqle.json +0 -47
teradataml/analytics/sqle/json/pmmlpredict_sqle.json +0 -55
teradataml/analytics/sqle/json/sessionize_sqle.json +0 -43
teradataml/analytics/sqle/json/stringsimilarity_sqle.json +0 -39
teradataml/analytics/sqle/json/svmsparsepredict_sqle.json +0 -74
teradataml/analytics/sqle/json/unpack_sqle.json +0 -80
teradataml/catalog/model_cataloging.py +0 -980
teradataml/config/mlengine_alias_definitions_v1.0 +0 -118
teradataml/config/mlengine_alias_definitions_v1.1 +0 -127
teradataml/config/mlengine_alias_definitions_v1.3 +0 -129
teradataml/table_operators/sandbox_container_util.py +0 -643
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/WHEEL +0 -0
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/top_level.txt +0 -0
{teradataml-17.20.0.6.dist-info → teradataml-20.0.0.0.dist-info}/zip-safe +0 -0

teradataml/table_operators/TableOperator.py CHANGED Viewed

@@ -13,6 +13,9 @@
 # ##################################################################
 import os
+import time
+import uuid
+from math import floor
 import tarfile
 import subprocess
 from pathlib import Path
@@ -495,177 +498,9 @@ class TableOperator:
                 awu_matrix_returns.append(["values in returns", self.returns[key], False, self._supported_returns_datatypes])
             _Validators._validate_function_arguments(awu_matrix_returns)
-    def setup_test_env(self, docker_image_location):
-        """
-                DESCRIPTION:
-                    Function enables user to load already downloaded sandbox image.
-                    This will enable users to run the Python scripts on client machine outside of
-                    Open Analytics Framework.
-                PARAMETERS:
-                    docker_image_location:
-                        Required Argument.
-                        Specifies the location of image on user's system.
-                        Types: str
-                        Note:
-                            For location to download docker image refer teradataml User Guide.
-                RETURNS:
-                    None.
-                RAISES:
-                    TeradataMlException
-                EXAMPLES:
-                    # Load example data.
-                    load_example_data("Script", ["barrier"])
-                    # Example - The script mapper.py reads in a line of text input ("Old Macdonald Had A Farm") from csv and
-                    # splits the line into individual words, emitting a new row for each word.
-                    # Create teradataml DataFrame objects.
-                    >>> barrierdf = DataFrame.from_table("barrier")
-                    # Create remote user environment.
-                    >>> test_env = create_env('test_env', 'python_3.7.9', 'Demo environment');
-                    User environment test_env created.
-                    # Create an Apply object that allows user to execute script using Open Analytics Framework.
-                    >>> apply_obj = Apply(data=barrierdf,
-                                script_name='mapper.py',
-                                files_local_path='data/scripts',
-                                apply_command='python mapper.py',
-                                delimiter=',',
-                                env_name = "test_env",
-                                data_partition_column="Id",
-                                returns={"word": VARCHAR(15), "count_input": VARCHAR(2)}
-                                )
-                    # Run user script locally within docker container and using data from csv.
-                    # This helps the user to fix script level issues outside of Open Analytics Framework.
-                    # Setup the environment by providing local path to docker image file.
-                    >>> apply_obj.setup_test_env(docker_image_location='/tmp/sto_sandbox_docker_image.tar'))
-                    Loading image from /tmp/sto_sandbox_docker_image.tar. It may take few minutes.
-                    Image loaded successfully.
-        """
-        self.awu_matrix_setup=[]
-        self.awu_matrix_setup.append((["docker_image_location", docker_image_location, False, (str), True]))
-        # Validate missing arguments
-        _Validators._validate_missing_required_arguments(self.awu_matrix_setup)
-        # Validate argument types
-        _Validators._validate_function_arguments(self.awu_matrix_setup)
-        # get the frame object of the function.
-        import inspect
-        frame = inspect.currentframe()
-        # Validate argument types.
-        _Validators._validate_module_presence('docker', frame.f_code.co_name)
-        import docker
-        # Load image from user provided location
-        client = docker.from_env()
-        if not Path(docker_image_location).exists():
-            raise TeradataMlException(
-                Messages.get_message(MessageCodes.INPUT_FILE_NOT_FOUND).format(docker_image_location),
-                MessageCodes.INPUT_FILE_NOT_FOUND)
-        else:
-            try:
-                print("Loading image from {0}. It may take few minutes.".format(docker_image_location))
-                with open(docker_image_location, 'rb') as f:
-                    client.images.load(f)
-                print("Image loaded successfully.")
-            except:
-                raise
-        # Set _latest_sandbox_exists to True - which indicates sandbox image for STO exists on the system
-        configure._latest_sandbox_exists = True
-    def setup_sto_env(self, docker_image_location):
-        """
-        DESCRIPTION:
-            Function enables user to load already downloaded sandbox image.
-        PARAMETERS:
-            docker_image_location:
-                Required Argument.
-                Specifies the location of image on user's system.
-                Types: str
-                Note:
-                    For location to download docker image refer teradataml User Guide.
-        RETURNS:
-            None.
-        RAISES:
-            TeradataMlException
-        EXAMPLES:
-            # Note - Refer to User Guide for setting search path and required permissions.
-            # Load example data.
-            load_example_data("Script", ["barrier"])
-            # Example - The script mapper.py reads in a line of text input
-            # ("Old Macdonald Had A Farm") from csv and
-            # splits the line into individual words, emitting a new row for each word.
-            # Create teradataml DataFrame objects.
-            >>> barrierdf = DataFrame.from_table("barrier")
-            # Set SEARCHUIFDBPATH.
-            >>> execute_sql("SET SESSION SEARCHUIFDBPATH = alice;")
-            # Create a Script object that allows us to execute script on Vantage.
-            >>> import os
-            >>> td_path = os.path.dirname(teradataml.__file__)
-            >>> from teradatasqlalchemy import VARCHAR
-            >>> sto = Script(data=barrierdf,
-            ...              script_name='mapper.py',
-            ...              files_local_path= os.path.join(td_path, 'data', 'scripts'),
-            ...              script_command='python ./alice/mapper.py',
-            ...              data_order_column="Id",
-            ...              is_local_order=False,
-            ...              nulls_first=False,
-            ...              sort_ascending=False,
-            ...              charset='latin',
-            ...              returns=OrderedDict([("word", VARCHAR(15)),("count_input", VARCHAR(2))]))
-            # Run user script locally within docker container and using data from csv.
-            # This helps the user to fix script level issues outside Vantage.
-            # Setup the environment by providing local path to docker image file.
-            >>> sto.setup_sto_env(docker_image_location='/tmp/sto_sandbox_docker_image.tar')
-            Loading image from /tmp/sto_sandbox_docker_image.tar. It may take few minutes.
-            Image loaded successfully.
-            Starting a container for stosandbox:1.0 image.
-            Container d7c73cb498c79a082180576bb5b10bb07b52efdd3026856146fc15e91147b19f
-            started successfully.
-        """
-        self.awu_matrix_setup = []
-        self.awu_matrix_setup.append((["docker_image_location", docker_image_location,
-                                       False, (str), True]))
-        # Validate missing arguments.
-        _Validators._validate_missing_required_arguments(self.awu_matrix_setup)
-        # Validate argument types.
-        _Validators._validate_function_arguments(self.awu_matrix_setup)
-        from teradataml.table_operators.sandbox_container_util import setup_sandbox_env
-        setup_sandbox_env(sandbox_image_location=docker_image_location,
-                          sandbox_image_name='stosandbox:1.0')
-        # Set _latest_sandbox_exists to True - which indicates sandbox image for STO
-        # exists on the system.
-        from teradataml.options.configure import configure
-        configure._latest_sandbox_exists = True
     def test_script(self, supporting_files=None, input_data_file=None, script_args="",
-                    exec_mode='sandbox', **kwargs):
+                    exec_mode='local', **kwargs):
         """
         DESCRIPTION:
             Function enables user to run script in docker container environment outside
@@ -697,10 +532,9 @@ class TableOperator:
             exec_mode:
                 Optional Argument.
                 Specifies the mode in which user wants to test the script.
-                If set to 'sandbox', the user script will run within the sandbox
-                environment, else it will run locally on user's system.
-                Permitted Values: 'sandbox', 'local'
-                Default Value: 'sandbox'
+                If set to 'local', the user script will run locally on user's system.
+                Permitted Values: 'local'
+                Default Value: 'local'
                 Types: str
             kwargs:
@@ -734,13 +568,6 @@ class TableOperator:
                         Default Value: True
                         Types: bool
-                    timeout:
-                        Optional Argument.
-                        Specifies the timeout for docker API calls when running in
-                        sandbox mode.
-                        Default Value: 5000
-                        Types: int
                     data_file_quote_char:
                         Optional Argument.
                         Specifies the quotechar used in the input data file.
@@ -811,23 +638,6 @@ class TableOperator:
         EXAMPLES:
             # Assumption - sto is Script() object. Please refer to help(Script)
             # for creating Script object.
-            # Run user script in sandbox mode with input from data file.
-            >>> sto.test_script(input_data_file='../barrier.csv',
-            ...                 data_file_delimiter=',',
-            ...                 data_file_quote_char='"',
-            ...                 data_file_header=True,
-            ...                 exec_mode='sandbox')
-            ############ STDOUT Output ############
-                    word  count_input
-            0          1            1
-            1        Old            1
-            2  Macdonald            1
-            3        Had            1
-            4          A            1
-            5       Farm            1
-            >>>
             # Run user script in local mode with input from table.
             >>> sto.test_script(data_row_limit=300, password='alice', exec_mode='local')
@@ -841,19 +651,19 @@ class TableOperator:
             4          A            1
             5       Farm            1
-            # Run user script in sandbox mode with logmech as 'TD2'.
+            # Run user script in local mode with logmech as 'TD2'.
             >>> sto.test_script(script_args="4 5 10 6 480", password="alice", logmech="TD2")
-            # Run user script in sandbox mode with logmech as 'TDNEGO'.
+            # Run user script in local mode with logmech as 'TDNEGO'.
             >>> sto.test_script(script_args="4 5 10 6 480", password="alice", logmech="TDNEGO")
-            # Run user script in sandbox mode with logmech as 'LDAP'.
+            # Run user script in local mode with logmech as 'LDAP'.
             >>> sto.test_script(script_args="4 5 10 6 480", password="alice", logmech="LDAP")
-            # Run user script in sandbox mode with logmech as 'KRB5'.
+            # Run user script in local mode with logmech as 'KRB5'.
             >>> sto.test_script(script_args="4 5 10 6 480", password="alice", logmech="KRB5")
-            # Run user script in sandbox mode with logmech as 'JWT'.
+            # Run user script in local mode with logmech as 'JWT'.
             >>> sto.test_script(script_args="4 5 10 6 480", password="alice",
                                 logmech='JWT', logdata='token=eyJpc...h8dA')
@@ -866,8 +676,7 @@ class TableOperator:
         awu_matrix_test.append((["input_data_file", input_data_file, True, (str), True]))
         awu_matrix_test.append((["script_args", script_args, True, (str), False]))
         awu_matrix_test.append((["exec_mode", exec_mode, True, (str), True,
-                                 [TableOperatorConstants.SANDBOX_EXEC.value,
-                                  TableOperatorConstants.LOCAL_EXEC.value]]))
+                                 [TableOperatorConstants.LOCAL_EXEC.value]]))
         data_row_limit = kwargs.pop("data_row_limit", 1000)
         awu_matrix_test.append((["data_row_limit", data_row_limit, True, (int), True]))
@@ -883,9 +692,6 @@ class TableOperator:
         data_file_header = kwargs.pop("data_file_header", True)
         awu_matrix_test.append((["data_file_header", data_file_header, True, (bool)]))
-        timeout = kwargs.pop("timeout", 5000)
-        awu_matrix_test.append((["timeout", timeout, True, (int), True]))
         logmech = kwargs.pop("logmech", "TD2")
         awu_matrix_test.append(
             ["logmech", logmech, True, (str), True, logmech_valid_values])
@@ -896,9 +702,6 @@ class TableOperator:
         # Validate argument types.
         _Validators._validate_function_arguments(awu_matrix_test)
-        # Validate timeout value.
-        _Validators._validate_positive_int(timeout, "timeout")
         self._validate()
         if logmech == "JWT" and not logdata:
@@ -914,14 +717,8 @@ class TableOperator:
         # Either of 'input_data_file' or 'password' argument is required.
         password = kwargs.pop("password", None)
-        # The check of EITHER_THIS_OR_THAT_ARGUMENT is applicable only when the exec_mode is sandbox.
-        # Hence adding the check exec_mode != "local".
         # When exec_mode is local, the connection object is used to get the values in the table.
-        if exec_mode != "local" and not (input_data_file or (self.data and password)):
-            message = Messages.get_message(MessageCodes.EITHER_THIS_OR_THAT_ARGUMENT,
-                                           "input_data_file", "Script data and password")
-            raise TeradataMlException(message, MessageCodes.EITHER_THIS_OR_THAT_ARGUMENT)
-        elif exec_mode == "local" and not (input_data_file or self.data):
+        if exec_mode == "local" and not (input_data_file or self.data):
             message = Messages.get_message(MessageCodes.EITHER_THIS_OR_THAT_ARGUMENT,
                                            "input_data_file", "Script data")
             raise TeradataMlException(message, MessageCodes.EITHER_THIS_OR_THAT_ARGUMENT)
@@ -984,171 +781,6 @@ class TableOperator:
                     return self.__process_test_script_output(exec_cmd_output)
                 except Exception as exp:
                     raise
-        else:
-            # Execution Mode - sandbox.
-            # get the frame object of the function.
-            import inspect
-            frame = inspect.currentframe()
-            # Validate argument types.
-            _Validators._validate_module_presence('docker', frame.f_code.co_name)
-            # Read container_id from configure.sandbox_container_id, if it is None then
-            # raise an exception
-            container_id = configure.sandbox_container_id
-            if container_id is None:
-                message = Messages.get_message(MessageCodes.SANDBOX_CONTAINER_NOT_FOUND)
-                raise TeradataMlException(message,
-                                          MessageCodes.SANDBOX_CONTAINER_NOT_FOUND)
-            # Set path inside docker container. This is where files will be copied to.
-            # os.path.join() will not work here because the path is not dependent on
-            # client platform. Sandbox environment is linux based here.
-            _path_in_docker_container = "/home/tdatuser"
-            user_script_path = "{}/{}".format(_path_in_docker_container, self.script_name)
-            if input_data_file is not None:
-                input_file_name = os.path.basename(input_data_file)
-                input_file_path = "{}/{}".format(_path_in_docker_container,
-                                                 input_file_name)
-                # Create script_executor.
-                self._create_executor_script(user_script_path=user_script_path,
-                                             user_script_args=script_args,
-                                             data_file_path=input_file_path,
-                                             data_file_delimiter=data_file_delimiter,
-                                             data_file_quote_char=data_file_quote_char,
-                                             data_file_header=data_file_header)
-            else:
-                # Read input from db.
-                if self.data.shape[0] > data_row_limit:
-                    raise ValueError(
-                        Messages.get_message(MessageCodes.DATAFRAME_LIMIT_ERROR,
-                                             'data_row_limit', 'data_row_limit',
-                                             data_row_limit))
-                db_host = get_context().url.host
-                user_name = get_context().url.username
-                if not self.data._table_name:
-                    self.data._table_name = df_utils._execute_node_return_db_object_name(
-                        self.data._nodeid, self.data._metaexpr)
-                table_name = UtilFuncs._extract_table_name(self.data._table_name)
-                db_name = _get_current_databasename()
-                # Create script_executor.
-                self._create_executor_script(user_script_path=user_script_path,
-                                             user_script_args=script_args,
-                                             db_host=db_host,
-                                             user_name=user_name,
-                                             passwd=password,
-                                             table_name=table_name,
-                                             db_name=db_name,
-                                             logmech=logmech,
-                                             logdata=logdata)
-            import docker
-            client = docker.APIClient(timeout=timeout)
-            # Copy files to container indicated in configure.sandbox_container_id.
-            files_to_copy = [self.script_name]
-            if supporting_files is not None:
-                if isinstance(supporting_files, str):
-                    supporting_files = [supporting_files]
-                if len(supporting_files) == 0 \
-                        or any(file in [None, "None", ""] for file in supporting_files):
-                    raise ValueError(
-                        Messages.get_message(MessageCodes.LIST_SELECT_NONE_OR_EMPTY,
-                                             'supporting_files'))
-                else:
-                    files_to_copy.extend(supporting_files)
-            if input_data_file is not None:
-                files_to_copy.append(input_data_file)
-            for filename in files_to_copy:
-                file_path = os.path.join(self.files_local_path, filename)
-                # Check if file exists.
-                _Validators._validate_file_exists(file_path)
-                # Copy file to docker container.
-                self._copy_to_docker_container(client, file_path,
-                                               _path_in_docker_container,
-                                               container_id)
-            # Copy script_executor to docker container.
-            self._copy_to_docker_container(client, self.script_path,
-                                           _path_in_docker_container,
-                                           container_id)
-            script_executor_file_name = os.path.basename(self.script_path)
-            exec_cmd = ("python3 {0}/{1}".format(_path_in_docker_container,
-                                                 script_executor_file_name))
-            try:
-                # Setup an exec instance in the container.
-                exec_cmd_create = client.exec_create(container_id, exec_cmd)
-                # Start exec instance and run user script.
-                exec_cmd_output = client.exec_start(exec_cmd_create, demux=True)
-                # Inspect the output for success or failure.
-                inspect_out = client.exec_inspect(exec_cmd_create)
-                # Extract the exit code.
-                exit_code = inspect_out['ExitCode']
-                if exec_cmd_output[0] is not None:
-                    executor_output = exec_cmd_output[0].decode()
-                executor_error = ""
-                if exec_cmd_output[1] is not None:
-                    executor_error = exec_cmd_output[1].decode()
-                # Exit code 1 indicates any error thrown by subprocess.
-                # Exit code 126 indicates permission problem or command is not executable.
-                # Exit code 127 indicates possible typos in shell script with
-                # unrecognizable characters.
-                if exit_code == 1 or exit_code == 126 or exit_code == 127:
-                    message = Messages.get_message(
-                        MessageCodes.SANDBOX_SCRIPT_ERROR).format(executor_error)
-                    raise TeradataMlException(message,
-                                              MessageCodes.SANDBOX_SCRIPT_ERROR)
-                # Exit code 2 indicates either username or password is invalid.
-                elif exit_code == 2:
-                    message = Messages.get_message(
-                        MessageCodes.SANDBOX_CONNECTION_ERROR).format(executor_error)
-                    raise TeradataMlException(message,
-                                              MessageCodes.SANDBOX_CONNECTION_ERROR)
-                # Exit code 3 indicates problem with query.
-                elif exit_code == 3:
-                    message = Messages.get_message(
-                        MessageCodes.SANDBOX_QUERY_ERROR).format(executor_error)
-                    raise TeradataMlException(message,
-                                              MessageCodes.SANDBOX_QUERY_ERROR)
-                # Exit code 4 indicates all other exceptions / errors.
-                elif exit_code == 4:
-                    message = Messages.get_message(
-                        MessageCodes.SANDBOX_CONTAINER_ERROR).format(executor_error)
-                    raise TeradataMlException(message,
-                                              MessageCodes.SANDBOX_CONTAINER_ERROR)
-                elif exit_code != 0:
-                    # Any error other than exit code 1, 2, 3, 4
-                    message = Messages.get_message(
-                        MessageCodes.SANDBOX_CONTAINER_ERROR).format(executor_error)
-                    raise TeradataMlException(message,
-                                              MessageCodes.SANDBOX_CONTAINER_ERROR)
-                else:
-                    return self.__process_test_script_output(executor_output)
-            except Exception as exp:
-                message = Messages.get_message(
-                    MessageCodes.SANDBOX_CONTAINER_ERROR).format(str(exp))
-                raise TeradataMlException(message,
-                                          MessageCodes.SANDBOX_CONTAINER_ERROR)
     def __local_run_user_script_input_file(self, cmd, input_file_path,
                                            data_file_delimiter='\t',
@@ -1369,248 +1001,207 @@ class TableOperator:
         return self.__run_user_script_subprocess(cmd, db_data_handle)
-    def _create_executor_script(self, user_script_path,
-                                 user_script_args=None,
-                                 data_file_path=None,
-                                 data_file_delimiter='\t',
-                                 data_file_quote_char='"',
-                                 data_file_header=True,
-                                 db_name=None,
-                                 db_host=None,
-                                 user_name=None,
-                                 passwd=None,
-                                 logmech=None,
-                                 logdata=None,
-                                 table_name=None):
+    def __repr__(self):
+        """
+        Returns the string representation for the class instance.
+        """
+        if self.result is None:
+            repr_string = "Result is empty. Please run execute_script first."
+        else:
+            repr_string = "############ STDOUT Output ############"
+            repr_string = "{}\n\n{}".format(repr_string, self.result)
+        return repr_string
+    def deploy(self, model_column, partition_columns=None, model_file_prefix=None):
         """
         DESCRIPTION:
-            Internal function that will generate 'script_executor.py' to be copied to
-            sandbox environment.
+            Function deploys the model generated after `execute_script()` in database or user
+            environment in lake.
         PARAMETERS:
-            user_script_path:
-                Required Argument.
-                Specifies the path to user script inside docker container.
-                Types: str
-            user_script_args:
-                Optional Argument.
-                Specifies command line arguments required by the user script.
-                Types: str
-            data_file_path:
+            model_column:
                 Required Argument.
-                Specifies the path to input data file inside docker container.
-                Types: str
-            data_file_delimiter:
-                Optional Argument.
-                Specifies the delimiter used in input data file.
-                Default Value: "\t" (tab)
-                Types: character of length 1
-            data_file_quote_char:
-                Optional Argument.
-                Specifies the quote character used in input data file.
-                Default Value: '"'
-                Types: character of length 1
-            data_file_header:
-                Optional Argument.
-                Specifies whether the input data file has header.
-                Default Value: True
-                Types: bool
-            db_name:
-                Optional Argument.
-                Specifies the current database name.
-                Default Value: None
-                Types: str
-            db_host:
-                Optional Argument.
-                Specifies the host name.
-                Default Value: None
-                Types: str
-            user_name:
-                Optional Argument.
-                Specifies the user name.
-                Default Value: None
+                Specifies the column name in which model is present.
+                Supported types of model in this column are CLOB and BLOB.
+                Note:
+                    The column mentioned in this argument should be present in
+                    <apply_obj/script_obj>.result.
                 Types: str
-            passwd:
+            partition_columns:
                 Optional Argument.
-                Specifies the password for user name in "user_name".
-                Default Value: None
-                Types: str
+                Specifies the columns on which data is partitioned.
+                Note:
+                    The columns mentioned in this argument should be present in
+                    <apply_obj/script_obj>.result.
+                Types: str OR list of str
-            table_name:
+            model_file_prefix:
                 Optional Argument.
-                Specifies the table name where input data is present.
-                Default Value: None
+                Specifies the prefix to be used to the generated model file.
+                If this argument is None, prefix is auto-generated.
+                If the argument "model_column" contains multiple models and
+                    * "partition_columns" is None - model file prefix is appended with
+                      underscore(_) and numbers starting from one(1) to get model file
+                      names.
+                    * "partition_columns" is NOT None - model file prefix is appended
+                      with underscore(_) and unique values in partition_columns are joined
+                      with underscore(_) to generate model file names.
                 Types: str
         RETURNS:
-            None.
+            List of generated file names.
         RAISES:
-            None.
+            TeradatamlException
         EXAMPLES:
-            # Example 1: Create executor script when input data is to be read from a file.
-            self._create_executor_script(user_script_path=user_script_path,
-                                          user_script_args=script_args,
-                                          data_file_path=input_file_path,
-                                          data_file_delimiter=data_file_delimiter,
-                                          data_file_quote_char=data_file_quote_char,
-                                          data_file_header=data_file_header)
-            # Example 2: Create executor script when input data is to be read from db.
-            self._create_executor_script(user_script_path=user_script_path,
-                                          user_script_args=script_args,
-                                          db_host=db_host,
-                                          user_name=user_name,
-                                          passwd=password,
-                                          table_name=table_name,
-                                          db_name=db_name)
+            >>> load_example_data("openml", "multi_model_classification")
+            >>> df = DataFrame("multi_model_classification")
+            >>> df
+                           col2      col3      col4  label  group_column  partition_column_1  partition_column_2
+            col1
+            -1.013454  0.855765 -0.256920 -0.085301      1             9                   0                  10
+            -3.146552 -1.805530 -0.071515 -2.093998      0            10                   0                  10
+            -1.175097 -0.950745  0.018280 -0.895335      1            10                   0                  11
+             0.218497 -0.968924  0.183037 -0.303142      0            11                   0                  11
+            -1.471908 -0.029195 -0.166141 -0.645309      1            11                   1                  10
+             1.082336  0.846357 -0.012063  0.812633      1            11                   1                  11
+            -1.132068 -1.209750  0.065422 -0.982986      0            10                   1                  10
+            -0.440339  2.290676 -0.423878  0.749467      1             8                   1                  10
+            -0.615226 -0.546472  0.017496 -0.488720      0            12                   0                  10
+             0.579671 -0.573365  0.160603  0.014404      0             9                   1                  10
+            # Install Script file.
+            >>> file_location = os.path.join(os.path.dirname(teradataml.__file__), "data", "scripts", "deploy_script.py")
+            >>> install_file("deploy_script", file_location, replace=True)
+            # Variables needed for Script execution.
+            >>> script_command = '/opt/teradata/languages/Python/bin/python3 ./ALICE/deploy_script.py'
+            >>> partition_columns = ["partition_column_1", "partition_column_2"]
+            >>> columns = ["col1", "col2", "col3", "col4", "label",
+                           "partition_column_1", "partition_column_2"]
+            >>> returns = OrderedDict([("partition_column_1", INTEGER()),
+                                       ("partition_column_2", INTEGER()),
+                                       ("model", CLOB())])
+            # Script execution.
+            >>> obj = Script(data=df.select(columns),
+                             script_command=script_command,
+                             data_partition_column=partition_columns,
+                             returns=returns
+                             )
+            >>> opt = obj.execute_script()
+            >>> opt
+            partition_column_1  partition_column_2               model                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    model
+                            0                  10   b'gAejc1.....drIr'
+                            0                  11   b'gANjcw.....qWIu'
+                            1                  10   b'abdwcd.....dWIz'
+                            1                  11   b'gA4jc4.....agfu'
+            # Example 1: Provide only "partition_columns" argument. Here, "model_file_prefix"
+            #            is auto generated.
+            >>> obj.deploy(model_column="model",
+                           partition_columns=["partition_column_1", "partition_column_2"])
+            >>> ['model_file_1710436227163427__0_10',
+                 'model_file_1710436227163427__1_10',
+                 'model_file_1710436227163427__0_11',
+                 'model_file_1710436227163427__1_11']
+            # Example 2: Provide only "model_file_prefix" argument. Here, filenames are suffixed
+            #            with 1, 2, 3, ... for multiple models.
+            >>> obj.deploy(model_column="model", model_file_prefix="my_prefix_new_")
+            ['my_prefix_new__1',
+             'my_prefix_new__2',
+             'my_prefix_new__3',
+             'my_prefix_new__4']
+            # Example 3: Without both "partition_columns" and "model_file_prefix" arguments.
+            >>> obj.deploy(model_column="model")
+            ['model_file_1710438346528596__1',
+             'model_file_1710438346528596__2',
+             'model_file_1710438346528596__3',
+             'model_file_1710438346528596__4']
+            # Example 4: Provide both "partition_columns" and "model_file_prefix" arguments.
+            >>> obj.deploy(model_column="model", model_file_prefix="my_prefix_new_",
+                           partition_columns=["partition_column_1", "partition_column_2"])
+            ['my_prefix_new__0_10',
+             'my_prefix_new__0_11',
+             'my_prefix_new__1_10',
+             'my_prefix_new__1_11']
         """
-        __data_source = "db"
-        if data_file_path:
-            __data_source = "file"
-        temp_script_name = UtilFuncs._generate_temp_script_name(prefix="script_executor",
-                                                                use_default_database=True,
-                                                                gc_on_quit=True,
-                                                                quote=True,
-                                                                script_type=TeradataConstants.TERADATA_LOCAL_SCRIPT)
+        arg_info_matrix = []
+        arg_info_matrix.append(["model_column", model_column, False, (str)])
+        arg_info_matrix.append(["partition_columns", partition_columns, True, (str, list)])
+        arg_info_matrix.append(["model_file_prefix", model_file_prefix, True, (str)])
+        _Validators._validate_function_arguments(arg_info_matrix)
-        # Remove quotes from the file name after removing the database name.
-        script_alias = UtilFuncs._teradata_unquote_arg(
-            UtilFuncs._extract_table_name(temp_script_name), quote='"')
+        if self.result is None:
+            return "Result is empty. Please run execute_script first."
-        # script_name is the actual file name (basename).
-        script_name = "{script_name}.py".format(script_name=script_alias)
+        if partition_columns is None:
+            partition_columns = []
+        partition_columns = UtilFuncs._as_list(partition_columns)
-        # Create script in .teradataml directory.
-        ###
+        req_columns = [model_column] + partition_columns
-        script_dir = GarbageCollector._get_temp_dir_name()
+        _Validators._validate_column_exists_in_dataframe(columns=req_columns, metaexpr=self.result._metaexpr)
-        # script_path is the actual path where we want to generate the user script at.
-        self.script_path = os.path.join(script_dir, script_name)
+        data = self.result.select(req_columns)
+        data._index_column = None # Without this, first column i.e., model column will be index column.
-        template_dir = os.path.join(os.path.dirname(
-            os.path.dirname(os.path.abspath(__file__))),
-            "table_operators", "templates")
-        try:
-            # Write to the script based on the template.
-            #
-            from teradataml.common.constants import TableOperatorConstants
-            executor_file = os.path.join(template_dir,
-                                         TableOperatorConstants.SCRIPT_TEMPLATE.value)
-            with open(executor_file, 'r') as input_file:
-                with open(self.script_path, 'w') as output_file:
-                    os.chmod(self.script_path, 0o644)
-                    output_file.write(
-                        input_file.read().format(
-                            DATA_SOURCE=UtilFuncs._serialize_and_encode(__data_source),
-                            DELIMITER=UtilFuncs._serialize_and_encode(self.delimiter),
-                            QUOTECHAR=UtilFuncs._serialize_and_encode(self.quotechar),
-                            USER_SCRIPT_PATH=UtilFuncs._serialize_and_encode(
-                                user_script_path),
-                            SCRIPT_ARGS=UtilFuncs._serialize_and_encode(user_script_args),
-                            DATA_FILE_PATH=UtilFuncs._serialize_and_encode(
-                                data_file_path),
-                            INPUT_DATA_FILE_DELIMITER=UtilFuncs._serialize_and_encode(
-                                data_file_delimiter),
-                            INPUT_DATA_FILE_QUOTE_CHAR=UtilFuncs._serialize_and_encode(
-                                data_file_quote_char),
-                            INPUT_DATA_FILE_HEADER=UtilFuncs._serialize_and_encode(
-                                data_file_header),
-                            DB_HOST=UtilFuncs._serialize_and_encode(db_host),
-                            DB_USER=UtilFuncs._serialize_and_encode(user_name),
-                            DB_PASS=UtilFuncs._serialize_and_encode(passwd),
-                            DB_NAME=UtilFuncs._serialize_and_encode(db_name),
-                            TABLE_NAME=UtilFuncs._serialize_and_encode(table_name),
-                            LOGMECH=UtilFuncs._serialize_and_encode(logmech),
-                            LOGDATA=UtilFuncs._serialize_and_encode(logdata)
-                        ))
-        except Exception:
-            # Cleanup if we end up here in case of an error.
-            GarbageCollector._delete_local_file(self.script_path)
-            raise
-    def _copy_to_docker_container(self, client,
-                                   local_file_path,
-                                   path_in_docker_container,
-                                   container):
-        """
-        DESCRIPTION:
-            Function to copy files to docker container.
-        PARAMETERS:
-            client:
-                Required Argument.
-                Specifies the connection object for docker.
-                Types: str
+        if model_file_prefix is None:
+            timestamp = time.time()
+            tmp = "{}{}".format(floor(timestamp / 1000000),
+                                floor(timestamp % 1000000 * 1000000 +
+                                    int(str(uuid.uuid4().fields[-1])[:10])))
+            model_file_prefix = f"model_file_{tmp}_"
-            local_file_path:
-                Required Argument.
-                Specifies the path to the file to be copied.
-                Types: str
+        vals = data.get_values()
-            path_in_docker_container:
-                Required Argument.
-                Specifies destination path in the docker container where file will be
-                copied to.
-                Types: str
+        model_column_type = data._td_column_names_and_sqlalchemy_types[model_column.lower()].__class__.__name__
-            container:
-                Required Argument.
-                Specifies container id.
-                Types: str
+        n_models = len(vals)
+        all_files = []
-            RETURNS:
-                None.
+        for i, row in enumerate(vals):
+            model = row[0]
+            partition_values = ""
+            if partition_columns:
+                partition_values = "_".join([str(x) for x in row[1:]])
+            elif n_models > 1:
+                partition_values = str(i+1)
-            RAISES:
-                TeradataMLException.
+            model_file = f"{model_file_prefix}_{partition_values}"
+            model_file_path = os.path.join(os.path.expanduser("~"), ".teradataml", model_file)
-        """
-        # Create tar file.
-        tar_file_path = "{}.tar".format(local_file_path)
-        file_name = os.path.basename(local_file_path)
-        tar = tarfile.open(tar_file_path, mode='w')
-        try:
-            tar.add(local_file_path, arcname=file_name)
-        finally:
-            tar.close()
-        data = open(tar_file_path, 'rb').read()
+            if model_column_type == "CLOB":
+                import base64
+                model = base64.b64decode(model.partition("'")[2])
+            elif model_column_type == "BLOB":
+                # No operation needed.
+                # Apply model training returns BLOB type.
+                pass
+            else:
+                raise ValueError(f"Model column type {model_column_type} is not supported.")
-        try:
-            # Copy file to docker container.
-            copy_status = client.put_archive(container, path_in_docker_container, data)
-            os.remove(tar_file_path)
+            with open(model_file_path, "wb") as f:
+                f.write(model)
-            if copy_status:
-                return
-        except Exception as exp:
-            message = Messages.get_message(
-                MessageCodes.SANDBOX_CONTAINER_ERROR).format(str(exp))
-            raise TeradataMlException(message, MessageCodes.SANDBOX_CONTAINER_ERROR)
+            if self.__class__.__name__ == "Script":
+                from teradataml import install_file
+                install_file(file_identifier=model_file, file_path=model_file_path,
+                             is_binary=True, suppress_output=True)
+            elif self.__class__.__name__ == "Apply":
+                self.env.install_file(file_name=model_file_path)
-    def __repr__(self):
-        """
-        Returns the string representation for the class instance.
-        """
-        if self.result is None:
-            repr_string = "Result is empty. Please run execute_script first."
-        else:
-            repr_string = "############ STDOUT Output ############"
-            repr_string = "{}\n\n{}".format(repr_string, self.result)
-        return repr_string
+            all_files.append(model_file)
+            os.remove(model_file_path)
+        return all_files

teradataml 17.20.0.6__py3-none-any.whl → 20.0.0.0__py3-none-any.whl

Potentially problematic release.

teradataml 17.20.0.6py3-none-any.whl → 20.0.0.0py3-none-any.whl